From ea229ea7f3aec46bb52bbeeffb6c697683c7efc0 Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Mon, 25 May 2026 10:25:10 -0600
Subject: [PATCH 01/26] feat(runtime): server-authoritative resumable chat
 turns (RunBus)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Decouple a chat turn's lifecycle from the originating HTTP request. A turn
now runs to completion on the server regardless of the client connection;
the client is a viewer that attaches to a replayable per-conversation event
log (RunBus), replays the in-flight turn, then tails live events. Refresh /
conversation-switch / disconnect never lose or duplicate work — they detach
and re-attach. Only the Stop button (RunBus.cancel) aborts generation.

- RunBus: in-memory, replayable, monotonic-seq turn log with grace-window
  retention for late re-attach; threads its own AbortSignal into the engine.
- runtime.startTurn: detached turn driver; seeds user.message into the log;
  reports isTurnActive / activeConversationIds / turnSeq / getTurnReplay.
- Per-conversation SSE: ConversationEventManager + /v1/conversations/:id/events
  route with subscribed{isActive} frame + buffered replay; /v1/chat/start and
  cancel endpoints.
- Broadcast conversation.title + data.changed on the global SSE when a title
  generates, so viewers update without a turn-stream connection.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 src/api/conversation-events.ts              |  53 ++++-
 src/api/events.ts                           |   5 +
 src/api/handlers.ts                         |  77 ++++++
 src/api/routes/chat.ts                      |  62 +++--
 src/api/routes/conversation-events.ts       |  29 ++-
 src/api/server.ts                           |   7 +
 src/conversation/event-sourced-store.ts     |   2 +-
 src/conversation/types.ts                   |   4 +
 src/engine/types.ts                         |   1 +
 src/runtime/run-bus.ts                      | 247 ++++++++++++++++++++
 src/runtime/runtime.ts                      | 203 +++++++++++++++-
 test/integration/detached-turn-http.test.ts | 120 ++++++++++
 test/integration/detached-turn.test.ts      |  99 ++++++++
 test/unit/run-bus.test.ts                   | 154 ++++++++++++
 14 files changed, 1025 insertions(+), 38 deletions(-)
 create mode 100644 src/runtime/run-bus.ts
 create mode 100644 test/integration/detached-turn-http.test.ts
 create mode 100644 test/integration/detached-turn.test.ts
 create mode 100644 test/unit/run-bus.test.ts
diff --git a/src/api/conversation-events.ts b/src/api/conversation-events.ts
index 368110e6..e36a3c3e 100644
--- a/src/api/conversation-events.ts
+++ b/src/api/conversation-events.ts
@@ -8,6 +8,8 @@
  * Separate from SseEventManager which handles workspace-level events.
  */
 
+import type { BufferedRunEvent } from "../runtime/run-bus.ts";
+
 /** A subscriber watching a specific conversation's events. */
 interface ConversationSubscriber {
   id: string;
@@ -19,6 +21,13 @@ interface ConversationSubscriber {
 
 const encoder = new TextEncoder();
 
+/** Format an SSE frame. `seq`, when present, is sent as the `id:` line so a
+ *  reconnecting viewer can resume from its last-seen sequence number. */
+function frame(eventType: string, data: unknown, seq?: number): Uint8Array {
+  const idLine = seq != null ? `id: ${seq}\n` : "";
+  return encoder.encode(`event: ${eventType}\n${idLine}data: ${JSON.stringify(data)}\n\n`);
+}
+
 export class ConversationEventManager {
   private subscribers = new Map<string, ConversationSubscriber>();
   private heartbeatTimer: ReturnType<typeof setInterval> | null = null;
@@ -73,6 +82,8 @@ export class ConversationEventManager {
   addSubscriber(
     conversationId: string,
     userId: string,
+    replay?: BufferedRunEvent[],
+    meta?: { isActive: boolean; activeSeq: number },
   ): { stream: ReadableStream<Uint8Array>; subscriberId: string } {
     const id = crypto.randomUUID();
     let sub: ConversationSubscriber;
@@ -80,9 +91,24 @@ export class ConversationEventManager {
     const stream = new ReadableStream<Uint8Array>({
       start: (controller) => {
         sub = { id, userId, conversationId, controller, closed: false };
+        // The subscribed frame tells the client whether a turn is in flight
+        // (so it can trim a stale in-flight turn from disk history before the
+        // RunBus replay rebuilds it) and its current seq.
+        controller.enqueue(
+          frame("subscribed", {
+            subscriberId: id,
+            isActive: meta?.isActive ?? false,
+            activeSeq: meta?.activeSeq ?? 0,
+          }),
+        );
+        // Replay the in-flight turn (if any) BEFORE registering for live
+        // fan-out. start() runs synchronously and we add to the subscribers
+        // map only after replaying, so no live event can interleave ahead of
+        // the replay — viewers never see out-of-order deltas.
+        if (replay) {
+          for (const e of replay) controller.enqueue(frame(e.type, e.data, e.seq));
+        }
         this.subscribers.set(id, sub);
-        const subscribedMsg = `event: subscribed\ndata: ${JSON.stringify({ subscriberId: id })}\n\n`;
-        controller.enqueue(encoder.encode(subscribedMsg));
       },
       cancel: () => {
         this.removeSubscriber(id);
@@ -92,6 +118,29 @@ export class ConversationEventManager {
     return { stream, subscriberId: id };
   }
 
+  /**
+   * Fan out a live run event (with its sequence number) to every subscriber
+   * of the conversation. The seq lets viewers de-duplicate against replay and
+   * resume after a reconnect.
+   */
+  publishEvent(conversationId: string, event: BufferedRunEvent): void {
+    const encoded = frame(event.type, event.data, event.seq);
+    for (const [id, sub] of this.subscribers) {
+      if (sub.closed) {
+        this.subscribers.delete(id);
+        continue;
+      }
+      if (sub.conversationId !== conversationId) continue;
+      try {
+        sub.controller.enqueue(encoded);
+      } catch (err) {
+        console.warn("[conversation-events] SSE write failed:", err);
+        this.closeSub(sub);
+        this.subscribers.delete(id);
+      }
+    }
+  }
+
   /** Remove a specific subscriber. */
   removeSubscriber(subscriberId: string): void {
     const sub = this.subscribers.get(subscriberId);
diff --git a/src/api/events.ts b/src/api/events.ts
index 235da077..e2f96572 100644
--- a/src/api/events.ts
+++ b/src/api/events.ts
@@ -59,6 +59,11 @@ const SSE_ROUTES: Partial<Record<EngineEventType, SseRoute>> = {
   // existing "broadcast to all clients in this process" behavior to avoid
   // silently breaking iframe refresh. Revisit when payload grows wsId.
   "data.changed": { scope: "global" },
+  // Live conversation-title update (auto-title generation completes after the
+  // turn). Workspace-scoped via the conversation's workspaceId breadcrumb so
+  // it doesn't leak across tenants. The shell routes it to the matching
+  // conversation slice by `conversationId`.
+  "conversation.title": { scope: "workspace", wsIdField: "wsId" },
   // Org-level config (model preferences, feature flags). Affects every
   // workspace; broadcast to all.
   "config.changed": { scope: "global" },
diff --git a/src/api/handlers.ts b/src/api/handlers.ts
index 1988d0fa..26dfede0 100644
--- a/src/api/handlers.ts
+++ b/src/api/handlers.ts
@@ -8,6 +8,7 @@ import { ingestFiles, isAllowedMime, type UploadedFile } from "../files/ingest.t
 import { createFileStore } from "../files/store.ts";
 import type { FileEntry } from "../files/types.ts";
 import type { IdentityProvider, UserIdentity } from "../identity/provider.ts";
+import { DEV_IDENTITY } from "../identity/providers/dev.ts";
 import {
   ConversationAccessDeniedError,
   ConversationCorruptedError,
@@ -141,6 +142,82 @@ function runInProgressResponse(conversationId: string): Response {
   );
 }
 
+/**
+ * Handle POST /v1/chat/start — kick off a detached, server-authoritative turn
+ * and return the conversation id immediately. The turn runs to completion on
+ * the server regardless of this request's lifecycle (closing the tab does NOT
+ * cancel it). Clients watch the turn via GET /v1/conversations/:id/events,
+ * which replays the in-flight turn then tails live.
+ */
+export async function handleChatStart(
+  request: Request,
+  runtime: Runtime,
+  features: ResolvedFeatures,
+  identity?: UserIdentity,
+  workspaceId?: string,
+): Promise<Response> {
+  const parsed = await parseChatBody(request, runtime, features, identity, workspaceId);
+  if (parsed instanceof Response) return parsed;
+  try {
+    const { conversationId } = await runtime.startTurn(parsed);
+    return Response.json({ conversationId });
+  } catch (err) {
+    if (err instanceof RunInProgressError) {
+      return runInProgressResponse(parsed.conversationId ?? "");
+    }
+    if (err instanceof ConversationAccessDeniedError) {
+      return apiError(
+        403,
+        "conversation_access_denied",
+        "You do not have access to this conversation.",
+        { conversationId: parsed.conversationId },
+      );
+    }
+    throw err;
+  }
+}
+
+/**
+ * Handle POST /v1/conversations/:id/cancel — the explicit Stop button. The
+ * ONLY thing that aborts generation; client disconnect does not. Ownership is
+ * enforced (same posture as the events route).
+ */
+export async function handleChatCancel(
+  conversationId: string,
+  runtime: Runtime,
+  identity?: UserIdentity,
+): Promise<Response> {
+  const callerId = identity?.id ?? (runtime.getIdentityProvider() ? null : DEV_IDENTITY.id);
+  if (!callerId) {
+    return apiError(401, "authentication_required", "Authentication required.");
+  }
+  const conversation = await runtime.findConversation(conversationId).catch((err) => {
+    if (err instanceof ConversationCorruptedError) return err;
+    throw err;
+  });
+  if (conversation instanceof ConversationCorruptedError) {
+    return apiError(422, "conversation_corrupted", conversation.message, {
+      conversationId: conversation.conversationId,
+      reason: conversation.reason,
+    });
+  }
+  if (!conversation) {
+    return apiError(404, "not_found", "Conversation not found");
+  }
+  if (conversation.ownerId !== callerId) {
+    return apiError(
+      403,
+      "conversation_access_denied",
+      "You do not have access to this conversation.",
+      {
+        conversationId,
+      },
+    );
+  }
+  const cancelled = runtime.cancelTurn(conversationId);
+  return Response.json({ cancelled });
+}
+
 function conversationAccessDeniedResponse(conversationId: string): Response {
   return apiError(
     403,
diff --git a/src/api/routes/chat.ts b/src/api/routes/chat.ts
index 5ec79d3a..f14405fb 100644
--- a/src/api/routes/chat.ts
+++ b/src/api/routes/chat.ts
@@ -1,5 +1,5 @@
 import { Hono } from "hono";
-import { handleChat, handleChatStream } from "../handlers.ts";
+import { handleChat, handleChatCancel, handleChatStart, handleChatStream } from "../handlers.ts";
 import { requireAuth } from "../middleware/auth.ts";
 import { bodyLimit } from "../middleware/body-limit.ts";
 import { errorLog } from "../middleware/error-log.ts";
@@ -15,28 +15,40 @@ export function chatRoutes(ctx: AppContext) {
   const chatBodyLimit = bodyLimit(1_048_576, {
     multipart: ctx.runtime.getFilesConfig().maxTotalSize,
   });
-  return new Hono<AppEnv>()
-    .use("*", requireAuth(ctx.authOptions))
-    .use("*", requireWorkspace(ctx.workspaceStore))
-    .use("*", errorLog(ctx))
-    .post("/v1/chat", chatBodyLimit, rl, (c) =>
-      handleChat(
-        c.req.raw,
-        ctx.runtime,
-        ctx.features,
-        c.var.identity,
-        c.var.workspaceId,
-        ctx.conversationEventManager,
-      ),
-    )
-    .post("/v1/chat/stream", chatBodyLimit, rl, (c) =>
-      handleChatStream(
-        c.req.raw,
-        ctx.runtime,
-        ctx.features,
-        c.var.identity,
-        c.var.workspaceId,
-        ctx.conversationEventManager,
-      ),
-    );
+  return (
+    new Hono<AppEnv>()
+      .use("*", requireAuth(ctx.authOptions))
+      .use("*", requireWorkspace(ctx.workspaceStore))
+      .use("*", errorLog(ctx))
+      .post("/v1/chat", chatBodyLimit, rl, (c) =>
+        handleChat(
+          c.req.raw,
+          ctx.runtime,
+          ctx.features,
+          c.var.identity,
+          c.var.workspaceId,
+          ctx.conversationEventManager,
+        ),
+      )
+      .post("/v1/chat/stream", chatBodyLimit, rl, (c) =>
+        handleChatStream(
+          c.req.raw,
+          ctx.runtime,
+          ctx.features,
+          c.var.identity,
+          c.var.workspaceId,
+          ctx.conversationEventManager,
+        ),
+      )
+      // Server-authoritative entry point: starts a detached turn and returns
+      // the conversation id immediately. The client then watches via
+      // GET /v1/conversations/:id/events. Generation survives client disconnect.
+      .post("/v1/chat/start", chatBodyLimit, rl, (c) =>
+        handleChatStart(c.req.raw, ctx.runtime, ctx.features, c.var.identity, c.var.workspaceId),
+      )
+      // Explicit Stop — the only way to abort an in-flight turn.
+      .post("/v1/conversations/:id/cancel", (c) =>
+        handleChatCancel(c.req.param("id"), ctx.runtime, c.var.identity),
+      )
+  );
 }
diff --git a/src/api/routes/conversation-events.ts b/src/api/routes/conversation-events.ts
index 0b150026..d0acdf4f 100644
--- a/src/api/routes/conversation-events.ts
+++ b/src/api/routes/conversation-events.ts
@@ -92,13 +92,28 @@ export function conversationEventRoutes(ctx: AppContext) {
         );
       }
 
-      // Create SSE stream for this subscriber. The first frame
-      // (event: subscribed) carries the server-generated subscriberId
-      // so the client can pass it back as `X-Origin-Subscriber-Id` on
-      // any chat-stream POST it originates — that prevents the
-      // chat-stream's broadcast from echoing back to this same
-      // subscription.
-      const { stream } = ctx.conversationEventManager.addSubscriber(conversationId, callerId);
+      // Resume point: the client passes the highest sequence number it has
+      // already rendered (0 / absent = full replay of the in-flight turn).
+      const afterSeqRaw = c.req.query("afterSeq");
+      const afterSeq = afterSeqRaw ? Number.parseInt(afterSeqRaw, 10) : 0;
+      const replay = ctx.runtime.getTurnReplay(
+        conversationId,
+        Number.isFinite(afterSeq) ? afterSeq : 0,
+      );
+
+      // Create the SSE stream. The manager replays the buffered in-flight turn
+      // (events with seq > afterSeq) before registering for live fan-out, so a
+      // page refresh reconstructs the in-progress assistant message and then
+      // tails the rest with no gap or duplication.
+      const { stream } = ctx.conversationEventManager.addSubscriber(
+        conversationId,
+        callerId,
+        replay,
+        {
+          isActive: ctx.runtime.isTurnActive(conversationId),
+          activeSeq: ctx.runtime.turnSeq(conversationId),
+        },
+      );
 
       return new Response(stream, {
         headers: {
diff --git a/src/api/server.ts b/src/api/server.ts
index 3c1c3122..5b4288d9 100644
--- a/src/api/server.ts
+++ b/src/api/server.ts
@@ -73,6 +73,13 @@ export function startServer(options: ServerOptions): ServerHandle {
   const conversationEventManager = new ConversationEventManager();
   conversationEventManager.start();
 
+  // Bridge detached-turn events (RunBus) to the per-conversation SSE manager
+  // so connected viewers tail live. Replay-on-connect is sourced separately
+  // from the RunBus buffer (see the conversation-events route).
+  runtime.onTurnEvent = (conversationId, event) => {
+    conversationEventManager.publishEvent(conversationId, event);
+  };
+
   // Login rate limiter — per-IP brute-force protection
   const rateLimiter = new LoginRateLimiter();
   rateLimiter.start();
diff --git a/src/conversation/event-sourced-store.ts b/src/conversation/event-sourced-store.ts
index 7b3e5a45..e386f6c0 100644
--- a/src/conversation/event-sourced-store.ts
+++ b/src/conversation/event-sourced-store.ts
@@ -129,7 +129,7 @@ export class EventSourcedConversationStore implements ConversationStore, EventSi
   // =========================================================================
 
   async create(options: CreateConversationOptions): Promise<Conversation> {
-    const id = `conv_${crypto.randomUUID().replace(/-/g, "").slice(0, 16)}`;
+    const id = options.id ?? `conv_${crypto.randomUUID().replace(/-/g, "").slice(0, 16)}`;
     const now = new Date().toISOString();
     const conversation: Conversation = {
       id,
diff --git a/src/conversation/types.ts b/src/conversation/types.ts
index 69016424..133d536b 100644
--- a/src/conversation/types.ts
+++ b/src/conversation/types.ts
@@ -75,6 +75,10 @@ export interface CreateConversationOptions {
   workspaceId?: string;
   ownerId: string;
   metadata?: Record<string, unknown>;
+  /** Create with a specific id instead of a generated one. Used by the
+   *  detached-turn path so the conversation id is known to the caller before
+   *  the engine run starts. */
+  id?: string;
 }
 
 /** Fields that can be updated on a conversation. */
diff --git a/src/engine/types.ts b/src/engine/types.ts
index a320be3e..b20ade40 100644
--- a/src/engine/types.ts
+++ b/src/engine/types.ts
@@ -95,6 +95,7 @@ export type EngineEventType =
    */
   | "connection.state_changed"
   | "data.changed"
+  | "conversation.title"
   | "config.changed"
   | "skill.created"
   | "skill.updated"
diff --git a/src/runtime/run-bus.ts b/src/runtime/run-bus.ts
new file mode 100644
index 00000000..f69cc31e
--- /dev/null
+++ b/src/runtime/run-bus.ts
@@ -0,0 +1,247 @@
+/**
+ * RunBus — server-authoritative, replayable per-conversation turn log.
+ *
+ * A chat turn runs to completion on the server regardless of any client
+ * connection. The RunBus is the in-memory source of truth for an in-flight
+ * turn: it owns the turn's cancellation handle, an ordered event log with
+ * monotonic sequence numbers, and the set of live subscribers.
+ *
+ * Why it exists (issue #254 follow-up — conversation-tab rewrite):
+ *   - The client is a *viewer*. It attaches to a run, replays everything
+ *     emitted so far (so a page refresh reconstructs the in-progress
+ *     assistant message), then tails live events. Disconnect / refresh /
+ *     conversation-switch never lose or duplicate work — they just detach
+ *     and re-attach.
+ *   - The turn's lifecycle is decoupled from the originating HTTP request.
+ *     Closing the tab does NOT abort generation; only an explicit
+ *     {@link RunBus.cancel} (the Stop button) does.
+ *
+ * Scope: single-process, in-memory. Multi-replica (`platform.replicas > 1`)
+ * needs a Redis-backed log + conversationId-sticky routing — deferred,
+ * mirrors the `SessionRegistry` pattern.
+ */
+
+import { RunInProgressError } from "./errors.ts";
+
+export type RunStatus = "running" | "done" | "error" | "cancelled";
+
+/** A single buffered event in a run's log. `seq` is 1-based and monotonic. */
+export interface BufferedRunEvent {
+  seq: number;
+  type: string;
+  data: unknown;
+}
+
+interface RunLog {
+  conversationId: string;
+  seq: number;
+  events: BufferedRunEvent[];
+  status: RunStatus;
+  startedAt: number;
+  endedAt?: number;
+  abort: AbortController;
+  eventListeners: Set<(e: BufferedRunEvent) => void>;
+  endListeners: Set<(s: RunStatus) => void>;
+  gcTimer?: ReturnType<typeof setTimeout>;
+}
+
+/** Detach callback returned by {@link RunBus.attach}. */
+export type DetachFn = () => void;
+
+export class RunBus {
+  private runs = new Map<string, RunLog>();
+  /** How long a terminal run's log is retained for late re-attach. */
+  private readonly graceMs: number;
+
+  constructor(graceMs = 30_000) {
+    this.graceMs = graceMs;
+  }
+
+  /**
+   * Begin a turn for a conversation. Throws {@link RunInProgressError} if one
+   * is already running. Returns the turn's `AbortSignal` — the engine threads
+   * this (NOT the HTTP request's signal), so generation survives client
+   * disconnect and is only stopped by {@link cancel}.
+   */
+  begin(conversationId: string): AbortSignal {
+    const existing = this.runs.get(conversationId);
+    if (existing && existing.status === "running") {
+      throw new RunInProgressError(conversationId);
+    }
+    // A terminal log lingering in its grace window is replaced by the new turn.
+    if (existing?.gcTimer) clearTimeout(existing.gcTimer);
+
+    const log: RunLog = {
+      conversationId,
+      seq: 0,
+      events: [],
+      status: "running",
+      startedAt: Date.now(),
+      abort: new AbortController(),
+      eventListeners: new Set(),
+      endListeners: new Set(),
+    };
+    this.runs.set(conversationId, log);
+    return log.abort.signal;
+  }
+
+  /** Whether a turn is currently generating for this conversation. */
+  isActive(conversationId: string): boolean {
+    return this.runs.get(conversationId)?.status === "running";
+  }
+
+  /** Last sequence number assigned for this conversation's current/last run. */
+  currentSeq(conversationId: string): number {
+    return this.runs.get(conversationId)?.seq ?? 0;
+  }
+
+  /** Status of the conversation's current/last (still-retained) run. */
+  getStatus(conversationId: string): RunStatus | undefined {
+    return this.runs.get(conversationId)?.status;
+  }
+
+  /** Conversation ids with an actively generating turn. */
+  activeConversationIds(): string[] {
+    const ids: string[] = [];
+    for (const [id, log] of this.runs) {
+      if (log.status === "running") ids.push(id);
+    }
+    return ids;
+  }
+
+  /**
+   * Append an event to the run's log and fan it out to live subscribers.
+   * No-op if the run isn't active (defensive — late engine events after a
+   * cancel shouldn't resurrect a terminated log).
+   */
+  publish(conversationId: string, type: string, data: unknown): BufferedRunEvent | null {
+    const log = this.runs.get(conversationId);
+    if (!log || log.status !== "running") return null;
+    log.seq += 1;
+    const evt: BufferedRunEvent = { seq: log.seq, type, data };
+    log.events.push(evt);
+    for (const fn of log.eventListeners) {
+      try {
+        fn(evt);
+      } catch {
+        // A failing subscriber must not break the fan-out to others.
+      }
+    }
+    return evt;
+  }
+
+  /**
+   * Snapshot of buffered events with `seq > afterSeq` (no live subscription).
+   * Used to replay an in-progress turn to a freshly connecting SSE subscriber
+   * before it starts receiving live fan-out. Empty if no retained run.
+   */
+  bufferedSince(conversationId: string, afterSeq: number): BufferedRunEvent[] {
+    const log = this.runs.get(conversationId);
+    if (!log) return [];
+    return log.events.filter((e) => e.seq > afterSeq);
+  }
+
+  /** Mark a run terminal, notify end-listeners, and schedule log GC. */
+  end(conversationId: string, status: Exclude<RunStatus, "running">): void {
+    const log = this.runs.get(conversationId);
+    if (!log || log.status !== "running") return;
+    log.status = status;
+    log.endedAt = Date.now();
+    for (const fn of log.endListeners) {
+      try {
+        fn(status);
+      } catch {
+        // ignore
+      }
+    }
+    this.scheduleGc(log);
+  }
+
+  /**
+   * Explicitly cancel an active run (the Stop button). Aborts the turn's
+   * signal (engine stops cooperatively) and marks it `cancelled`.
+   */
+  cancel(conversationId: string): boolean {
+    const log = this.runs.get(conversationId);
+    if (!log || log.status !== "running") return false;
+    log.abort.abort();
+    this.end(conversationId, "cancelled");
+    return true;
+  }
+
+  /**
+   * Attach a viewer. Synchronously replays every buffered event with
+   * `seq > afterSeq`, then streams live events as they're published. If the
+   * run is already terminal, replays the tail then fires `onEnd`.
+   *
+   * Pass `afterSeq = 0` for a fresh attach (full replay), or the highest seq
+   * the client already rendered (from a prior connection) to resume without
+   * gaps or duplicates.
+   *
+   * Returns a detach function. No-op attach (returns a noop) when there's no
+   * retained run for the conversation — the caller then renders only
+   * persisted history.
+   */
+  attach(
+    conversationId: string,
+    afterSeq: number,
+    onEvent: (e: BufferedRunEvent) => void,
+    onEnd?: (s: RunStatus) => void,
+  ): DetachFn {
+    const log = this.runs.get(conversationId);
+    if (!log) return () => {};
+
+    // Snapshot the replay set before registering the live listener. JS is
+    // single-threaded and publish() is synchronous, so nothing can interleave
+    // between the filter and the add — no gaps, no double-delivery.
+    const replay = log.events.filter((e) => e.seq > afterSeq);
+    const liveListener = (e: BufferedRunEvent) => onEvent(e);
+    log.eventListeners.add(liveListener);
+
+    let endListener: ((s: RunStatus) => void) | undefined;
+    if (onEnd) {
+      endListener = (s) => onEnd(s);
+      log.endListeners.add(endListener);
+    }
+
+    for (const e of replay) onEvent(e);
+    // Already-terminal run: deliver the terminal status after the replay.
+    if (log.status !== "running" && onEnd) onEnd(log.status);
+
+    return () => {
+      log.eventListeners.delete(liveListener);
+      if (endListener) log.endListeners.delete(endListener);
+    };
+  }
+
+  /** Drop a retained terminal log immediately (test/GC helper). */
+  evict(conversationId: string): void {
+    const log = this.runs.get(conversationId);
+    if (log?.gcTimer) clearTimeout(log.gcTimer);
+    this.runs.delete(conversationId);
+  }
+
+  /** Cancel all active runs and clear state (shutdown / reset). */
+  reset(): void {
+    for (const log of this.runs.values()) {
+      if (log.gcTimer) clearTimeout(log.gcTimer);
+      if (log.status === "running") log.abort.abort();
+    }
+    this.runs.clear();
+  }
+
+  private scheduleGc(log: RunLog): void {
+    if (this.graceMs <= 0) {
+      this.runs.delete(log.conversationId);
+      return;
+    }
+    log.gcTimer = setTimeout(() => {
+      // Only GC if a newer run hasn't replaced this one.
+      if (this.runs.get(log.conversationId) === log) {
+        this.runs.delete(log.conversationId);
+      }
+    }, this.graceMs);
+    // Don't keep the process alive solely for log GC.
+    log.gcTimer.unref?.();
+  }
+}
diff --git a/src/runtime/runtime.ts b/src/runtime/runtime.ts
index d6497409..96ad3c41 100644
--- a/src/runtime/runtime.ts
+++ b/src/runtime/runtime.ts
@@ -95,6 +95,7 @@ import {
   type RequestContext,
   runWithRequestContext,
 } from "./request-context.ts";
+import { type BufferedRunEvent, RunBus, type RunStatus } from "./run-bus.ts";
 import { buildSkillsLoadedPayload } from "./skills-loaded-payload.ts";
 import { surfaceTools } from "./tools.ts";
 import type { ChatRequest, ChatResult, ModelSlots, RuntimeConfig, TurnUsage } from "./types.ts";
@@ -254,6 +255,14 @@ export class Runtime {
    */
   private readonly activeConversations = new Set<string>();
 
+  /**
+   * Server-authoritative, replayable log of in-flight turns. Detached web
+   * chats run through {@link startTurn}; their engine events are published
+   * here so any viewer (live, reconnecting, or cross-tab) can replay + tail.
+   * The turn's cancellation lives here too — client disconnect does NOT abort.
+   */
+  private readonly runBus = new RunBus();
+
   private constructor(
     _engine: AgentEngine,
     resolveModelFn: (modelString: string) => LanguageModelV3,
@@ -726,6 +735,183 @@ export class Runtime {
     }
   }
 
+  // ===========================================================================
+  // Detached, server-authoritative turns (conversation-tab rewrite).
+  //
+  // `startTurn` runs a chat turn to completion regardless of the caller's
+  // connection. The conversation id is resolved up front and returned
+  // immediately; the engine run continues in the background, publishing every
+  // event to the RunBus. Clients are viewers — they `attachTurn` to replay +
+  // tail. Client disconnect does NOT abort; only `cancelTurn` (Stop) does.
+  // ===========================================================================
+
+  /** Whether a detached turn is currently generating for this conversation. */
+  isTurnActive(conversationId: string): boolean {
+    return this.runBus.isActive(conversationId);
+  }
+
+  /** Conversation ids with an actively generating turn (drives the list dot). */
+  activeTurnConversationIds(): string[] {
+    return this.runBus.activeConversationIds();
+  }
+
+  /** Highest event sequence number for a conversation's current/last run. */
+  turnSeq(conversationId: string): number {
+    return this.runBus.currentSeq(conversationId);
+  }
+
+  /**
+   * Attach a viewer to a conversation's in-flight turn: replays buffered
+   * events with `seq > afterSeq`, then tails live ones. Returns a detach fn
+   * (a safe no-op when nothing is running). Detaching never cancels the turn.
+   */
+  attachTurn(
+    conversationId: string,
+    afterSeq: number,
+    onEvent: (e: BufferedRunEvent) => void,
+    onEnd?: (s: RunStatus) => void,
+  ): () => void {
+    return this.runBus.attach(conversationId, afterSeq, onEvent, onEnd);
+  }
+
+  /** Explicitly cancel an in-flight turn (the Stop button). */
+  cancelTurn(conversationId: string): boolean {
+    return this.runBus.cancel(conversationId);
+  }
+
+  /**
+   * Start a chat turn that runs to completion server-side, decoupled from the
+   * caller's connection. Resolves (creating if new) the conversation id up
+   * front, reserves the run on the RunBus, then runs the engine in the
+   * background — publishing every event to the bus so viewers can replay +
+   * tail via {@link attachTurn}. Returns once the id is known; the turn keeps
+   * running after the HTTP request that called this returns. Throws
+   * {@link RunInProgressError} if a turn is already active for the conversation.
+   */
+  async startTurn(request: ChatRequest): Promise<{ conversationId: string }> {
+    if (!request.workspaceId) {
+      throw new Error("workspaceId is required. Every chat request must be workspace-scoped.");
+    }
+    const store = this.findConversationStore();
+    const ownerId = this.resolveOwnerId(request);
+    const createOpts: CreateConversationOptions = {
+      ownerId,
+      workspaceId: request.workspaceId,
+      ...(request.metadata ? { metadata: request.metadata } : {}),
+    };
+
+    const isNew = !request.conversationId;
+    let conversationId: string;
+    if (request.conversationId) {
+      const existing = await store.load(request.conversationId);
+      if (existing && existing.ownerId !== ownerId) {
+        throw new ConversationAccessDeniedError(request.conversationId, ownerId);
+      }
+      conversationId =
+        existing?.id ?? (await store.create({ ...createOpts, id: request.conversationId })).id;
+    } else {
+      conversationId = (await store.create(createOpts)).id;
+    }
+
+    // Reserve the run (throws if already active). The returned signal is the
+    // RunBus's — NOT the HTTP request's — so client disconnect won't abort.
+    const signal = this.runBus.begin(conversationId);
+
+    // Seed the run stream with the user's message so the turn is
+    // self-contained: any viewer (sender, other tab, post-refresh) can
+    // reconstruct user + assistant from replay alone, no optimistic client
+    // state required.
+    this.publishTurnEvent(conversationId, "user.message", {
+      content: request.message,
+      ...(ownerId ? { userId: ownerId } : {}),
+      timestamp: new Date().toISOString(),
+    });
+
+    // Tell conversation-list UIs a new conversation exists (so the row + its
+    // streaming dot appear immediately). Resolved-existing turns already have
+    // a row.
+    if (isNew) this.emitConversationsChanged();
+
+    const busSink = this.createRunBusSink(conversationId);
+    // Detached: run to completion regardless of the caller's connection.
+    void this.chat({ ...request, conversationId, signal }, busSink)
+      .then((result) => {
+        // Publish a terminal `done` carrying the final result so viewers
+        // finalize the assistant message, then close the run.
+        this.publishTurnEvent(conversationId, "done", {
+          response: result.response,
+          conversationId: result.conversationId,
+          toolCalls: result.toolCalls,
+          stopReason: result.stopReason,
+          usage: result.usage,
+        });
+        this.runBus.end(conversationId, "done");
+      })
+      .catch((err) => {
+        if (signal.aborted) {
+          this.publishTurnEvent(conversationId, "cancelled", {});
+          this.runBus.end(conversationId, "cancelled");
+        } else {
+          this.publishTurnEvent(conversationId, "error", {
+            error: "engine_error",
+            message: err instanceof Error ? err.message : String(err),
+          });
+          this.runBus.end(conversationId, "error");
+        }
+      })
+      .finally(() => {
+        // Refresh list UIs so the row's dot clears and the final title shows.
+        this.emitConversationsChanged();
+      });
+
+    return { conversationId };
+  }
+
+  /**
+   * Live fan-out hook for detached-turn events. The API layer sets this to
+   * forward each published event to the per-conversation SSE manager so
+   * connected viewers tail in real time. Buffering/replay stays in the RunBus;
+   * this is purely the live edge.
+   */
+  onTurnEvent?: (conversationId: string, event: BufferedRunEvent) => void;
+
+  /** Replay snapshot of an in-flight turn for a newly connecting viewer. */
+  getTurnReplay(conversationId: string, afterSeq: number): BufferedRunEvent[] {
+    return this.runBus.bufferedSince(conversationId, afterSeq);
+  }
+
+  /** Publish to the RunBus (buffer/replay) and fan out live (SSE viewers). */
+  private publishTurnEvent(conversationId: string, type: string, data: unknown): void {
+    const buffered = this.runBus.publish(conversationId, type, data);
+    if (buffered) this.onTurnEvent?.(conversationId, buffered);
+  }
+
+  /** EventSink that forwards engine events into the RunBus for one turn. */
+  private createRunBusSink(conversationId: string): EventSink {
+    return {
+      emit: (event: EngineEvent) => {
+        this.publishTurnEvent(conversationId, event.type, event.data);
+      },
+    };
+  }
+
+  /** Broadcast a conversations-list change on the global sink (→ SSE → iframe). */
+  private emitConversationsChanged(): void {
+    this.defaultEvents.emit({
+      type: "data.changed",
+      data: { server: "conversations", tool: "list" },
+    });
+  }
+
+  private resolveOwnerId(request: ChatRequest): string {
+    if (request.identity?.id) return request.identity.id;
+    if (!this._identityProvider) return "usr_default";
+    throw new Error(
+      "[runtime.startTurn] no identity on request — the auth middleware must populate " +
+        "request.identity before the turn starts.",
+    );
+  }
+
   private async _chatInner(request: ChatRequest, requestSink?: EventSink): Promise<ChatResult> {
     if (!request.workspaceId) {
       throw new Error("workspaceId is required. Every chat request must be workspace-scoped.");
@@ -1211,15 +1397,26 @@ export class Runtime {
       });
     }
 
-    // Fire-and-forget title generation on first turn (use "fast" slot for cost savings)
+    // Fire-and-forget title generation on first turn (use "fast" slot for cost
+    // savings). Decoupled from the turn lifecycle: when it resolves we persist
+    // the title, then broadcast `conversation.title` on the global SSE so any
+    // live viewer's panel header updates in place, and refresh the
+    // conversations list. The global channel (not the turn stream, which the
+    // client closes on `done`) means delivery is reliable after the turn ends
+    // and across tabs — routed to the right conversation by `conversationId`.
     if (conversation.title === null) {
       const titleModel = this.resolveModelFn(this.getModelSlot("fast"));
       const titleInput =
         request.message ||
         `[Uploaded: ${request.fileRefs?.map((f) => f.filename).join(", ") || "files"}]`;
       void generateTitle(titleModel, titleInput, result.output).then(
-        (title) => {
-          void store.update(conversation.id, { title });
+        async (title) => {
+          await store.update(conversation.id, { title });
+          this.defaultEvents.emit({
+            type: "conversation.title",
+            data: { conversationId: conversation.id, title, wsId },
+          });
+          this.emitConversationsChanged();
         },
         (err) => console.error("[runtime] title generation failed:", err),
       );
diff --git a/test/integration/detached-turn-http.test.ts b/test/integration/detached-turn-http.test.ts
new file mode 100644
index 00000000..c79d52ee
--- /dev/null
+++ b/test/integration/detached-turn-http.test.ts
@@ -0,0 +1,120 @@
+import { afterAll, beforeAll, describe, expect, it } from "bun:test";
+import { mkdirSync, rmSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { type ServerHandle, startServer } from "../../src/api/server.ts";
+import { Runtime } from "../../src/runtime/runtime.ts";
+import { createEchoModel } from "../helpers/echo-model.ts";
+import { TEST_WORKSPACE_ID, provisionTestWorkspace } from "../helpers/test-workspace.ts";
+
+let runtime: Runtime;
+let handle: ServerHandle;
+let baseUrl: string;
+const testDir = join(tmpdir(), `nimblebrain-detached-http-${Date.now()}`);
+
+beforeAll(async () => {
+  mkdirSync(testDir, { recursive: true });
+  runtime = await Runtime.start({
+    model: { provider: "custom", adapter: createEchoModel() },
+    noDefaultBundles: true,
+    logging: { disabled: true },
+    workDir: testDir,
+  });
+  await provisionTestWorkspace(runtime);
+  handle = startServer({ runtime, port: 0 });
+  baseUrl = `http://localhost:${handle.port}`;
+});
+
+afterAll(async () => {
+  handle.stop(true);
+  await runtime.shutdown();
+  rmSync(testDir, { recursive: true, force: true });
+});
+
+/** Read an SSE response body for a bounded window, returning event types seen. */
+async function readSse(res: Response, ms: number): Promise<string[]> {
+  const reader = res.body!.getReader();
+  const decoder = new TextDecoder();
+  const types: string[] = [];
+  const deadline = Date.now() + ms;
+  let buffer = "";
+  try {
+    while (Date.now() < deadline) {
+      const chunk = await Promise.race([
+        reader.read(),
+        new Promise<{ done: true; value: undefined }>((r) =>
+          setTimeout(() => r({ done: true, value: undefined }), deadline - Date.now()),
+        ),
+      ]);
+      if (chunk.done || !chunk.value) break;
+      buffer += decoder.decode(chunk.value, { stream: true });
+      const lines = buffer.split("\n");
+      buffer = lines.pop() ?? "";
+      for (const line of lines) {
+        if (line.startsWith("event: ")) types.push(line.slice(7).trim());
+      }
+    }
+  } finally {
+    await reader.cancel().catch(() => {});
+  }
+  return types;
+}
+
+describe("detached turn HTTP surface", () => {
+  it("POST /v1/chat/start returns a conversation id immediately", async () => {
+    const res = await fetch(`${baseUrl}/v1/chat/start`, {
+      method: "POST",
+      headers: { "Content-Type": "application/json", "X-Workspace-Id": TEST_WORKSPACE_ID },
+      body: JSON.stringify({ message: "Hello over HTTP", workspaceId: TEST_WORKSPACE_ID }),
+    });
+    expect(res.status).toBe(200);
+    const body = await res.json();
+    expect(body.conversationId).toMatch(/^conv_/);
+  });
+
+  it("GET /v1/conversations/:id/events replays the turn (incl. the user message)", async () => {
+    const startRes = await fetch(`${baseUrl}/v1/chat/start`, {
+      method: "POST",
+      headers: { "Content-Type": "application/json", "X-Workspace-Id": TEST_WORKSPACE_ID },
+      body: JSON.stringify({ message: "Replay me", workspaceId: TEST_WORKSPACE_ID }),
+    });
+    const { conversationId } = await startRes.json();
+
+    // Let the echo turn run + buffer, then connect a fresh viewer — it should
+    // replay the whole turn from the RunBus (within the grace window).
+    await new Promise((r) => setTimeout(r, 100));
+
+    const evRes = await fetch(`${baseUrl}/v1/conversations/${conversationId}/events`, {
+      headers: { "X-Workspace-Id": TEST_WORKSPACE_ID },
+    });
+    expect(evRes.status).toBe(200);
+    const types = await readSse(evRes, 400);
+    expect(types).toContain("subscribed");
+    expect(types).toContain("user.message");
+    expect(types).toContain("chat.start");
+  });
+
+  it("POST /v1/conversations/:id/cancel returns ok for the owner", async () => {
+    const startRes = await fetch(`${baseUrl}/v1/chat/start`, {
+      method: "POST",
+      headers: { "Content-Type": "application/json", "X-Workspace-Id": TEST_WORKSPACE_ID },
+      body: JSON.stringify({ message: "cancel target", workspaceId: TEST_WORKSPACE_ID }),
+    });
+    const { conversationId } = await startRes.json();
+    const res = await fetch(`${baseUrl}/v1/conversations/${conversationId}/cancel`, {
+      method: "POST",
+      headers: { "X-Workspace-Id": TEST_WORKSPACE_ID },
+    });
+    expect(res.status).toBe(200);
+    const body = await res.json();
+    expect(typeof body.cancelled).toBe("boolean");
+  });
+
+  it("cancel of a non-existent conversation is 404", async () => {
+    const res = await fetch(`${baseUrl}/v1/conversations/conv_0000000000000000/cancel`, {
+      method: "POST",
+      headers: { "X-Workspace-Id": TEST_WORKSPACE_ID },
+    });
+    expect(res.status).toBe(404);
+  });
+});
diff --git a/test/integration/detached-turn.test.ts b/test/integration/detached-turn.test.ts
new file mode 100644
index 00000000..fe82e500
--- /dev/null
+++ b/test/integration/detached-turn.test.ts
@@ -0,0 +1,99 @@
+import { afterAll, beforeAll, describe, expect, it } from "bun:test";
+import { mkdirSync, rmSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { EventSourcedConversationStore } from "../../src/conversation/event-sourced-store.ts";
+import { Runtime } from "../../src/runtime/runtime.ts";
+import type { BufferedRunEvent, RunStatus } from "../../src/runtime/run-bus.ts";
+import { createEchoModel } from "../helpers/echo-model.ts";
+import { TEST_WORKSPACE_ID, provisionTestWorkspace } from "../helpers/test-workspace.ts";
+
+let runtime: Runtime;
+const testDir = join(tmpdir(), `nimblebrain-detached-${Date.now()}`);
+
+beforeAll(async () => {
+  mkdirSync(testDir, { recursive: true });
+  runtime = await Runtime.start({
+    model: { provider: "custom", adapter: createEchoModel() },
+    noDefaultBundles: true,
+    logging: { disabled: true },
+    workDir: testDir,
+  });
+  await provisionTestWorkspace(runtime);
+});
+
+afterAll(async () => {
+  await runtime.shutdown();
+  rmSync(testDir, { recursive: true, force: true });
+});
+
+/** Attach to a turn and resolve with all events once it ends. */
+function awaitTurn(conversationId: string): Promise<{ events: BufferedRunEvent[]; status: RunStatus }> {
+  return new Promise((resolve) => {
+    const events: BufferedRunEvent[] = [];
+    runtime.attachTurn(
+      conversationId,
+      0,
+      (e) => events.push(e),
+      (status) => resolve({ events, status }),
+    );
+  });
+}
+
+async function waitFor(pred: () => boolean, timeoutMs = 2000): Promise<void> {
+  const start = Date.now();
+  while (!pred()) {
+    if (Date.now() - start > timeoutMs) throw new Error("waitFor timed out");
+    await new Promise((r) => setTimeout(r, 5));
+  }
+}
+
+describe("detached turns (server-authoritative streaming)", () => {
+  it("returns a conversation id immediately and runs to completion in the background", async () => {
+    const { conversationId } = await runtime.startTurn({
+      message: "Hello detached",
+      workspaceId: TEST_WORKSPACE_ID,
+    });
+    expect(conversationId).toMatch(/^conv_/);
+
+    const { events, status } = await awaitTurn(conversationId);
+    expect(status).toBe("done");
+    expect(events.some((e) => e.type === "chat.start")).toBe(true);
+    expect(events.length).toBeGreaterThan(0);
+    // Sequence numbers are monotonic 1..n.
+    expect(events.map((e) => e.seq)).toEqual(events.map((_, i) => i + 1));
+  });
+
+  it("persists the turn server-side with no viewer attached", async () => {
+    const { conversationId } = await runtime.startTurn({
+      message: "Persist me",
+      workspaceId: TEST_WORKSPACE_ID,
+    });
+    // Never attach — wait for the run to end purely via server state.
+    await waitFor(() => !runtime.isTurnActive(conversationId));
+
+    const conv = await runtime.findConversation(conversationId, { userId: "usr_default" });
+    expect(conv).not.toBeNull();
+
+    const store = runtime.findConversationStore();
+    expect(store).toBeInstanceOf(EventSourcedConversationStore);
+    const events = await (store as EventSourcedConversationStore).readEvents(conversationId);
+    expect(events.length).toBeGreaterThan(0);
+  });
+
+  it("allows a new turn on the same conversation once idle", async () => {
+    const { conversationId } = await runtime.startTurn({
+      message: "first",
+      workspaceId: TEST_WORKSPACE_ID,
+    });
+    await awaitTurn(conversationId);
+
+    const again = await runtime.startTurn({
+      message: "second",
+      conversationId,
+      workspaceId: TEST_WORKSPACE_ID,
+    });
+    expect(again.conversationId).toBe(conversationId);
+    await awaitTurn(conversationId);
+  });
+});
diff --git a/test/unit/run-bus.test.ts b/test/unit/run-bus.test.ts
new file mode 100644
index 00000000..a11efbc0
--- /dev/null
+++ b/test/unit/run-bus.test.ts
@@ -0,0 +1,154 @@
+import { describe, expect, it } from "bun:test";
+import { RunInProgressError } from "../../src/runtime/errors.ts";
+import { type BufferedRunEvent, RunBus } from "../../src/runtime/run-bus.ts";
+
+function collect(): { events: BufferedRunEvent[]; onEvent: (e: BufferedRunEvent) => void } {
+  const events: BufferedRunEvent[] = [];
+  return { events, onEvent: (e) => events.push(e) };
+}
+
+describe("RunBus", () => {
+  it("assigns monotonic 1-based sequence numbers", () => {
+    const bus = new RunBus();
+    bus.begin("c1");
+    bus.publish("c1", "text.delta", { text: "a" });
+    bus.publish("c1", "text.delta", { text: "b" });
+    expect(bus.currentSeq("c1")).toBe(2);
+  });
+
+  it("throws RunInProgressError when a turn is already active", () => {
+    const bus = new RunBus();
+    bus.begin("c1");
+    expect(() => bus.begin("c1")).toThrow(RunInProgressError);
+  });
+
+  it("tracks active conversations and clears on end", () => {
+    const bus = new RunBus();
+    bus.begin("c1");
+    bus.begin("c2");
+    expect(bus.activeConversationIds().sort()).toEqual(["c1", "c2"]);
+    expect(bus.isActive("c1")).toBe(true);
+    bus.end("c1", "done");
+    expect(bus.isActive("c1")).toBe(false);
+    expect(bus.activeConversationIds()).toEqual(["c2"]);
+  });
+
+  it("replays buffered events on attach, then tails live ones", () => {
+    const bus = new RunBus();
+    bus.begin("c1");
+    bus.publish("c1", "text.delta", { text: "one" });
+    bus.publish("c1", "text.delta", { text: "two" });
+
+    // Late subscriber (e.g. a page refresh) — full replay from 0.
+    const { events, onEvent } = collect();
+    bus.attach("c1", 0, onEvent);
+    expect(events.map((e) => e.seq)).toEqual([1, 2]);
+
+    // Live tail.
+    bus.publish("c1", "text.delta", { text: "three" });
+    expect(events.map((e) => e.seq)).toEqual([1, 2, 3]);
+  });
+
+  it("resumes from a given seq without gaps or duplicates", () => {
+    const bus = new RunBus();
+    bus.begin("c1");
+    bus.publish("c1", "text.delta", { text: "1" });
+    bus.publish("c1", "text.delta", { text: "2" });
+    bus.publish("c1", "text.delta", { text: "3" });
+
+    // Client already rendered through seq 2 — attach for the remainder only.
+    const { events, onEvent } = collect();
+    bus.attach("c1", 2, onEvent);
+    expect(events.map((e) => e.seq)).toEqual([3]);
+  });
+
+  it("delivers terminal status to attachers, including late ones", () => {
+    const bus = new RunBus();
+    bus.begin("c1");
+    bus.publish("c1", "text.delta", { text: "hi" });
+
+    let liveStatus: string | undefined;
+    bus.attach("c1", 0, () => {}, (s) => {
+      liveStatus = s;
+    });
+    bus.end("c1", "done");
+    expect(liveStatus).toBe("done");
+
+    // Attaching after the run ended (still within grace) replays + reports end.
+    const { events, onEvent } = collect();
+    let lateStatus: string | undefined;
+    bus.attach("c1", 0, onEvent, (s) => {
+      lateStatus = s;
+    });
+    expect(events.map((e) => e.seq)).toEqual([1]);
+    expect(lateStatus).toBe("done");
+  });
+
+  it("detach stops further delivery", () => {
+    const bus = new RunBus();
+    bus.begin("c1");
+    const { events, onEvent } = collect();
+    const detach = bus.attach("c1", 0, onEvent);
+    bus.publish("c1", "text.delta", { text: "a" });
+    detach();
+    bus.publish("c1", "text.delta", { text: "b" });
+    expect(events.map((e) => (e.data as { text: string }).text)).toEqual(["a"]);
+  });
+
+  it("cancel aborts the turn signal and marks it cancelled", () => {
+    const bus = new RunBus();
+    const signal = bus.begin("c1");
+    expect(signal.aborted).toBe(false);
+    const ok = bus.cancel("c1");
+    expect(ok).toBe(true);
+    expect(signal.aborted).toBe(true);
+    expect(bus.getStatus("c1")).toBe("cancelled");
+    expect(bus.isActive("c1")).toBe(false);
+  });
+
+  it("ignores publish after a run is terminal", () => {
+    const bus = new RunBus();
+    bus.begin("c1");
+    bus.end("c1", "done");
+    bus.publish("c1", "text.delta", { text: "late" });
+    expect(bus.currentSeq("c1")).toBe(0);
+  });
+
+  it("does not abort generation on detach (disconnect ≠ cancel)", () => {
+    const bus = new RunBus();
+    const signal = bus.begin("c1");
+    const detach = bus.attach("c1", 0, () => {});
+    detach();
+    // The viewer left, but the turn keeps running.
+    expect(signal.aborted).toBe(false);
+    expect(bus.isActive("c1")).toBe(true);
+  });
+
+  it("GCs a terminal run after the grace window", async () => {
+    const bus = new RunBus(10);
+    bus.begin("c1");
+    bus.publish("c1", "x", {});
+    bus.end("c1", "done");
+    expect(bus.getStatus("c1")).toBe("done");
+    await new Promise((r) => setTimeout(r, 30));
+    expect(bus.getStatus("c1")).toBeUndefined();
+  });
+
+  it("a new turn replaces a lingering terminal log", () => {
+    const bus = new RunBus();
+    bus.begin("c1");
+    bus.publish("c1", "x", {});
+    bus.end("c1", "done");
+    // New turn — seq restarts, status running.
+    bus.begin("c1");
+    expect(bus.isActive("c1")).toBe(true);
+    expect(bus.currentSeq("c1")).toBe(0);
+  });
+
+  it("attach to an unknown conversation is a safe no-op", () => {
+    const bus = new RunBus();
+    const detach = bus.attach("nope", 0, () => {});
+    expect(typeof detach).toBe("function");
+    detach();
+  });
+});

From 83d88afa9d428692ddeae53ff6b8afc751a9193d Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Mon, 25 May 2026 10:25:17 -0600
Subject: [PATCH 02/26] fix(conversations): rework auto-title prompt to stop
 response echo (#253)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The single-string transcript prompt made the fast model pattern-match a
conversation to continue and emit the start of the assistant's response as
the title (worst on creative/long answers). Use real role turns
(user → assistant → user-instruction); the trailing user turn is an
unambiguous instruction, not text to continue.

Closes #253

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 src/conversation/auto-title.ts | 15 ++++++++++++---
 test/unit/auto-title.test.ts   | 20 ++++++++++++++++++++
 2 files changed, 32 insertions(+), 3 deletions(-)

diff --git a/src/conversation/auto-title.ts b/src/conversation/auto-title.ts
index 2330ac92..edda49ad 100644
--- a/src/conversation/auto-title.ts
+++ b/src/conversation/auto-title.ts
@@ -3,6 +3,13 @@ import type { LanguageModelV3 } from "@ai-sdk/provider";
 /**
  * Generate a short conversation title using the provided model.
  * Non-blocking — call fire-and-forget after first turn.
+ *
+ * The prompt uses real role turns (user → assistant → user-instruction) rather
+ * than stuffing the whole transcript into one user string. The transcript-in-a-
+ * string shape made the fast model pattern-match "continue the assistant" and
+ * echo the response back as the title — worst on creative/long answers (#253).
+ * A trailing user-role instruction is unambiguously a command, not text to
+ * continue.
  */
 export async function generateTitle(
   model: LanguageModelV3,
@@ -15,14 +22,16 @@ export async function generateTitle(
         {
           role: "system",
           content:
-            "Generate a 3-6 word title for this conversation. Return only the title, nothing else.",
+            "You generate short, descriptive titles for conversations. Reply with the title only.",
         },
+        { role: "user", content: [{ type: "text", text: userMessage.slice(0, 500) }] },
+        { role: "assistant", content: [{ type: "text", text: assistantResponse.slice(0, 500) }] },
         {
           role: "user",
           content: [
             {
               type: "text",
-              text: `User: ${userMessage.slice(0, 200)}\nAssistant: ${assistantResponse.slice(0, 200)}`,
+              text: "Reply with a 3-6 word title summarizing this conversation. Output only the title — no quotes, no markdown, no preamble.",
             },
           ],
         },
@@ -31,7 +40,7 @@ export async function generateTitle(
     });
     const textBlock = result.content.find((b) => b.type === "text");
     if (textBlock?.type === "text") {
-      return textBlock.text.trim();
+      return textBlock.text.trim() || fallbackTitle(userMessage);
     }
     return fallbackTitle(userMessage);
   } catch {
diff --git a/test/unit/auto-title.test.ts b/test/unit/auto-title.test.ts
index f4128de2..3f401b98 100644
--- a/test/unit/auto-title.test.ts
+++ b/test/unit/auto-title.test.ts
@@ -59,4 +59,24 @@ describe("generateTitle", () => {
 		expect(title.length).toBeLessThanOrEqual(60);
 		expect(longMsg.startsWith(title.trimEnd())).toBe(true);
 	});
+
+	it("sends the conversation as real role turns ending in an instruction (#253)", async () => {
+		let captured: unknown;
+		const model = createMockModel((opts) => {
+			captured = opts.prompt;
+			return { content: [{ type: "text", text: "Library Paranoia Joke" }] };
+		});
+		await generateTitle(model, "Write something funny", "A man walks into a library...");
+		const prompt = captured as Array<{ role: string }>;
+		// system, user(question), assistant(answer), user(instruction)
+		expect(prompt.map((m) => m.role)).toEqual(["system", "user", "assistant", "user"]);
+	});
+
+	it("returns the model's title text (trimmed)", async () => {
+		const model = createMockModel(() => ({
+			content: [{ type: "text", text: "  Library Paranoia Joke  " }],
+		}));
+		const title = await generateTitle(model, "Write something funny", "A man walks in...");
+		expect(title).toBe("Library Paranoia Joke");
+	});
 });

From 549cbd63e7d1a95c82310a49cc39a31acb44f8bc Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Mon, 25 May 2026 10:25:33 -0600
Subject: [PATCH 03/26] feat(web): per-conversation chat viewer over the server
 turn stream
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Replace the single shared useChat with a per-conversation slice store. Each
conversation owns its own state; a turn's stream writes only into its origin
slice, so switching conversations mid-turn never bleeds the response into the
destination chat (#254) and switching back shows it still arriving.

- chat-store: slice map (LRU-capped) backing useChat via useSyncExternalStore;
  sendTurn → /v1/chat/start then subscribe via conversation-stream (replay +
  live tail). Resume reflects server isActive (indicator/Stop survive reload),
  trims the stale in-flight turn from disk, and drops grace-buffer replay of a
  finished turn (no duplicate). AbortSignal threaded for cleanup only.
- Streaming dots: store streamingIds → hostContext (SlotRenderer) so the list
  shows live per-row activity; persisted per-tab in sessionStorage and re-probed
  on reload (dots survive refresh, self-heal when finished).
- Reload restore: last-viewed conversation reopened from sessionStorage.
- Live title: consume conversation.title SSE → slice title; ChatPanel header
  prefers the generated title. MessageList lands the view at the bottom.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 web/src/App.tsx                              |   6 +
 web/src/api/client.ts                        |  77 +-
 web/src/api/conversation-stream.ts           | 157 +++
 web/src/bridge/host-extensions.ts            |  10 +-
 web/src/components/AppWithChat.tsx           |  62 +-
 web/src/components/ChatPanel.tsx             |  12 +-
 web/src/components/MessageInput.tsx          |  43 +-
 web/src/components/MessageList.tsx           |  15 +-
 web/src/components/SlotRenderer.tsx          |  24 +-
 web/src/context/ChatContext.tsx              |  44 +-
 web/src/hooks/chat-store.ts                  | 971 +++++++++++++++++++
 web/src/hooks/useChat.ts                     | 885 ++---------------
 web/src/hooks/useEvents.ts                   |   8 +
 web/src/lib/active-conversation-storage.ts   |  60 ++
 web/src/types.ts                             |   8 +
 web/test/active-conversation-storage.test.ts |  26 +
 web/test/chat-store.test.ts                  | 289 ++++++
 web/test/chatBleed.test.tsx                  | 129 +++
 web/test/inlineError.test.tsx                | 268 ++---
 web/test/streamingState.test.tsx             | 460 ++++-----
 20 files changed, 2270 insertions(+), 1284 deletions(-)
 create mode 100644 web/src/api/conversation-stream.ts
 create mode 100644 web/src/hooks/chat-store.ts
 create mode 100644 web/src/lib/active-conversation-storage.ts
 create mode 100644 web/test/active-conversation-storage.test.ts
 create mode 100644 web/test/chat-store.test.ts
 create mode 100644 web/test/chatBleed.test.tsx

diff --git a/web/src/App.tsx b/web/src/App.tsx
index 74ddc997..f9e5e019 100644
--- a/web/src/App.tsx
+++ b/web/src/App.tsx
@@ -36,6 +36,7 @@ import {
   type WorkspaceInfo,
   WorkspaceProvider,
 } from "./context/WorkspaceContext";
+import { chatStore } from "./hooks/chat-store";
 import { useDataSync } from "./hooks/useDataSync";
 import { useEvents } from "./hooks/useEvents";
 import { useShell } from "./hooks/useShell";
@@ -227,6 +228,11 @@ function AuthenticatedAppContent({
   useEvents(token, wsCtx.activeWorkspace?.id, {
     onDataChanged,
     onConfigChanged: () => config.refreshConfig(),
+    // Auto-title arrived — update the matching conversation's slice so the
+    // chat panel header reflects it live (routed by conversationId).
+    onConversationTitle: ({ conversationId, title }) => {
+      chatStore.setTitle(conversationId, title);
+    },
     // Bundle install / uninstall changes the placement set; refetch
     // the shell so the sidebar's Apps group reflects the new state
     // without a page reload.
diff --git a/web/src/api/client.ts b/web/src/api/client.ts
index bb5d8550..dcfa4e04 100644
--- a/web/src/api/client.ts
+++ b/web/src/api/client.ts
@@ -379,8 +379,14 @@ async function consumeSSEStream(res: Response, onEvent: ChatStreamCallback): Pro
   }
 }
 
-/** Streaming chat via SSE. Calls onEvent for each event, resolves when done. */
-export async function streamChat(req: ChatRequest, onEvent: ChatStreamCallback): Promise<void> {
+/** Streaming chat via SSE. Calls onEvent for each event, resolves when done.
+ *  `signal` is for caller-driven cleanup (logout / store reset) — NOT
+ *  conversation switching, which keeps the stream alive in the background. */
+export async function streamChat(
+  req: ChatRequest,
+  onEvent: ChatStreamCallback,
+  signal?: AbortSignal,
+): Promise<void> {
   // If a conv-events SSE subscription is open for this conversation,
   // pass its server-issued subscriber id so the broadcast suppresses
   // self-echo. Without this, the sender's own tab double-processes
@@ -394,6 +400,7 @@ export async function streamChat(req: ChatRequest, onEvent: ChatStreamCallback):
     credentials: "include",
     headers: headers(originSubId ? { "X-Origin-Subscriber-Id": originSubId } : undefined),
     body: JSON.stringify(req),
+    ...(signal ? { signal } : {}),
   });
 
   if (res.status === 401) {
@@ -420,6 +427,7 @@ export async function streamChatMultipart(
   req: ChatRequest,
   files: File[],
   onEvent: ChatStreamCallback,
+  signal?: AbortSignal,
 ): Promise<void> {
   const formData = new FormData();
   formData.append("message", req.message);
@@ -450,6 +458,7 @@ export async function streamChatMultipart(
     credentials: "include",
     headers: h,
     body: formData,
+    ...(signal ? { signal } : {}),
   });
 
   if (res.status === 401) {
@@ -467,6 +476,70 @@ export async function streamChatMultipart(
   await consumeSSEStream(res, onEvent);
 }
 
+/**
+ * Start a server-authoritative turn. Returns the conversation id immediately;
+ * the turn runs to completion on the server regardless of this client. Watch
+ * it via `connectConversationStream`. Replaces the streaming `streamChat` path.
+ */
+export async function startChatTurn(req: ChatRequest): Promise<{ conversationId: string }> {
+  const res = await fetchWithRefresh(`${API_BASE}/v1/chat/start`, {
+    method: "POST",
+    credentials: "include",
+    headers: headers(),
+    body: JSON.stringify(req),
+  });
+  if (res.status === 401) throw new ApiClientError("unauthorized", "Unauthorized", 401);
+  if (!res.ok) {
+    const body: ApiError = await res
+      .json()
+      .catch(() => ({ error: "unknown", message: res.statusText }));
+    throw new ApiClientError(body.error, body.message, res.status, body.details);
+  }
+  return res.json() as Promise<{ conversationId: string }>;
+}
+
+/** Start a server-authoritative turn with file attachments (multipart). */
+export async function startChatTurnMultipart(
+  req: ChatRequest,
+  files: File[],
+): Promise<{ conversationId: string }> {
+  const formData = new FormData();
+  formData.append("message", req.message);
+  if (req.conversationId) formData.append("conversationId", req.conversationId);
+  if (req.model) formData.append("model", req.model);
+  if (req.appContext) formData.append("appContext", JSON.stringify(req.appContext));
+  for (const file of files) formData.append("files", file, file.name);
+
+  const h: Record<string, string> = {};
+  if (authToken && authToken !== "__cookie__") h.Authorization = `Bearer ${authToken}`;
+  if (activeWorkspaceId) h["X-Workspace-Id"] = activeWorkspaceId;
+
+  const res = await fetchWithRefresh(`${API_BASE}/v1/chat/start`, {
+    method: "POST",
+    credentials: "include",
+    headers: h,
+    body: formData,
+  });
+  if (res.status === 401) throw new ApiClientError("unauthorized", "Unauthorized", 401);
+  if (!res.ok) {
+    const body: ApiError = await res
+      .json()
+      .catch(() => ({ error: "unknown", message: res.statusText }));
+    throw new ApiClientError(body.error, body.message, res.status, body.details);
+  }
+  return res.json() as Promise<{ conversationId: string }>;
+}
+
+/** Explicitly stop an in-flight turn (the Stop button). */
+export async function cancelChatTurn(conversationId: string): Promise<void> {
+  await fetchWithRefresh(
+    `${API_BASE}/v1/conversations/${encodeURIComponent(conversationId)}/cancel`,
+    { method: "POST", credentials: "include", headers: headers() },
+  ).catch(() => {
+    // Best-effort — the turn may have already finished.
+  });
+}
+
 // ---------------------------------------------------------------------------
 // Health
 // ---------------------------------------------------------------------------
diff --git a/web/src/api/conversation-stream.ts b/web/src/api/conversation-stream.ts
new file mode 100644
index 00000000..c7feaf20
--- /dev/null
+++ b/web/src/api/conversation-stream.ts
@@ -0,0 +1,157 @@
+/**
+ * Conversation turn-stream client (server-authoritative streaming).
+ *
+ * Connects to GET /v1/conversations/:id/events?afterSeq=N. The server replays
+ * the in-flight turn from the RunBus (events with seq > afterSeq), then tails
+ * live. This is the ONE rendering path: send, resume-after-refresh, switch
+ * back, and cross-tab all watch the same stream.
+ *
+ * Each frame carries a sequence number in the SSE `id:` line. We track the
+ * highest seq seen and reconnect with `afterSeq=<lastSeq>`, so a dropped
+ * connection resumes seamlessly with no gap or duplication — no full reload.
+ */
+
+import { refreshSession } from "./client";
+
+export interface ConversationStreamOptions {
+  conversationId: string;
+  apiBase?: string;
+  token?: string;
+  /** Highest seq the caller has already applied (resume point). Default 0. */
+  afterSeq?: number;
+  /** Called for each turn event. `seq` is monotonic within a turn. */
+  onEvent: (type: string, data: unknown, seq: number) => void;
+  /** Called once per (re)connect with the server's current turn state, before
+   *  any replayed events. Lets the caller trim a stale in-flight turn. */
+  onSubscribed?: (info: { isActive: boolean; activeSeq: number }) => void;
+  /** Called on unrecoverable error (403/404/auth). */
+  onError?: (error: Error) => void;
+}
+
+export interface ConversationStreamConnection {
+  close(): void;
+}
+
+const INITIAL_BACKOFF_MS = 1_000;
+const MAX_BACKOFF_MS = 30_000;
+const BACKOFF_MULTIPLIER = 2;
+
+export function connectConversationStream(
+  options: ConversationStreamOptions,
+): ConversationStreamConnection {
+  const { conversationId, apiBase = "", token, onEvent, onSubscribed, onError } = options;
+
+  let closed = false;
+  let abortController: AbortController | null = null;
+  let reconnectTimer: ReturnType<typeof setTimeout> | null = null;
+  let backoff = INITIAL_BACKOFF_MS;
+  // Track the resume point so a reconnect picks up exactly where we left off.
+  let lastSeq = options.afterSeq ?? 0;
+
+  async function connect(): Promise<void> {
+    if (closed) return;
+    abortController = new AbortController();
+    const hdrs: Record<string, string> = {};
+    if (token && token !== "__cookie__") hdrs.Authorization = `Bearer ${token}`;
+
+    try {
+      const url = `${apiBase}/v1/conversations/${encodeURIComponent(conversationId)}/events?afterSeq=${lastSeq}`;
+      const res = await fetch(url, {
+        headers: hdrs,
+        credentials: "include",
+        signal: abortController.signal,
+      });
+
+      if (res.status === 401) {
+        const refreshed = await refreshSession();
+        if (refreshed) return void scheduleReconnect();
+        onError?.(new Error("Conversation stream auth failed after token refresh"));
+        return;
+      }
+      if (!res.ok) {
+        if (res.status === 403 || res.status === 404) {
+          onError?.(new Error(`Conversation stream access denied: ${res.status}`));
+          return;
+        }
+        throw new Error(`Conversation stream failed: ${res.status} ${res.statusText}`);
+      }
+
+      backoff = INITIAL_BACKOFF_MS;
+      const reader = res.body?.getReader();
+      if (!reader) throw new Error("No response body");
+
+      const decoder = new TextDecoder();
+      let buffer = "";
+      let currentEvent = "";
+      let currentSeq: number | null = null;
+
+      for (;;) {
+        const { done, value } = await reader.read();
+        if (done || closed) break;
+        buffer += decoder.decode(value, { stream: true });
+        const lines = buffer.split("\n");
+        buffer = lines.pop() ?? "";
+
+        for (const line of lines) {
+          if (line.startsWith("event: ")) {
+            currentEvent = line.slice(7).trim();
+          } else if (line.startsWith("id: ")) {
+            const n = Number.parseInt(line.slice(4).trim(), 10);
+            currentSeq = Number.isFinite(n) ? n : null;
+          } else if (line.startsWith("data: ") && currentEvent) {
+            try {
+              const data = JSON.parse(line.slice(6));
+              if (currentEvent === "subscribed") {
+                const info = data as { isActive?: boolean; activeSeq?: number };
+                onSubscribed?.({
+                  isActive: info.isActive ?? false,
+                  activeSeq: info.activeSeq ?? 0,
+                });
+              } else {
+                const seq = currentSeq ?? 0;
+                if (seq > lastSeq) lastSeq = seq;
+                onEvent(currentEvent, data, seq);
+              }
+            } catch {
+              // Skip malformed frames.
+            }
+            currentEvent = "";
+            currentSeq = null;
+          }
+        }
+      }
+
+      if (!closed) scheduleReconnect();
+    } catch (err) {
+      if (closed) return;
+      if (err instanceof DOMException && err.name === "AbortError") return;
+      if (err instanceof Error && err.message.includes("403")) {
+        onError?.(err);
+        return;
+      }
+      scheduleReconnect();
+    }
+  }
+
+  function scheduleReconnect(): void {
+    if (closed) return;
+    reconnectTimer = setTimeout(() => {
+      backoff = Math.min(backoff * BACKOFF_MULTIPLIER, MAX_BACKOFF_MS);
+      connect();
+    }, backoff);
+  }
+
+  connect();
+
+  return {
+    close() {
+      closed = true;
+      if (reconnectTimer) {
+        clearTimeout(reconnectTimer);
+        reconnectTimer = null;
+      }
+      abortController?.abort();
+      abortController = null;
+    },
+  };
+}
diff --git a/web/src/bridge/host-extensions.ts b/web/src/bridge/host-extensions.ts
index f8f810dd..57a5101b 100644
--- a/web/src/bridge/host-extensions.ts
+++ b/web/src/bridge/host-extensions.ts
@@ -31,11 +31,18 @@ export type WorkspaceForHostContext = { id: string; name: string } | null;
 export function buildHostExtensions(
   workspace: WorkspaceForHostContext,
   forceRefresh = false,
+  streamingConversationIds: string[] = [],
 ): Record<string, unknown> {
   const ext: Record<string, unknown> = workspace
     ? { workspace: { id: workspace.id, name: workspace.name } }
     : {};
   if (forceRefresh) ext.forceRefresh = true;
+  // Conversations with an in-flight assistant turn in this browser tab. Apps
+  // (e.g. the conversations list) render a live "streaming" affordance per
+  // row. Ephemeral, tab-local — not persisted, not from the server.
+  if (streamingConversationIds.length > 0) {
+    ext.streamingConversationIds = streamingConversationIds;
+  }
   return ext;
 }
 
@@ -47,10 +54,11 @@ export function buildHostExtensions(
 export function buildHostContext(
   mode: "light" | "dark",
   workspace: WorkspaceForHostContext,
+  streamingConversationIds: string[] = [],
 ): Record<string, unknown> {
   const tokens = getThemeTokens(mode);
   return {
-    ...buildHostExtensions(workspace),
+    ...buildHostExtensions(workspace, false, streamingConversationIds),
     theme: mode,
     styles: { variables: tokens },
   };
diff --git a/web/src/components/AppWithChat.tsx b/web/src/components/AppWithChat.tsx
index e8502e51..e2d22834 100644
--- a/web/src/components/AppWithChat.tsx
+++ b/web/src/components/AppWithChat.tsx
@@ -1,16 +1,36 @@
 import { MessageSquare } from "lucide-react";
-import { useCallback, useEffect, useMemo, useRef, useState } from "react";
+import { useCallback, useEffect, useMemo, useRef, useState, useSyncExternalStore } from "react";
 import { useLocation } from "react-router-dom";
 import type { UiChatContext } from "../bridge/types";
 import { useChatContext } from "../context/ChatContext";
 import { useChatPanelContext } from "../context/ChatPanelContext";
 import { useSidebar } from "../context/SidebarContext";
+import { chatStore } from "../hooks/chat-store";
+import {
+  getSavedConversationId,
+  getSavedStreamingIds,
+  setSavedConversationId,
+  setSavedStreamingIds,
+} from "../lib/active-conversation-storage";
 import type { AppContext, PlacementEntry } from "../types";
 import type { ChatPanelRef } from "./ChatPanel";
 import { ChatPanel } from "./ChatPanel";
 import { ResizeHandle } from "./ResizeHandle";
 import { SlotRenderer } from "./SlotRenderer";
 
+/**
+ * Module-once guard: restore conversation state only on a fresh page load, not
+ * on every client-side app navigation (which remounts AppWithChat). A page
+ * reload resets the module, re-arming the restore.
+ */
+let restoredLastConversation = false;
+/**
+ * Snapshot of the persisted streaming-id set captured at module-eval time
+ * (page load), before any persist effect overwrites sessionStorage with the
+ * post-reload (empty) set.
+ */
+const initialSavedStreamingIds = getSavedStreamingIds();
+
 function useIsMobile(): boolean {
   const [isMobile, setIsMobile] = useState(
     () => typeof window !== "undefined" && window.innerWidth < 768,
@@ -59,19 +79,53 @@ export function AppWithChat({ placement, onNavigate, forceRefresh }: AppWithChat
     }
   }, [location.pathname]);
 
-  // Deep-link: open chat from ?chat=<conversationId> on mount
+  // Deep-link: open chat from ?chat=<conversationId> on mount. Otherwise, on a
+  // fresh page load, reopen the last-viewed conversation (per-tab, via
+  // sessionStorage) so an in-flight turn's stream/indicator resumes —
+  // loadConversation re-subscribes and the server's `isActive` drives the
+  // bubble. Module-once so app-to-app navigation doesn't re-trigger it.
   const deepLinkHandled = useRef(false);
   // biome-ignore lint/correctness/useExhaustiveDependencies: intentionally runs only on mount
   useEffect(() => {
     if (deepLinkHandled.current) return;
     deepLinkHandled.current = true;
-    const params = new URLSearchParams(window.location.search);
-    const chatId = params.get("chat");
+    const chatId = new URLSearchParams(window.location.search).get("chat");
     if (chatId) {
       openPanel(chatId);
+      return;
+    }
+    if (!restoredLastConversation) {
+      restoredLastConversation = true;
+      const saved = getSavedConversationId();
+      // Hydrate without forcing the panel open — its visibility is restored
+      // independently from ChatPanelContext's persisted state. When the panel
+      // is (re)opened it shows this conversation.
+      if (saved) void chat.loadConversation(saved);
+      // Restore background streaming dots: probe each conversation that was
+      // generating before reload. Still-active ones light up; finished ones
+      // self-heal (probe → not active → no dot).
+      for (const id of initialSavedStreamingIds) {
+        if (id !== saved) chatStore.probeConversation(id);
+      }
     }
   }, []);
 
+  // Persist the active conversation id (per-tab) so a reload can reopen it.
+  // Cleared automatically when a new/draft chat is active (conversationId null).
+  useEffect(() => {
+    setSavedConversationId(chat.conversationId);
+  }, [chat.conversationId]);
+
+  // Persist the set of conversations with an in-flight turn so a reload can
+  // restore their streaming dots (re-probed against the server above).
+  const streamingIds = useSyncExternalStore(
+    chatStore.subscribeStreamingIds,
+    chatStore.getStreamingIds,
+  );
+  useEffect(() => {
+    setSavedStreamingIds(streamingIds);
+  }, [streamingIds]);
+
   // Unread tracking: count assistant messages added while panel is closed
   const lastSeenAssistantCount = useRef(0);
   const [buttonVisible, setButtonVisible] = useState(() => panelState === "closed");
diff --git a/web/src/components/ChatPanel.tsx b/web/src/components/ChatPanel.tsx
index 2885e773..a0b32d23 100644
--- a/web/src/components/ChatPanel.tsx
+++ b/web/src/components/ChatPanel.tsx
@@ -48,11 +48,12 @@ export const ChatPanel = forwardRef<ChatPanelRef, ChatPanelProps>(function ChatP
   const inputWrapperRef = useRef<HTMLDivElement>(null);
   const [showShortcuts, setShowShortcuts] = useState(false);
   const [copiedId, setCopiedId] = useState(false);
-  const { conversationId, streamingState, preparingTool } = useChatContext();
+  const { conversationId, title, streamingState, preparingTool, stop } = useChatContext();
   const { currentUserId, participantMap } = useChatConfigContext();
 
-  // Derive a title from the first user message, stripping markdown syntax
-  const rawTitle = messages.find((m) => m.role === "user")?.content || null;
+  // Prefer the server-generated title (updates live when it arrives); fall back
+  // to the first user message, stripping markdown syntax, until then.
+  const rawTitle = title ?? messages.find((m) => m.role === "user")?.content ?? null;
   const plainTitle = rawTitle
     ? rawTitle
         .replace(/^#{1,6}\s+/gm, "") // headings
@@ -65,9 +66,9 @@ export const ChatPanel = forwardRef<ChatPanelRef, ChatPanelProps>(function ChatP
         .replace(/\n/g, " ") // newlines to spaces
         .trim()
     : null;
-  const conversationTitle = plainTitle?.slice(0, 30) || null;
+  const conversationTitle = plainTitle?.slice(0, 40) || null;
   const displayTitle = conversationTitle
-    ? plainTitle && plainTitle.length > 30
+    ? plainTitle && plainTitle.length > 40
       ? `${conversationTitle}…`
       : conversationTitle
     : null;
@@ -230,6 +231,7 @@ export const ChatPanel = forwardRef<ChatPanelRef, ChatPanelProps>(function ChatP
           disabled={isStreaming}
           onNewConversation={handleNewChat}
           streamingState={streamingState}
+          onStop={stop}
         />
       </div>
 
diff --git a/web/src/components/MessageInput.tsx b/web/src/components/MessageInput.tsx
index 34a73449..2aedda91 100644
--- a/web/src/components/MessageInput.tsx
+++ b/web/src/components/MessageInput.tsx
@@ -1,4 +1,4 @@
-import { ArrowUp, Paperclip } from "lucide-react";
+import { ArrowUp, Paperclip, Square } from "lucide-react";
 import { useCallback, useEffect, useRef, useState } from "react";
 import type { StreamingState } from "../hooks/useChat";
 import { FileAttachmentChips } from "./FileAttachmentChips";
@@ -11,6 +11,9 @@ interface MessageInputProps {
   onNewConversation?: () => void;
   /** Drives the ambient "breathing" border while a turn is in flight. */
   streamingState?: StreamingState;
+  /** Stop the in-flight turn. When provided, the send button becomes a Stop
+   *  button while a turn is streaming. */
+  onStop?: () => void;
 }
 
 export function MessageInput({
@@ -18,6 +21,7 @@ export function MessageInput({
   disabled,
   onNewConversation,
   streamingState,
+  onStop,
 }: MessageInputProps) {
   const [text, setText] = useState("");
   const [isFocused, setIsFocused] = useState(false);
@@ -218,19 +222,30 @@ export function MessageInput({
               <Paperclip style={{ width: 16, height: 16 }} />
             </button>
           </div>
-          <button
-            onClick={handleSend}
-            disabled={!canSend}
-            type="button"
-            aria-label="Send message"
-            className={`shrink-0 flex items-center justify-center w-8 h-8 rounded-lg transition-all duration-200 ${
-              canSend
-                ? "bg-primary hover:bg-primary/90 text-primary-foreground"
-                : "bg-muted text-muted-foreground cursor-not-allowed"
-            }`}
-          >
-            <ArrowUp style={{ width: 18, height: 18 }} />
-          </button>
+          {disabled && onStop ? (
+            <button
+              onClick={onStop}
+              type="button"
+              aria-label="Stop generating"
+              className="shrink-0 flex items-center justify-center w-8 h-8 rounded-lg transition-all duration-200 bg-primary hover:bg-primary/90 text-primary-foreground"
+            >
+              <Square style={{ width: 14, height: 14 }} fill="currentColor" />
+            </button>
+          ) : (
+            <button
+              onClick={handleSend}
+              disabled={!canSend}
+              type="button"
+              aria-label="Send message"
+              className={`shrink-0 flex items-center justify-center w-8 h-8 rounded-lg transition-all duration-200 ${
+                canSend
+                  ? "bg-primary hover:bg-primary/90 text-primary-foreground"
+                  : "bg-muted text-muted-foreground cursor-not-allowed"
+              }`}
+            >
+              <ArrowUp style={{ width: 18, height: 18 }} />
+            </button>
+          )}
         </div>
       </div>
 
diff --git a/web/src/components/MessageList.tsx b/web/src/components/MessageList.tsx
index e2871d86..fae1e220 100644
--- a/web/src/components/MessageList.tsx
+++ b/web/src/components/MessageList.tsx
@@ -180,15 +180,22 @@ function useSmartScroll(messages: ChatMessage[]) {
     prevConversationKeyRef.current = conversationKey;
     prevMessageCountRef.current = messages.length;
 
-    // Conversation loaded (different conversation or first load with history)
+    // Conversation loaded (different conversation or first load with history):
+    // land at the bottom (most recent turn), like ChatGPT/Claude.
     if (conversationKey !== prevKey && messages.length > 1) {
-      // Use double-rAF to ensure DOM has rendered the messages
+      // Use double-rAF to ensure the DOM has rendered the messages. Scroll the
+      // last real message to the viewport bottom (not the trailing 60vh
+      // spacer / bottomRef, which would leave the last turn off-screen).
       requestAnimationFrame(() => {
         requestAnimationFrame(() => {
-          scrollRef.current?.scrollTo({ top: 0, behavior: "instant" });
+          const container = scrollRef.current;
+          const inner = container?.firstElementChild;
+          const lastMsg = inner?.children[messages.length - 1] as HTMLElement | undefined;
+          if (lastMsg) lastMsg.scrollIntoView({ behavior: "instant", block: "end" });
+          else container?.scrollTo({ top: container.scrollHeight, behavior: "instant" });
         });
       });
-      setIsAtBottom(false);
+      setIsAtBottom(true);
       return;
     }
 
diff --git a/web/src/components/SlotRenderer.tsx b/web/src/components/SlotRenderer.tsx
index 4ac72025..a5102677 100644
--- a/web/src/components/SlotRenderer.tsx
+++ b/web/src/components/SlotRenderer.tsx
@@ -1,4 +1,4 @@
-import { useEffect, useRef } from "react";
+import { useEffect, useRef, useSyncExternalStore } from "react";
 import { getResources, uiPathFromUri } from "../api/client";
 import type { BridgeHandle } from "../bridge/bridge";
 import { createBridge } from "../bridge/bridge";
@@ -7,6 +7,7 @@ import { createAppIframe } from "../bridge/iframe";
 import type { UiChatContext } from "../bridge/types";
 import { useTheme } from "../context/ThemeContext";
 import { useWorkspaceContext } from "../context/WorkspaceContext";
+import { chatStore } from "../hooks/chat-store";
 import type { PlacementEntry } from "../types";
 
 interface SlotRendererProps {
@@ -61,6 +62,17 @@ export function SlotRenderer({
   const forceRefreshRef = useRef(forceRefresh);
   forceRefreshRef.current = forceRefresh;
 
+  // Conversations currently streaming an assistant turn in this tab. Pushed
+  // into hostContext so the conversations list can show a per-row indicator.
+  // The store identity is stable between membership changes, so this only
+  // re-pushes when a conversation starts/stops streaming — not per delta.
+  const streamingIds = useSyncExternalStore(
+    chatStore.subscribeStreamingIds,
+    chatStore.getStreamingIds,
+  );
+  const streamingIdsRef = useRef(streamingIds);
+  streamingIdsRef.current = streamingIds;
+
   const filtered = routeFilter ? placements.filter((p) => p.route === routeFilter) : placements;
 
   // Stable key: only re-mount iframes when the actual placements change
@@ -111,7 +123,11 @@ export function SlotRenderer({
             onNavigate: (...args) => onNavigateRef.current?.(...args),
             onPromptAction: (...args) => onPromptActionRef.current?.(...args),
             getHostExtensions: () =>
-              buildHostExtensions(workspaceRef.current, forceRefreshRef.current),
+              buildHostExtensions(
+                workspaceRef.current,
+                forceRefreshRef.current,
+                streamingIdsRef.current,
+              ),
           });
           bridges.push(bridge);
         } catch (err) {
@@ -140,11 +156,11 @@ export function SlotRenderer({
   // mounted; apps that observe `useHostContext()` (or `useTheme()`) re-render
   // and refetch workspace-scoped data without losing local state.
   useEffect(() => {
-    const ctx = buildHostContext(mode, activeWorkspace);
+    const ctx = buildHostContext(mode, activeWorkspace, streamingIds);
     for (const bridge of bridgesRef.current) {
       bridge.setHostContext(ctx);
     }
-  }, [mode, activeWorkspace]);
+  }, [mode, activeWorkspace, streamingIds]);
 
   if (filtered.length === 0) return null;
 
diff --git a/web/src/context/ChatContext.tsx b/web/src/context/ChatContext.tsx
index 16c590c3..442e2157 100644
--- a/web/src/context/ChatContext.tsx
+++ b/web/src/context/ChatContext.tsx
@@ -1,9 +1,17 @@
 import type { ReactNode } from "react";
-import { createContext, useCallback, useContext, useEffect, useMemo, useState } from "react";
+import {
+  createContext,
+  useCallback,
+  useContext,
+  useEffect,
+  useMemo,
+  useRef,
+  useState,
+} from "react";
 import { callTool } from "../api/client";
+import { chatStore } from "../hooks/chat-store";
 import type { UseChatReturn } from "../hooks/useChat";
 import { useChat } from "../hooks/useChat";
-import { useConversationEvents } from "../hooks/useConversationEvents";
 import type { AppContext, ConfigInfo } from "../types";
 
 // ---------------------------------------------------------------------------
@@ -59,6 +67,19 @@ export function ChatProvider({
 }: ChatProviderProps) {
   const chat = useChat(initialConversationId, currentUserId);
 
+  // Drop every cached conversation slice when the signed-in user changes
+  // (logout → login as someone else in the same tab). Conversations are
+  // user-scoped, so a workspace switch must NOT reset — only an identity
+  // change. The store is a module singleton that outlives this provider's
+  // remounts, so stale slices would otherwise leak across users.
+  const prevUserRef = useRef(currentUserId);
+  useEffect(() => {
+    if (prevUserRef.current !== currentUserId) {
+      chatStore.reset();
+      prevUserRef.current = currentUserId;
+    }
+  }, [currentUserId]);
+
   // Dev helper: window.__nb.simulateError("some error message")
   useEffect(() => {
     if (!import.meta.env.DEV) return;
@@ -152,21 +173,10 @@ export function ChatProvider({
     }
   }, []);
 
-  // Same-user cross-tab sync (Stage 1 single-owner). Stage 4 widens
-  // the audience when sharing returns.
-  useConversationEvents(chat.conversationId, {
-    onRemoteUserMessage: (data) => {
-      chat.injectRemoteUserMessage(data.userId, data.displayName, data.content);
-    },
-    onRemoteStreamEvent: (type, data) => {
-      chat.processRemoteStreamEvent(type, data);
-    },
-    onReconnect: () => {
-      if (chat.conversationId) {
-        chat.loadConversation(chat.conversationId);
-      }
-    },
-  });
+  // Cross-tab / refresh sync is now handled by the per-conversation turn
+  // stream itself (server-authoritative): every viewer attaches to
+  // GET /v1/conversations/:id/events, which replays the in-flight turn and
+  // tails live. No separate remote-event bridge needed.
 
   const wrappedSendMessage = useCallback(
     (text: string, appContext?: AppContext, files?: File[]) => {
diff --git a/web/src/hooks/chat-store.ts b/web/src/hooks/chat-store.ts
new file mode 100644
index 00000000..0d5a4ca2
--- /dev/null
+++ b/web/src/hooks/chat-store.ts
@@ -0,0 +1,971 @@
+import {
+  callTool,
+  cancelChatTurn,
+  getAuthToken,
+  startChatTurn,
+  startChatTurnMultipart,
+} from "../api/client";
+import {
+  type ConversationStreamConnection,
+  connectConversationStream,
+} from "../api/conversation-stream";
+import { formatSendError } from "../api/format-error";
+import type {
+  AppContext,
+  ChatRequest,
+  ChatResult,
+  LlmDoneEvent,
+  ReasoningDeltaEvent,
+  StreamErrorEvent,
+  TextDeltaEvent,
+  ToolDoneEvent,
+  ToolPreparingEvent,
+  ToolStartEvent,
+} from "../types";
+
+// ===========================================================================
+// Public display types (shared across the chat UI). These live here — not in
+// useChat — because the slice store is the lowest layer that owns them and
+// `useChat` re-exports them for backward-compatible imports.
+// ===========================================================================
+
+export type StreamingState =
+  | null
+  | "thinking"
+  | "streaming"
+  | "preparing"
+  | "working"
+  | "analyzing";
+
+/** Identifies the tool the model is currently building a call for. */
+export interface PreparingTool {
+  id: string;
+  name: string;
+}
+
+/** Typed tool result shape forwarded through the bridge. */
+export interface ToolResultForUI {
+  content: Array<{ type: string; text?: string; [key: string]: unknown }>;
+  structuredContent?: Record<string, unknown>;
+  isError: boolean;
+}
+
+/** Tool call with UI state for streaming display. */
+export interface ToolCallDisplay {
+  id: string;
+  name: string;
+  status: "running" | "done" | "error";
+  ok?: boolean;
+  ms?: number;
+  resourceUri?: string;
+  resourceLinks?: Array<{
+    uri: string;
+    name?: string;
+    mimeType?: string;
+    description?: string;
+  }>;
+  result?: ToolResultForUI;
+  input?: Record<string, unknown>;
+  appName?: string;
+}
+
+/** A block in the assistant message stream — text, reasoning, or tool group. */
+export type ContentBlock =
+  | { type: "text"; text: string }
+  | { type: "reasoning"; text: string }
+  | { type: "tool"; toolCalls: ToolCallDisplay[] };
+
+/** Live iteration progress during streaming. */
+export interface IterationProgress {
+  n: number;
+  inputTokens: number;
+  outputTokens: number;
+}
+
+/** File metadata attached to a message. */
+export interface MessageFileAttachment {
+  id: string;
+  filename: string;
+  mimeType: string;
+  size: number;
+  extracted: boolean;
+}
+
+/** A chat message with ordered content blocks for display. */
+export interface ChatMessage {
+  role: "user" | "assistant";
+  content: string;
+  blocks?: ContentBlock[];
+  toolCalls?: ToolCallDisplay[];
+  iteration?: IterationProgress;
+  timestamp?: string;
+  userId?: string;
+  files?: MessageFileAttachment[];
+  stopReason?: string;
+  error?: string;
+  usage?: {
+    inputTokens: number;
+    outputTokens: number;
+    cacheReadTokens?: number;
+    cacheWriteTokens?: number;
+    reasoningTokens?: number;
+    model: string;
+    llmMs: number;
+  };
+}
+
+/** Conversation-level metadata (Stage 1: single-owner only). */
+export interface LoadedConversationMeta {
+  ownerId?: string;
+}
+
+// ===========================================================================
+// Snapshot — the immutable view a React component renders for one conversation.
+// ===========================================================================
+
+export interface ChatSnapshot {
+  conversationId: string | null;
+  /** Server-generated conversation title (null until generated/loaded). */
+  title: string | null;
+  messages: ChatMessage[];
+  isStreaming: boolean;
+  streamingState: StreamingState;
+  preparingTool: PreparingTool | null;
+  meta: LoadedConversationMeta | null;
+  error: string | null;
+}
+
+const EMPTY_MESSAGES: ChatMessage[] = [];
+const EMPTY_SNAPSHOT: ChatSnapshot = {
+  conversationId: null,
+  title: null,
+  messages: EMPTY_MESSAGES,
+  isStreaming: false,
+  streamingState: null,
+  preparingTool: null,
+  meta: null,
+  error: null,
+};
+
+// ===========================================================================
+// Slice — mutable per-conversation viewer state.
+//
+// The server is authoritative: a turn runs to completion server-side and its
+// events are published to a per-conversation stream. This slice is a *view*
+// over that stream plus the persisted history. Switching away / refreshing
+// just detaches; re-attaching replays the in-flight turn (issue #254 +
+// server-authoritative streaming follow-up).
+// ===========================================================================
+
+interface ConversationSlice {
+  keys: Set<string>;
+  conversationId: string | null;
+  title: string | null;
+  messages: ChatMessage[];
+  isStreaming: boolean;
+  streamingState: StreamingState;
+  preparingTool: PreparingTool | null;
+  meta: LoadedConversationMeta | null;
+  error: string | null;
+  // streaming scratch
+  blocks: ContentBlock[];
+  toolCalls: ToolCallDisplay[];
+  iteration?: IterationProgress;
+  // live subscription to the server turn stream (null when detached)
+  connection: ConversationStreamConnection | null;
+  /** The next streamed `user.message` echoes a turn we optimistically added —
+   *  consume it instead of appending a duplicate. */
+  pendingEcho: boolean;
+  /** First `subscribed` frame of a resume should trim a stale in-flight turn
+   *  from disk history (the replay rebuilds it). */
+  resumeOnSubscribe: boolean;
+  /** True once full history is loaded (loadConversation) or the conversation
+   *  was authored in this session (sendTurn / new draft). A dot-only probe
+   *  leaves it false so opening the conversation still fetches full history. */
+  hydrated: boolean;
+  lastActiveAt: number;
+  snapshot: ChatSnapshot;
+}
+
+export interface StartTurnHooks {
+  onConversationId?: (id: string) => void;
+}
+
+export interface StartTurnParams {
+  text: string;
+  appContext?: AppContext;
+  model?: string;
+  files?: File[];
+  currentUserId?: string;
+}
+
+// ---------------------------------------------------------------------------
+// Pure helpers
+// ---------------------------------------------------------------------------
+
+function cloneBlocks(blocks: ContentBlock[]): ContentBlock[] {
+  return blocks.map((b) => {
+    if (b.type === "tool") return { ...b, toolCalls: [...b.toolCalls] };
+    return { ...b };
+  });
+}
+
+function textFromBlocks(blocks: ContentBlock[]): string {
+  return blocks
+    .filter((b): b is ContentBlock & { type: "text" } => b.type === "text")
+    .map((b) => b.text)
+    .join("");
+}
+
+function wrapStringResult(text: string, isError = false): ToolResultForUI {
+  return { content: [{ type: "text", text }], isError };
+}
+
+const updateTool =
+  (evt: ToolDoneEvent) =>
+  (tc: ToolCallDisplay): ToolCallDisplay =>
+    tc.id === evt.id
+      ? {
+          ...tc,
+          status: evt.ok ? ("done" as const) : ("error" as const),
+          ok: evt.ok,
+          ms: evt.ms,
+          resourceUri: tc.resourceUri ?? evt.resourceUri,
+          resourceLinks:
+            evt.resourceLinks != null && evt.resourceLinks.length > 0
+              ? evt.resourceLinks
+              : tc.resourceLinks,
+          result: evt.result != null ? (evt.result as ToolResultForUI) : tc.result,
+        }
+      : tc;
+
+// ---------------------------------------------------------------------------
+// Key helpers
+// ---------------------------------------------------------------------------
+
+const DRAFT_PREFIX = "draft:";
+let draftCounter = 0;
+
+export function freshDraftKey(): string {
+  draftCounter += 1;
+  return `${DRAFT_PREFIX}${draftCounter}`;
+}
+
+export function isDraftKey(key: string): boolean {
+  return key.startsWith(DRAFT_PREFIX);
+}
+
+// ---------------------------------------------------------------------------
+// Store
+// ---------------------------------------------------------------------------
+
+const MAX_SLICES = 30;
+
+export interface ChatStore {
+  ensureSlice(key: string, opts?: { conversationId?: string | null }): void;
+  getSnapshot(key: string): ChatSnapshot;
+  subscribeSlice(key: string, cb: () => void): () => void;
+  getStreamingIds(): string[];
+  subscribeStreamingIds(cb: () => void): () => void;
+  markActive(key: string): void;
+  markInactive(key: string): void;
+  /** Send a message: start a server turn, then watch its stream. */
+  sendTurn(key: string, params: StartTurnParams, hooks?: StartTurnHooks): Promise<void>;
+  /** Load persisted history and attach to any in-flight turn. */
+  loadConversation(id: string): Promise<void>;
+  /** Probe whether a conversation is generating (restores dots on reload),
+   *  without fetching message history. */
+  probeConversation(id: string): void;
+  /** Set a conversation's title (from the live `conversation.title` SSE).
+   *  No-op if the conversation has no slice in this tab. */
+  setTitle(conversationId: string, title: string): void;
+  /** Stop an in-flight turn (the only thing that aborts generation). */
+  cancelTurn(key: string): void;
+  retryLastMessage(key: string): string | null;
+  simulateError(key: string, message: string): void;
+  reset(): void;
+  sliceCount(): number;
+}
+
+export function createChatStore(): ChatStore {
+  const byKey = new Map<string, ConversationSlice>();
+  const allSlices = new Set<ConversationSlice>();
+  const listeners = new Map<string, Set<() => void>>();
+  const activeCounts = new Map<string, number>();
+
+  let streamingIds: string[] = [];
+  const streamingListeners = new Set<() => void>();
+
+  // -- snapshot + notification --
+
+  function buildSnapshot(slice: ConversationSlice): ChatSnapshot {
+    return {
+      conversationId: slice.conversationId,
+      title: slice.title,
+      messages: slice.messages,
+      isStreaming: slice.isStreaming,
+      streamingState: slice.streamingState,
+      preparingTool: slice.preparingTool,
+      meta: slice.meta,
+      error: slice.error,
+    };
+  }
+
+  function notifyKey(key: string): void {
+    const set = listeners.get(key);
+    if (!set) return;
+    for (const cb of set) cb();
+  }
+
+  function recomputeStreamingIds(): void {
+    const ids = new Set<string>();
+    for (const slice of allSlices) {
+      if (slice.isStreaming && slice.conversationId) ids.add(slice.conversationId);
+    }
+    const next = [...ids].sort();
+    if (next.length !== streamingIds.length || next.some((id, i) => id !== streamingIds[i])) {
+      streamingIds = next;
+      for (const cb of streamingListeners) cb();
+    }
+  }
+
+  function commit(slice: ConversationSlice): void {
+    slice.snapshot = buildSnapshot(slice);
+    for (const key of slice.keys) notifyKey(key);
+    recomputeStreamingIds();
+  }
+
+  // -- slice lifecycle --
+
+  function isActive(slice: ConversationSlice): boolean {
+    for (const key of slice.keys) {
+      if ((activeCounts.get(key) ?? 0) > 0) return true;
+    }
+    return false;
+  }
+
+  function removeSlice(slice: ConversationSlice): void {
+    slice.connection?.close();
+    slice.connection = null;
+    for (const key of slice.keys) byKey.delete(key);
+    allSlices.delete(slice);
+  }
+
+  function evict(): void {
+    if (allSlices.size <= MAX_SLICES) return;
+    const idle = [...allSlices]
+      .filter((s) => !s.isStreaming && !isActive(s))
+      .sort((a, b) => a.lastActiveAt - b.lastActiveAt);
+    let over = allSlices.size - MAX_SLICES;
+    for (const s of idle) {
+      if (over <= 0) break;
+      removeSlice(s);
+      over -= 1;
+    }
+  }
+
+  function createSlice(key: string, conversationId: string | null): ConversationSlice {
+    const slice: ConversationSlice = {
+      keys: new Set([key]),
+      conversationId,
+      title: null,
+      messages: [],
+      isStreaming: false,
+      streamingState: null,
+      preparingTool: null,
+      meta: null,
+      error: null,
+      blocks: [],
+      toolCalls: [],
+      iteration: undefined,
+      connection: null,
+      pendingEcho: false,
+      resumeOnSubscribe: false,
+      // A fresh draft is fully "loaded" (empty IS its full history); a slice
+      // keyed by a real conversation id starts unhydrated until fetched.
+      hydrated: isDraftKey(key),
+      lastActiveAt: Date.now(),
+      snapshot: EMPTY_SNAPSHOT,
+    };
+    slice.snapshot = buildSnapshot(slice);
+    byKey.set(key, slice);
+    allSlices.add(slice);
+    evict();
+    return slice;
+  }
+
+  function ensureSlice(key: string, opts?: { conversationId?: string | null }): void {
+    const existing = byKey.get(key);
+    if (existing) {
+      existing.lastActiveAt = Date.now();
+      return;
+    }
+    const convId =
+      opts && "conversationId" in opts
+        ? (opts.conversationId ?? null)
+        : isDraftKey(key)
+          ? null
+          : key;
+    createSlice(key, convId);
+  }
+
+  function aliasSlice(slice: ConversationSlice, conversationId: string): void {
+    if (slice.keys.has(conversationId)) return;
+    slice.keys.add(conversationId);
+    byKey.set(conversationId, slice);
+  }
+
+  // -- streaming scratch --
+
+  function resetScratch(slice: ConversationSlice): void {
+    slice.blocks = [];
+    slice.toolCalls = [];
+    slice.iteration = undefined;
+  }
+
+  function assistantFromScratch(slice: ConversationSlice): ChatMessage {
+    return {
+      role: "assistant",
+      content: textFromBlocks(slice.blocks),
+      blocks: cloneBlocks(slice.blocks),
+      toolCalls: [...slice.toolCalls],
+      iteration: slice.iteration ? { ...slice.iteration } : undefined,
+    };
+  }
+
+  function flush(slice: ConversationSlice): void {
+    const updated = [...slice.messages];
+    updated[updated.length - 1] = assistantFromScratch(slice);
+    slice.messages = updated;
+    commit(slice);
+  }
+
+  /** Drop the trailing in-flight turn (last user message + anything after). */
+  function trimTrailingTurn(slice: ConversationSlice): void {
+    for (let i = slice.messages.length - 1; i >= 0; i--) {
+      if (slice.messages[i].role === "user") {
+        slice.messages = slice.messages.slice(0, i);
+        return;
+      }
+    }
+  }
+
+  // -- subscription --
+
+  function closeConnection(slice: ConversationSlice): void {
+    slice.connection?.close();
+    slice.connection = null;
+  }
+
+  function openConnection(slice: ConversationSlice, conversationId: string, resume: boolean): void {
+    closeConnection(slice);
+    slice.resumeOnSubscribe = resume;
+    // When a resume finds no active turn, the server may still replay the most
+    // recent (already-finished) turn from its grace buffer. Those events would
+    // re-append a turn that's already in the loaded disk history → duplicate.
+    // Drop them once we know this connection isn't watching a live turn.
+    let dropEvents = false;
+    slice.connection = connectConversationStream({
+      conversationId,
+      token: getAuthToken() ?? undefined,
+      afterSeq: 0,
+      onSubscribed: (info) => {
+        if (slice.resumeOnSubscribe) {
+          slice.resumeOnSubscribe = false;
+          if (info.isActive) {
+            // A turn is in flight — trim the stale in-flight turn loaded from
+            // disk; the RunBus replay rebuilds it from the top. Reflect the
+            // server's "is generating" truth immediately so the streaming
+            // indicator (and Stop button) show on resume without waiting for
+            // the first replayed event.
+            trimTrailingTurn(slice);
+            resetScratch(slice);
+            slice.isStreaming = true;
+            if (!slice.streamingState) slice.streamingState = "thinking";
+            commit(slice);
+          } else if (!slice.isStreaming) {
+            // Nothing in flight and we're not sending — ignore the trailing
+            // grace-buffer replay (already in disk history) and detach.
+            dropEvents = true;
+            closeConnection(slice);
+          }
+        }
+      },
+      onEvent: (type, data) => {
+        if (dropEvents) return;
+        applyStreamEvent(slice, type, data);
+      },
+      onError: () => {
+        // Leave the slice intact; the persisted history still renders.
+      },
+    });
+  }
+
+  // -- stream reducer --
+
+  function applyStreamEvent(slice: ConversationSlice, type: string, data: unknown): void {
+    switch (type) {
+      case "user.message": {
+        const evt = data as { content: string; userId?: string; timestamp?: string };
+        resetScratch(slice);
+        if (slice.pendingEcho) {
+          // Our optimistic user message + assistant placeholder are already in
+          // place; the deltas will fill the placeholder.
+          slice.pendingEcho = false;
+        } else {
+          const userMsg: ChatMessage = {
+            role: "user",
+            content: evt.content,
+            ...(evt.timestamp ? { timestamp: evt.timestamp } : {}),
+            ...(evt.userId ? { userId: evt.userId } : {}),
+          };
+          const assistantMsg: ChatMessage = {
+            role: "assistant",
+            content: "",
+            blocks: [],
+            toolCalls: [],
+            timestamp: new Date().toISOString(),
+          };
+          slice.messages = [...slice.messages, userMsg, assistantMsg];
+        }
+        slice.isStreaming = true;
+        slice.streamingState = "thinking";
+        commit(slice);
+        break;
+      }
+      case "chat.start": {
+        const evt = data as { conversationId: string };
+        if (evt.conversationId && slice.conversationId !== evt.conversationId) {
+          slice.conversationId = evt.conversationId;
+          aliasSlice(slice, evt.conversationId);
+          commit(slice);
+        }
+        break;
+      }
+      case "text.delta": {
+        const evt = data as TextDeltaEvent;
+        slice.streamingState = "streaming";
+        slice.preparingTool = null;
+        const last = slice.blocks[slice.blocks.length - 1];
+        if (last && last.type === "text") last.text += evt.text;
+        else slice.blocks.push({ type: "text", text: evt.text });
+        flush(slice);
+        break;
+      }
+      case "reasoning.delta": {
+        const evt = data as ReasoningDeltaEvent;
+        slice.streamingState = "streaming";
+        slice.preparingTool = null;
+        const last = slice.blocks[slice.blocks.length - 1];
+        if (last && last.type === "reasoning") last.text += evt.text;
+        else slice.blocks.push({ type: "reasoning", text: evt.text });
+        flush(slice);
+        break;
+      }
+      case "tool.preparing": {
+        const evt = data as ToolPreparingEvent;
+        slice.streamingState = "preparing";
+        slice.preparingTool = { id: evt.id, name: evt.name };
+        commit(slice);
+        break;
+      }
+      case "tool.preparing.done":
+        break;
+      case "tool.start": {
+        const evt = data as ToolStartEvent;
+        slice.streamingState = "working";
+        slice.preparingTool = null;
+        const separatorIdx = evt.name.indexOf("__");
+        const newTool: ToolCallDisplay = {
+          id: evt.id,
+          name: evt.name,
+          status: "running",
+          resourceUri: evt.resourceUri,
+          input: evt.input,
+          appName: separatorIdx !== -1 ? evt.name.slice(0, separatorIdx) : undefined,
+        };
+        slice.toolCalls = [...slice.toolCalls, newTool];
+        const last = slice.blocks[slice.blocks.length - 1];
+        if (last && last.type === "tool") last.toolCalls = [...last.toolCalls, newTool];
+        else slice.blocks.push({ type: "tool", toolCalls: [newTool] });
+        flush(slice);
+        break;
+      }
+      case "tool.done": {
+        const evt = data as ToolDoneEvent;
+        const updater = updateTool(evt);
+        slice.toolCalls = slice.toolCalls.map(updater);
+        for (const block of slice.blocks) {
+          if (block.type === "tool") block.toolCalls = block.toolCalls.map(updater);
+        }
+        const anyRunning = slice.toolCalls.some((tc) => tc.status === "running");
+        slice.streamingState = anyRunning ? "working" : "analyzing";
+        flush(slice);
+        break;
+      }
+      case "llm.done": {
+        const evt = data as LlmDoneEvent;
+        slice.iteration = {
+          n: (slice.iteration?.n ?? 0) + 1,
+          inputTokens: (slice.iteration?.inputTokens ?? 0) + (evt.usage?.inputTokens ?? 0),
+          outputTokens: (slice.iteration?.outputTokens ?? 0) + (evt.usage?.outputTokens ?? 0),
+        };
+        flush(slice);
+        break;
+      }
+      case "done": {
+        const result = data as ChatResult;
+        slice.streamingState = null;
+        slice.preparingTool = null;
+        slice.isStreaming = false;
+
+        if (result.toolCalls) {
+          const outputMap = new Map(result.toolCalls.map((tc) => [tc.id, tc.output]));
+          const backfill = (tc: ToolCallDisplay): ToolCallDisplay => {
+            if (tc.result != null) return tc;
+            const output = outputMap.get(tc.id);
+            return output != null ? { ...tc, result: wrapStringResult(output) } : tc;
+          };
+          for (const block of slice.blocks) {
+            if (block.type === "tool") block.toolCalls = block.toolCalls.map(backfill);
+          }
+          slice.toolCalls = slice.toolCalls.map(backfill);
+        }
+
+        const finalBlocks = cloneBlocks(slice.blocks);
+        const finalTools = slice.toolCalls.length > 0 ? [...slice.toolCalls] : undefined;
+        const usage = result.usage
+          ? {
+              inputTokens: result.usage.inputTokens,
+              outputTokens: result.usage.outputTokens,
+              cacheReadTokens: result.usage.cacheReadTokens,
+              cacheWriteTokens: result.usage.cacheWriteTokens,
+              reasoningTokens: result.usage.reasoningTokens,
+              model: result.usage.model,
+              llmMs: result.usage.llmMs,
+            }
+          : undefined;
+        const resultFiles = (result as unknown as Record<string, unknown>).files as
+          | MessageFileAttachment[]
+          | undefined;
+
+        const updated = [...slice.messages];
+        if (updated.length > 0 && updated[updated.length - 1].role === "assistant") {
+          updated[updated.length - 1] = {
+            role: "assistant",
+            content: result.response,
+            blocks: finalBlocks,
+            toolCalls: finalTools,
+            usage,
+            ...(result.stopReason && result.stopReason !== "complete"
+              ? { stopReason: result.stopReason }
+              : {}),
+            ...(resultFiles && resultFiles.length > 0 ? { files: resultFiles } : {}),
+          };
+          slice.messages = updated;
+        }
+        resetScratch(slice);
+        commit(slice);
+        closeConnection(slice);
+        break;
+      }
+      case "error": {
+        const evt = data as StreamErrorEvent;
+        slice.streamingState = null;
+        slice.preparingTool = null;
+        slice.isStreaming = false;
+        const updated = [...slice.messages];
+        const last = updated[updated.length - 1];
+        if (last?.role === "assistant") {
+          updated[updated.length - 1] = { ...last, error: evt.message };
+          slice.messages = updated;
+        } else {
+          slice.error = evt.message;
+        }
+        commit(slice);
+        closeConnection(slice);
+        break;
+      }
+      case "cancelled": {
+        slice.streamingState = null;
+        slice.preparingTool = null;
+        slice.isStreaming = false;
+        commit(slice);
+        closeConnection(slice);
+        break;
+      }
+    }
+  }
+
+  // -- send (start a server turn, then watch it) --
+
+  async function sendTurn(
+    key: string,
+    params: StartTurnParams,
+    hooks?: StartTurnHooks,
+  ): Promise<void> {
+    ensureSlice(key);
+    const slice = byKey.get(key);
+    if (!slice || slice.isStreaming) return;
+
+    slice.error = null;
+    slice.isStreaming = true;
+    slice.streamingState = "thinking";
+    slice.pendingEcho = true;
+    // Authoring a turn means the full conversation lives in memory.
+    slice.hydrated = true;
+    resetScratch(slice);
+
+    // Optimistic user message + assistant placeholder for snappy UX. The
+    // streamed `user.message` echo is consumed (pendingEcho), not duplicated.
+    const userFiles: MessageFileAttachment[] | undefined = params.files?.map((f) => ({
+      id: `pending_${f.name}_${f.size}`,
+      filename: f.name,
+      mimeType: f.type || "application/octet-stream",
+      size: f.size,
+      extracted: false,
+    }));
+    const userMsg: ChatMessage = {
+      role: "user",
+      content: params.text,
+      timestamp: new Date().toISOString(),
+      ...(params.currentUserId ? { userId: params.currentUserId } : {}),
+      ...(userFiles && userFiles.length > 0 ? { files: userFiles } : {}),
+    };
+    const assistantMsg: ChatMessage = {
+      role: "assistant",
+      content: "",
+      blocks: [],
+      toolCalls: [],
+      timestamp: new Date().toISOString(),
+    };
+    slice.messages = [...slice.messages, userMsg, assistantMsg];
+    commit(slice);
+
+    const req: ChatRequest = {
+      message: params.text,
+      ...(slice.conversationId ? { conversationId: slice.conversationId } : {}),
+      ...(params.appContext ? { appContext: params.appContext } : {}),
+      ...(params.model ? { model: params.model } : {}),
+    };
+
+    let conversationId: string;
+    try {
+      const result =
+        params.files && params.files.length > 0
+          ? await startChatTurnMultipart(req, params.files)
+          : await startChatTurn(req);
+      conversationId = result.conversationId;
+    } catch (err) {
+      handleTurnError(slice, err);
+      slice.isStreaming = false;
+      slice.streamingState = null;
+      slice.pendingEcho = false;
+      commit(slice);
+      return;
+    }
+
+    if (slice.conversationId !== conversationId) {
+      slice.conversationId = conversationId;
+      aliasSlice(slice, conversationId);
+      hooks?.onConversationId?.(conversationId);
+      commit(slice);
+    }
+
+    // Watch the turn we just started (fresh turn — not a resume).
+    openConnection(slice, conversationId, false);
+  }
+
+  function handleTurnError(slice: ConversationSlice, err: unknown): void {
+    // Drop the optimistic user+assistant placeholders on a hard start failure.
+    slice.messages = slice.messages.slice(0, -2);
+    slice.error = formatSendError(err);
+  }
+
+  // -- load from disk + attach --
+
+  async function loadConversation(id: string): Promise<void> {
+    const existing = byKey.get(id);
+    // Already fully loaded and live — keep the stream, don't refetch. A
+    // dot-only probe (connection but not hydrated) falls through so opening
+    // the conversation fetches its full history.
+    if (existing?.hydrated && (existing.isStreaming || existing.connection)) {
+      existing.lastActiveAt = Date.now();
+      return;
+    }
+    ensureSlice(id, { conversationId: id });
+    const slice = byKey.get(id);
+    if (slice) slice.error = null;
+    try {
+      const res = await callTool("conversations", "get", { id, expand: "full" });
+      const current = byKey.get(id);
+      if (!current) return;
+      if (res.isError) {
+        const errText = res.content
+          ?.map((b) => b.text ?? "")
+          .filter(Boolean)
+          .join("\n");
+        throw new Error(errText || "Failed to load conversation");
+      }
+      let raw: unknown = res.structuredContent;
+      if (!raw && res.content?.[0]?.text) {
+        try {
+          raw = JSON.parse(res.content[0].text);
+        } catch {
+          raw = {};
+        }
+      }
+      const parsed = raw as {
+        metadata: { id: string; ownerId?: string; title?: string | null };
+        messages: ChatMessage[];
+      };
+      current.conversationId = parsed.metadata.id;
+      aliasSlice(current, parsed.metadata.id);
+      current.meta = { ownerId: parsed.metadata.ownerId };
+      current.title = parsed.metadata.title ?? null;
+      current.messages = parsed.messages ?? [];
+      current.hydrated = true;
+      commit(current);
+      // Attach to any in-flight turn (resume — trims a stale in-flight turn
+      // from the loaded history if the server says one is active).
+      openConnection(current, parsed.metadata.id, true);
+    } catch (err) {
+      const slc = byKey.get(id);
+      if (slc) {
+        slc.error = err instanceof Error ? err.message : "Failed to load conversation";
+        commit(slc);
+      }
+    }
+  }
+
+  function cancelTurn(key: string): void {
+    const slice = byKey.get(key);
+    if (!slice?.conversationId) return;
+    void cancelChatTurn(slice.conversationId);
+    // The server emits a terminal `cancelled` event which finalizes the slice;
+    // no optimistic mutation needed.
+  }
+
+  /**
+   * Lightweight "is this conversation generating?" probe — used on reload to
+   * restore background streaming dots without fetching message history. Opens
+   * a resume subscription: if the server says the turn is active, the slice
+   * flips to streaming (→ `getStreamingIds` → dot) and tails live; if not, the
+   * connection closes and the slice stays idle. Leaves `hydrated` false so a
+   * later open still loads full history.
+   */
+  function probeConversation(id: string): void {
+    const existing = byKey.get(id);
+    if (existing?.isStreaming || existing?.connection) return; // already live/probed
+    ensureSlice(id, { conversationId: id });
+    const slice = byKey.get(id);
+    if (slice) openConnection(slice, id, true);
+  }
+
+  // -- retry / simulate --
+
+  function retryLastMessage(key: string): string | null {
+    const slice = byKey.get(key);
+    if (!slice) return null;
+    let text: string | null = null;
+    for (let i = slice.messages.length - 1; i >= 0; i--) {
+      if (slice.messages[i].role === "user") {
+        text = slice.messages[i].content;
+        slice.messages = slice.messages.slice(0, i);
+        break;
+      }
+    }
+    slice.error = null;
+    slice.isStreaming = false;
+    slice.streamingState = null;
+    slice.preparingTool = null;
+    commit(slice);
+    return text;
+  }
+
+  function simulateError(key: string, message: string): void {
+    const slice = byKey.get(key);
+    if (!slice || slice.messages.length === 0) return;
+    const updated = [...slice.messages];
+    const last = updated[updated.length - 1];
+    if (last?.role === "assistant") {
+      updated[updated.length - 1] = { ...last, error: message };
+    } else {
+      updated.push({ role: "assistant", content: "", error: message });
+    }
+    slice.messages = updated;
+    slice.streamingState = null;
+    slice.preparingTool = null;
+    slice.isStreaming = false;
+    commit(slice);
+  }
+
+  function reset(): void {
+    for (const slice of allSlices) slice.connection?.close();
+    byKey.clear();
+    allSlices.clear();
+    activeCounts.clear();
+    streamingIds = [];
+    for (const set of listeners.values()) {
+      for (const cb of set) cb();
+    }
+    for (const cb of streamingListeners) cb();
+  }
+
+  return {
+    ensureSlice,
+    getSnapshot(key) {
+      return byKey.get(key)?.snapshot ?? EMPTY_SNAPSHOT;
+    },
+    subscribeSlice(key, cb) {
+      let set = listeners.get(key);
+      if (!set) {
+        set = new Set();
+        listeners.set(key, set);
+      }
+      set.add(cb);
+      return () => {
+        const s = listeners.get(key);
+        if (!s) return;
+        s.delete(cb);
+        if (s.size === 0) listeners.delete(key);
+      };
+    },
+    getStreamingIds() {
+      return streamingIds;
+    },
+    subscribeStreamingIds(cb) {
+      streamingListeners.add(cb);
+      return () => streamingListeners.delete(cb);
+    },
+    markActive(key) {
+      activeCounts.set(key, (activeCounts.get(key) ?? 0) + 1);
+      const slice = byKey.get(key);
+      if (slice) slice.lastActiveAt = Date.now();
+    },
+    markInactive(key) {
+      const n = (activeCounts.get(key) ?? 0) - 1;
+      if (n <= 0) activeCounts.delete(key);
+      else activeCounts.set(key, n);
+    },
+    sendTurn,
+    loadConversation,
+    probeConversation,
+    setTitle(conversationId, title) {
+      const slice = byKey.get(conversationId);
+      if (!slice || slice.title === title) return;
+      slice.title = title;
+      commit(slice);
+    },
+    cancelTurn,
+    retryLastMessage,
+    simulateError,
+    reset,
+    sliceCount() {
+      return allSlices.size;
+    },
+  };
+}
+
+/** Module-singleton store. */
+export const chatStore = createChatStore();
diff --git a/web/src/hooks/useChat.ts b/web/src/hooks/useChat.ts
index ce1a1024..53a7d918 100644
--- a/web/src/hooks/useChat.ts
+++ b/web/src/hooks/useChat.ts
@@ -1,136 +1,27 @@
-import { useCallback, useEffect, useRef, useState } from "react";
-import { ApiClientError, callTool, streamChat, streamChatMultipart } from "../api/client";
-import { formatSendError } from "../api/format-error";
+import { useCallback, useEffect, useMemo, useState, useSyncExternalStore } from "react";
 import { captureEvent } from "../telemetry";
+import type { AppContext } from "../types";
 import type {
-  AppContext,
-  ChatRequest,
-  ChatResult,
-  ChatStreamEventMap,
-  ChatStreamEventType,
-  LlmDoneEvent,
-  ReasoningDeltaEvent,
-  StreamErrorEvent,
-  TextDeltaEvent,
-  ToolDoneEvent,
-  ToolPreparingEvent,
-  ToolStartEvent,
-} from "../types";
-
-/**
- * Streaming state machine:
- *
- *   null → thinking → streaming ↔ preparing → working → analyzing → streaming → null
- *                                                              ↘ working (next tool.start)
- *
- * `analyzing` fills the gap between the last tool.done (all tools finished)
- * and the next text.delta / tool.start, when the model is inferring on tool
- * results but the UI would otherwise look frozen.
- *
- * `preparing` fills the model-side gap: after text/reasoning has streamed
- * within an iteration, the model may continue emitting a large tool-call
- * input block (45 KB+ for full-document writes). No deltas fire during
- * that window — without `preparing`, the indicator goes dark for as long
- * as it takes the LLM to emit the args. `tool.preparing` fires on
- * `tool-input-start` from the AI SDK; `tool.start` follows once the
- * iteration finishes and the engine begins execution.
- *
- * Any `tool.start` can re-enter `working` from a non-terminal state.
- */
-export type StreamingState =
-  | null
-  | "thinking"
-  | "streaming"
-  | "preparing"
-  | "working"
-  | "analyzing";
-
-/** Identifies the tool the model is currently building a call for. */
-export interface PreparingTool {
-  id: string;
-  name: string;
-}
-
-/** Typed tool result shape forwarded through the bridge. */
-export interface ToolResultForUI {
-  content: Array<{ type: string; text?: string; [key: string]: unknown }>;
-  structuredContent?: Record<string, unknown>;
-  isError: boolean;
-}
-
-/** Tool call with UI state for streaming display. */
-export interface ToolCallDisplay {
-  id: string;
-  name: string;
-  status: "running" | "done" | "error";
-  ok?: boolean;
-  ms?: number;
-  resourceUri?: string;
-  /** MCP `resource_link` blocks returned by the tool result, if any. */
-  resourceLinks?: Array<{
-    uri: string;
-    name?: string;
-    mimeType?: string;
-    description?: string;
-  }>;
-  result?: ToolResultForUI;
-  input?: Record<string, unknown>;
-  appName?: string;
-}
-
-/** A block in the assistant message stream — text, reasoning, or tool call group, in temporal order. */
-export type ContentBlock =
-  | { type: "text"; text: string }
-  | { type: "reasoning"; text: string }
-  | { type: "tool"; toolCalls: ToolCallDisplay[] };
-
-/** Live iteration progress during streaming. */
-export interface IterationProgress {
-  n: number;
-  inputTokens: number;
-  outputTokens: number;
-}
-
-/** File metadata attached to a message. */
-export interface MessageFileAttachment {
-  id: string;
-  filename: string;
-  mimeType: string;
-  size: number;
-  extracted: boolean;
-}
-
-/** A chat message with ordered content blocks for display. */
-export interface ChatMessage {
-  role: "user" | "assistant";
-  content: string;
-  blocks?: ContentBlock[];
-  toolCalls?: ToolCallDisplay[];
-  iteration?: IterationProgress;
-  timestamp?: string;
-  userId?: string;
-  files?: MessageFileAttachment[];
-  stopReason?: string;
-  /** Set when the engine errors mid-stream — renders inline on the message. */
-  error?: string;
-  usage?: {
-    inputTokens: number;
-    outputTokens: number;
-    cacheReadTokens?: number;
-    cacheWriteTokens?: number;
-    reasoningTokens?: number;
-    model: string;
-    llmMs: number;
-  };
-}
-
-/**
- * Conversation-level metadata. Stage 1: single-owner only — sharing
- * was removed (returns in Stage 4 with policy gating).
- */
-export interface LoadedConversationMeta {
-  ownerId?: string;
-}
+  ChatMessage,
+  LoadedConversationMeta,
+  PreparingTool,
+  StreamingState,
+} from "./chat-store";
+import { chatStore, freshDraftKey } from "./chat-store";
+
+// Re-export the display types so existing `from "../hooks/useChat"` imports
+// keep working — the slice store now owns the definitions.
+export type {
+  ChatMessage,
+  ContentBlock,
+  IterationProgress,
+  LoadedConversationMeta,
+  MessageFileAttachment,
+  PreparingTool,
+  StreamingState,
+  ToolCallDisplay,
+  ToolResultForUI,
+} from "./chat-store";
 
 export interface UseChatReturn {
   messages: ChatMessage[];
@@ -139,6 +30,8 @@ export interface UseChatReturn {
   /** Set while streamingState === "preparing"; null otherwise. */
   preparingTool: PreparingTool | null;
   conversationId: string | null;
+  /** Server-generated title; null until generated/loaded. */
+  title: string | null;
   conversationMeta: LoadedConversationMeta | null;
   error: string | null;
   sendMessage: (
@@ -149,687 +42,117 @@ export interface UseChatReturn {
   ) => Promise<void>;
   newConversation: () => void;
   loadConversation: (id: string) => Promise<void>;
-  /** Inject a user message from another participant (remote stream). */
-  injectRemoteUserMessage: (userId: string, displayName: string, content: string) => void;
-  /** Process a streaming event from a remote participant's assistant response. */
-  processRemoteStreamEvent: (type: string, data: unknown) => void;
+  /** Stop the in-flight turn (the only thing that aborts generation). */
+  stop: () => void;
   /** Retry the last failed message (removes errored pair and re-sends). */
   retryLastMessage: () => void;
   /** Inject a synthetic error for demoing the error UX (dev only). */
   simulateError: (message: string) => void;
 }
 
-/** Deep-copy blocks for immutable state updates. */
-function cloneBlocks(blocks: ContentBlock[]): ContentBlock[] {
-  return blocks.map((b) => {
-    if (b.type === "tool") return { ...b, toolCalls: [...b.toolCalls] };
-    return { ...b }; // text or reasoning — both shaped { type, text }
+/**
+ * Per-conversation chat state, backed by the module-singleton {@link chatStore}.
+ *
+ * `activeKey` selects which conversation's slice this hook renders. A stream
+ * started for one conversation writes only into that conversation's slice
+ * (captured at send time), so switching conversations mid-turn never bleeds
+ * the in-flight response into the destination chat (issue #254). Switching
+ * back shows the still-arriving response because the background stream kept
+ * filling its origin slice.
+ */
+export function useChat(initialConversationId?: string, currentUserId?: string): UseChatReturn {
+  const [activeKey, setActiveKey] = useState(() => {
+    const key = initialConversationId ?? freshDraftKey();
+    chatStore.ensureSlice(
+      key,
+      initialConversationId ? { conversationId: initialConversationId } : undefined,
+    );
+    return key;
   });
-}
-
-/** Derive full visible text from blocks. Reasoning is NOT included
- *  (it's collapsed-by-default UI and shouldn't pollute the message body). */
-function textFromBlocks(blocks: ContentBlock[]): string {
-  return blocks
-    .filter((b): b is ContentBlock & { type: "text" } => b.type === "text")
-    .map((b) => b.text)
-    .join("");
-}
-
-/** Wrap a plain string result into a ToolResultForUI. */
-function wrapStringResult(text: string, isError = false): ToolResultForUI {
-  return { content: [{ type: "text", text }], isError };
-}
 
-const updateTool =
-  (evt: ToolDoneEvent) =>
-  (tc: ToolCallDisplay): ToolCallDisplay =>
-    tc.id === evt.id
-      ? {
-          ...tc,
-          status: evt.ok ? ("done" as const) : ("error" as const),
-          ok: evt.ok,
-          ms: evt.ms,
-          resourceUri: tc.resourceUri ?? evt.resourceUri,
-          resourceLinks:
-            evt.resourceLinks != null && evt.resourceLinks.length > 0
-              ? evt.resourceLinks
-              : tc.resourceLinks,
-          result: evt.result != null ? (evt.result as ToolResultForUI) : tc.result,
-        }
-      : tc;
-
-export function useChat(initialConversationId?: string, currentUserId?: string): UseChatReturn {
-  const [messages, setMessages] = useState<ChatMessage[]>([]);
-  const [isStreaming, setIsStreaming] = useState(false);
-  const [conversationId, setConversationId] = useState<string | null>(
-    initialConversationId ?? null,
+  const subscribe = useCallback(
+    (cb: () => void) => chatStore.subscribeSlice(activeKey, cb),
+    [activeKey],
   );
-  const [error, setError] = useState<string | null>(null);
-  const [streamingState, setStreamingState] = useState<StreamingState>(null);
-  const [preparingTool, setPreparingTool] = useState<PreparingTool | null>(null);
-  const [conversationMeta, setConversationMeta] = useState<LoadedConversationMeta | null>(null);
-
-  // Refs for building the current assistant message during streaming.
-  const blocksRef = useRef<ContentBlock[]>([]);
-  const toolCallsRef = useRef<ToolCallDisplay[]>([]);
-  const iterationRef = useRef<IterationProgress | undefined>(undefined);
+  const getSnapshot = useCallback(() => chatStore.getSnapshot(activeKey), [activeKey]);
+  const snap = useSyncExternalStore(subscribe, getSnapshot);
 
-  /** Push current refs into the last assistant message. */
-  function flushToMessage() {
-    const currentBlocks = cloneBlocks(blocksRef.current);
-    const currentText = textFromBlocks(blocksRef.current);
-    const currentTools = [...toolCallsRef.current];
-    const currentIteration = iterationRef.current ? { ...iterationRef.current } : undefined;
-    setMessages((prev) => {
-      const updated = [...prev];
-      updated[updated.length - 1] = {
-        role: "assistant",
-        content: currentText,
-        blocks: currentBlocks,
-        toolCalls: currentTools,
-        iteration: currentIteration,
-      };
-      return updated;
-    });
-  }
+  // Mark the active slice so the LRU never evicts what the user is viewing.
+  useEffect(() => {
+    chatStore.markActive(activeKey);
+    return () => chatStore.markInactive(activeKey);
+  }, [activeKey]);
 
   const sendMessage = useCallback(
     async (text: string, appContext?: AppContext, model?: string, files?: File[]) => {
-      if (isStreaming) return;
-
-      setError(null);
-      setIsStreaming(true);
-      setStreamingState("thinking");
-      blocksRef.current = [];
-      toolCallsRef.current = [];
-      iterationRef.current = undefined;
-
-      // Add user message (with file previews if attached)
-      const userFiles: MessageFileAttachment[] | undefined = files?.map((f) => ({
-        id: `pending_${f.name}_${f.size}`,
-        filename: f.name,
-        mimeType: f.type || "application/octet-stream",
-        size: f.size,
-        extracted: false,
-      }));
-      const userMsg: ChatMessage = {
-        role: "user",
-        content: text,
-        timestamp: new Date().toISOString(),
-        ...(currentUserId ? { userId: currentUserId } : {}),
-        ...(userFiles && userFiles.length > 0 ? { files: userFiles } : {}),
-      };
-      setMessages((prev) => [...prev, userMsg]);
-
-      // Add placeholder assistant message
-      const assistantMsg: ChatMessage = {
-        role: "assistant",
-        content: "",
-        blocks: [],
-        toolCalls: [],
-        timestamp: new Date().toISOString(),
-      };
-      setMessages((prev) => [...prev, assistantMsg]);
-
-      // Enrich appContext with latest app state from the bridge (Synapse Feature 2)
+      // Enrich appContext with the latest app state from the bridge
+      // (Synapse Feature 2). Kept here — the store stays bridge-agnostic.
       let enrichedContext = appContext;
       if (appContext) {
         const { getAppState } = await import("../bridge/bridge");
         const appStateEntry = getAppState(appContext.serverName);
-        if (appStateEntry) {
-          enrichedContext = { ...appContext, appState: appStateEntry };
-        }
-      }
-
-      const req: ChatRequest = {
-        message: text,
-        ...(conversationId ? { conversationId } : {}),
-        ...(enrichedContext ? { appContext: enrichedContext } : {}),
-        ...(model ? { model } : {}),
-      };
-
-      try {
-        const onEvent = <K extends ChatStreamEventType>(type: K, data: ChatStreamEventMap[K]) => {
-          switch (type) {
-            case "chat.start": {
-              const evt = data as { conversationId: string };
-              if (evt.conversationId) {
-                setConversationId(evt.conversationId);
-              }
-              break;
-            }
-            case "text.delta": {
-              const evt = data as TextDeltaEvent;
-              setStreamingState((prev) => (prev !== "streaming" ? "streaming" : prev));
-              // Defensive: keeps `preparingTool` paired with the
-              // `"preparing"` streamingState. Render sites gate on the
-              // state, so stale data never shows today, but a future
-              // caller reading `preparingTool` directly would otherwise
-              // see a tool name from a long-finished iteration.
-              setPreparingTool(null);
-              // Append to last text block or create a new one
-              const blocks = blocksRef.current;
-              const lastBlock = blocks[blocks.length - 1];
-              if (lastBlock && lastBlock.type === "text") {
-                lastBlock.text += evt.text;
-              } else {
-                blocks.push({ type: "text", text: evt.text });
-              }
-              flushToMessage();
-              break;
-            }
-            case "reasoning.delta": {
-              const evt = data as ReasoningDeltaEvent;
-              setStreamingState((prev) => (prev !== "streaming" ? "streaming" : prev));
-              setPreparingTool(null);
-              const blocks = blocksRef.current;
-              const lastBlock = blocks[blocks.length - 1];
-              if (lastBlock && lastBlock.type === "reasoning") {
-                lastBlock.text += evt.text;
-              } else {
-                blocks.push({ type: "reasoning", text: evt.text });
-              }
-              flushToMessage();
-              break;
-            }
-            case "tool.preparing": {
-              const evt = data as ToolPreparingEvent;
-              setStreamingState("preparing");
-              setPreparingTool({ id: evt.id, name: evt.name });
-              break;
-            }
-            case "tool.preparing.done": {
-              // No state change — `tool.start` follows once the iteration
-              // ends and the engine begins execution. Holding `preparing`
-              // through the gap keeps the indicator stable.
-              break;
-            }
-            case "tool.start": {
-              const evt = data as ToolStartEvent;
-              setStreamingState("working");
-              setPreparingTool(null);
-              const separatorIdx = evt.name.indexOf("__");
-              const newTool: ToolCallDisplay = {
-                id: evt.id,
-                name: evt.name,
-                status: "running",
-                resourceUri: evt.resourceUri,
-                input: evt.input,
-                appName: separatorIdx !== -1 ? evt.name.slice(0, separatorIdx) : undefined,
-              };
-              // Flat ref
-              toolCallsRef.current = [...toolCallsRef.current, newTool];
-              // Blocks — group consecutive tool calls
-              const blocks = blocksRef.current;
-              const lastBlock = blocks[blocks.length - 1];
-              if (lastBlock && lastBlock.type === "tool") {
-                lastBlock.toolCalls = [...lastBlock.toolCalls, newTool];
-              } else {
-                blocks.push({ type: "tool", toolCalls: [newTool] });
-              }
-              flushToMessage();
-              break;
-            }
-            case "tool.done": {
-              const evt = data as ToolDoneEvent;
-              const updater = updateTool(evt);
-              // Update flat ref
-              toolCallsRef.current = toolCallsRef.current.map(updater);
-              // Update in blocks
-              for (const block of blocksRef.current) {
-                if (block.type === "tool") {
-                  block.toolCalls = block.toolCalls.map(updater);
-                }
-              }
-              // Hold `working` while other parallel tools are still running;
-              // only flip to `analyzing` when the last tool in the batch lands,
-              // so the indicator reflects "model is inferring on results."
-              const anyRunning = toolCallsRef.current.some((tc) => tc.status === "running");
-              setStreamingState(anyRunning ? "working" : "analyzing");
-              flushToMessage();
-              break;
-            }
-            case "llm.done": {
-              const evt = data as LlmDoneEvent;
-              iterationRef.current = {
-                n: (iterationRef.current?.n ?? 0) + 1,
-                inputTokens:
-                  (iterationRef.current?.inputTokens ?? 0) + (evt.usage?.inputTokens ?? 0),
-                outputTokens:
-                  (iterationRef.current?.outputTokens ?? 0) + (evt.usage?.outputTokens ?? 0),
-              };
-              flushToMessage();
-              break;
-            }
-            case "done": {
-              const result = data as ChatResult;
-              setStreamingState(null);
-              setPreparingTool(null);
-              setConversationId(result.conversationId);
-
-              // Backfill tool results from done event
-              if (result.toolCalls) {
-                const outputMap = new Map(result.toolCalls.map((tc) => [tc.id, tc.output]));
-                const backfill = (tc: ToolCallDisplay): ToolCallDisplay => {
-                  if (tc.result != null) return tc;
-                  const output = outputMap.get(tc.id);
-                  return output != null ? { ...tc, result: wrapStringResult(output) } : tc;
-                };
-                for (const block of blocksRef.current) {
-                  if (block.type === "tool") {
-                    block.toolCalls = block.toolCalls.map(backfill);
-                  }
-                }
-                toolCallsRef.current = toolCallsRef.current.map(backfill);
-              }
-
-              const finalBlocks = cloneBlocks(blocksRef.current);
-              const finalTools =
-                toolCallsRef.current.length > 0 ? [...toolCallsRef.current] : undefined;
-              const usage = result.usage
-                ? {
-                    inputTokens: result.usage.inputTokens,
-                    outputTokens: result.usage.outputTokens,
-                    cacheReadTokens: result.usage.cacheReadTokens,
-                    cacheWriteTokens: result.usage.cacheWriteTokens,
-                    reasoningTokens: result.usage.reasoningTokens,
-                    model: result.usage.model,
-                    llmMs: result.usage.llmMs,
-                  }
-                : undefined;
-              // Parse file attachments from done event metadata
-              const resultFiles = (result as unknown as Record<string, unknown>).files as
-                | MessageFileAttachment[]
-                | undefined;
-
-              setMessages((prev) => {
-                const updated = [...prev];
-                updated[updated.length - 1] = {
-                  role: "assistant",
-                  content: result.response,
-                  blocks: finalBlocks,
-                  toolCalls: finalTools,
-                  usage,
-                  ...(result.stopReason && result.stopReason !== "complete"
-                    ? { stopReason: result.stopReason }
-                    : {}),
-                  ...(resultFiles && resultFiles.length > 0 ? { files: resultFiles } : {}),
-                };
-                return updated;
-              });
-              break;
-            }
-            case "error": {
-              const evt = data as StreamErrorEvent;
-              setStreamingState(null);
-              setPreparingTool(null);
-              // Stamp the error on the last assistant message so it renders
-              // inline — not as a disconnected banner at the top.
-              setMessages((prev) => {
-                const updated = [...prev];
-                const last = updated[updated.length - 1];
-                if (last?.role === "assistant") {
-                  updated[updated.length - 1] = { ...last, error: evt.message };
-                } else {
-                  // No assistant message to attach to — fall back to banner
-                  setError(evt.message);
-                }
-                return updated;
-              });
-              break;
-            }
-          }
-        };
-        if (files && files.length > 0) {
-          await streamChatMultipart(req, files, onEvent);
-        } else {
-          await streamChat(req, onEvent);
-        }
-        captureEvent("web.chat_sent", {
-          is_resume: !!conversationId,
-          has_app_context: !!appContext,
-        });
-      } catch (err) {
-        if (err instanceof ApiClientError && err.code === "run_in_progress") {
-          // Server rejected because a previous run is still in flight.
-          // Drop the optimistic user+assistant placeholders so the failed
-          // message doesn't stick in history as if it had succeeded.
-          setMessages((prev) => prev.slice(0, -2));
-          captureEvent("web.chat_run_in_progress", {
-            conversation_id: conversationId ?? null,
-            has_app_context: !!appContext,
-          });
-          // Banner only — nothing in this turn to mark inline
-          setError(formatSendError(err));
-          return;
-        }
-        const msg = formatSendError(err);
-        // Stamp on the last assistant message if one exists;
-        // only fall back to banner when there's no message to attach to.
-        setMessages((prev) => {
-          const last = prev[prev.length - 1];
-          if (last?.role === "assistant") {
-            const updated = [...prev];
-            updated[updated.length - 1] = { ...last, error: msg };
-            return updated;
-          }
-          // No assistant message — fall back to banner
-          setError(msg);
-          return prev;
-        });
-      } finally {
-        setIsStreaming(false);
-        setStreamingState(null);
-        setPreparingTool(null);
+        if (appStateEntry) enrichedContext = { ...appContext, appState: appStateEntry };
       }
+      const hadConversation = !!chatStore.getSnapshot(activeKey).conversationId;
+      await chatStore.sendTurn(
+        activeKey,
+        { text, appContext: enrichedContext, model, files, currentUserId },
+        { onConversationId: (id) => setActiveKey(id) },
+      );
+      captureEvent("web.chat_sent", {
+        is_resume: hadConversation,
+        has_app_context: !!appContext,
+      });
     },
-    // biome-ignore lint/correctness/useExhaustiveDependencies: sendMessage captures streaming/conversation state via refs
-    [isStreaming, conversationId, currentUserId, flushToMessage],
+    [activeKey, currentUserId],
   );
 
   const newConversation = useCallback(() => {
-    setMessages([]);
-    setConversationId(null);
-    setConversationMeta(null);
-    setError(null);
-    setIsStreaming(false);
-    setStreamingState(null);
-    setPreparingTool(null);
-    blocksRef.current = [];
-    toolCallsRef.current = [];
-    iterationRef.current = undefined;
+    const key = freshDraftKey();
+    chatStore.ensureSlice(key);
+    setActiveKey(key);
   }, []);
 
   const loadConversation = useCallback(async (id: string) => {
-    setError(null);
-    try {
-      // expand:"full" — the shell is rendering the entire chat, not
-      // sampling for an LLM. The bounded default (`expand:"messages"`,
-      // last 20) exists to keep agent tool-results small; the trusted
-      // web shell needs every turn or the UI silently shows only the tail.
-      const res = await callTool("conversations", "get", { id, expand: "full" });
-      if (res.isError) {
-        const errText = res.content
-          ?.map((b) => b.text ?? "")
-          .filter(Boolean)
-          .join("\n");
-        throw new Error(errText || "Failed to load conversation");
-      }
-      // Prefer structuredContent; fall back to parsing first text block.
-      let raw: unknown = res.structuredContent;
-      if (!raw && res.content?.[0]?.text) {
-        try {
-          raw = JSON.parse(res.content[0].text);
-        } catch {
-          raw = {};
-        }
-      }
-      // The API already returns DisplayMessage[] in the exact shape ChatMessage
-      // expects — one message per turn, blocks in iteration order, tool calls
-      // hydrated with status+result. No reshaping needed here.
-      const data = raw as {
-        metadata: {
-          id: string;
-          ownerId?: string;
-        };
-        messages: ChatMessage[];
-      };
-      setConversationId(data.metadata.id);
-      setConversationMeta({ ownerId: data.metadata.ownerId });
-      setMessages(data.messages);
-    } catch (err) {
-      const msg = err instanceof Error ? err.message : "Failed to load conversation";
-      setError(msg);
-    }
+    setActiveKey(id);
+    await chatStore.loadConversation(id);
   }, []);
 
-  // --- Remote participant event injection ---
+  const stop = useCallback(() => {
+    chatStore.cancelTurn(activeKey);
+  }, [activeKey]);
 
-  const injectRemoteUserMessage = useCallback(
-    (userId: string, _displayName: string, content: string) => {
-      // Reset streaming refs for the incoming remote assistant response
-      blocksRef.current = [];
-      toolCallsRef.current = [];
-      iterationRef.current = undefined;
+  const retryLastMessage = useCallback(() => {
+    const text = chatStore.retryLastMessage(activeKey);
+    if (text != null) void sendMessage(text);
+  }, [activeKey, sendMessage]);
 
-      const userMsg: ChatMessage = {
-        role: "user",
-        content,
-        timestamp: new Date().toISOString(),
-        userId,
-      };
-      const assistantMsg: ChatMessage = {
-        role: "assistant",
-        content: "",
-        blocks: [],
-        toolCalls: [],
-        timestamp: new Date().toISOString(),
-      };
-      setMessages((prev) => [...prev, userMsg, assistantMsg]);
-      setIsStreaming(true);
-      setStreamingState("thinking");
+  const simulateError = useCallback(
+    (message: string) => {
+      chatStore.simulateError(activeKey, message);
     },
-    [],
+    [activeKey],
   );
 
-  const processRemoteStreamEvent = useCallback(
-    (type: string, data: unknown) => {
-      switch (type) {
-        case "text.delta": {
-          const evt = data as TextDeltaEvent;
-          setStreamingState((prev) => (prev !== "streaming" ? "streaming" : prev));
-          setPreparingTool(null);
-          const blocks = blocksRef.current;
-          const lastBlock = blocks[blocks.length - 1];
-          if (lastBlock && lastBlock.type === "text") {
-            lastBlock.text += evt.text;
-          } else {
-            blocks.push({ type: "text", text: evt.text });
-          }
-          flushToMessage();
-          break;
-        }
-        case "reasoning.delta": {
-          const evt = data as ReasoningDeltaEvent;
-          setStreamingState((prev) => (prev !== "streaming" ? "streaming" : prev));
-          setPreparingTool(null);
-          const blocks = blocksRef.current;
-          const lastBlock = blocks[blocks.length - 1];
-          if (lastBlock && lastBlock.type === "reasoning") {
-            lastBlock.text += evt.text;
-          } else {
-            blocks.push({ type: "reasoning", text: evt.text });
-          }
-          flushToMessage();
-          break;
-        }
-        case "tool.preparing": {
-          const evt = data as ToolPreparingEvent;
-          setStreamingState("preparing");
-          setPreparingTool({ id: evt.id, name: evt.name });
-          break;
-        }
-        case "tool.preparing.done": {
-          break;
-        }
-        case "tool.start": {
-          const evt = data as ToolStartEvent;
-          setStreamingState("working");
-          setPreparingTool(null);
-          const separatorIdx = evt.name.indexOf("__");
-          const newTool: ToolCallDisplay = {
-            id: evt.id,
-            name: evt.name,
-            status: "running",
-            resourceUri: evt.resourceUri,
-            input: evt.input,
-            appName: separatorIdx !== -1 ? evt.name.slice(0, separatorIdx) : undefined,
-          };
-          toolCallsRef.current = [...toolCallsRef.current, newTool];
-          const blocks = blocksRef.current;
-          const lastBlock = blocks[blocks.length - 1];
-          if (lastBlock && lastBlock.type === "tool") {
-            lastBlock.toolCalls = [...lastBlock.toolCalls, newTool];
-          } else {
-            blocks.push({ type: "tool", toolCalls: [newTool] });
-          }
-          flushToMessage();
-          break;
-        }
-        case "tool.done": {
-          const evt = data as ToolDoneEvent;
-          const updater = updateTool(evt);
-          toolCallsRef.current = toolCallsRef.current.map(updater);
-          for (const block of blocksRef.current) {
-            if (block.type === "tool") {
-              block.toolCalls = block.toolCalls.map(updater);
-            }
-          }
-          const anyRunning = toolCallsRef.current.some((tc) => tc.status === "running");
-          setStreamingState(anyRunning ? "working" : "analyzing");
-          flushToMessage();
-          break;
-        }
-        case "llm.done": {
-          const evt = data as LlmDoneEvent;
-          iterationRef.current = {
-            n: (iterationRef.current?.n ?? 0) + 1,
-            inputTokens: (iterationRef.current?.inputTokens ?? 0) + (evt.usage?.inputTokens ?? 0),
-            outputTokens:
-              (iterationRef.current?.outputTokens ?? 0) + (evt.usage?.outputTokens ?? 0),
-          };
-          flushToMessage();
-          break;
-        }
-        case "done": {
-          const result = data as ChatResult;
-          setStreamingState(null);
-          setPreparingTool(null);
-          setIsStreaming(false);
-
-          if (result.toolCalls) {
-            const outputMap = new Map(result.toolCalls.map((tc) => [tc.id, tc.output]));
-            const backfill = (tc: ToolCallDisplay): ToolCallDisplay => {
-              if (tc.result != null) return tc;
-              const output = outputMap.get(tc.id);
-              return output != null ? { ...tc, result: wrapStringResult(output) } : tc;
-            };
-            for (const block of blocksRef.current) {
-              if (block.type === "tool") {
-                block.toolCalls = block.toolCalls.map(backfill);
-              }
-            }
-            toolCallsRef.current = toolCallsRef.current.map(backfill);
-          }
-
-          const finalBlocks = cloneBlocks(blocksRef.current);
-          const finalTools =
-            toolCallsRef.current.length > 0 ? [...toolCallsRef.current] : undefined;
-          const usage = result.usage
-            ? {
-                inputTokens: result.usage.inputTokens,
-                outputTokens: result.usage.outputTokens,
-                cacheReadTokens: result.usage.cacheReadTokens,
-                cacheWriteTokens: result.usage.cacheWriteTokens,
-                reasoningTokens: result.usage.reasoningTokens,
-                model: result.usage.model,
-                llmMs: result.usage.llmMs,
-              }
-            : undefined;
-
-          setMessages((prev) => {
-            const updated = [...prev];
-            updated[updated.length - 1] = {
-              role: "assistant",
-              content: result.response,
-              blocks: finalBlocks,
-              toolCalls: finalTools,
-              usage,
-              ...(result.stopReason && result.stopReason !== "complete"
-                ? { stopReason: result.stopReason }
-                : {}),
-            };
-            return updated;
-          });
-          break;
-        }
-      }
-      // biome-ignore lint/correctness/useExhaustiveDependencies: SSE handler intentionally captures only flushToMessage
-    },
-    [flushToMessage],
+  return useMemo<UseChatReturn>(
+    () => ({
+      messages: snap.messages,
+      isStreaming: snap.isStreaming,
+      streamingState: snap.streamingState,
+      preparingTool: snap.preparingTool,
+      // Drafts carry a null conversationId on the slice, so this is null until
+      // the server assigns a real id on chat.start.
+      conversationId: snap.conversationId,
+      title: snap.title,
+      conversationMeta: snap.meta,
+      error: snap.error,
+      sendMessage,
+      newConversation,
+      loadConversation,
+      stop,
+      retryLastMessage,
+      simulateError,
+    }),
+    [snap, sendMessage, newConversation, loadConversation, stop, retryLastMessage, simulateError],
   );
-
-  // Pending retry text — set by retryLastMessage, consumed by an effect
-  const retryRef = useRef<string | null>(null);
-
-  const retryLastMessage = useCallback(() => {
-    // Find the last user message, stash its text, remove the failed pair
-    setMessages((prev) => {
-      for (let i = prev.length - 1; i >= 0; i--) {
-        if (prev[i].role === "user") {
-          retryRef.current = prev[i].content;
-          return prev.slice(0, i);
-        }
-      }
-      return prev;
-    });
-    // Clear error + streaming state so sendMessage's guard passes
-    setError(null);
-    setIsStreaming(false);
-    setStreamingState(null);
-    setPreparingTool(null);
-  }, []);
-
-  // Effect: once isStreaming is false and there's a pending retry, fire it.
-  // We can't call sendMessage synchronously from retryLastMessage because
-  // sendMessage is memoized with isStreaming in its dep list — the closure
-  // still sees isStreaming=true until React re-renders with the new state.
-  // This effect fires after React flushes the state updates, at which point
-  // sendMessage has been recreated with isStreaming=false.
-  // NOTE: this depends on sendMessage's identity changing when isStreaming
-  // changes (via flushToMessage in its dep list). Do not memoize
-  // flushToMessage without verifying this still fires.
-  useEffect(() => {
-    if (!isStreaming && retryRef.current) {
-      const text = retryRef.current;
-      retryRef.current = null;
-      sendMessage(text);
-    }
-  }, [isStreaming, sendMessage]);
-
-  const simulateError = useCallback((message: string) => {
-    setMessages((prev) => {
-      if (prev.length === 0) return prev;
-      const updated = [...prev];
-      const last = updated[updated.length - 1];
-      if (last?.role === "assistant") {
-        updated[updated.length - 1] = { ...last, error: message };
-      } else {
-        // Append a synthetic assistant message with the error
-        updated.push({ role: "assistant", content: "", error: message });
-      }
-      return updated;
-    });
-    setStreamingState(null);
-    setPreparingTool(null);
-    setIsStreaming(false);
-  }, []);
-
-  return {
-    messages,
-    isStreaming,
-    streamingState,
-    preparingTool,
-    conversationId,
-    conversationMeta,
-    error,
-    sendMessage,
-    newConversation,
-    loadConversation,
-    injectRemoteUserMessage,
-    processRemoteStreamEvent,
-    retryLastMessage,
-    simulateError,
-  };
 }
diff --git a/web/src/hooks/useEvents.ts b/web/src/hooks/useEvents.ts
index 2920c586..b7c7cc4b 100644
--- a/web/src/hooks/useEvents.ts
+++ b/web/src/hooks/useEvents.ts
@@ -4,6 +4,7 @@ import { connectEvents } from "../api/sse";
 import type {
   ConfigChangedEvent,
   ConnectionStateChangedEvent,
+  ConversationTitleEvent,
   DataChangedEvent,
   SseEventMap,
   SseEventType,
@@ -14,6 +15,8 @@ export interface UseEventsOptions {
   onDataChanged?: (event: DataChangedEvent) => void;
   /** Called when a config.changed SSE event is received. */
   onConfigChanged?: (event: ConfigChangedEvent) => void;
+  /** Called when an auto-generated conversation title arrives. */
+  onConversationTitle?: (event: ConversationTitleEvent) => void;
   /** Called when a per-Connection state transition fires (URL bundles). */
   onConnectionStateChanged?: (event: ConnectionStateChangedEvent) => void;
   /**
@@ -41,6 +44,8 @@ export function useEvents(
   onDataChangedRef.current = options?.onDataChanged;
   const onConfigChangedRef = useRef(options?.onConfigChanged);
   onConfigChangedRef.current = options?.onConfigChanged;
+  const onConversationTitleRef = useRef(options?.onConversationTitle);
+  onConversationTitleRef.current = options?.onConversationTitle;
   const onConnectionStateChangedRef = useRef(options?.onConnectionStateChanged);
   onConnectionStateChangedRef.current = options?.onConnectionStateChanged;
   const onBundleLifecycleChangedRef = useRef(options?.onBundleLifecycleChanged);
@@ -59,6 +64,9 @@ export function useEvents(
         if (type === "config.changed") {
           onConfigChangedRef.current?.(data as ConfigChangedEvent);
         }
+        if (type === "conversation.title") {
+          onConversationTitleRef.current?.(data as ConversationTitleEvent);
+        }
         if (type === "connection.state_changed") {
           onConnectionStateChangedRef.current?.(data as ConnectionStateChangedEvent);
         }
diff --git a/web/src/lib/active-conversation-storage.ts b/web/src/lib/active-conversation-storage.ts
new file mode 100644
index 00000000..cf5c9d7d
--- /dev/null
+++ b/web/src/lib/active-conversation-storage.ts
@@ -0,0 +1,60 @@
+/**
+ * Per-tab persistence of the last-viewed conversation id.
+ *
+ * Stored in `sessionStorage` so it is:
+ *   - site-scoped (per-origin) and never sent to the server,
+ *   - per-tab (two tabs don't clobber each other's active conversation),
+ *   - cleared automatically when the tab closes (no stale-id cleanup).
+ *
+ * On a fresh page load the chat panel reads this and re-opens the
+ * conversation, which re-subscribes to the server turn stream — so an
+ * in-flight turn's streaming indicator resumes (the actual stream lives
+ * server-side; only the id needs remembering). The `/chat/:id` route
+ * restores from the URL instead and doesn't use this.
+ */
+
+const KEY = "nb:activeConversationId";
+const STREAMING_KEY = "nb:streamingConversationIds";
+
+export function getSavedConversationId(): string | null {
+  try {
+    return sessionStorage.getItem(KEY);
+  } catch {
+    // sessionStorage can throw in private-mode / sandboxed contexts.
+    return null;
+  }
+}
+
+export function setSavedConversationId(id: string | null): void {
+  try {
+    if (id) sessionStorage.setItem(KEY, id);
+    else sessionStorage.removeItem(KEY);
+  } catch {
+    // Best-effort — persistence is an enhancement, not a correctness path.
+  }
+}
+
+/**
+ * Conversation ids that had an in-flight turn when the page was last alive.
+ * On reload these are re-probed against the server (`isActive`) to restore the
+ * list's streaming dots; finished ones self-heal (probe → not active → no dot).
+ */
+export function getSavedStreamingIds(): string[] {
+  try {
+    const raw = sessionStorage.getItem(STREAMING_KEY);
+    if (!raw) return [];
+    const parsed: unknown = JSON.parse(raw);
+    return Array.isArray(parsed) ? parsed.filter((x): x is string => typeof x === "string") : [];
+  } catch {
+    return [];
+  }
+}
+
+export function setSavedStreamingIds(ids: string[]): void {
+  try {
+    if (ids.length > 0) sessionStorage.setItem(STREAMING_KEY, JSON.stringify(ids));
+    else sessionStorage.removeItem(STREAMING_KEY);
+  } catch {
+    // Best-effort.
+  }
+}
diff --git a/web/src/types.ts b/web/src/types.ts
index c3f014ab..f17be2b4 100644
--- a/web/src/types.ts
+++ b/web/src/types.ts
@@ -163,6 +163,13 @@ export interface ConfigChangedEvent {
   timestamp: string;
 }
 
+/** Live auto-generated conversation title (routed to a slice by conversationId). */
+export interface ConversationTitleEvent {
+  conversationId: string;
+  title: string;
+  wsId?: string;
+}
+
 /** SSE event type to payload mapping. */
 export interface SseEventMap {
   "bundle.installed": BundleInstalledEvent;
@@ -172,6 +179,7 @@ export interface SseEventMap {
   "bundle.dead": BundleDeadEvent;
   "connection.state_changed": ConnectionStateChangedEvent;
   "data.changed": DataChangedEvent;
+  "conversation.title": ConversationTitleEvent;
   "config.changed": ConfigChangedEvent;
   heartbeat: HeartbeatEvent;
 }
diff --git a/web/test/active-conversation-storage.test.ts b/web/test/active-conversation-storage.test.ts
new file mode 100644
index 00000000..ff30a483
--- /dev/null
+++ b/web/test/active-conversation-storage.test.ts
@@ -0,0 +1,26 @@
+import { beforeEach, describe, expect, it } from "bun:test";
+import {
+  getSavedConversationId,
+  setSavedConversationId,
+} from "../src/lib/active-conversation-storage";
+
+describe("active-conversation-storage", () => {
+  beforeEach(() => {
+    sessionStorage.clear();
+  });
+
+  it("returns null when nothing is saved", () => {
+    expect(getSavedConversationId()).toBeNull();
+  });
+
+  it("round-trips a conversation id", () => {
+    setSavedConversationId("conv_abc123");
+    expect(getSavedConversationId()).toBe("conv_abc123");
+  });
+
+  it("clears the saved id when set to null (new/draft chat)", () => {
+    setSavedConversationId("conv_abc123");
+    setSavedConversationId(null);
+    expect(getSavedConversationId()).toBeNull();
+  });
+});
diff --git a/web/test/chat-store.test.ts b/web/test/chat-store.test.ts
new file mode 100644
index 00000000..7f7d455c
--- /dev/null
+++ b/web/test/chat-store.test.ts
@@ -0,0 +1,289 @@
+import { beforeEach, describe, expect, it, mock } from "bun:test";
+import type { ChatMessage } from "../src/hooks/chat-store.ts";
+
+// ---------------------------------------------------------------------------
+// Drive the chat store directly (no React). The store is now a *viewer* over
+// the server turn stream: sendTurn → startChatTurn (POST) → subscribe via
+// connectConversationStream. We mock both seams and drive the captured
+// stream callback to simulate server events.
+//
+// Bun module mocks are process-global; we spread the real client and override
+// only the turn transport so sibling suites keep the real exports.
+// ---------------------------------------------------------------------------
+
+interface CapturedStream {
+  conversationId: string;
+  onEvent: (type: string, data: unknown, seq: number) => void;
+  onSubscribed?: (info: { isActive: boolean; activeSeq: number }) => void;
+  closed: boolean;
+}
+let streams: CapturedStream[] = [];
+let convCounter = 0;
+
+const LOADED: ChatMessage[] = [
+  { role: "user", content: "loaded-q" },
+  { role: "assistant", content: "loaded-a", blocks: [{ type: "text", text: "loaded-a" }] },
+];
+
+mock.module("../src/api/conversation-stream", () => ({
+  connectConversationStream: (opts: {
+    conversationId: string;
+    onEvent: (type: string, data: unknown, seq: number) => void;
+    onSubscribed?: (info: { isActive: boolean; activeSeq: number }) => void;
+  }) => {
+    const entry: CapturedStream = {
+      conversationId: opts.conversationId,
+      onEvent: opts.onEvent,
+      onSubscribed: opts.onSubscribed,
+      closed: false,
+    };
+    streams.push(entry);
+    return {
+      close() {
+        entry.closed = true;
+      },
+    };
+  },
+}));
+
+const actualClient = await import("../src/api/client");
+mock.module("../src/api/client", () => ({
+  ...actualClient,
+  startChatTurn: (req: { conversationId?: string }) => {
+    convCounter += 1;
+    return Promise.resolve({ conversationId: req.conversationId ?? `conv_${convCounter}` });
+  },
+  startChatTurnMultipart: (req: { conversationId?: string }) => {
+    convCounter += 1;
+    return Promise.resolve({ conversationId: req.conversationId ?? `conv_${convCounter}` });
+  },
+  cancelChatTurn: () => Promise.resolve(),
+  callTool: (_server: string, _action: string, args?: Record<string, unknown>) =>
+    Promise.resolve({
+      isError: false,
+      structuredContent: { metadata: { id: args?.id }, messages: LOADED },
+    }),
+}));
+
+import { createChatStore, freshDraftKey } from "../src/hooks/chat-store.ts";
+
+function lastAssistant(messages: ChatMessage[]): ChatMessage | undefined {
+  for (let i = messages.length - 1; i >= 0; i--) {
+    if (messages[i].role === "assistant") return messages[i];
+  }
+  return undefined;
+}
+
+/** The most-recently-opened stream (the one a just-sent turn subscribed to). */
+function latestStream(): CapturedStream {
+  return streams[streams.length - 1];
+}
+
+describe("chat-store viewer", () => {
+  beforeEach(() => {
+    streams = [];
+    convCounter = 0;
+  });
+
+  it("renders a sent turn from the server stream (echo consumed, no dup)", async () => {
+    const store = createChatStore();
+    await store.sendTurn("draft-1", { text: "hello" });
+    const s = latestStream();
+
+    // Server echoes the user message (consumed by the optimistic placeholder),
+    // then streams the assistant.
+    s.onEvent("user.message", { content: "hello" }, 1);
+    s.onEvent("text.delta", { text: "hi " }, 2);
+    s.onEvent("text.delta", { text: "there" }, 3);
+
+    const snap = store.getSnapshot("draft-1");
+    const users = snap.messages.filter((m) => m.role === "user");
+    expect(users).toHaveLength(1); // not duplicated
+    expect(users[0].content).toBe("hello");
+    expect(lastAssistant(snap.messages)?.content).toBe("hi there");
+  });
+
+  it("isolates concurrent turns into their own slices", async () => {
+    const store = createChatStore();
+    await store.sendTurn("kA", { text: "a" });
+    const aStream = latestStream();
+    await store.sendTurn("kB", { text: "b" });
+    const bStream = latestStream();
+
+    aStream.onEvent("user.message", { content: "a" }, 1);
+    aStream.onEvent("text.delta", { text: "a1" }, 2);
+    bStream.onEvent("user.message", { content: "b" }, 1);
+    bStream.onEvent("text.delta", { text: "b1" }, 2);
+    aStream.onEvent("text.delta", { text: "a2" }, 3);
+
+    expect(lastAssistant(store.getSnapshot("kA").messages)?.content).toBe("a1a2");
+    expect(lastAssistant(store.getSnapshot("kB").messages)?.content).toBe("b1");
+  });
+
+  it("remaps a draft to the real conversation id", async () => {
+    const store = createChatStore();
+    const draft = freshDraftKey();
+    const seen: string[] = [];
+    await store.sendTurn(draft, { text: "hi" }, { onConversationId: (id) => seen.push(id) });
+    expect(seen).toEqual(["conv_1"]);
+    expect(store.getSnapshot(draft).conversationId).toBe("conv_1");
+    // The real id resolves to the same live slice.
+    latestStream().onEvent("user.message", { content: "hi" }, 1);
+    latestStream().onEvent("text.delta", { text: "yo" }, 2);
+    expect(lastAssistant(store.getSnapshot("conv_1").messages)?.content).toBe("yo");
+  });
+
+  it("enforces per-slice single-flight", async () => {
+    const store = createChatStore();
+    const p1 = store.sendTurn("kA", { text: "first" });
+    const p2 = store.sendTurn("kA", { text: "second" }); // ignored — already streaming
+    await Promise.all([p1, p2]);
+    // Only one turn started → one stream opened.
+    expect(streams).toHaveLength(1);
+  });
+
+  it("finalizes on the terminal done event and closes the stream", async () => {
+    const store = createChatStore();
+    await store.sendTurn("kA", { text: "go" });
+    const s = latestStream();
+    s.onEvent("user.message", { content: "go" }, 1);
+    s.onEvent("text.delta", { text: "partial" }, 2);
+    s.onEvent("done", { response: "final answer", conversationId: "conv_1" }, 3);
+
+    const snap = store.getSnapshot("kA");
+    expect(snap.isStreaming).toBe(false);
+    expect(lastAssistant(snap.messages)?.content).toBe("final answer");
+    expect(s.closed).toBe(true);
+  });
+
+  it("does not clobber a slice that is streaming on loadConversation", async () => {
+    const store = createChatStore();
+    await store.sendTurn("conv_1", { text: "go" });
+    latestStream().onEvent("user.message", { content: "go" }, 1);
+    latestStream().onEvent("text.delta", { text: "streaming-text" }, 2);
+
+    await store.loadConversation("conv_1");
+    expect(lastAssistant(store.getSnapshot("conv_1").messages)?.content).toBe("streaming-text");
+  });
+
+  it("loads persisted history into an idle slice and trims a stale in-flight turn on resume", async () => {
+    const store = createChatStore();
+    await store.loadConversation("conv_X");
+    const s = latestStream();
+    // Server says a turn is in flight → the stale in-flight turn (last user
+    // message + after) is trimmed, then replay rebuilds it.
+    s.onSubscribed?.({ isActive: true, activeSeq: 2 });
+    // After trim, the loaded "loaded-q"/"loaded-a" pair: "loaded-q" is the last
+    // user message, so it + the trailing assistant are dropped.
+    expect(store.getSnapshot("conv_X").messages).toHaveLength(0);
+    // Server says a turn is active → the streaming indicator shows immediately,
+    // before any replayed event arrives.
+    expect(store.getSnapshot("conv_X").isStreaming).toBe(true);
+
+    s.onEvent("user.message", { content: "loaded-q" }, 1);
+    s.onEvent("text.delta", { text: "fresh" }, 2);
+    expect(lastAssistant(store.getSnapshot("conv_X").messages)?.content).toBe("fresh");
+  });
+
+  it("closes an idle resume connection when nothing is in flight", async () => {
+    const store = createChatStore();
+    await store.loadConversation("conv_Y");
+    const s = latestStream();
+    s.onSubscribed?.({ isActive: false, activeSeq: 0 });
+    expect(s.closed).toBe(true);
+    // History still present.
+    expect(store.getSnapshot("conv_Y").messages).toHaveLength(LOADED.length);
+  });
+
+  it("tracks streaming ids and clears on terminal", async () => {
+    const store = createChatStore();
+    await store.sendTurn(freshDraftKey(), { text: "a" });
+    latestStream().onEvent("user.message", { content: "a" }, 1);
+    expect(store.getStreamingIds()).toEqual(["conv_1"]);
+    latestStream().onEvent("done", { response: "x", conversationId: "conv_1" }, 2);
+    expect(store.getStreamingIds()).toEqual([]);
+  });
+
+  it("caps idle slices via LRU but keeps streaming ones", async () => {
+    const store = createChatStore();
+    await store.sendTurn(freshDraftKey(), { text: "go" });
+    latestStream().onEvent("user.message", { content: "go" }, 1);
+    for (let i = 0; i < 60; i++) store.ensureSlice(`idle-${i}`);
+    expect(store.sliceCount()).toBeLessThanOrEqual(30);
+    expect(store.getSnapshot("conv_1").isStreaming).toBe(true);
+  });
+
+  it("reset drops every slice and closes streams", async () => {
+    const store = createChatStore();
+    await store.sendTurn("kA", { text: "a" });
+    const s = latestStream();
+    expect(store.sliceCount()).toBeGreaterThan(0);
+    store.reset();
+    expect(store.sliceCount()).toBe(0);
+    expect(s.closed).toBe(true);
+    expect(store.getSnapshot("conv_1").messages).toEqual([]);
+  });
+
+  it("probeConversation lights a dot for an active conversation (no history fetch)", () => {
+    const store = createChatStore();
+    store.probeConversation("conv_live");
+    latestStream().onSubscribed?.({ isActive: true, activeSeq: 3 });
+
+    expect(store.getStreamingIds()).toEqual(["conv_live"]);
+    // No message history was fetched — only the probe subscription.
+    expect(store.getSnapshot("conv_live").messages).toEqual([]);
+  });
+
+  it("probeConversation closes and shows no dot for an inactive conversation", () => {
+    const store = createChatStore();
+    store.probeConversation("conv_done");
+    const s = latestStream();
+    s.onSubscribed?.({ isActive: false, activeSeq: 0 });
+
+    expect(store.getStreamingIds()).toEqual([]);
+    expect(s.closed).toBe(true);
+  });
+
+  it("opening a probed conversation still loads full history", async () => {
+    const store = createChatStore();
+    store.probeConversation("conv_x");
+    latestStream().onSubscribed?.({ isActive: true, activeSeq: 3 });
+    // Probe left it unhydrated despite streaming — loadConversation must fetch.
+    await store.loadConversation("conv_x");
+    expect(lastAssistant(store.getSnapshot("conv_x").messages)?.content).toBe("loaded-a");
+  });
+
+  it("setTitle updates a conversation's slice title (live conversation.title SSE)", async () => {
+    const store = createChatStore();
+    await store.sendTurn("kA", { text: "a" });
+    latestStream().onEvent("chat.start", { conversationId: "A" }, 1);
+    expect(store.getSnapshot("A").title).toBeNull();
+
+    store.setTitle("A", "Library Paranoia Joke");
+    expect(store.getSnapshot("A").title).toBe("Library Paranoia Joke");
+  });
+
+  it("setTitle is a no-op for a conversation with no slice in this tab", () => {
+    const store = createChatStore();
+    store.setTitle("conv_absent", "Whatever");
+    expect(store.getSnapshot("conv_absent").title).toBeNull();
+  });
+
+  it("does not duplicate a finished turn whose grace-buffer replay still arrives", async () => {
+    const store = createChatStore();
+    // Disk already has the completed turn.
+    await store.loadConversation("conv_done");
+    expect(store.getSnapshot("conv_done").messages).toEqual(LOADED);
+
+    // Resume finds no active turn, but the server still replays the recently
+    // finished turn from its grace buffer. Those events must be dropped, not
+    // re-appended on top of the disk history.
+    const s = latestStream();
+    s.onSubscribed?.({ isActive: false, activeSeq: 0 });
+    s.onEvent("user.message", { content: "loaded-q" }, 1);
+    s.onEvent("text.delta", { text: "loaded-a" }, 2);
+    s.onEvent("done", { conversationId: "conv_done", response: "loaded-a" }, 3);
+
+    expect(store.getSnapshot("conv_done").messages).toEqual(LOADED);
+  });
+});
diff --git a/web/test/chatBleed.test.tsx b/web/test/chatBleed.test.tsx
new file mode 100644
index 00000000..351eca0b
--- /dev/null
+++ b/web/test/chatBleed.test.tsx
@@ -0,0 +1,129 @@
+import { act, renderHook } from "@testing-library/react";
+import { beforeEach, describe, expect, it, mock } from "bun:test";
+import type { ReactNode } from "react";
+import { ChatProvider, useChatContext } from "../src/context/ChatContext.tsx";
+import type { ChatMessage } from "../src/hooks/useChat.ts";
+
+// ---------------------------------------------------------------------------
+// Regression for #254 under the server-authoritative model: a turn streaming
+// in conversation A must NOT bleed into B when the user switches mid-turn.
+// Each conversation is a viewer over its own server stream; switching away
+// keeps A's stream filling A's slice in the background.
+// ---------------------------------------------------------------------------
+
+type StreamCb = (type: string, data: unknown, seq: number) => void;
+const streamsByConv = new Map<string, StreamCb>();
+const subscribedByConv = new Map<string, (info: { isActive: boolean; activeSeq: number }) => void>();
+
+const B_MESSAGES: ChatMessage[] = [
+  { role: "user", content: "b-question" },
+  { role: "assistant", content: "b-answer", blocks: [{ type: "text", text: "b-answer" }] },
+];
+
+mock.module("../src/api/conversation-stream", () => ({
+  connectConversationStream: (opts: {
+    conversationId: string;
+    onEvent: StreamCb;
+    onSubscribed?: (info: { isActive: boolean; activeSeq: number }) => void;
+  }) => {
+    streamsByConv.set(opts.conversationId, opts.onEvent);
+    if (opts.onSubscribed) subscribedByConv.set(opts.conversationId, opts.onSubscribed);
+    return {
+      close() {
+        streamsByConv.delete(opts.conversationId);
+        subscribedByConv.delete(opts.conversationId);
+      },
+    };
+  },
+}));
+
+const actualClient = await import("../src/api/client");
+mock.module("../src/api/client", () => ({
+  ...actualClient,
+  startChatTurn: () => Promise.resolve({ conversationId: "conv-A" }),
+  startChatTurnMultipart: () => Promise.resolve({ conversationId: "conv-A" }),
+  cancelChatTurn: () => Promise.resolve(),
+  callTool: (server: string, action: string, args?: Record<string, unknown>) => {
+    if (server === "conversations" && action === "get") {
+      return Promise.resolve({
+        isError: false,
+        structuredContent: { metadata: { id: args?.id }, messages: B_MESSAGES },
+      });
+    }
+    return Promise.resolve({ isError: false, structuredContent: {} });
+  },
+}));
+
+function wrapper({ children }: { children: ReactNode }) {
+  return <ChatProvider>{children}</ChatProvider>;
+}
+
+function lastAssistant(messages: ChatMessage[]): ChatMessage | undefined {
+  for (let i = messages.length - 1; i >= 0; i--) {
+    if (messages[i].role === "assistant") return messages[i];
+  }
+  return undefined;
+}
+
+describe("#254 mid-turn conversation switch (server-authoritative)", () => {
+  beforeEach(() => {
+    streamsByConv.clear();
+    subscribedByConv.clear();
+  });
+
+  it("does not bleed A's streaming deltas into conversation B", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+
+    await act(async () => {
+      await result.current.sendMessage("a-question");
+    });
+
+    act(() => {
+      streamsByConv.get("conv-A")?.("user.message", { content: "a-question" }, 1);
+      streamsByConv.get("conv-A")?.("text.delta", { text: "A-part1" }, 2);
+    });
+
+    await act(async () => {
+      await result.current.loadConversation("conv-B");
+    });
+    act(() => {
+      subscribedByConv.get("conv-B")?.({ isActive: false, activeSeq: 0 });
+    });
+
+    expect(result.current.conversationId).toBe("conv-B");
+    expect(lastAssistant(result.current.messages)?.content).toBe("b-answer");
+
+    // A keeps streaming in the background.
+    act(() => {
+      streamsByConv.get("conv-A")?.("text.delta", { text: "A-part2" }, 3);
+    });
+
+    expect(lastAssistant(result.current.messages)?.content).toBe("b-answer");
+  });
+
+  it("keeps A's background stream so switching back shows the response", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+
+    await act(async () => {
+      await result.current.sendMessage("a-question");
+    });
+    act(() => {
+      streamsByConv.get("conv-A")?.("user.message", { content: "a-question" }, 1);
+      streamsByConv.get("conv-A")?.("text.delta", { text: "A1" }, 2);
+    });
+
+    await act(async () => {
+      await result.current.loadConversation("conv-B");
+    });
+    act(() => {
+      subscribedByConv.get("conv-B")?.({ isActive: false, activeSeq: 0 });
+      streamsByConv.get("conv-A")?.("text.delta", { text: "A2" }, 3);
+    });
+
+    await act(async () => {
+      await result.current.loadConversation("conv-A");
+    });
+    expect(result.current.conversationId).toBe("conv-A");
+    expect(lastAssistant(result.current.messages)?.content).toBe("A1A2");
+  });
+});
diff --git a/web/test/inlineError.test.tsx b/web/test/inlineError.test.tsx
index 0079baed..92e67bab 100644
--- a/web/test/inlineError.test.tsx
+++ b/web/test/inlineError.test.tsx
@@ -1,183 +1,119 @@
-import { describe, expect, it, mock, beforeEach } from "bun:test";
-import { renderHook, act } from "@testing-library/react";
+import { act, renderHook } from "@testing-library/react";
+import { beforeEach, describe, expect, it, mock } from "bun:test";
 import type { ReactNode } from "react";
 import { ChatProvider, useChatContext } from "../src/context/ChatContext.tsx";
 
 // ---------------------------------------------------------------------------
-// Mock streamChat so we can control SSE events in tests
+// Inline error UX under the server-authoritative path. We capture the turn
+// stream's onEvent and push synthetic server events.
 // ---------------------------------------------------------------------------
 
-type StreamCallback = (type: string, data: unknown) => void;
+type StreamCb = (type: string, data: unknown, seq: number) => void;
+let capturedOnEvent: StreamCb | null = null;
 
-let capturedCallback: StreamCallback | null = null;
-let resolveStream: (() => void) | null = null;
-let rejectStream: ((err: Error) => void) | null = null;
+mock.module("../src/api/conversation-stream", () => ({
+  connectConversationStream: (opts: { onEvent: StreamCb }) => {
+    capturedOnEvent = opts.onEvent;
+    return { close() {} };
+  },
+}));
 
+const actualClient = await import("../src/api/client");
 mock.module("../src/api/client", () => ({
-	streamChat: (_req: unknown, cb: StreamCallback) => {
-		capturedCallback = cb;
-		return new Promise<void>((resolve, reject) => {
-			resolveStream = resolve;
-			rejectStream = reject;
-		});
-	},
-	getConversationHistory: mock(() =>
-		Promise.resolve({ conversationId: "c1", messages: [] }),
-	),
+  ...actualClient,
+  startChatTurn: () => Promise.resolve({ conversationId: "c1" }),
+  startChatTurnMultipart: () => Promise.resolve({ conversationId: "c1" }),
+  cancelChatTurn: () => Promise.resolve(),
 }));
 
-// ---------------------------------------------------------------------------
-// Helpers
-// ---------------------------------------------------------------------------
-
 function wrapper({ children }: { children: ReactNode }) {
-	return <ChatProvider>{children}</ChatProvider>;
+  return <ChatProvider>{children}</ChatProvider>;
 }
 
-// ---------------------------------------------------------------------------
-// Tests
-// ---------------------------------------------------------------------------
+let seq = 0;
+function emit(type: string, data: unknown): void {
+  seq += 1;
+  capturedOnEvent?.(type, data, seq);
+}
 
 describe("inline error UX", () => {
-	beforeEach(() => {
-		capturedCallback = null;
-		resolveStream = null;
-		rejectStream = null;
-	});
-
-	it("stream error event stamps error on last assistant message, not banner", async () => {
-		const { result } = renderHook(() => useChatContext(), { wrapper });
-
-		act(() => {
-			result.current.sendMessage("hello");
-		});
-		await act(async () => {});
-
-		// Simulate some streaming content first
-		act(() => {
-			capturedCallback?.("text.delta", { text: "Here is my response" });
-		});
-
-		// Fire SSE error event
-		act(() => {
-			capturedCallback?.("error", {
-				error: "json_parse",
-				message: "JSON Parse error: Unable to parse JSON string",
-			});
-		});
-
-		// Error should be on the last assistant message
-		const lastMsg = result.current.messages[result.current.messages.length - 1];
-		expect(lastMsg?.role).toBe("assistant");
-		expect(lastMsg?.error).toBe("JSON Parse error: Unable to parse JSON string");
-
-		// Banner error should NOT be set
-		expect(result.current.error).toBeNull();
-	});
-
-	it("simulateError is a no-op when there are no messages", () => {
-		const { result } = renderHook(() => useChatContext(), { wrapper });
-
-		expect(result.current.messages).toHaveLength(0);
-
-		act(() => {
-			result.current.simulateError("Something broke");
-		});
-
-		// No messages to stamp on — stays empty
-		expect(result.current.messages).toHaveLength(0);
-		expect(result.current.isStreaming).toBe(false);
-		expect(result.current.streamingState).toBeNull();
-	});
-
-	it("simulateError stamps on existing assistant message", async () => {
-		const { result } = renderHook(() => useChatContext(), { wrapper });
-
-		act(() => {
-			result.current.sendMessage("hello");
-		});
-		await act(async () => {});
-
-		act(() => {
-			capturedCallback?.("text.delta", { text: "response text" });
-		});
-
-		// Complete the stream so isStreaming is false
-		act(() => {
-			capturedCallback?.("done", {
-				response: "response text",
-				conversationId: "c1",
-				toolCalls: [],
-				inputTokens: 10,
-				outputTokens: 5,
-				stopReason: "complete",
-			});
-		});
-		act(() => {
-			resolveStream?.();
-		});
-		await act(async () => {});
-
-		const msgCountBefore = result.current.messages.length;
-
-		act(() => {
-			result.current.simulateError("Simulated crash");
-		});
-
-		// Should stamp on existing message, not add a new one
-		expect(result.current.messages).toHaveLength(msgCountBefore);
-		const lastMsg = result.current.messages[result.current.messages.length - 1];
-		expect(lastMsg?.role).toBe("assistant");
-		expect(lastMsg?.error).toBe("Simulated crash");
-	});
-
-	it("retryLastMessage removes failed pair and re-sends", async () => {
-		const { result } = renderHook(() => useChatContext(), { wrapper });
-
-		// Send a message
-		act(() => {
-			result.current.sendMessage("try this");
-		});
-		await act(async () => {});
-
-		// Simulate some content then error
-		act(() => {
-			capturedCallback?.("text.delta", { text: "partial" });
-		});
-		act(() => {
-			capturedCallback?.("error", {
-				error: "crash",
-				message: "Engine crashed",
-			});
-		});
-
-		// Complete the stream promise so isStreaming clears
-		act(() => {
-			resolveStream?.();
-		});
-		await act(async () => {});
-
-		// Should have user + errored assistant
-		expect(result.current.messages).toHaveLength(2);
-		expect(result.current.messages[1].error).toBe("Engine crashed");
-
-		// Reset mocks for the retry
-		capturedCallback = null;
-		resolveStream = null;
-
-		// Retry
-		act(() => {
-			result.current.retryLastMessage();
-		});
-		await act(async () => {});
-
-		// retryLastMessage removes the failed pair and triggers a new send.
-		// After retry fires, we should have a new user + assistant placeholder.
-		// The callback should be captured again from the new sendMessage call.
-		// Give it another tick for the effect to fire sendMessage
-		await act(async () => {});
-
-		// The retry effect should have fired sendMessage, creating new messages
-		expect(result.current.isStreaming).toBe(true);
-	});
+  beforeEach(() => {
+    capturedOnEvent = null;
+    seq = 0;
+  });
+
+  it("stream error event stamps error on last assistant message, not banner", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    await act(async () => {
+      await result.current.sendMessage("hello");
+    });
+
+    act(() => emit("text.delta", { text: "Here is my response" }));
+    act(() =>
+      emit("error", {
+        error: "json_parse",
+        message: "JSON Parse error: Unable to parse JSON string",
+      }),
+    );
+
+    const lastMsg = result.current.messages[result.current.messages.length - 1];
+    expect(lastMsg?.role).toBe("assistant");
+    expect(lastMsg?.error).toBe("JSON Parse error: Unable to parse JSON string");
+    expect(result.current.error).toBeNull();
+  });
+
+  it("simulateError is a no-op when there are no messages", () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    expect(result.current.messages).toHaveLength(0);
+    act(() => {
+      result.current.simulateError("Something broke");
+    });
+    expect(result.current.messages).toHaveLength(0);
+    expect(result.current.isStreaming).toBe(false);
+    expect(result.current.streamingState).toBeNull();
+  });
+
+  it("simulateError stamps on existing assistant message", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    await act(async () => {
+      await result.current.sendMessage("hello");
+    });
+    act(() => emit("text.delta", { text: "response text" }));
+    act(() =>
+      emit("done", {
+        response: "response text",
+        conversationId: "c1",
+        toolCalls: [],
+        stopReason: "complete",
+      }),
+    );
+
+    const msgCountBefore = result.current.messages.length;
+    act(() => {
+      result.current.simulateError("Simulated crash");
+    });
+    expect(result.current.messages).toHaveLength(msgCountBefore);
+    const lastMsg = result.current.messages[result.current.messages.length - 1];
+    expect(lastMsg?.role).toBe("assistant");
+    expect(lastMsg?.error).toBe("Simulated crash");
+  });
+
+  it("retryLastMessage removes failed pair and re-sends", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    await act(async () => {
+      await result.current.sendMessage("try this");
+    });
+    act(() => emit("text.delta", { text: "partial" }));
+    act(() => emit("error", { error: "crash", message: "Engine crashed" }));
+
+    expect(result.current.messages).toHaveLength(2);
+    expect(result.current.messages[1].error).toBe("Engine crashed");
+
+    await act(async () => {
+      result.current.retryLastMessage();
+    });
+    await act(async () => {});
+
+    expect(result.current.isStreaming).toBe(true);
+  });
 });
diff --git a/web/test/streamingState.test.tsx b/web/test/streamingState.test.tsx
index 5f8d7877..5f8f8d58 100644
--- a/web/test/streamingState.test.tsx
+++ b/web/test/streamingState.test.tsx
@@ -1,305 +1,193 @@
-import { describe, expect, it, mock, beforeEach } from "bun:test";
-import { renderHook, act } from "@testing-library/react";
+import { act, renderHook } from "@testing-library/react";
+import { beforeEach, describe, expect, it, mock } from "bun:test";
 import type { ReactNode } from "react";
 import { ChatProvider, useChatContext } from "../src/context/ChatContext.tsx";
 import type { StreamingState } from "../src/hooks/useChat.ts";
 
 // ---------------------------------------------------------------------------
-// Mock streamChat so we can control SSE events in tests
+// Drive the streaming state machine through the server-authoritative path:
+// sendMessage → startChatTurn (POST) → subscribe via connectConversationStream.
+// We capture the stream's onEvent and push synthetic server events.
 // ---------------------------------------------------------------------------
 
-type StreamCallback = (type: string, data: unknown) => void;
+type StreamCb = (type: string, data: unknown, seq: number) => void;
+let capturedOnEvent: StreamCb | null = null;
 
-let capturedCallback: StreamCallback | null = null;
-let resolveStream: (() => void) | null = null;
+mock.module("../src/api/conversation-stream", () => ({
+  connectConversationStream: (opts: { onEvent: StreamCb }) => {
+    capturedOnEvent = opts.onEvent;
+    return { close() {} };
+  },
+}));
 
+const actualClient = await import("../src/api/client");
 mock.module("../src/api/client", () => ({
-	streamChat: (_req: unknown, cb: StreamCallback) => {
-		capturedCallback = cb;
-		return new Promise<void>((resolve) => {
-			resolveStream = resolve;
-		});
-	},
-	getConversationHistory: mock(() =>
-		Promise.resolve({ conversationId: "c1", messages: [] }),
-	),
+  ...actualClient,
+  startChatTurn: () => Promise.resolve({ conversationId: "c1" }),
+  startChatTurnMultipart: () => Promise.resolve({ conversationId: "c1" }),
+  cancelChatTurn: () => Promise.resolve(),
 }));
 
-// ---------------------------------------------------------------------------
-// Helpers
-// ---------------------------------------------------------------------------
-
 function wrapper({ children }: { children: ReactNode }) {
-	return <ChatProvider>{children}</ChatProvider>;
+  return <ChatProvider>{children}</ChatProvider>;
 }
 
-function useStreamingState() {
-	const ctx = useChatContext();
-	return ctx;
+let seq = 0;
+function emit(type: string, data: unknown): void {
+  seq += 1;
+  capturedOnEvent?.(type, data, seq);
 }
 
-// ---------------------------------------------------------------------------
-// Tests
-// ---------------------------------------------------------------------------
-
 describe("streamingState state machine", () => {
-	beforeEach(() => {
-		capturedCallback = null;
-		resolveStream = null;
-	});
-
-	it("starts as null", () => {
-		const { result } = renderHook(() => useStreamingState(), { wrapper });
-		expect(result.current.streamingState).toBeNull();
-	});
-
-	it("transitions to thinking when sendMessage is called", async () => {
-		const { result } = renderHook(() => useStreamingState(), { wrapper });
-
-		// sendMessage returns a promise; don't await (stream is pending)
-		act(() => {
-			result.current.sendMessage("hello");
-		});
-
-		// Wait a tick for state to settle
-		await act(async () => {});
-
-		expect(result.current.streamingState).toBe("thinking" as StreamingState);
-	});
-
-	it("transitions thinking → streaming on first text.delta", async () => {
-		const { result } = renderHook(() => useStreamingState(), { wrapper });
-
-		act(() => {
-			result.current.sendMessage("hello");
-		});
-		await act(async () => {});
-
-		expect(result.current.streamingState).toBe("thinking");
-
-		act(() => {
-			capturedCallback?.("text.delta", { text: "Hi" });
-		});
-
-		expect(result.current.streamingState).toBe("streaming");
-	});
-
-	it("transitions streaming → working on tool.start", async () => {
-		const { result } = renderHook(() => useStreamingState(), { wrapper });
-
-		act(() => {
-			result.current.sendMessage("hello");
-		});
-		await act(async () => {});
-
-		act(() => {
-			capturedCallback?.("text.delta", { text: "Let me check" });
-		});
-		expect(result.current.streamingState).toBe("streaming");
-
-		act(() => {
-			capturedCallback?.("tool.start", { id: "t1", name: "search" });
-		});
-		expect(result.current.streamingState).toBe("working");
-	});
-
-	it("transitions working → analyzing on last tool.done", async () => {
-		const { result } = renderHook(() => useStreamingState(), { wrapper });
-
-		act(() => {
-			result.current.sendMessage("hello");
-		});
-		await act(async () => {});
-
-		act(() => {
-			capturedCallback?.("text.delta", { text: "x" });
-		});
-		act(() => {
-			capturedCallback?.("tool.start", { id: "t1", name: "search" });
-		});
-		expect(result.current.streamingState).toBe("working");
-
-		act(() => {
-			capturedCallback?.("tool.done", { id: "t1", name: "search", ok: true, ms: 100 });
-		});
-		// No in-flight tools remain → model is inferring on the result.
-		expect(result.current.streamingState).toBe("analyzing");
-	});
-
-	it("holds working while parallel tools are still in flight, then analyzing", async () => {
-		const { result } = renderHook(() => useStreamingState(), { wrapper });
-
-		act(() => {
-			result.current.sendMessage("hello");
-		});
-		await act(async () => {});
-
-		act(() => {
-			capturedCallback?.("tool.start", { id: "a", name: "search" });
-			capturedCallback?.("tool.start", { id: "b", name: "fetch" });
-		});
-		expect(result.current.streamingState).toBe("working");
-
-		// First of two completes — the other is still running, so stay `working`.
-		act(() => {
-			capturedCallback?.("tool.done", { id: "a", name: "search", ok: true, ms: 10 });
-		});
-		expect(result.current.streamingState).toBe("working");
-
-		// Last one lands → flip to `analyzing`.
-		act(() => {
-			capturedCallback?.("tool.done", { id: "b", name: "fetch", ok: false, ms: 725 });
-		});
-		expect(result.current.streamingState).toBe("analyzing");
-	});
-
-	it("transitions analyzing → streaming on the next text.delta", async () => {
-		const { result } = renderHook(() => useStreamingState(), { wrapper });
-
-		act(() => {
-			result.current.sendMessage("hello");
-		});
-		await act(async () => {});
-
-		act(() => {
-			capturedCallback?.("tool.start", { id: "t1", name: "search" });
-			capturedCallback?.("tool.done", { id: "t1", name: "search", ok: true, ms: 10 });
-		});
-		expect(result.current.streamingState).toBe("analyzing");
-
-		act(() => {
-			capturedCallback?.("text.delta", { text: "Based on that…" });
-		});
-		expect(result.current.streamingState).toBe("streaming");
-	});
-
-	it("transitions analyzing → working when the model calls another tool", async () => {
-		const { result } = renderHook(() => useStreamingState(), { wrapper });
-
-		act(() => {
-			result.current.sendMessage("hello");
-		});
-		await act(async () => {});
-
-		act(() => {
-			capturedCallback?.("tool.start", { id: "t1", name: "search" });
-			capturedCallback?.("tool.done", { id: "t1", name: "search", ok: true, ms: 10 });
-		});
-		expect(result.current.streamingState).toBe("analyzing");
-
-		act(() => {
-			capturedCallback?.("tool.start", { id: "t2", name: "fetch" });
-		});
-		expect(result.current.streamingState).toBe("working");
-	});
-
-	it("transitions to null on done event", async () => {
-		const { result } = renderHook(() => useStreamingState(), { wrapper });
-
-		act(() => {
-			result.current.sendMessage("hello");
-		});
-		await act(async () => {});
-
-		act(() => {
-			capturedCallback?.("text.delta", { text: "Hi" });
-		});
-		expect(result.current.streamingState).toBe("streaming");
-
-		act(() => {
-			capturedCallback?.("done", {
-				conversationId: "c1",
-				response: "Hi",
-			});
-		});
-		expect(result.current.streamingState).toBeNull();
-	});
-
-	it("transitions to null on error event", async () => {
-		const { result } = renderHook(() => useStreamingState(), { wrapper });
-
-		act(() => {
-			result.current.sendMessage("hello");
-		});
-		await act(async () => {});
-
-		expect(result.current.streamingState).toBe("thinking");
-
-		act(() => {
-			capturedCallback?.("error", { error: "fail", message: "fail" });
-		});
-		expect(result.current.streamingState).toBeNull();
-	});
-
-	it("transitions to null in finally after stream resolves", async () => {
-		const { result } = renderHook(() => useStreamingState(), { wrapper });
-
-		act(() => {
-			result.current.sendMessage("hello");
-		});
-		await act(async () => {});
-
-		expect(result.current.streamingState).toBe("thinking");
-
-		// Resolve the stream promise (triggers finally block)
-		await act(async () => {
-			resolveStream?.();
-		});
-
-		expect(result.current.streamingState).toBeNull();
-	});
-
-	it("newConversation resets streamingState to null", async () => {
-		const { result } = renderHook(() => useStreamingState(), { wrapper });
-
-		act(() => {
-			result.current.newConversation();
-		});
-
-		expect(result.current.streamingState).toBeNull();
-	});
-
-	it("full cycle: thinking → streaming → working → analyzing → streaming → null", async () => {
-		const { result } = renderHook(() => useStreamingState(), { wrapper });
-
-		act(() => {
-			result.current.sendMessage("hello");
-		});
-		await act(async () => {});
-		expect(result.current.streamingState).toBe("thinking");
-
-		act(() => {
-			capturedCallback?.("text.delta", { text: "Let me " });
-		});
-		expect(result.current.streamingState).toBe("streaming");
-
-		act(() => {
-			capturedCallback?.("tool.start", { id: "t1", name: "lookup" });
-		});
-		expect(result.current.streamingState).toBe("working");
-
-		act(() => {
-			capturedCallback?.("tool.done", { id: "t1", name: "lookup", ok: true, ms: 50 });
-		});
-		expect(result.current.streamingState).toBe("analyzing");
-
-		act(() => {
-			capturedCallback?.("text.delta", { text: "here you go" });
-		});
-		expect(result.current.streamingState).toBe("streaming");
-
-		act(() => {
-			capturedCallback?.("done", {
-				conversationId: "c1",
-				response: "Let me here you go",
-			});
-		});
-		expect(result.current.streamingState).toBeNull();
-
-		// Resolve the stream so the finally block runs
-		await act(async () => {
-			resolveStream?.();
-		});
-		expect(result.current.streamingState).toBeNull();
-	});
+  beforeEach(() => {
+    capturedOnEvent = null;
+    seq = 0;
+  });
+
+  it("starts as null", () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    expect(result.current.streamingState).toBeNull();
+  });
+
+  it("transitions to thinking when sendMessage is called", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    await act(async () => {
+      await result.current.sendMessage("hello");
+    });
+    expect(result.current.streamingState).toBe("thinking" as StreamingState);
+  });
+
+  it("transitions thinking → streaming on first text.delta", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    await act(async () => {
+      await result.current.sendMessage("hello");
+    });
+    expect(result.current.streamingState).toBe("thinking");
+    act(() => emit("text.delta", { text: "Hi" }));
+    expect(result.current.streamingState).toBe("streaming");
+  });
+
+  it("transitions streaming → working on tool.start", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    await act(async () => {
+      await result.current.sendMessage("hello");
+    });
+    act(() => emit("text.delta", { text: "Let me check" }));
+    expect(result.current.streamingState).toBe("streaming");
+    act(() => emit("tool.start", { id: "t1", name: "search" }));
+    expect(result.current.streamingState).toBe("working");
+  });
+
+  it("transitions working → analyzing on last tool.done", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    await act(async () => {
+      await result.current.sendMessage("hello");
+    });
+    act(() => emit("text.delta", { text: "x" }));
+    act(() => emit("tool.start", { id: "t1", name: "search" }));
+    expect(result.current.streamingState).toBe("working");
+    act(() => emit("tool.done", { id: "t1", name: "search", ok: true, ms: 100 }));
+    expect(result.current.streamingState).toBe("analyzing");
+  });
+
+  it("holds working while parallel tools are still in flight, then analyzing", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    await act(async () => {
+      await result.current.sendMessage("hello");
+    });
+    act(() => {
+      emit("tool.start", { id: "a", name: "search" });
+      emit("tool.start", { id: "b", name: "fetch" });
+    });
+    expect(result.current.streamingState).toBe("working");
+    act(() => emit("tool.done", { id: "a", name: "search", ok: true, ms: 10 }));
+    expect(result.current.streamingState).toBe("working");
+    act(() => emit("tool.done", { id: "b", name: "fetch", ok: false, ms: 725 }));
+    expect(result.current.streamingState).toBe("analyzing");
+  });
+
+  it("transitions analyzing → streaming on the next text.delta", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    await act(async () => {
+      await result.current.sendMessage("hello");
+    });
+    act(() => {
+      emit("tool.start", { id: "t1", name: "search" });
+      emit("tool.done", { id: "t1", name: "search", ok: true, ms: 10 });
+    });
+    expect(result.current.streamingState).toBe("analyzing");
+    act(() => emit("text.delta", { text: "Based on that…" }));
+    expect(result.current.streamingState).toBe("streaming");
+  });
+
+  it("transitions analyzing → working when the model calls another tool", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    await act(async () => {
+      await result.current.sendMessage("hello");
+    });
+    act(() => {
+      emit("tool.start", { id: "t1", name: "search" });
+      emit("tool.done", { id: "t1", name: "search", ok: true, ms: 10 });
+    });
+    expect(result.current.streamingState).toBe("analyzing");
+    act(() => emit("tool.start", { id: "t2", name: "fetch" }));
+    expect(result.current.streamingState).toBe("working");
+  });
+
+  it("transitions to null on done event", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    await act(async () => {
+      await result.current.sendMessage("hello");
+    });
+    act(() => emit("text.delta", { text: "Hi" }));
+    expect(result.current.streamingState).toBe("streaming");
+    act(() => emit("done", { conversationId: "c1", response: "Hi" }));
+    expect(result.current.streamingState).toBeNull();
+  });
+
+  it("transitions to null on error event", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    await act(async () => {
+      await result.current.sendMessage("hello");
+    });
+    expect(result.current.streamingState).toBe("thinking");
+    act(() => emit("error", { error: "fail", message: "fail" }));
+    expect(result.current.streamingState).toBeNull();
+  });
+
+  it("transitions to null on cancelled event", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    await act(async () => {
+      await result.current.sendMessage("hello");
+    });
+    expect(result.current.streamingState).toBe("thinking");
+    act(() => emit("cancelled", {}));
+    expect(result.current.streamingState).toBeNull();
+  });
+
+  it("newConversation resets streamingState to null", () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    act(() => {
+      result.current.newConversation();
+    });
+    expect(result.current.streamingState).toBeNull();
+  });
+
+  it("full cycle: thinking → streaming → working → analyzing → streaming → null", async () => {
+    const { result } = renderHook(() => useChatContext(), { wrapper });
+    await act(async () => {
+      await result.current.sendMessage("hello");
+    });
+    expect(result.current.streamingState).toBe("thinking");
+    act(() => emit("text.delta", { text: "Let me " }));
+    expect(result.current.streamingState).toBe("streaming");
+    act(() => emit("tool.start", { id: "t1", name: "lookup" }));
+    expect(result.current.streamingState).toBe("working");
+    act(() => emit("tool.done", { id: "t1", name: "lookup", ok: true, ms: 50 }));
+    expect(result.current.streamingState).toBe("analyzing");
+    act(() => emit("text.delta", { text: "here you go" }));
+    expect(result.current.streamingState).toBe("streaming");
+    act(() => emit("done", { conversationId: "c1", response: "Let me here you go" }));
+    expect(result.current.streamingState).toBeNull();
+  });
 });

From fd7fceacf6485263684ecb67b196f9c97a54f50a Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Mon, 25 May 2026 10:25:43 -0600
Subject: [PATCH 04/26] feat(conversations): live streaming dots + flicker-free
 list
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Per-row streaming indicator: read host-pushed streamingConversationIds
  (useHostContext) and render a pulsing dot on conversations with an in-flight
  turn.
- No more list flicker on updates: data.changed refreshes run in the
  background (no skeleton swap) and only for conversation changes — other apps'
  data.changed are ignored. Skeleton stays for initial load + view switches.
- New conversations appear immediately: ConversationIndex.flushPending() picks
  up a just-created file on the read path instead of racing the fs.watch
  debounce.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 src/bundles/conversations/CHANGELOG.md        | 17 +++++
 src/bundles/conversations/src/index-cache.ts  | 23 +++++++
 src/bundles/conversations/ui/src/App.tsx      |  2 +-
 .../conversations/ui/src/ConversationList.tsx | 16 ++++-
 .../conversations/ui/src/Dashboard.tsx        | 68 ++++++++++++-------
 src/bundles/conversations/ui/src/index.css    | 18 +++++
 src/tools/platform/conversations.ts           |  4 ++
 test/unit/conversations-index-flush.test.ts   | 56 +++++++++++++++
 8 files changed, 178 insertions(+), 26 deletions(-)
 create mode 100644 test/unit/conversations-index-flush.test.ts

diff --git a/src/bundles/conversations/CHANGELOG.md b/src/bundles/conversations/CHANGELOG.md
index cb2721be..ba8315aa 100644
--- a/src/bundles/conversations/CHANGELOG.md
+++ b/src/bundles/conversations/CHANGELOG.md
@@ -1,5 +1,22 @@
 # Changelog
 
+## 0.4.0
+
+### Changed
+
+- List no longer flickers on live updates. `data.changed` refreshes now run in
+  the background (no skeleton swap) and only for conversation changes — other
+  apps' `data.changed` are ignored. Initial load and view switches still show
+  the skeleton.
+
+## 0.3.0
+
+### Added
+
+- Live streaming indicator: a pulsing dot marks any conversation with an
+  in-flight assistant turn. Driven by host-pushed `streamingConversationIds`
+  (`useHostContext`), so it reflects real-time tab state without polling.
+
 ## 0.2.0
 
 **Breaking — tool output shape.** The bundle now returns a display-oriented
diff --git a/src/bundles/conversations/src/index-cache.ts b/src/bundles/conversations/src/index-cache.ts
index c937e2dd..cb4d7d30 100644
--- a/src/bundles/conversations/src/index-cache.ts
+++ b/src/bundles/conversations/src/index-cache.ts
@@ -105,6 +105,29 @@ export class ConversationIndex {
     });
   }
 
+  /**
+   * Bring the index up to date NOW, bypassing the fs.watch debounce.
+   *
+   * Processes any queued watch events immediately, then scans the directory
+   * for files not yet indexed (a just-created conversation whose watch event
+   * hasn't fired or debounced yet). Called on the read path so a
+   * `data.changed`-driven list refresh reflects a brand-new conversation
+   * deterministically, instead of racing the 500ms watch debounce.
+   */
+  async flushPending(): Promise<void> {
+    if (this.debounceTimer) {
+      clearTimeout(this.debounceTimer);
+      this.debounceTimer = null;
+    }
+    await this.processPendingFiles();
+    if (!this.dir) return;
+    for (const filePath of listConversationFiles(this.dir)) {
+      if (!this.fileToId.has(basename(filePath))) {
+        await this.indexFile(filePath);
+      }
+    }
+  }
+
   /** Stop watching. */
   stopWatching(): void {
     if (this.watcher) {
diff --git a/src/bundles/conversations/ui/src/App.tsx b/src/bundles/conversations/ui/src/App.tsx
index 2b23c1bb..d0e86196 100644
--- a/src/bundles/conversations/ui/src/App.tsx
+++ b/src/bundles/conversations/ui/src/App.tsx
@@ -3,7 +3,7 @@ import { Dashboard } from "./Dashboard";
 
 export function App() {
   return (
-    <SynapseProvider name="@nimblebraininc/conversations" version="0.2.0">
+    <SynapseProvider name="@nimblebraininc/conversations" version="0.4.0">
       <Dashboard />
     </SynapseProvider>
   );
diff --git a/src/bundles/conversations/ui/src/ConversationList.tsx b/src/bundles/conversations/ui/src/ConversationList.tsx
index 8a7f433c..23a9e305 100644
--- a/src/bundles/conversations/ui/src/ConversationList.tsx
+++ b/src/bundles/conversations/ui/src/ConversationList.tsx
@@ -10,6 +10,8 @@ interface Props {
   groups: DateGroup[];
   activeFilter: FilterKey;
   totalConversations: number;
+  /** Conversation ids with an in-flight assistant turn (host-pushed). */
+  streamingIds?: Set<string>;
   onOpen: (id: string) => void;
 }
 
@@ -18,6 +20,7 @@ export function ConversationList({
   groups,
   activeFilter,
   totalConversations,
+  streamingIds,
   onOpen,
 }: Props) {
   if (loading) {
@@ -60,10 +63,21 @@ export function ConversationList({
           {showSectionLabels && <div className="section-label">{group.label}</div>}
           {group.items.map((c) => {
             const title = c.title || c.preview || c.id;
+            const isStreaming = streamingIds?.has(c.id) ?? false;
             return (
               <button type="button" key={c.id} className="conv-item" onClick={() => onOpen(c.id)}>
                 <div className="conv-item-top">
-                  <span className="conv-title">{truncate(title, 80)}</span>
+                  <span className="conv-title">
+                    {isStreaming && (
+                      <span
+                        className="conv-streaming-dot"
+                        role="img"
+                        aria-label="Responding"
+                        title="Responding…"
+                      />
+                    )}
+                    {truncate(title, 80)}
+                  </span>
                   <span className="conv-time">{relativeTime(c.updatedAt || c.createdAt)}</span>
                 </div>
                 {c.preview && <div className="conv-preview">{truncate(c.preview, 120)}</div>}
diff --git a/src/bundles/conversations/ui/src/Dashboard.tsx b/src/bundles/conversations/ui/src/Dashboard.tsx
index bc81de9e..1d597007 100644
--- a/src/bundles/conversations/ui/src/Dashboard.tsx
+++ b/src/bundles/conversations/ui/src/Dashboard.tsx
@@ -1,4 +1,4 @@
-import { useAction, useDataSync, useSynapse } from "@nimblebrain/synapse/react";
+import { useAction, useDataSync, useHostContext, useSynapse } from "@nimblebrain/synapse/react";
 import { useCallback, useEffect, useMemo, useState } from "react";
 import { ConversationList } from "./ConversationList";
 import { groupByDate } from "./dateUtils";
@@ -11,6 +11,13 @@ type View = "list" | "search";
 export function Dashboard() {
   const synapse = useSynapse();
   const action = useAction();
+  // Conversations with an in-flight assistant turn in this tab — pushed by the
+  // host via hostContext. Drives a live per-row streaming indicator.
+  const { streamingConversationIds } = useHostContext<{ streamingConversationIds?: string[] }>();
+  const streamingIds = useMemo(
+    () => new Set(streamingConversationIds ?? []),
+    [streamingConversationIds],
+  );
 
   const [view, setView] = useState<View>("list");
   const [conversations, setConversations] = useState<ListResult["conversations"]>([]);
@@ -20,29 +27,38 @@ export function Dashboard() {
   const [loading, setLoading] = useState(true);
   const [error, setError] = useState<string | null>(null);
 
-  const loadList = useCallback(async () => {
-    setLoading(true);
-    setError(null);
-    try {
-      const result = await synapse.callTool<Record<string, never>, ListResult>("list", {});
-      if (result.isError) {
-        setError("Failed to load conversations");
-        return;
+  // `background: true` refreshes data in place without flipping to the skeleton
+  // state — used for live data-changed refreshes so the list doesn't flicker.
+  // Rows are keyed by id, so React reconciles the swapped data without a
+  // visible reload. Skeletons are reserved for the initial load + view switches.
+  const loadList = useCallback(
+    async (opts?: { background?: boolean }) => {
+      if (!opts?.background) setLoading(true);
+      setError(null);
+      try {
+        const result = await synapse.callTool<Record<string, never>, ListResult>("list", {});
+        if (result.isError) {
+          setError("Failed to load conversations");
+          return;
+        }
+        setConversations(result.data.conversations || []);
+      } catch (err) {
+        setError(err instanceof Error ? err.message : "Failed to load conversations");
+      } finally {
+        if (!opts?.background) setLoading(false);
       }
-      setConversations(result.data.conversations || []);
-    } catch (err) {
-      setError(err instanceof Error ? err.message : "Failed to load conversations");
-    } finally {
-      setLoading(false);
-    }
-  }, [synapse]);
+    },
+    [synapse],
+  );
 
   const runSearch = useCallback(
-    async (query: string) => {
+    async (query: string, opts?: { background?: boolean }) => {
       setView("search");
       setSearchQuery(query);
-      setSearchResults(null);
-      setLoading(true);
+      if (!opts?.background) {
+        setSearchResults(null);
+        setLoading(true);
+      }
       setError(null);
       try {
         const result = await synapse.callTool<{ query: string }, SearchResultData>("search", {
@@ -56,7 +72,7 @@ export function Dashboard() {
       } catch (err) {
         setError(err instanceof Error ? err.message : "Search failed");
       } finally {
-        setLoading(false);
+        if (!opts?.background) setLoading(false);
       }
     },
     [synapse],
@@ -67,12 +83,15 @@ export function Dashboard() {
     loadList();
   }, [loadList]);
 
-  // Reload list/search on host data-changed broadcasts.
-  useDataSync(() => {
+  // Refresh on host data-changed broadcasts — but only for conversation
+  // changes (ignore unrelated apps' data.changed), and in the background so
+  // the list updates in place without a skeleton flicker.
+  useDataSync((event) => {
+    if (event.server !== "conversations") return;
     if (view === "list") {
-      loadList();
+      loadList({ background: true });
     } else if (view === "search" && searchQuery) {
-      runSearch(searchQuery);
+      runSearch(searchQuery, { background: true });
     }
   });
 
@@ -155,6 +174,7 @@ export function Dashboard() {
             groups={groups}
             activeFilter={activeFilter}
             totalConversations={conversations.length}
+            streamingIds={streamingIds}
             onOpen={handleOpenConversation}
           />
         )}
diff --git a/src/bundles/conversations/ui/src/index.css b/src/bundles/conversations/ui/src/index.css
index 7c5f4143..712cc7d2 100644
--- a/src/bundles/conversations/ui/src/index.css
+++ b/src/bundles/conversations/ui/src/index.css
@@ -189,6 +189,24 @@ body {
   color: var(--color-text-secondary, #737373);
   flex-shrink: 0;
 }
+/* Live indicator: a conversation with an in-flight assistant turn. */
+.conv-streaming-dot {
+  display: inline-block;
+  width: 7px;
+  height: 7px;
+  margin-right: 7px;
+  border-radius: 50%;
+  background: var(--color-text-accent, #0055ff);
+  vertical-align: middle;
+  animation: conv-streaming-pulse 1.2s ease-in-out infinite;
+}
+@keyframes conv-streaming-pulse {
+  0%, 100% { opacity: 1; transform: scale(1); }
+  50% { opacity: 0.4; transform: scale(0.7); }
+}
+@media (prefers-reduced-motion: reduce) {
+  .conv-streaming-dot { animation: none; }
+}
 .conv-preview {
   margin-top: 4px; font-size: 13px;
   color: var(--color-text-secondary, #737373);
diff --git a/src/tools/platform/conversations.ts b/src/tools/platform/conversations.ts
index ae431f99..78f9e643 100644
--- a/src/tools/platform/conversations.ts
+++ b/src/tools/platform/conversations.ts
@@ -61,6 +61,10 @@ export async function createConversationsSource(
       await cachedIndex.build(dir);
       cachedIndex.startWatching(dir);
     }
+    // Pick up brand-new conversations deterministically rather than racing the
+    // fs.watch debounce — a `data.changed` refresh fires the instant a turn
+    // starts, before the watch has re-indexed the new file.
+    await cachedIndex.flushPending();
     return { index: cachedIndex, dir };
   }
 
diff --git a/test/unit/conversations-index-flush.test.ts b/test/unit/conversations-index-flush.test.ts
new file mode 100644
index 00000000..1750e700
--- /dev/null
+++ b/test/unit/conversations-index-flush.test.ts
@@ -0,0 +1,56 @@
+import { afterEach, beforeEach, describe, expect, it } from "bun:test";
+import { mkdirSync, rmSync, writeFileSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { ConversationIndex } from "../../src/bundles/conversations/src/index-cache.ts";
+
+// flushPending() must surface a brand-new conversation deterministically —
+// the conversations-list refresh fires the instant a turn starts, before the
+// fs.watch debounce re-indexes the new file (the "new conversation doesn't
+// show up" bug).
+
+function writeConversation(dir: string, id: string): void {
+  const meta = JSON.stringify({
+    id,
+    ownerId: "usr_test",
+    createdAt: "2025-01-01T00:00:00.000Z",
+    updatedAt: "2025-01-01T00:00:00.000Z",
+    title: null,
+    totalInputTokens: 0,
+    totalOutputTokens: 0,
+    lastModel: null,
+  });
+  const userMsg = JSON.stringify({ role: "user", content: "Hello", timestamp: "2025-01-01T00:00:00.000Z" });
+  writeFileSync(join(dir, `${id}.jsonl`), `${meta}\n${userMsg}\n`);
+}
+
+describe("ConversationIndex.flushPending", () => {
+  let dir: string;
+  let index: ConversationIndex;
+
+  beforeEach(async () => {
+    dir = join(tmpdir(), `nb-flush-test-${crypto.randomUUID()}`);
+    mkdirSync(dir, { recursive: true });
+    index = new ConversationIndex();
+    await index.build(dir);
+  });
+
+  afterEach(() => {
+    index.stopWatching();
+    rmSync(dir, { recursive: true, force: true });
+  });
+
+  it("picks up a newly written conversation file without waiting for the watch debounce", async () => {
+    expect(index.list().totalCount).toBe(0);
+
+    // A new conversation lands on disk (as runtime.startTurn's store.create does).
+    writeConversation(dir, "conv_brandnew000001");
+    // Without flushing, the in-memory index hasn't seen it yet.
+    expect(index.list().totalCount).toBe(0);
+
+    await index.flushPending();
+    const result = index.list();
+    expect(result.totalCount).toBe(1);
+    expect(result.conversations[0].id).toBe("conv_brandnew000001");
+  });
+});

From 00f424481d7b30facf7dac5a672aea92fc81a052 Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Mon, 25 May 2026 10:47:03 -0600
Subject: [PATCH 05/26] refactor(web): remove old streaming-chat client
 orphaned by the rewrite
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The per-conversation viewer replaced the old streaming path, leaving the
client-side pieces unreferenced:

- client.ts: streamChat / streamChatMultipart / consumeSSEStream (callers
  now use startChatTurn + connectConversationStream).
- conversation-sse.ts and useConversationEvents.ts (the old cross-tab SSE
  hook) — zero importers.

The server `/v1/chat/stream` + handleChatStream stay (still a valid REST
surface, exercised by integration tests). Also comment the one ported
`as unknown as` cast for the done-payload `files` field.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 web/src/api/client.ts                  | 138 ---------------
 web/src/api/conversation-sse.ts        | 235 -------------------------
 web/src/hooks/chat-store.ts            |   2 +
 web/src/hooks/useConversationEvents.ts |  81 ---------
 4 files changed, 2 insertions(+), 454 deletions(-)
 delete mode 100644 web/src/api/conversation-sse.ts
 delete mode 100644 web/src/hooks/useConversationEvents.ts

diff --git a/web/src/api/client.ts b/web/src/api/client.ts
index dcfa4e04..f0bb414c 100644
--- a/web/src/api/client.ts
+++ b/web/src/api/client.ts
@@ -5,13 +5,10 @@ import type {
   BootstrapResponse,
   ChatRequest,
   ChatResult,
-  ChatStreamEventMap,
-  ChatStreamEventType,
   HealthInfo,
   PlacementEntry,
   ToolCallResult,
 } from "../types";
-import { getConversationSubscriberId } from "./conversation-sse";
 import { createFetchWithRefresh } from "./fetch-with-refresh";
 
 // ---------------------------------------------------------------------------
@@ -341,141 +338,6 @@ export async function chat(req: ChatRequest): Promise<ChatResult> {
   });
 }
 
-type ChatStreamCallback = <K extends ChatStreamEventType>(
-  type: K,
-  data: ChatStreamEventMap[K],
-) => void;
-
-/** Parse SSE events from a streaming response body. */
-async function consumeSSEStream(res: Response, onEvent: ChatStreamCallback): Promise<void> {
-  const reader = res.body?.getReader();
-  if (!reader) throw new Error("No response body");
-
-  const decoder = new TextDecoder();
-  let buffer = "";
-
-  for (;;) {
-    const { done, value } = await reader.read();
-    if (done) break;
-
-    buffer += decoder.decode(value, { stream: true });
-    const lines = buffer.split("\n");
-    buffer = lines.pop() ?? "";
-
-    let currentEvent = "";
-    for (const line of lines) {
-      if (line.startsWith("event: ")) {
-        currentEvent = line.slice(7).trim();
-      } else if (line.startsWith("data: ") && currentEvent) {
-        try {
-          const data = JSON.parse(line.slice(6));
-          onEvent(currentEvent as ChatStreamEventType, data);
-        } catch {
-          // Skip malformed data lines
-        }
-        currentEvent = "";
-      }
-    }
-  }
-}
-
-/** Streaming chat via SSE. Calls onEvent for each event, resolves when done.
- *  `signal` is for caller-driven cleanup (logout / store reset) — NOT
- *  conversation switching, which keeps the stream alive in the background. */
-export async function streamChat(
-  req: ChatRequest,
-  onEvent: ChatStreamCallback,
-  signal?: AbortSignal,
-): Promise<void> {
-  // If a conv-events SSE subscription is open for this conversation,
-  // pass its server-issued subscriber id so the broadcast suppresses
-  // self-echo. Without this, the sender's own tab double-processes
-  // every event (once via the streamed HTTP response below, once via
-  // its conv-events subscription).
-  const originSubId = req.conversationId
-    ? getConversationSubscriberId(req.conversationId)
-    : undefined;
-  const res = await fetchWithRefresh(`${API_BASE}/v1/chat/stream`, {
-    method: "POST",
-    credentials: "include",
-    headers: headers(originSubId ? { "X-Origin-Subscriber-Id": originSubId } : undefined),
-    body: JSON.stringify(req),
-    ...(signal ? { signal } : {}),
-  });
-
-  if (res.status === 401) {
-    throw new ApiClientError("unauthorized", "Unauthorized", 401);
-  }
-
-  if (!res.ok) {
-    const body: ApiError = await res.json().catch(() => ({
-      error: "unknown",
-      message: res.statusText,
-    }));
-    throw new ApiClientError(body.error, body.message, res.status, body.details);
-  }
-
-  await consumeSSEStream(res, onEvent);
-}
-
-/**
- * Streaming chat via SSE with file attachments (multipart/form-data).
- * When files are present, sends a FormData body instead of JSON.
- * SSE streaming works identically for both content types.
- */
-export async function streamChatMultipart(
-  req: ChatRequest,
-  files: File[],
-  onEvent: ChatStreamCallback,
-  signal?: AbortSignal,
-): Promise<void> {
-  const formData = new FormData();
-  formData.append("message", req.message);
-  if (req.conversationId) formData.append("conversationId", req.conversationId);
-  if (req.model) formData.append("model", req.model);
-  if (req.appContext) formData.append("appContext", JSON.stringify(req.appContext));
-  for (const file of files) {
-    formData.append("files", file, file.name);
-  }
-
-  // Build headers WITHOUT Content-Type — let the browser set multipart boundary
-  const h: Record<string, string> = {};
-  if (authToken && authToken !== "__cookie__") {
-    h.Authorization = `Bearer ${authToken}`;
-  }
-  if (activeWorkspaceId) {
-    h["X-Workspace-Id"] = activeWorkspaceId;
-  }
-  // Suppress self-echo on the conv-events subscription — see
-  // `streamChat` above for why this matters.
-  if (req.conversationId) {
-    const originSubId = getConversationSubscriberId(req.conversationId);
-    if (originSubId) h["X-Origin-Subscriber-Id"] = originSubId;
-  }
-
-  const res = await fetchWithRefresh(`${API_BASE}/v1/chat/stream`, {
-    method: "POST",
-    credentials: "include",
-    headers: h,
-    body: formData,
-    ...(signal ? { signal } : {}),
-  });
-
-  if (res.status === 401) {
-    throw new ApiClientError("unauthorized", "Unauthorized", 401);
-  }
-
-  if (!res.ok) {
-    const body: ApiError = await res.json().catch(() => ({
-      error: "unknown",
-      message: res.statusText,
-    }));
-    throw new ApiClientError(body.error, body.message, res.status, body.details);
-  }
-
-  await consumeSSEStream(res, onEvent);
-}
-
 /**
  * Start a server-authoritative turn. Returns the conversation id immediately;
  * the turn runs to completion on the server regardless of this client. Watch
diff --git a/web/src/api/conversation-sse.ts b/web/src/api/conversation-sse.ts
deleted file mode 100644
index fed65f27..00000000
--- a/web/src/api/conversation-sse.ts
+++ /dev/null
@@ -1,235 +0,0 @@
-/**
- * Per-conversation SSE client.
- *
- * Connects to GET /v1/conversations/:id/events to receive real-time
- * chat events from other participants in a shared conversation.
- *
- * Same pattern as sse.ts (fetch + ReadableStream for custom auth headers).
- * Auto-reconnects with exponential backoff. On reconnect, calls onReconnect
- * so the caller can reload the full conversation to catch missed messages.
- */
-
-import { refreshSession } from "./client";
-
-/**
- * Per-conversation `subscriberId` registry.
- *
- * The server-issued subscriber id arrives in the first SSE frame
- * (`event: subscribed`) once a conversation event stream opens. We
- * stash it here so the chat-stream POST path can pick it up via
- * `getConversationSubscriberId(convId)` and forward it as
- * `X-Origin-Subscriber-Id` — that makes the broadcast skip this
- * tab's own conv-events subscription and prevents the sender from
- * double-handling every event (once via the chat-stream HTTP
- * response, once via the broadcast hitting its own subscription).
- *
- * Cleared on stream cancel / close to avoid stale ids leaking into
- * a future stream attempt for the same conv.
- */
-const conversationSubscriberIds = new Map<string, string>();
-
-export function getConversationSubscriberId(conversationId: string): string | undefined {
-  return conversationSubscriberIds.get(conversationId);
-}
-
-function setConversationSubscriberId(conversationId: string, subscriberId: string): void {
-  conversationSubscriberIds.set(conversationId, subscriberId);
-}
-
-function clearConversationSubscriberId(conversationId: string): void {
-  conversationSubscriberIds.delete(conversationId);
-}
-
-/** Options for connecting to a conversation event stream. */
-export interface ConversationSseOptions {
-  conversationId: string;
-  /** Base URL. Defaults to empty string (same-origin). */
-  apiBase?: string;
-  /** Bearer token for authorization. */
-  token?: string;
-  /** Called when an SSE event is received. */
-  onEvent: (type: string, data: unknown) => void;
-  /** Called on successful reconnection (caller should reload conversation). */
-  onReconnect?: () => void;
-  /** Called when the connection is lost (before reconnect). */
-  onDisconnect?: () => void;
-  /** Called on unrecoverable error (e.g. 403 after participant removal). */
-  onError?: (error: Error) => void;
-}
-
-/** Handle to close the conversation SSE connection. */
-export interface ConversationSseConnection {
-  close(): void;
-}
-
-const INITIAL_BACKOFF_MS = 1_000;
-const MAX_BACKOFF_MS = 30_000;
-const BACKOFF_MULTIPLIER = 2;
-
-export function connectConversationEvents(
-  options: ConversationSseOptions,
-): ConversationSseConnection {
-  const {
-    conversationId,
-    apiBase = "",
-    token,
-    onEvent,
-    onReconnect,
-    onDisconnect,
-    onError,
-  } = options;
-
-  let closed = false;
-  let abortController: AbortController | null = null;
-  let reconnectTimer: ReturnType<typeof setTimeout> | null = null;
-  let backoff = INITIAL_BACKOFF_MS;
-  let hasConnectedBefore = false;
-
-  async function connect(): Promise<void> {
-    if (closed) return;
-
-    abortController = new AbortController();
-    const hdrs: Record<string, string> = {};
-    if (token && token !== "__cookie__") {
-      hdrs.Authorization = `Bearer ${token}`;
-    }
-
-    try {
-      const res = await fetch(
-        `${apiBase}/v1/conversations/${encodeURIComponent(conversationId)}/events`,
-        {
-          headers: hdrs,
-          credentials: "include",
-          signal: abortController.signal,
-        },
-      );
-
-      if (res.status === 401) {
-        // Attempt silent token refresh before giving up
-        const refreshed = await refreshSession();
-        if (refreshed) {
-          scheduleReconnect();
-          return;
-        }
-        onError?.(new Error("Conversation SSE auth failed after token refresh"));
-        return;
-      }
-
-      if (!res.ok) {
-        // 403/404 = access denied or removed — don't reconnect
-        if (res.status === 403 || res.status === 404) {
-          onError?.(new Error(`Conversation access denied: ${res.status}`));
-          return;
-        }
-        throw new Error(`Conversation SSE failed: ${res.status} ${res.statusText}`);
-      }
-
-      // Connected successfully — reset backoff
-      backoff = INITIAL_BACKOFF_MS;
-
-      // If this is a reconnect, notify so caller can reload missed messages
-      if (hasConnectedBefore) {
-        onReconnect?.();
-      }
-      hasConnectedBefore = true;
-
-      const reader = res.body?.getReader();
-      if (!reader) throw new Error("No response body");
-
-      const decoder = new TextDecoder();
-      let buffer = "";
-
-      for (;;) {
-        const { done, value } = await reader.read();
-        if (done || closed) break;
-
-        buffer += decoder.decode(value, { stream: true });
-        const lines = buffer.split("\n");
-        buffer = lines.pop() ?? "";
-
-        let currentEvent = "";
-        for (const line of lines) {
-          if (line.startsWith("event: ")) {
-            currentEvent = line.slice(7).trim();
-          } else if (line.startsWith("data: ") && currentEvent) {
-            try {
-              const data = JSON.parse(line.slice(6));
-              if (currentEvent === "subscribed") {
-                // Server-issued subscriber id — record it so the
-                // chat-stream POST can suppress self-echo. We
-                // deliberately don't surface this event to onEvent;
-                // it's plumbing, not a chat event.
-                const subscriberId = (data as { subscriberId?: unknown })?.subscriberId;
-                if (typeof subscriberId === "string") {
-                  setConversationSubscriberId(conversationId, subscriberId);
-                }
-              } else {
-                onEvent(currentEvent, data);
-              }
-            } catch {
-              // Skip malformed data lines
-            }
-            currentEvent = "";
-          }
-        }
-      }
-
-      // Stream ended — reconnect unless closed
-      if (!closed) {
-        onDisconnect?.();
-        scheduleReconnect();
-      }
-    } catch (err) {
-      if (closed) return;
-      if (err instanceof DOMException && err.name === "AbortError") return;
-
-      onDisconnect?.();
-
-      // 403 is unrecoverable (access denied). 401 — try refresh first.
-      if (err instanceof Error && err.message.includes("401")) {
-        const refreshed = await refreshSession();
-        if (refreshed) {
-          scheduleReconnect();
-          return;
-        }
-        onError?.(err);
-        return;
-      }
-      if (err instanceof Error && err.message.includes("403")) {
-        onError?.(err);
-        return;
-      }
-
-      scheduleReconnect();
-    }
-  }
-
-  function scheduleReconnect(): void {
-    if (closed) return;
-    reconnectTimer = setTimeout(() => {
-      backoff = Math.min(backoff * BACKOFF_MULTIPLIER, MAX_BACKOFF_MS);
-      connect();
-    }, backoff);
-  }
-
-  connect();
-
-  return {
-    close() {
-      closed = true;
-      if (reconnectTimer) {
-        clearTimeout(reconnectTimer);
-        reconnectTimer = null;
-      }
-      if (abortController) {
-        abortController.abort();
-        abortController = null;
-      }
-      // Drop the cached subscriber id — the next subscription gets a
-      // fresh server-issued id, so a stale entry would mislead the
-      // chat-stream POST into excluding a subscriber that no longer
-      // exists.
-      clearConversationSubscriberId(conversationId);
-    },
-  };
-}
diff --git a/web/src/hooks/chat-store.ts b/web/src/hooks/chat-store.ts
index 0d5a4ca2..1622e488 100644
--- a/web/src/hooks/chat-store.ts
+++ b/web/src/hooks/chat-store.ts
@@ -645,6 +645,8 @@ export function createChatStore(): ChatStore {
               llmMs: result.usage.llmMs,
             }
           : undefined;
+        // Cast: `files` is attached to the done payload by the server but isn't
+        // on the typed ChatResult — read it defensively.
         const resultFiles = (result as unknown as Record<string, unknown>).files as
           | MessageFileAttachment[]
           | undefined;
diff --git a/web/src/hooks/useConversationEvents.ts b/web/src/hooks/useConversationEvents.ts
deleted file mode 100644
index d701b820..00000000
--- a/web/src/hooks/useConversationEvents.ts
+++ /dev/null
@@ -1,81 +0,0 @@
-/**
- * React hook for subscribing to per-conversation SSE events.
- *
- * Stage 1: conversations are single-owner; the broadcast still fires
- * server-side so this subscription is the same-user cross-tab sync
- * path (one user, multiple browser tabs/devices on the same
- * conversation). Stage 4 reintroduces multi-user sharing and this
- * hook's audience widens.
- *
- * Disconnects on cleanup or when the conversation changes. On
- * reconnect, triggers a full conversation reload to catch missed
- * messages.
- */
-
-import { useEffect, useRef } from "react";
-import { getAuthToken } from "../api/client";
-import { type ConversationSseConnection, connectConversationEvents } from "../api/conversation-sse";
-
-export interface ConversationEventCallbacks {
-  /** A user message arrived from another participant. */
-  onRemoteUserMessage: (data: {
-    userId: string;
-    displayName: string;
-    content: string;
-    timestamp: string;
-  }) => void;
-  /** A streaming event arrived from the assistant (responding to another user's message). */
-  onRemoteStreamEvent: (type: string, data: unknown) => void;
-  /** Connection was re-established — reload the conversation to catch missed messages. */
-  onReconnect: () => void;
-}
-
-export function useConversationEvents(
-  conversationId: string | null,
-  callbacks: ConversationEventCallbacks,
-): void {
-  // Keep callbacks in a ref so we don't reconnect on every render
-  const callbacksRef = useRef(callbacks);
-  callbacksRef.current = callbacks;
-
-  useEffect(() => {
-    // Subscribe whenever a conversation is open — same-user cross-tab
-    // sync (and, post-Stage-4, multi-user sharing).
-    if (!conversationId) return;
-
-    const token = getAuthToken();
-    let connection: ConversationSseConnection | null = null;
-
-    connection = connectConversationEvents({
-      conversationId,
-      token: token ?? undefined,
-      onEvent: (type, data) => {
-        if (type === "user.message") {
-          callbacksRef.current.onRemoteUserMessage(
-            data as {
-              userId: string;
-              displayName: string;
-              content: string;
-              timestamp: string;
-            },
-          );
-        } else if (type === "heartbeat") {
-          // Ignore heartbeats
-        } else {
-          // text.delta, tool.start, tool.done, llm.done, done
-          callbacksRef.current.onRemoteStreamEvent(type, data);
-        }
-      },
-      onReconnect: () => {
-        callbacksRef.current.onReconnect();
-      },
-      onError: (err) => {
-        console.warn("[conversation-sse] Error:", err.message);
-      },
-    });
-
-    return () => {
-      connection?.close();
-    };
-  }, [conversationId]);
-}

From a86bafdced44fa9b77067acd12980fefe1c94717 Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Mon, 25 May 2026 10:58:49 -0600
Subject: [PATCH 06/26] test(conversations): fix auto-title detection after
 #253 prompt change

The capturing-model test helper skipped auto-title model calls by matching
the old prompt string ("Generate a 3-6 word title"). The #253 rework changed
the title system prompt, so the guard stopped recognizing title calls and they
polluted the captured chat system prompt. Match the new prompt instead.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 test/integration/appcontext-wiring.test.ts   | 2 +-
 test/integration/dependency-checking.test.ts | 2 +-
 test/integration/runtime.test.ts             | 2 +-
 test/integration/skill-lifecycle.test.ts     | 2 +-
 4 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/test/integration/appcontext-wiring.test.ts b/test/integration/appcontext-wiring.test.ts
index ea1d5b0f..480eeeab 100644
--- a/test/integration/appcontext-wiring.test.ts
+++ b/test/integration/appcontext-wiring.test.ts
@@ -13,7 +13,7 @@ function createCapturingModel() {
 		const systemMsg = options.prompt.find((m) => m.role === "system");
 		if (systemMsg && typeof systemMsg.content === "string") {
 			// Skip auto-title calls
-			if (!systemMsg.content.includes("Generate a 3-6 word title")) {
+			if (!systemMsg.content.includes("descriptive titles for conversations")) {
 				capturedSystem = systemMsg.content;
 			}
 		}
diff --git a/test/integration/dependency-checking.test.ts b/test/integration/dependency-checking.test.ts
index e62ec72a..6b9ead22 100644
--- a/test/integration/dependency-checking.test.ts
+++ b/test/integration/dependency-checking.test.ts
@@ -21,7 +21,7 @@ function createCapturingModel(): { model: LanguageModelV3; getSystem: () => stri
     const systemMsg = options.prompt.find((m) => m.role === "system");
     if (systemMsg && typeof systemMsg.content === "string") {
       // Skip auto-title calls (they have a short, distinctive system prompt)
-      if (!systemMsg.content.includes("Generate a 3-6 word title")) {
+      if (!systemMsg.content.includes("descriptive titles for conversations")) {
         capturedSystem = systemMsg.content;
       }
     }
diff --git a/test/integration/runtime.test.ts b/test/integration/runtime.test.ts
index 4e831dc2..bd8b78d1 100644
--- a/test/integration/runtime.test.ts
+++ b/test/integration/runtime.test.ts
@@ -217,7 +217,7 @@ I am Nira, your AI assistant. You work at Acme Corp.
       const systemMsg = options.prompt.find((m) => m.role === "system");
       if (systemMsg && typeof systemMsg.content === "string") {
         // Skip auto-title calls
-        if (!systemMsg.content.includes("Generate a 3-6 word title")) {
+        if (!systemMsg.content.includes("descriptive titles for conversations")) {
           capturedSystem = systemMsg.content;
         }
       }
diff --git a/test/integration/skill-lifecycle.test.ts b/test/integration/skill-lifecycle.test.ts
index 98708a10..0f0e93e1 100644
--- a/test/integration/skill-lifecycle.test.ts
+++ b/test/integration/skill-lifecycle.test.ts
@@ -22,7 +22,7 @@ function createCapturingModel(): { model: LanguageModelV3; getSystem: () => stri
 		const systemMsg = options.prompt.find((m) => m.role === "system");
 		if (systemMsg && typeof systemMsg.content === "string") {
 			// Skip auto-title calls (they have a short, distinctive system prompt)
-			if (!systemMsg.content.includes("Generate a 3-6 word title")) {
+			if (!systemMsg.content.includes("descriptive titles for conversations")) {
 				capturedSystem = systemMsg.content;
 			}
 		}

From 9ddfd2e59abccb3407011cc0a7324e2b049ec56e Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Mon, 25 May 2026 10:58:49 -0600
Subject: [PATCH 07/26] fix(adapters): log sinks must not throw into the
 event-emit path
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Detached turns emit events after the originating request ends; if the workdir
is gone (test teardown) or a write otherwise fails (disk full, perms), the
unguarded appendFileSync threw out of emit() as an unhandled error. Wrap the
write best-effort — a failed log line must never crash the caller.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 src/adapters/structured-log-sink.ts | 8 +++++++-
 src/adapters/workspace-log-sink.ts  | 8 +++++++-
 2 files changed, 14 insertions(+), 2 deletions(-)

diff --git a/src/adapters/structured-log-sink.ts b/src/adapters/structured-log-sink.ts
index 0d37a270..8c10a511 100644
--- a/src/adapters/structured-log-sink.ts
+++ b/src/adapters/structured-log-sink.ts
@@ -92,7 +92,13 @@ export class StructuredLogSink implements EventSink {
   private writeLine(record: Record<string, unknown>): void {
     const today = new Date().toISOString().slice(0, 10); // YYYY-MM-DD
     const filename = `nimblebrain-${today}.jsonl`;
-    appendFileSync(join(this.dir, filename), `${JSON.stringify(record)}\n`);
+    try {
+      appendFileSync(join(this.dir, filename), `${JSON.stringify(record)}\n`);
+    } catch {
+      // Best-effort logging: a write failure (disk full, perms, or a detached
+      // turn emitting after the workdir was torn down) must never throw into
+      // the event-emit path and crash the caller.
+    }
   }
 
   /** Remove log files older than the retention threshold. */
diff --git a/src/adapters/workspace-log-sink.ts b/src/adapters/workspace-log-sink.ts
index 7df6ddd3..a140884d 100644
--- a/src/adapters/workspace-log-sink.ts
+++ b/src/adapters/workspace-log-sink.ts
@@ -64,7 +64,13 @@ export class WorkspaceLogSink implements EventSink {
 
     const today = new Date().toISOString().slice(0, 10); // YYYY-MM-DD
     const filename = `${today}.jsonl`;
-    appendFileSync(join(this.dir, filename), `${JSON.stringify(record)}\n`);
+    try {
+      appendFileSync(join(this.dir, filename), `${JSON.stringify(record)}\n`);
+    } catch {
+      // Best-effort logging: a write failure (disk full, perms, or a detached
+      // turn emitting after the workdir was torn down) must never throw into
+      // the event-emit path and crash the caller.
+    }
   }
 
   /** No-op — kept for API compatibility. Writes are synchronous. */

From 46d775b6f6f750eba79744fe22228433bfa873ad Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Mon, 25 May 2026 11:22:11 -0600
Subject: [PATCH 08/26] fix(runtime): deliver `cancelled` frame to live viewers
 on Stop

RunBus.cancel() flips the run to terminal synchronously, after which publish()
is a no-op. The engine's post-abort `cancelled` publish (startTurn's catch)
therefore never reached the SSE feed (onTurnEvent), so the Stop button aborted
generation but left the UI stuck streaming until a reload. done/error work
because they publish before ending while the run is still active.

Publish `cancelled` in cancelTurn BEFORE RunBus.cancel ends the run. The
engine's later cancelled publish becomes a harmless no-op. Adds a regression
test on the live onTurnEvent path (the attach/onEnd path the old tests used
did not cover this).

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 src/runtime/runtime.ts                 |  7 ++++
 test/integration/detached-turn.test.ts | 54 ++++++++++++++++++++++++++
 2 files changed, 61 insertions(+)

diff --git a/src/runtime/runtime.ts b/src/runtime/runtime.ts
index 96ad3c41..ab3e82b0 100644
--- a/src/runtime/runtime.ts
+++ b/src/runtime/runtime.ts
@@ -776,6 +776,13 @@ export class Runtime {
 
   /** Explicitly cancel an in-flight turn (the Stop button). */
   cancelTurn(conversationId: string): boolean {
+    if (!this.runBus.isActive(conversationId)) return false;
+    // Publish the terminal `cancelled` frame to live viewers BEFORE ending the
+    // run. `RunBus.cancel` flips status to terminal synchronously, after which
+    // `publish` is a no-op — so the engine's own post-abort `cancelled` publish
+    // (in startTurn's catch) never reaches the SSE. Without this, the Stop
+    // button aborts generation but the UI stays stuck streaming until a reload.
+    this.publishTurnEvent(conversationId, "cancelled", {});
     return this.runBus.cancel(conversationId);
   }
 
diff --git a/test/integration/detached-turn.test.ts b/test/integration/detached-turn.test.ts
index fe82e500..7cc1bf3e 100644
--- a/test/integration/detached-turn.test.ts
+++ b/test/integration/detached-turn.test.ts
@@ -6,6 +6,7 @@ import { EventSourcedConversationStore } from "../../src/conversation/event-sour
 import { Runtime } from "../../src/runtime/runtime.ts";
 import type { BufferedRunEvent, RunStatus } from "../../src/runtime/run-bus.ts";
 import { createEchoModel } from "../helpers/echo-model.ts";
+import { createMockModel } from "../helpers/mock-model.ts";
 import { TEST_WORKSPACE_ID, provisionTestWorkspace } from "../helpers/test-workspace.ts";
 
 let runtime: Runtime;
@@ -97,3 +98,56 @@ describe("detached turns (server-authoritative streaming)", () => {
     await awaitTurn(conversationId);
   });
 });
+
+describe("cancel delivers a terminal frame to live viewers (Stop button)", () => {
+  let rt: Runtime;
+  const dir = join(tmpdir(), `nimblebrain-cancel-${Date.now()}`);
+  // Gate the model so the turn stays active until we cancel it mid-run.
+  let release!: () => void;
+  const gate = new Promise<void>((r) => {
+    release = r;
+  });
+
+  beforeAll(async () => {
+    mkdirSync(dir, { recursive: true });
+    rt = await Runtime.start({
+      model: {
+        provider: "custom",
+        adapter: createMockModel(async () => {
+          await gate;
+          return { content: [{ type: "text", text: "unreached" }] };
+        }),
+      },
+      noDefaultBundles: true,
+      logging: { disabled: true },
+      workDir: dir,
+    });
+    await provisionTestWorkspace(rt);
+  });
+
+  afterAll(async () => {
+    release(); // let the gated engine task unwind before shutdown
+    await rt.shutdown();
+    rmSync(dir, { recursive: true, force: true });
+  });
+
+  it("publishes `cancelled` on the live onTurnEvent path (not just RunBus onEnd)", async () => {
+    // Capture the SSE feed path: server.ts wires runtime.onTurnEvent →
+    // ConversationEventManager. This is the channel the bug bypassed.
+    const captured: BufferedRunEvent[] = [];
+    rt.onTurnEvent = (_cid, e) => captured.push(e);
+
+    const { conversationId } = await rt.startTurn({
+      message: "hang",
+      workspaceId: TEST_WORKSPACE_ID,
+    });
+    await waitFor(() => rt.isTurnActive(conversationId));
+
+    const ok = rt.cancelTurn(conversationId);
+    expect(ok).toBe(true);
+    // The terminal frame must reach live viewers — RunBus.cancel ends the run
+    // synchronously, so publishing after it (engine's catch) would no-op.
+    expect(captured.some((e) => e.type === "cancelled")).toBe(true);
+    expect(rt.isTurnActive(conversationId)).toBe(false);
+  });
+});

From f2c0c33bc7cc48c92829605d6ac92072c80091dc Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Mon, 25 May 2026 11:25:16 -0600
Subject: [PATCH 09/26] fix(api): map ConversationCorruptedError to 422 in
 handleChatStart
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

startTurn → store.load throws ConversationCorruptedError for a pre-migration
(ownerless) conversation on the resume path, but handleChatStart let it fall
through to a raw 500. handleChat and handleChatCancel both already map it to
422 via conversationCorruptedResponse — match them. Adds an HTTP test
asserting /v1/chat/start on an ownerless conversation returns 422.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 src/api/handlers.ts                         |  6 ++++
 test/integration/detached-turn-http.test.ts | 31 ++++++++++++++++++++-
 2 files changed, 36 insertions(+), 1 deletion(-)

diff --git a/src/api/handlers.ts b/src/api/handlers.ts
index 26dfede0..686bf991 100644
--- a/src/api/handlers.ts
+++ b/src/api/handlers.ts
@@ -173,6 +173,12 @@ export async function handleChatStart(
         { conversationId: parsed.conversationId },
       );
     }
+    // startTurn → store.load can throw on a pre-migration (ownerless)
+    // conversation. Map to 422 — parity with handleChat / handleChatCancel —
+    // instead of leaking a raw 500.
+    if (err instanceof ConversationCorruptedError) {
+      return conversationCorruptedResponse(err);
+    }
     throw err;
   }
 }
diff --git a/test/integration/detached-turn-http.test.ts b/test/integration/detached-turn-http.test.ts
index c79d52ee..95645623 100644
--- a/test/integration/detached-turn-http.test.ts
+++ b/test/integration/detached-turn-http.test.ts
@@ -1,5 +1,5 @@
 import { afterAll, beforeAll, describe, expect, it } from "bun:test";
-import { mkdirSync, rmSync } from "node:fs";
+import { mkdirSync, rmSync, writeFileSync } from "node:fs";
 import { tmpdir } from "node:os";
 import { join } from "node:path";
 import { type ServerHandle, startServer } from "../../src/api/server.ts";
@@ -117,4 +117,33 @@ describe("detached turn HTTP surface", () => {
     });
     expect(res.status).toBe(404);
   });
+
+  it("start on a pre-migration (ownerless) conversation is 422, not 500", async () => {
+    // Seed a corrupted conversation: line-1 metadata without ownerId makes the
+    // store throw ConversationCorruptedError on load (the resume path).
+    const convId = "conv_dead00000000beef"; // conv_ + 16 hex
+    const convDir = join(testDir, "conversations");
+    mkdirSync(convDir, { recursive: true });
+    const meta = JSON.stringify({
+      id: convId,
+      createdAt: "2025-01-01T00:00:00.000Z",
+      updatedAt: "2025-01-01T00:00:00.000Z",
+      title: null,
+      format: "events",
+    });
+    writeFileSync(join(convDir, `${convId}.jsonl`), `${meta}\n`);
+
+    const res = await fetch(`${baseUrl}/v1/chat/start`, {
+      method: "POST",
+      headers: { "Content-Type": "application/json", "X-Workspace-Id": TEST_WORKSPACE_ID },
+      body: JSON.stringify({
+        message: "resume corrupt",
+        conversationId: convId,
+        workspaceId: TEST_WORKSPACE_ID,
+      }),
+    });
+    expect(res.status).toBe(422);
+    const body = await res.json();
+    expect(body.error).toBe("conversation_corrupted");
+  });
 });

From 66210e108ac14e276dd5db1b35ca7d74af6c739b Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Mon, 25 May 2026 11:38:51 -0600
Subject: [PATCH 10/26] fix(runtime): serialize startTurn create to prevent a
 double-create race
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Two concurrent starts with the same not-yet-existing conversationId could both
load()->null then both create({id}) — and create is a truncating writeFile with
no exists-guard, so the loser would clobber the winner's in-progress file.
runBus.begin serializes the run, but it ran AFTER create, too late to help.

For a provided id, reserve the run (begin) BEFORE touching storage: the loser
now throws RunInProgressError before it can create. On any load/create failure
we evict to release the reservation so a failed start can't leave the id stuck
"running". Adds a regression test (delayed load forces the window; asserts
create runs exactly once).

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 src/runtime/runtime.ts                 | 33 +++++++++++++++------
 test/integration/detached-turn.test.ts | 41 +++++++++++++++++++++++++-
 2 files changed, 64 insertions(+), 10 deletions(-)

diff --git a/src/runtime/runtime.ts b/src/runtime/runtime.ts
index ab3e82b0..6350cfe6 100644
--- a/src/runtime/runtime.ts
+++ b/src/runtime/runtime.ts
@@ -807,23 +807,38 @@ export class Runtime {
       ...(request.metadata ? { metadata: request.metadata } : {}),
     };
 
+    // Reserve the run (throws RunInProgressError if one is already active). The
+    // returned signal is the RunBus's — NOT the HTTP request's — so a client
+    // disconnect won't abort generation.
+    //
+    // For a provided id we begin BEFORE touching storage: `begin` is the
+    // serialization point, so a concurrent start with the same id is rejected
+    // here instead of both racing load()->null->create() and clobbering the
+    // file (create is a truncating writeFile with no exists-guard). On any
+    // load/create failure we `evict` to release the reservation — otherwise a
+    // failed start would leave the id stuck "running" and block future turns.
+    // A fresh conversation has no id until create(), so that path begins after.
     const isNew = !request.conversationId;
     let conversationId: string;
+    let signal: AbortSignal;
     if (request.conversationId) {
-      const existing = await store.load(request.conversationId);
-      if (existing && existing.ownerId !== ownerId) {
-        throw new ConversationAccessDeniedError(request.conversationId, ownerId);
+      signal = this.runBus.begin(request.conversationId);
+      try {
+        const existing = await store.load(request.conversationId);
+        if (existing && existing.ownerId !== ownerId) {
+          throw new ConversationAccessDeniedError(request.conversationId, ownerId);
+        }
+        conversationId =
+          existing?.id ?? (await store.create({ ...createOpts, id: request.conversationId })).id;
+      } catch (err) {
+        this.runBus.evict(request.conversationId);
+        throw err;
       }
-      conversationId =
-        existing?.id ?? (await store.create({ ...createOpts, id: request.conversationId })).id;
     } else {
       conversationId = (await store.create(createOpts)).id;
+      signal = this.runBus.begin(conversationId);
     }
 
-    // Reserve the run (throws if already active). The returned signal is the
-    // RunBus's — NOT the HTTP request's — so client disconnect won't abort.
-    const signal = this.runBus.begin(conversationId);
-
     // Seed the run stream with the user's message so the turn is
     // self-contained: any viewer (sender, other tab, post-refresh) can
     // reconstruct user + assistant from replay alone, no optimistic client
diff --git a/test/integration/detached-turn.test.ts b/test/integration/detached-turn.test.ts
index 7cc1bf3e..c3ccd5b5 100644
--- a/test/integration/detached-turn.test.ts
+++ b/test/integration/detached-turn.test.ts
@@ -1,8 +1,10 @@
-import { afterAll, beforeAll, describe, expect, it } from "bun:test";
+import { afterAll, beforeAll, describe, expect, it, spyOn } from "bun:test";
 import { mkdirSync, rmSync } from "node:fs";
 import { tmpdir } from "node:os";
 import { join } from "node:path";
 import { EventSourcedConversationStore } from "../../src/conversation/event-sourced-store.ts";
+import type { ConversationAccessContext } from "../../src/conversation/types.ts";
+import { RunInProgressError } from "../../src/runtime/errors.ts";
 import { Runtime } from "../../src/runtime/runtime.ts";
 import type { BufferedRunEvent, RunStatus } from "../../src/runtime/run-bus.ts";
 import { createEchoModel } from "../helpers/echo-model.ts";
@@ -82,6 +84,43 @@ describe("detached turns (server-authoritative streaming)", () => {
     expect(events.length).toBeGreaterThan(0);
   });
 
+  it("does not double-create on concurrent starts with the same provided id", async () => {
+    // Force both starts into the load→create window by delaying load. With the
+    // race fix (begin before storage), the loser's begin throws before it can
+    // create — so create runs exactly once. Without it, both create and the
+    // loser's truncating writeFile would clobber the winner's file.
+    const proto = EventSourcedConversationStore.prototype;
+    const realLoad = proto.load;
+    const loadSpy = spyOn(proto, "load").mockImplementation(async function (
+      this: EventSourcedConversationStore,
+      id: string,
+      access?: ConversationAccessContext,
+    ) {
+      await new Promise((r) => setTimeout(r, 25));
+      return realLoad.call(this, id, access);
+    });
+    const createSpy = spyOn(proto, "create");
+    try {
+      const id = "conv_face0000face0001"; // conv_ + 16 hex, not yet on disk
+      const results = await Promise.allSettled([
+        runtime.startTurn({ message: "a", conversationId: id, workspaceId: TEST_WORKSPACE_ID }),
+        runtime.startTurn({ message: "b", conversationId: id, workspaceId: TEST_WORKSPACE_ID }),
+      ]);
+
+      const createsForId = createSpy.mock.calls.filter(
+        (c) => (c[0] as { id?: string })?.id === id,
+      );
+      expect(createsForId.length).toBe(1);
+
+      const rejected = results.filter((r) => r.status === "rejected");
+      expect(rejected.length).toBe(1);
+      expect((rejected[0] as PromiseRejectedResult).reason).toBeInstanceOf(RunInProgressError);
+    } finally {
+      loadSpy.mockRestore();
+      createSpy.mockRestore();
+    }
+  });
+
   it("allows a new turn on the same conversation once idle", async () => {
     const { conversationId } = await runtime.startTurn({
       message: "first",

From 75e01e3a675b6104848ae786205df9a6a5885a44 Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Mon, 25 May 2026 11:53:59 -0600
Subject: [PATCH 11/26] fix(web): clear stuck streaming on reconnect after the
 turn ended
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

connectConversationStream reconnects with backoff up to 30s; RunBus GCs a
terminal turn 30s after it ends. If a viewer is disconnected past that window
while the turn finishes, the reconnect's subscribed{isActive:false} carries no
replayed terminal frame — and the client only reconciled on the first (resume)
subscribed, so the slice stayed isStreaming=true until a manual reload.

Reconcile on any subscribed frame: if the server reports no active turn while
the slice still thinks it's streaming, clear the streaming state (the server is
authoritative). A terminal frame still within grace replays right after and
finalizes the content; if GC'd, the partial is kept and a reload fetches the
final — either way the spinner no longer hangs.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 web/src/hooks/chat-store.ts | 19 ++++++++++++++++++-
 web/test/chat-store.test.ts | 18 ++++++++++++++++++
 2 files changed, 36 insertions(+), 1 deletion(-)

diff --git a/web/src/hooks/chat-store.ts b/web/src/hooks/chat-store.ts
index 1622e488..3d1c8119 100644
--- a/web/src/hooks/chat-store.ts
+++ b/web/src/hooks/chat-store.ts
@@ -483,13 +483,30 @@ export function createChatStore(): ChatStore {
             slice.isStreaming = true;
             if (!slice.streamingState) slice.streamingState = "thinking";
             commit(slice);
-          } else if (!slice.isStreaming) {
+            return;
+          }
+          if (!slice.isStreaming) {
             // Nothing in flight and we're not sending — ignore the trailing
             // grace-buffer replay (already in disk history) and detach.
             dropEvents = true;
             closeConnection(slice);
+            return;
           }
         }
+        // Server-authoritative reconcile: the server says no turn is running,
+        // but we still think we're streaming. Happens when a viewer reconnects
+        // after the turn ended while disconnected past the RunBus grace window
+        // — the terminal frame was GC'd, so it will never replay and the spinner
+        // would hang forever. Clear it. A terminal frame still within grace
+        // arrives in the replay that follows and finalizes the content; if it
+        // was GC'd, the slice keeps its last-seen partial (a reload fetches the
+        // final) — either way we stop hanging.
+        if (!info.isActive && slice.isStreaming) {
+          slice.isStreaming = false;
+          slice.streamingState = null;
+          slice.preparingTool = null;
+          commit(slice);
+        }
       },
       onEvent: (type, data) => {
         if (dropEvents) return;
diff --git a/web/test/chat-store.test.ts b/web/test/chat-store.test.ts
index 7f7d455c..dd4a3f24 100644
--- a/web/test/chat-store.test.ts
+++ b/web/test/chat-store.test.ts
@@ -269,6 +269,24 @@ describe("chat-store viewer", () => {
     expect(store.getSnapshot("conv_absent").title).toBeNull();
   });
 
+  it("clears a stuck stream when a reconnect reports the turn already ended", async () => {
+    const store = createChatStore();
+    await store.sendTurn("kA", { text: "a" });
+    const s = latestStream();
+    s.onEvent("chat.start", { conversationId: "A" }, 1);
+    s.onEvent("text.delta", { text: "partial" }, 2);
+    expect(store.getSnapshot("A").isStreaming).toBe(true);
+
+    // Reconnect after the turn ended while disconnected past the grace window:
+    // server says not active and the terminal frame was GC'd (no replay).
+    s.onSubscribed?.({ isActive: false, activeSeq: 0 });
+
+    expect(store.getSnapshot("A").isStreaming).toBe(false);
+    expect(store.getSnapshot("A").streamingState).toBeNull();
+    // Last-seen partial is retained (a reload would fetch the final transcript).
+    expect(lastAssistant(store.getSnapshot("A").messages)?.content).toBe("partial");
+  });
+
   it("does not duplicate a finished turn whose grace-buffer replay still arrives", async () => {
     const store = createChatStore();
     // Disk already has the completed turn.

From 2ce8d73d3c457b2566cffcc9d4ca2e486a4fcbb6 Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Mon, 25 May 2026 12:39:19 -0600
Subject: [PATCH 12/26] fix(conversations): complete a partial disk snapshot on
 resume (no flicker)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

loadConversation reads disk then subscribes. A short turn ending in that window
left a partial snapshot, and onSubscribed hit the drop branch — discarding the
grace-buffer replay that held the full `done`, so the final response only showed
after a reload.

Mark the gap precisely instead of always recombining (which would flicker every
recently-finished conversation on open): the reader flags an assistant turn with
no run.done/run.error as `pending`. On resume the client now branches on it:

- live turn, or pending tail + retained run (activeSeq>0) → trim + apply replay
  (rebuilds the full turn, no duplicate);
- pending tail + run GC'd → refetch the now-complete transcript;
- complete tail → ignore the grace replay (no dup, no flicker — the common
  open-a-recent-conversation path is untouched).

A trailing user message (no assistant yet) also counts as pending. probe slices
have no messages, so they're unaffected.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 src/bundles/conversations/src/jsonl-reader.ts | 14 ++++++
 .../conversations/jsonl-reader.test.ts        | 47 +++++++++++++++++++
 web/src/hooks/chat-store.ts                   | 46 ++++++++++++++----
 web/test/chat-store.test.ts                   | 41 +++++++++++++++-
 4 files changed, 137 insertions(+), 11 deletions(-)

diff --git a/src/bundles/conversations/src/jsonl-reader.ts b/src/bundles/conversations/src/jsonl-reader.ts
index f15a8ab6..faaf4dcf 100644
--- a/src/bundles/conversations/src/jsonl-reader.ts
+++ b/src/bundles/conversations/src/jsonl-reader.ts
@@ -47,6 +47,13 @@ export interface DisplayMessage {
   files?: DisplayFile[];
   /** Non-"complete" run terminations bubble up here ("max_iterations", "error"). */
   stopReason?: string;
+  /**
+   * True when this assistant turn has no terminal event yet (no run.done /
+   * run.error) — i.e. the run was still in flight when the file was read. Lets
+   * a live viewer tell a partial disk snapshot from a finished turn and decide
+   * whether to reconcile against the server's replay.
+   */
+  pending?: boolean;
 }
 
 export type DisplayBlock =
@@ -452,6 +459,10 @@ function collectRun(
 
   let endTs = events[start]?.ts ?? "";
   let stopReason: string | undefined;
+  // A run is "terminated" only when we see its run.done/run.error. If the loop
+  // runs out of events first, the turn was still in flight when the file was
+  // read → mark the message pending.
+  let terminated = false;
 
   let i = start + 1;
   while (i < events.length) {
@@ -459,12 +470,14 @@ function collectRun(
     if (isRunDone(inner) && inner.runId === runId) {
       endTs = inner.ts;
       stopReason = inner.stopReason;
+      terminated = true;
       i++;
       break;
     }
     if (isRunError(inner) && inner.runId === runId) {
       endTs = inner.ts;
       stopReason = "error";
+      terminated = true;
       i++;
       break;
     }
@@ -588,6 +601,7 @@ function collectRun(
     ...(flatToolCalls.length > 0 ? { toolCalls: flatToolCalls } : {}),
     usage,
     ...(stopReason && stopReason !== "complete" ? { stopReason } : {}),
+    ...(terminated ? {} : { pending: true }),
   };
   return [msg, i];
 }
diff --git a/test/unit/bundles/conversations/jsonl-reader.test.ts b/test/unit/bundles/conversations/jsonl-reader.test.ts
index b322cf44..b3902fec 100644
--- a/test/unit/bundles/conversations/jsonl-reader.test.ts
+++ b/test/unit/bundles/conversations/jsonl-reader.test.ts
@@ -254,6 +254,53 @@ describe("readConversation (event format)", () => {
 		expect(assistant.timestamp).toBe("2025-06-01T00:00:06.000Z");
 	});
 
+	test("flags an in-flight run (no run.done) as pending", async () => {
+		const runId = "run_pending";
+		const lines = [
+			JSON.stringify(eventMeta("conv_pending01")),
+			JSON.stringify({ ts: "2025-06-01T00:00:00.000Z", type: "run.start", runId }),
+			JSON.stringify({
+				ts: "2025-06-01T00:00:01.000Z",
+				type: "llm.response",
+				runId,
+				model: "m1",
+				content: [{ type: "text", text: "partial" }],
+				usage: { inputTokens: 5, outputTokens: 2 },
+				llmMs: 30,
+			}),
+			// No run.done — the run was still in flight when the file was read.
+		];
+		const path = writeTmpFile("conv_pending01.jsonl", lines);
+
+		const result = await readConversation(path);
+		expect(result).not.toBeNull();
+		const asst = result!.messages.at(-1)!;
+		expect(asst.role).toBe("assistant");
+		expect(asst.pending).toBe(true);
+	});
+
+	test("a completed run (run.done) is not pending", async () => {
+		const runId = "run_complete";
+		const lines = [
+			JSON.stringify(eventMeta("conv_complete01")),
+			JSON.stringify({ ts: "2025-06-01T00:00:00.000Z", type: "run.start", runId }),
+			JSON.stringify({
+				ts: "2025-06-01T00:00:01.000Z",
+				type: "llm.response",
+				runId,
+				model: "m1",
+				content: [{ type: "text", text: "done" }],
+				usage: { inputTokens: 5, outputTokens: 2 },
+				llmMs: 30,
+			}),
+			JSON.stringify({ ts: "2025-06-01T00:00:02.000Z", type: "run.done", runId, stopReason: "complete" }),
+		];
+		const path = writeTmpFile("conv_complete01.jsonl", lines);
+
+		const result = await readConversation(path);
+		expect(result!.messages.at(-1)!.pending).toBeUndefined();
+	});
+
 	test("sets status='error' and isError=true for a failed tool call", async () => {
 		const runId = "run_b";
 		const lines = [
diff --git a/web/src/hooks/chat-store.ts b/web/src/hooks/chat-store.ts
index 3d1c8119..429d0445 100644
--- a/web/src/hooks/chat-store.ts
+++ b/web/src/hooks/chat-store.ts
@@ -102,6 +102,9 @@ export interface ChatMessage {
   userId?: string;
   files?: MessageFileAttachment[];
   stopReason?: string;
+  /** Loaded-from-disk turn with no terminal event yet (run still in flight when
+   *  read). Drives the resume reconcile — a partial snapshot vs a finished turn. */
+  pending?: boolean;
   error?: string;
   usage?: {
     inputTokens: number;
@@ -450,6 +453,15 @@ export function createChatStore(): ChatStore {
     }
   }
 
+  /** True when the loaded disk tail is an unfinished turn — a trailing user
+   *  message (no assistant yet) or an assistant flagged `pending` (read before
+   *  its run.done). Distinguishes a partial snapshot from a finished turn. */
+  function hasPendingTail(slice: ConversationSlice): boolean {
+    const last = slice.messages[slice.messages.length - 1];
+    if (!last) return false;
+    return last.role === "user" || last.pending === true;
+  }
+
   // -- subscription --
 
   function closeConnection(slice: ConversationSlice): void {
@@ -472,22 +484,36 @@ export function createChatStore(): ChatStore {
       onSubscribed: (info) => {
         if (slice.resumeOnSubscribe) {
           slice.resumeOnSubscribe = false;
-          if (info.isActive) {
-            // A turn is in flight — trim the stale in-flight turn loaded from
-            // disk; the RunBus replay rebuilds it from the top. Reflect the
-            // server's "is generating" truth immediately so the streaming
-            // indicator (and Stop button) show on resume without waiting for
-            // the first replayed event.
+          const pendingTail = hasPendingTail(slice);
+          if (info.isActive || (pendingTail && info.activeSeq > 0)) {
+            // Either a live turn, OR a turn that finished in the load→subscribe
+            // window but is still retained in the RunBus grace buffer (partial
+            // disk tail + a retained run). Either way the replay carries the
+            // full trailing turn — trim the stale/partial disk copy so the
+            // replay rebuilds it without duplicating. For a live turn, reflect
+            // the streaming indicator immediately; for a just-finished one the
+            // replayed `done` finalizes it.
             trimTrailingTurn(slice);
             resetScratch(slice);
-            slice.isStreaming = true;
-            if (!slice.streamingState) slice.streamingState = "thinking";
+            if (info.isActive) {
+              slice.isStreaming = true;
+              if (!slice.streamingState) slice.streamingState = "thinking";
+            }
             commit(slice);
             return;
           }
+          if (pendingTail) {
+            // Partial disk tail but the run is gone (grace GC'd) — no replay can
+            // complete it. Refetch the now-complete transcript.
+            dropEvents = true;
+            closeConnection(slice);
+            void loadConversation(conversationId);
+            return;
+          }
           if (!slice.isStreaming) {
-            // Nothing in flight and we're not sending — ignore the trailing
-            // grace-buffer replay (already in disk history) and detach.
+            // Complete disk tail (or idle) — ignore any stray grace-buffer
+            // replay; it would duplicate (and flicker) a turn already fully on
+            // disk.
             dropEvents = true;
             closeConnection(slice);
             return;
diff --git a/web/test/chat-store.test.ts b/web/test/chat-store.test.ts
index dd4a3f24..dca8a29b 100644
--- a/web/test/chat-store.test.ts
+++ b/web/test/chat-store.test.ts
@@ -25,6 +25,12 @@ const LOADED: ChatMessage[] = [
   { role: "assistant", content: "loaded-a", blocks: [{ type: "text", text: "loaded-a" }] },
 ];
 
+// A partial disk snapshot: the trailing assistant has no terminal event yet.
+const PENDING_LOADED: ChatMessage[] = [
+  { role: "user", content: "loaded-q" },
+  { role: "assistant", content: "part", blocks: [{ type: "text", text: "part" }], pending: true },
+];
+
 mock.module("../src/api/conversation-stream", () => ({
   connectConversationStream: (opts: {
     conversationId: string;
@@ -61,7 +67,10 @@ mock.module("../src/api/client", () => ({
   callTool: (_server: string, _action: string, args?: Record<string, unknown>) =>
     Promise.resolve({
       isError: false,
-      structuredContent: { metadata: { id: args?.id }, messages: LOADED },
+      structuredContent: {
+        metadata: { id: args?.id },
+        messages: args?.id === "conv_pending" ? PENDING_LOADED : LOADED,
+      },
     }),
 }));
 
@@ -287,6 +296,36 @@ describe("chat-store viewer", () => {
     expect(lastAssistant(store.getSnapshot("A").messages)?.content).toBe("partial");
   });
 
+  it("completes a partial disk tail from the grace replay on resume (no dup)", async () => {
+    const store = createChatStore();
+    await store.loadConversation("conv_pending");
+    expect(lastAssistant(store.getSnapshot("conv_pending").messages)?.content).toBe("part");
+
+    // Turn finished in the load→subscribe window but is still graced: not
+    // active, retained run (activeSeq>0). The replay carries the full turn.
+    const s = latestStream();
+    s.onSubscribed?.({ isActive: false, activeSeq: 5 });
+    s.onEvent("user.message", { content: "loaded-q" }, 1);
+    s.onEvent("text.delta", { text: "full answer" }, 2);
+    s.onEvent("done", { conversationId: "conv_pending", response: "full answer" }, 3);
+
+    const msgs = store.getSnapshot("conv_pending").messages;
+    expect(lastAssistant(msgs)?.content).toBe("full answer");
+    expect(msgs.filter((m) => m.role === "user").length).toBe(1); // no duplicate turn
+  });
+
+  it("keeps a complete disk tail intact when a graced replay is available (no flicker)", async () => {
+    const store = createChatStore();
+    await store.loadConversation("conv_done2");
+    const s = latestStream();
+    // Complete tail + retained run: the grace replay must be ignored (not
+    // trimmed+rebuilt) so the just-opened turn doesn't blink out and back.
+    s.onSubscribed?.({ isActive: false, activeSeq: 9 });
+    s.onEvent("user.message", { content: "loaded-q" }, 1);
+    s.onEvent("done", { conversationId: "conv_done2", response: "loaded-a" }, 2);
+    expect(store.getSnapshot("conv_done2").messages).toEqual(LOADED);
+  });
+
   it("does not duplicate a finished turn whose grace-buffer replay still arrives", async () => {
     const store = createChatStore();
     // Disk already has the completed turn.

From f4e4a627caf835c42d4595bb6e5ea70c42847996 Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Mon, 25 May 2026 16:47:27 -0600
Subject: [PATCH 13/26] docs(conversations): note legacy seq-less broadcast vs
 RunBus viewer
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

conversation-stream viewers track the RunBus seq (id: line) for replay/resume.
The legacy /v1/chat and /v1/chat/stream endpoints fan out via
broadcastToConversation, which is seq-less — those frames apply live but don't
advance lastSeq and have no resume. The web shell is RunBus-only; only an
external caller hitting the legacy endpoints while a web tab watches the same
conversation would mix the two. Document the boundary on both sides.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 src/api/conversation-events.ts     | 5 +++++
 web/src/api/conversation-stream.ts | 8 ++++++++
 2 files changed, 13 insertions(+)

diff --git a/src/api/conversation-events.ts b/src/api/conversation-events.ts
index e36a3c3e..95b41aa2 100644
--- a/src/api/conversation-events.ts
+++ b/src/api/conversation-events.ts
@@ -170,6 +170,11 @@ export class ConversationEventManager {
    * explicit policy gates; until then, this is the only exclusion
    * shape needed.
    *
+   * Seq-less: unlike {@link publishEvent} (the RunBus path), these frames carry
+   * no `id:` sequence. A seq-tracking `conversation-stream` viewer applies them
+   * live but can't replay/resume them. Only `/v1/chat` + `/v1/chat/stream` use
+   * this; the web shell is RunBus-only.
+   *
    * @param conversationId - Target conversation
    * @param eventType - SSE event type (e.g. "text.delta", "user.message")
    * @param data - Event data payload
diff --git a/web/src/api/conversation-stream.ts b/web/src/api/conversation-stream.ts
index c7feaf20..30a44afd 100644
--- a/web/src/api/conversation-stream.ts
+++ b/web/src/api/conversation-stream.ts
@@ -9,6 +9,14 @@
  * Each frame carries a sequence number in the SSE `id:` line. We track the
  * highest seq seen and reconnect with `afterSeq=<lastSeq>`, so a dropped
  * connection resumes seamlessly with no gap or duplication — no full reload.
+ *
+ * This viewer assumes the RunBus (seq'd) path. The legacy `/v1/chat` and
+ * `/v1/chat/stream` endpoints fan out to the same conversation subscribers via
+ * `broadcastToConversation`, which is seq-less (no `id:` line) and not RunBus-
+ * backed — those frames apply live but don't advance `lastSeq` and have no
+ * replay/resume. The web shell doesn't use those endpoints; only an external
+ * caller hitting them while a web tab watches the same conversation would mix
+ * the two streams.
  */
 
 import { refreshSession } from "./client";

From 1c2d75f3f551f097ea0a0ee25228a85cbc2c07b1 Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Tue, 26 May 2026 12:16:22 -0600
Subject: [PATCH 14/26] fix(adapters): warn once per failure episode in
 best-effort log sinks
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The earlier hardening (commit 9ddfd2e) silenced log-sink throws to keep emit()
safe, but a real disk-full / perms incident produced zero operator signal.
Surface the first write failure of an episode with console.warn, then suppress
until a subsequent success re-arms — first failure visible, sustained outage
doesn't spam, intermittent recovery re-warns when it breaks again.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 src/adapters/structured-log-sink.ts | 18 ++++++++++++++++--
 src/adapters/workspace-log-sink.ts  | 16 ++++++++++++++--
 2 files changed, 30 insertions(+), 4 deletions(-)

diff --git a/src/adapters/structured-log-sink.ts b/src/adapters/structured-log-sink.ts
index 8c10a511..acecbaf6 100644
--- a/src/adapters/structured-log-sink.ts
+++ b/src/adapters/structured-log-sink.ts
@@ -39,6 +39,10 @@ export class StructuredLogSink implements EventSink {
   private conversationId: string | undefined;
   private userId: string | undefined;
   private workspaceId: string | undefined;
+  /** True after a write failure surfaced a console.warn; reset on the next
+   *  successful write so a recurring failure (after intermittent recovery)
+   *  warns again. Avoids spamming during a sustained outage. */
+  private writeWarned = false;
 
   constructor(config: StructuredLogConfig) {
     this.dir = config.dir;
@@ -94,10 +98,20 @@ export class StructuredLogSink implements EventSink {
     const filename = `nimblebrain-${today}.jsonl`;
     try {
       appendFileSync(join(this.dir, filename), `${JSON.stringify(record)}\n`);
-    } catch {
+      this.writeWarned = false;
+    } catch (err) {
       // Best-effort logging: a write failure (disk full, perms, or a detached
       // turn emitting after the workdir was torn down) must never throw into
-      // the event-emit path and crash the caller.
+      // the event-emit path and crash the caller. Surface the first failure of
+      // an episode so operators see disk/perms incidents; suppress until a
+      // subsequent success re-arms.
+      if (!this.writeWarned) {
+        this.writeWarned = true;
+        console.warn(
+          `[structured-log-sink] write to ${this.dir} failed (further failures suppressed until recovery):`,
+          err instanceof Error ? err.message : err,
+        );
+      }
     }
   }
 
diff --git a/src/adapters/workspace-log-sink.ts b/src/adapters/workspace-log-sink.ts
index a140884d..45ef4491 100644
--- a/src/adapters/workspace-log-sink.ts
+++ b/src/adapters/workspace-log-sink.ts
@@ -43,6 +43,8 @@ export interface WorkspaceLogConfig {
  */
 export class WorkspaceLogSink implements EventSink {
   private dir: string;
+  /** First-failure-of-an-episode flag — see structured-log-sink. */
+  private writeWarned = false;
 
   constructor(config: WorkspaceLogConfig) {
     this.dir = join(config.dir, "workspace");
@@ -66,10 +68,20 @@ export class WorkspaceLogSink implements EventSink {
     const filename = `${today}.jsonl`;
     try {
       appendFileSync(join(this.dir, filename), `${JSON.stringify(record)}\n`);
-    } catch {
+      this.writeWarned = false;
+    } catch (err) {
       // Best-effort logging: a write failure (disk full, perms, or a detached
       // turn emitting after the workdir was torn down) must never throw into
-      // the event-emit path and crash the caller.
+      // the event-emit path and crash the caller. Surface the first failure of
+      // an episode so operators see disk/perms incidents; suppress until a
+      // subsequent success re-arms.
+      if (!this.writeWarned) {
+        this.writeWarned = true;
+        console.warn(
+          `[workspace-log-sink] write to ${this.dir} failed (further failures suppressed until recovery):`,
+          err instanceof Error ? err.message : err,
+        );
+      }
     }
   }
 

From 014492b21d417a1c2824d491dc767b81e44d5220 Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Tue, 26 May 2026 12:32:20 -0600
Subject: [PATCH 15/26] docs+chore: surface RunBus single-process limit when
 replicas > 1
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

A viewer landing on a different pod than the one running the turn sees
isActive:false and silently drops resume — RunBus is single-process and isn't
yet clustered. Sticky routing on Mcp-Session-Id (prereq #2) mitigates for the
active tab; a pod restart or any cross-pod viewer still loses the in-flight
turn. Two changes so this isn't a silent regression:

- AGENTS.md: add a "Known limitation under replicas > 1" note under the four
  prereqs, pointing at run-bus.ts and the deferred clustered RunBus.
- serve.ts: emit a loud startup warn when sessionStore.type === "redis" (the
  one strong signal of multi-replica intent) so operators see the gap at boot.

Not a hard error — sticky routing is sufficient for many cases, and operators
may accept the limit until the clustered RunBus lands.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 AGENTS.md                 |  2 ++
 src/cli/commands/serve.ts | 17 +++++++++++++++++
 2 files changed, 19 insertions(+)

diff --git a/AGENTS.md b/AGENTS.md
index 41ae0e3a..5ccfd4fd 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -329,6 +329,8 @@ Routing requests to the process owning a session's transport is the **load balan
 3. `sessionStore.type: "redis"`. Each tenant gets its own Redis instance in its own namespace (see `infra/CLAUDE.md` per-tenant Redis pattern). Default `nb:mcp:session:` keyPrefix is correct under that model.
 4. `platform.strategy.type: RollingUpdate`. Only after (1).
 
+**Known limitation under `replicas > 1`: RunBus is single-process.** Chat turn replay/resume (the SSE-stream-backed viewer attaches to a per-conversation event log) lives in-memory on the pod that started the turn. A viewer landing on a different pod sees `isActive:false` for an in-flight turn elsewhere and the live frames don't fan out cross-pod. Sticky routing on `Mcp-Session-Id` (prereq #2) mitigates for the active tab; a pod restart or any cross-pod viewer (other tab/device) still drops resume mid-turn. The clustered Redis-backed RunBus is deferred work, tracked in `src/runtime/run-bus.ts` — `serve` warns at boot when `sessionStore.type === "redis"` so the gap is visible.
+
 **TTL units: seconds at the surface, ms internally.** Operator-facing: `MCP_SESSION_TTL_SECONDS` env (highest priority) > `sessionStore.ttlSeconds` config > 8h default. Conversion to ms happens in `Runtime.getSessionStoreTtlMs()` only — registry constructors and the host's idle sweep both take ms from there. Don't add mixed-unit code elsewhere.
 
 ## MCP App Bridge Rules
diff --git a/src/cli/commands/serve.ts b/src/cli/commands/serve.ts
index be59de56..62bc0354 100644
--- a/src/cli/commands/serve.ts
+++ b/src/cli/commands/serve.ts
@@ -42,6 +42,23 @@ export function createServeCommand(telemetry: TelemetryManager): Command {
       // boot loudly instead of every individual MCP request.
       const sessionStoreConfig = resolveSessionStoreConfig(runtime.getSessionStoreConfig());
       const sessionRegistry = await createSessionRegistry(sessionStoreConfig);
+      // Multi-replica intent (Redis-backed sessions) implies the operator may
+      // run platform.replicas > 1. RunBus is still single-process — turn
+      // replay/resume only works on the pod that holds the run. Sticky routing
+      // on Mcp-Session-Id (CLAUDE.md prereq #2) mitigates for the active tab
+      // but a pod restart / cross-pod viewer still drops the in-flight turn.
+      // Loud heads-up at boot; not a hard error (sticky routing is enough for
+      // most cases, and operators may accept the gap until the clustered
+      // RunBus lands).
+      if (sessionStoreConfig.type === "redis") {
+        log.warn(
+          "[nimblebrain] sessionStore=redis detected. RunBus is still single-process; " +
+            "if platform.replicas > 1, a viewer that hits a different pod sees " +
+            "isActive:false for an in-flight turn. Ensure Mcp-Session-Id sticky " +
+            "routing is in place (CLAUDE.md replicas>1 prereq #2); RunBus Redis port " +
+            "is tracked as deferred work.",
+        );
+      }
 
       const port = Number(process.env.PORT) || Number(opts.port) || 27247;
       await startServerWithShutdown({ runtime, port, sessionRegistry });

From 96d5e651326f95f6892ac84a41d11aedbddc9ba3 Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Wed, 27 May 2026 12:09:33 -0500
Subject: [PATCH 16/26] fix(runtime): cap per-run RunBus event buffer to
 prevent unbounded growth
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

A runaway or adversarial event producer — a model stream looping
pathologically, a chatty tool spamming progress events — could push
log.events past safe memory limits before the grace-window GC fired.
Tens of thousands of token deltas held in-process for the grace window
on a multi-tenant deployment is real heap pressure.

Cap at 500k events per run with discard-as-error semantics: on overflow,
abort the turn's signal, append a synthetic terminal `error` event with
`error: "buffer_overflow"` so viewers see the cause, end the run as
`error`, and warn once. Subsequent publishes drop via the standard
`status !== "running"` guard.

500k sits ~10x over the worst legit run we can measure (extended-thinking
turn with chatty tool progress: ~30-50k events). Hitting it requires
the kind of pathological producer that is exactly what this cap exists
to terminate cleanly.

Configurable via the RunBus constructor for tests; production leaves it
at the default.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 src/runtime/run-bus.ts    | 64 ++++++++++++++++++++++++++++++++++++++-
 test/unit/run-bus.test.ts | 53 ++++++++++++++++++++++++++++++++
 2 files changed, 116 insertions(+), 1 deletion(-)

diff --git a/src/runtime/run-bus.ts b/src/runtime/run-bus.ts
index f69cc31e..c8aa8e02 100644
--- a/src/runtime/run-bus.ts
+++ b/src/runtime/run-bus.ts
@@ -43,8 +43,27 @@ interface RunLog {
   eventListeners: Set<(e: BufferedRunEvent) => void>;
   endListeners: Set<(s: RunStatus) => void>;
   gcTimer?: ReturnType<typeof setTimeout>;
+  /** Set once when the per-run event cap is exceeded, so the overflow
+   *  handler only fires once per run (subsequent publishes during the
+   *  same tick are dropped silently). */
+  bufferOverflowed?: boolean;
 }
 
+/**
+ * Hard cap on buffered events per run. A defense against a runaway or
+ * adversarial event producer holding unbounded memory for the grace window.
+ *
+ * Sized to sit comfortably above legitimate worst cases: a Synapse-research
+ * style extended-thinking turn emits on the order of 10^5 events (token
+ * deltas + tool progress + status). 500k gives ~5x headroom over the
+ * worst legit run we've measured. Hitting it requires either a model
+ * stream looping pathologically or an adversarial tool spamming progress
+ * events — either way, terminating the run with a clear error is the
+ * correct response. Operators see a warn log; the agent's next turn can
+ * pick up from persisted history.
+ */
+const DEFAULT_MAX_EVENTS_PER_RUN = 500_000;
+
 /** Detach callback returned by {@link RunBus.attach}. */
 export type DetachFn = () => void;
 
@@ -52,9 +71,13 @@ export class RunBus {
   private runs = new Map<string, RunLog>();
   /** How long a terminal run's log is retained for late re-attach. */
   private readonly graceMs: number;
+  /** Per-run event cap. See {@link DEFAULT_MAX_EVENTS_PER_RUN}. Configurable
+   *  via constructor for tests; production should leave it at the default. */
+  private readonly maxEventsPerRun: number;
 
-  constructor(graceMs = 30_000) {
+  constructor(graceMs = 30_000, maxEventsPerRun = DEFAULT_MAX_EVENTS_PER_RUN) {
     this.graceMs = graceMs;
+    this.maxEventsPerRun = maxEventsPerRun;
   }
 
   /**
@@ -113,10 +136,49 @@ export class RunBus {
    * Append an event to the run's log and fan it out to live subscribers.
    * No-op if the run isn't active (defensive — late engine events after a
    * cancel shouldn't resurrect a terminated log).
+   *
+   * If appending this event would exceed {@link maxEventsPerRun}, the run
+   * is aborted, a synthetic terminal `error` event is appended and fanned
+   * out (so viewers see the cause rather than a silent stop), and the run
+   * is marked `error`. Subsequent publishes during the same tick are
+   * dropped by the standard `status !== "running"` guard.
    */
   publish(conversationId: string, type: string, data: unknown): BufferedRunEvent | null {
     const log = this.runs.get(conversationId);
     if (!log || log.status !== "running") return null;
+
+    // Overflow check BEFORE seq increment / push: the terminal error event
+    // itself counts toward seq but is intentionally allowed past the cap so
+    // viewers always see why generation stopped.
+    if (!log.bufferOverflowed && log.events.length >= this.maxEventsPerRun) {
+      log.bufferOverflowed = true;
+      console.warn(
+        `[run-bus] conversation=${conversationId} hit per-run event cap ` +
+          `(${this.maxEventsPerRun}); aborting turn. This indicates a runaway ` +
+          `producer (model stream looping or tool spamming progress events).`,
+      );
+      log.abort.abort();
+      log.seq += 1;
+      const errEvt: BufferedRunEvent = {
+        seq: log.seq,
+        type: "error",
+        data: {
+          error: "buffer_overflow",
+          message: `Per-run event cap exceeded (${this.maxEventsPerRun}). Turn aborted.`,
+        },
+      };
+      log.events.push(errEvt);
+      for (const fn of log.eventListeners) {
+        try {
+          fn(errEvt);
+        } catch {
+          // A failing subscriber must not break the fan-out to others.
+        }
+      }
+      this.end(conversationId, "error");
+      return errEvt;
+    }
+
     log.seq += 1;
     const evt: BufferedRunEvent = { seq: log.seq, type, data };
     log.events.push(evt);
diff --git a/test/unit/run-bus.test.ts b/test/unit/run-bus.test.ts
index a11efbc0..dc482bf5 100644
--- a/test/unit/run-bus.test.ts
+++ b/test/unit/run-bus.test.ts
@@ -151,4 +151,57 @@ describe("RunBus", () => {
     expect(typeof detach).toBe("function");
     detach();
   });
+
+  it("caps per-run event buffer and ends the run with a terminal error", () => {
+    // Tiny cap for testability. Production uses 500k.
+    const bus = new RunBus(30_000, 10);
+    const signal = bus.begin("c1");
+
+    const { events, onEvent } = collect();
+    const endStatuses: string[] = [];
+    bus.attach("c1", 0, onEvent, (s) => endStatuses.push(s));
+
+    // Fill exactly to the cap — these should all succeed.
+    for (let i = 0; i < 10; i++) {
+      bus.publish("c1", "text.delta", { text: String(i) });
+    }
+    expect(bus.isActive("c1")).toBe(true);
+
+    // 11th publish trips the cap — turn aborts, terminal error appended.
+    const overflow = bus.publish("c1", "text.delta", { text: "boom" });
+
+    expect(overflow).not.toBeNull();
+    expect(overflow?.type).toBe("error");
+    expect((overflow?.data as { error: string }).error).toBe("buffer_overflow");
+    expect(signal.aborted).toBe(true);
+    expect(bus.getStatus("c1")).toBe("error");
+    expect(bus.isActive("c1")).toBe(false);
+    expect(endStatuses).toEqual(["error"]);
+
+    // The viewer saw 10 deltas + 1 terminal error.
+    expect(events.length).toBe(11);
+    expect(events[events.length - 1]?.type).toBe("error");
+
+    // Further publishes are dropped by the standard not-running guard.
+    const after = bus.publish("c1", "text.delta", { text: "late" });
+    expect(after).toBeNull();
+  });
+
+  it("overflow error event is included in a late attacher's replay", () => {
+    const bus = new RunBus(30_000, 3);
+    bus.begin("c1");
+    bus.publish("c1", "text.delta", { text: "1" });
+    bus.publish("c1", "text.delta", { text: "2" });
+    bus.publish("c1", "text.delta", { text: "3" });
+    bus.publish("c1", "text.delta", { text: "4" }); // trips cap
+
+    const { events, onEvent } = collect();
+    let lateStatus: string | undefined;
+    bus.attach("c1", 0, onEvent, (s) => {
+      lateStatus = s;
+    });
+    expect(lateStatus).toBe("error");
+    expect(events[events.length - 1]?.type).toBe("error");
+    expect((events[events.length - 1]?.data as { error: string }).error).toBe("buffer_overflow");
+  });
 });

From 5818db5bab997cb8bf8cd6a89b0b3fe775351fb0 Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Wed, 27 May 2026 12:09:48 -0500
Subject: [PATCH 17/26] fix(tests): hard-error on missing workDir under bun
 test, fix 8 leakers
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

`Runtime.start({})` defaulted `workDir` to `~/.nimblebrain`, so any
integration test that forgot the field silently wrote echo-model
conversations, test workspaces, and bundle data straight into the
developer's real workdir. They then showed up in the conversations tab
on `bun run dev` — confusing diagnosis that looked like a title-pipeline
bug but was really 268 of 282 convs being test fixtures with
`workspaceId: "ws_test"`.

`resolveWorkDir` now throws under `NODE_ENV=test` (bun:test sets this
automatically) when `workDir` is missing, with a clear example fix.
Catches future regressions of this category at construction time.

Eight test files were leaking:
- chat-stream-concurrent
- appcontext-wiring (3 Runtime.starts)
- dependency-checking (6 starts; share file-scope testDir)
- conversation-integration
- remote-integration (3 starts)
- runtime (7 starts; one needed its own workDir to avoid skill bleed
  from earlier same-file tests writing to the shared global skill dir)
- security/workspace-isolation
- usage-integration

New helper `test/helpers/test-workdir.ts` exposes `makeTestWorkDir(label)`
that returns `{workDir, cleanup}` for tests that want per-test isolation.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 src/runtime/runtime.ts                        | 17 +++++++++-
 test/helpers/test-workdir.ts                  | 33 +++++++++++++++++++
 test/integration/appcontext-wiring.test.ts    | 15 +++++++++
 .../chat-stream-concurrent.test.ts            | 12 +++++++
 .../conversation-integration.test.ts          |  4 +++
 test/integration/dependency-checking.test.ts  |  6 ++++
 test/integration/remote-integration.test.ts   |  3 ++
 test/integration/runtime.test.ts              | 14 +++++++-
 .../security/workspace-isolation.test.ts      |  8 +++++
 test/integration/usage-integration.test.ts    |  2 ++
 10 files changed, 112 insertions(+), 2 deletions(-)
 create mode 100644 test/helpers/test-workdir.ts

diff --git a/src/runtime/runtime.ts b/src/runtime/runtime.ts
index 6350cfe6..28e4002c 100644
--- a/src/runtime/runtime.ts
+++ b/src/runtime/runtime.ts
@@ -131,7 +131,22 @@ function parseAliasRef(s: string): ModelSlot | null {
 }
 
 function resolveWorkDir(config: RuntimeConfig): string {
-  return config.workDir ?? DEFAULT_WORK_DIR;
+  if (config.workDir) return config.workDir;
+  // Hard guard: under `bun test` (NODE_ENV=test is set automatically by the
+  // bun test runner), defaulting to `~/.nimblebrain` would pollute the
+  // developer's real workdir with test conversations / workspaces / bundles.
+  // Force every test to pass an explicit (typically tmpdir-based) workDir.
+  // Without this, a test that forgets `workDir` silently writes echo-model
+  // conversations into the user's dev environment and they show up in the
+  // real app's conversations tab.
+  if (process.env.NODE_ENV === "test") {
+    throw new Error(
+      "Runtime.start({}) called without `workDir` under bun test. " +
+        "Pass an explicit tmpdir-based workDir to avoid polluting the developer's ~/.nimblebrain. " +
+        "Example: workDir: join(tmpdir(), 'nb-test-' + Date.now()).",
+    );
+  }
+  return DEFAULT_WORK_DIR;
 }
 
 function globalSkillDir(config: RuntimeConfig): string {
diff --git a/test/helpers/test-workdir.ts b/test/helpers/test-workdir.ts
new file mode 100644
index 00000000..934de436
--- /dev/null
+++ b/test/helpers/test-workdir.ts
@@ -0,0 +1,33 @@
+import { mkdirSync, rmSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+
+/**
+ * Allocate an isolated, ephemeral workDir for an integration test.
+ *
+ * Why this exists: `Runtime.start({})` defaults `workDir` to `~/.nimblebrain`.
+ * A test that forgets to pass `workDir` writes echo-model conversations,
+ * test workspaces, and bundle data straight into the developer's real dev
+ * workdir, where they then show up in the conversations tab and lifecycle
+ * tools. `Runtime.start` throws under `NODE_ENV=test` if `workDir` is
+ * missing — this helper is the canonical way to satisfy that guard.
+ *
+ * Returns the path and a cleanup function. Call cleanup in `afterEach` /
+ * `afterAll` after `runtime.shutdown()`.
+ *
+ * @example
+ *   const { workDir, cleanup } = makeTestWorkDir("chat-stream-concurrent");
+ *   afterEach(async () => { await runtime.shutdown(); cleanup(); });
+ *   const runtime = await Runtime.start({ workDir, ... });
+ */
+export function makeTestWorkDir(label = "test"): { workDir: string; cleanup: () => void } {
+  const workDir = join(
+    tmpdir(),
+    `nb-${label}-${Date.now()}-${Math.floor(Math.random() * 1e9).toString(36)}`,
+  );
+  mkdirSync(workDir, { recursive: true });
+  return {
+    workDir,
+    cleanup: () => rmSync(workDir, { recursive: true, force: true }),
+  };
+}
diff --git a/test/integration/appcontext-wiring.test.ts b/test/integration/appcontext-wiring.test.ts
index 480eeeab..ec62bd85 100644
--- a/test/integration/appcontext-wiring.test.ts
+++ b/test/integration/appcontext-wiring.test.ts
@@ -4,6 +4,7 @@ import type { ToolSource } from "../../src/tools/types.ts";
 import type { ToolResult } from "../../src/engine/types.ts";
 import { textContent } from "../../src/engine/content-helpers.ts";
 import { createMockModel } from "../helpers/mock-model.ts";
+import { makeTestWorkDir } from "../helpers/test-workdir.ts";
 import { TEST_WORKSPACE_ID, provisionTestWorkspace } from "../helpers/test-workspace.ts";
 
 /** Minimal model adapter that captures the system prompt for assertions. */
@@ -50,9 +51,21 @@ function createFakeSource(name: string, tools: Array<{ localName: string; descri
 }
 
 describe("Runtime.chat() appContext wiring", () => {
+	const cleanups: Array<() => void> = [];
+	afterAll(() => {
+		for (const c of cleanups) c();
+	});
+
+	function freshWorkDir(): string {
+		const { workDir, cleanup } = makeTestWorkDir("appcontext-wiring");
+		cleanups.push(cleanup);
+		return workDir;
+	}
+
 	it("passes focusedApp to composeSystemPrompt when appContext matches a source", async () => {
 		const { adapter, getSystem } = createCapturingModel();
 		const runtime = await Runtime.start({
+			workDir: freshWorkDir(),
 			model: { provider: "custom", adapter },
 			noDefaultBundles: true,
 			logging: { disabled: true },
@@ -86,6 +99,7 @@ describe("Runtime.chat() appContext wiring", () => {
 	it("does not inject focusedApp when appContext is absent", async () => {
 		const { adapter, getSystem } = createCapturingModel();
 		const runtime = await Runtime.start({
+			workDir: freshWorkDir(),
 			model: { provider: "custom", adapter },
 			noDefaultBundles: true,
 			logging: { disabled: true },
@@ -104,6 +118,7 @@ describe("Runtime.chat() appContext wiring", () => {
 	it("skips silently when serverName does not match any source", async () => {
 		const { adapter, getSystem } = createCapturingModel();
 		const runtime = await Runtime.start({
+			workDir: freshWorkDir(),
 			model: { provider: "custom", adapter },
 			noDefaultBundles: true,
 			logging: { disabled: true },
diff --git a/test/integration/chat-stream-concurrent.test.ts b/test/integration/chat-stream-concurrent.test.ts
index 38cd3fbb..ee8376d0 100644
--- a/test/integration/chat-stream-concurrent.test.ts
+++ b/test/integration/chat-stream-concurrent.test.ts
@@ -15,6 +15,7 @@ import { startServer } from "../../src/api/server.ts";
 import { Runtime } from "../../src/runtime/runtime.ts";
 import { createEchoModel } from "../helpers/echo-model.ts";
 import { createMockModel } from "../helpers/mock-model.ts";
+import { makeTestWorkDir } from "../helpers/test-workdir.ts";
 import { TEST_WORKSPACE_ID, provisionTestWorkspace } from "../helpers/test-workspace.ts";
 
 interface SSEEvent {
@@ -39,14 +40,23 @@ function parseSSE(text: string): SSEEvent[] {
 describe("POST /v1/chat/stream — concurrency protection", () => {
   let handle: ServerHandle | null = null;
   let runtime: Runtime | null = null;
+  let cleanupDir: (() => void) | null = null;
 
   afterEach(async () => {
     handle?.stop(true);
     await runtime?.shutdown();
+    cleanupDir?.();
     handle = null;
     runtime = null;
+    cleanupDir = null;
   });
 
+  function makeWorkDir(): string {
+    const w = makeTestWorkDir("chat-stream-concurrent");
+    cleanupDir = w.cleanup;
+    return w.workDir;
+  }
+
   test("returns HTTP 409 when pre-check sees an in-flight run on the same conversation", async () => {
     // A gated model lets us hold runtime.chat() open deterministically. The
     // first call to doGenerate awaits the gate; releasing it lets the seed
@@ -67,6 +77,7 @@ describe("POST /v1/chat/stream — concurrency protection", () => {
     });
 
     runtime = await Runtime.start({
+      workDir: makeWorkDir(),
       model: { provider: "custom", adapter: gatedModel },
       noDefaultBundles: true,
       logging: { disabled: true },
@@ -112,6 +123,7 @@ describe("POST /v1/chat/stream — concurrency protection", () => {
 
   test("concurrent stream requests produce exactly one successful run; the rest are rejected", async () => {
     runtime = await Runtime.start({
+      workDir: makeWorkDir(),
       model: { provider: "custom", adapter: createEchoModel() },
       noDefaultBundles: true,
       logging: { disabled: true },
diff --git a/test/integration/conversation-integration.test.ts b/test/integration/conversation-integration.test.ts
index 0833ffae..41a6f4b6 100644
--- a/test/integration/conversation-integration.test.ts
+++ b/test/integration/conversation-integration.test.ts
@@ -217,9 +217,12 @@ describe("API full-flow integration", () => {
 	let runtime: Runtime;
 	let handle: ServerHandle;
 	let baseUrl: string;
+	let runtimeWorkDir: string;
 
 	beforeAll(async () => {
+		runtimeWorkDir = tempDir();
 		runtime = await Runtime.start({
+			workDir: runtimeWorkDir,
 			model: { provider: "custom", adapter: createEchoModel() },
 			noDefaultBundles: true,
 			logging: { disabled: true },
@@ -232,6 +235,7 @@ describe("API full-flow integration", () => {
 	afterAll(async () => {
 		handle.stop(true);
 		await runtime.shutdown();
+		rmSync(runtimeWorkDir, { recursive: true, force: true });
 	});
 
 	it.skip("chat → list → rename → search → fork → delete → verify gone", async () => {
diff --git a/test/integration/dependency-checking.test.ts b/test/integration/dependency-checking.test.ts
index 6b9ead22..88a44989 100644
--- a/test/integration/dependency-checking.test.ts
+++ b/test/integration/dependency-checking.test.ts
@@ -60,6 +60,7 @@ You are a friendly greeter.
 
     const { model, getSystem } = createCapturingModel();
     const runtime = await Runtime.start({
+      workDir: testDir,
       model: { provider: "custom", adapter: model },
       noDefaultBundles: true,
       skillDirs: [skillDir],
@@ -96,6 +97,7 @@ You are a helper.
 
     const { model, getSystem } = createCapturingModel();
     const runtime = await Runtime.start({
+      workDir: testDir,
       model: { provider: "custom", adapter: model },
       noDefaultBundles: true,
       skillDirs: [skillDir],
@@ -138,6 +140,7 @@ You are a data analyst.
 
     const { model, getSystem } = createCapturingModel();
     const runtime = await Runtime.start({
+      workDir: testDir,
       model: { provider: "custom", adapter: model },
       noDefaultBundles: true,
       skillDirs: [skillDir],
@@ -178,6 +181,7 @@ You use multiple tools.
 
     const { model, getSystem } = createCapturingModel();
     const runtime = await Runtime.start({
+      workDir: testDir,
       model: { provider: "custom", adapter: model },
       noDefaultBundles: true,
       skillDirs: [skillDir],
@@ -223,6 +227,7 @@ Original body.
 
     const { model, getSystem } = createCapturingModel();
     const runtime = await Runtime.start({
+      workDir: testDir,
       model: { provider: "custom", adapter: model },
       noDefaultBundles: true,
       skillDirs: [skillDir],
@@ -265,6 +270,7 @@ Matching body.
 
     const { model } = createCapturingModel();
     const runtime = await Runtime.start({
+      workDir: testDir,
       model: { provider: "custom", adapter: model },
       noDefaultBundles: true,
       skillDirs: [skillDir],
diff --git a/test/integration/remote-integration.test.ts b/test/integration/remote-integration.test.ts
index bb3644f7..0b692556 100644
--- a/test/integration/remote-integration.test.ts
+++ b/test/integration/remote-integration.test.ts
@@ -225,6 +225,7 @@ describe.skip("Remote integration: POST /v1/apps/install with url", () => {
 		writeFileSync(configPath, JSON.stringify({ bundles: [] }, null, 2));
 
 		runtime = await Runtime.start({
+			workDir: testDir,
 			model: { provider: "custom", adapter: createEchoModel() },
 			noDefaultBundles: true,
 			logging: { disabled: true },
@@ -350,6 +351,7 @@ describe("Remote integration: registering remote bundles in workspace registry",
 
 	it("remote bundle can be registered into a workspace registry and provides tools", async () => {
 		const runtime = await Runtime.start({
+			workDir: testDir,
 			model: { provider: "custom", adapter: createEchoModel() },
 			noDefaultBundles: true,
 			logging: { disabled: true },
@@ -375,6 +377,7 @@ describe("Remote integration: registering remote bundles in workspace registry",
 
 	it("failed remote bundle does not pollute registry while successful one registers", async () => {
 		const runtime = await Runtime.start({
+			workDir: testDir,
 			model: { provider: "custom", adapter: createEchoModel() },
 			noDefaultBundles: true,
 			logging: { disabled: true },
diff --git a/test/integration/runtime.test.ts b/test/integration/runtime.test.ts
index bd8b78d1..be65be86 100644
--- a/test/integration/runtime.test.ts
+++ b/test/integration/runtime.test.ts
@@ -57,6 +57,7 @@ describe("filterTools", () => {
 describe("Runtime", () => {
   it("starts with echo model and processes a chat", async () => {
     const runtime = await Runtime.start({
+      workDir: testDir,
       model: { provider: "custom", adapter: createEchoModel() },
       noDefaultBundles: true,
     });
@@ -96,6 +97,7 @@ describe("Runtime", () => {
 
   it("creates new conversation when no id provided", async () => {
     const runtime = await Runtime.start({
+      workDir: testDir,
       model: { provider: "custom", adapter: createEchoModel() },
       noDefaultBundles: true,
     });
@@ -182,6 +184,7 @@ You are a friendly greeter. Always respond with enthusiasm!
     );
 
     const runtime = await Runtime.start({
+      workDir: testDir,
       model: { provider: "custom", adapter: createEchoModel() },
       noDefaultBundles: true,
       skillDirs: [skillDir],
@@ -229,6 +232,7 @@ I am Nira, your AI assistant. You work at Acme Corp.
     });
 
     const runtime = await Runtime.start({
+      workDir: testDir,
       model: { provider: "custom", adapter: model },
       noDefaultBundles: true,
       skillDirs: [skillDir],
@@ -244,10 +248,16 @@ I am Nira, your AI assistant. You work at Acme Corp.
   });
 
   it("reloads skills dynamically", async () => {
-    const skillDir = join(testDir, "dynamic-skills");
+    // Isolated workDir — earlier tests in this file write to `testDir/skills`
+    // (the global skill dir), which would otherwise pre-load `greeter` here
+    // and break the "No skills initially" assertion below.
+    const isolatedWorkDir = join(testDir, `reload-skills-${Date.now()}`);
+    mkdirSync(isolatedWorkDir, { recursive: true });
+    const skillDir = join(isolatedWorkDir, "dynamic-skills");
     mkdirSync(skillDir, { recursive: true });
 
     const runtime = await Runtime.start({
+      workDir: isolatedWorkDir,
       model: { provider: "custom", adapter: createEchoModel() },
       noDefaultBundles: true,
       skillDirs: [skillDir],
@@ -290,6 +300,7 @@ Greet with enthusiasm!
     };
 
     const runtime = await Runtime.start({
+      workDir: testDir,
       model: { provider: "custom", adapter: createEchoModel() },
       noDefaultBundles: true,
       events: [sink],
@@ -306,6 +317,7 @@ Greet with enthusiasm!
 
   it("reports available tools (empty when no bundles)", async () => {
     const runtime = await Runtime.start({
+      workDir: testDir,
       model: { provider: "custom", adapter: createEchoModel() },
       noDefaultBundles: true,
     });
diff --git a/test/integration/security/workspace-isolation.test.ts b/test/integration/security/workspace-isolation.test.ts
index f00dc959..079a78fb 100644
--- a/test/integration/security/workspace-isolation.test.ts
+++ b/test/integration/security/workspace-isolation.test.ts
@@ -11,6 +11,9 @@
  *    install the same bundle (the briefing/nav leak class)
  */
 
+import { mkdirSync, rmSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
 import { afterAll, beforeAll, describe, expect, it } from "bun:test";
 import type {
   BriefingBlock,
@@ -31,10 +34,14 @@ import type { Tool, ToolSource } from "../../../src/tools/types.ts";
 let runtime: Runtime;
 let handle: ServerHandle;
 let baseUrl: string;
+let workDir: string;
 const TEST_KEY = "security-test-key-12345";
 
 beforeAll(async () => {
+  workDir = join(tmpdir(), `nb-workspace-isolation-${Date.now()}`);
+  mkdirSync(workDir, { recursive: true });
   runtime = await Runtime.start({
+    workDir,
     model: { provider: "custom", adapter: createEchoModel() },
     noDefaultBundles: true,
     logging: { disabled: true },
@@ -51,6 +58,7 @@ beforeAll(async () => {
 afterAll(async () => {
   handle.stop(true);
   await runtime.shutdown();
+  rmSync(workDir, { recursive: true, force: true });
 });
 
 function authHeaders(extra?: Record<string, string>): Record<string, string> {
diff --git a/test/integration/usage-integration.test.ts b/test/integration/usage-integration.test.ts
index e6dd79be..00bd42e2 100644
--- a/test/integration/usage-integration.test.ts
+++ b/test/integration/usage-integration.test.ts
@@ -14,10 +14,12 @@ describe("ChatResult.usage", () => {
 
 	afterAll(async () => {
 		await runtime.shutdown();
+		if (existsSync(usageTestDir)) rmSync(usageTestDir, { recursive: true });
 	});
 
 	it("is populated with all TurnUsage fields after Runtime.chat()", async () => {
 		runtime = await Runtime.start({
+			workDir: usageTestDir,
 			model: { provider: "custom", adapter: createEchoModel() },
 			noDefaultBundles: true,
 			logging: { disabled: true },

From 0556d83722188878f1e5722aed12502e53e4823f Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Wed, 27 May 2026 12:10:09 -0500
Subject: [PATCH 18/26] perf(conversations): patch list row title in-place
 instead of refetching
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The runtime fired `emitConversationsChanged()` three times on a
first-turn chat: when isNew (sidebar row appears), at .finally (terminal
state), and again when the title resolved. Each broadcast triggered the
conversations-list iframe to refetch the whole list.

The title-resolve refetch is now redundant. The `conversation.title`
SSE event already exists (the chat panel header consumes it for live
title display); the list iframe just didn't have a channel for it.
Add one: the web shell forwards `conversation.title` via postMessage to
matching iframes, and the conversations bundle listens with a raw
`window.addEventListener` (the synapse SDK doesn't know this envelope,
which is fine — its own listener ignores unrecognized methods, no
double-handling). The iframe patches the matching row's title in-place,
no list refetch.

Drop the now-redundant `emitConversationsChanged()` from the
title-resolve handler. Broadcast count drops from 3 to 2 on first turn;
subsequent turns unchanged at 1.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .../conversations/ui/src/Dashboard.tsx        | 37 +++++++++++++++++++
 src/runtime/runtime.ts                        | 16 +++++---
 web/src/App.tsx                               |  6 ++-
 web/src/lib/forward-conversation-title.ts     | 37 +++++++++++++++++++
 4 files changed, 89 insertions(+), 7 deletions(-)
 create mode 100644 web/src/lib/forward-conversation-title.ts

diff --git a/src/bundles/conversations/ui/src/Dashboard.tsx b/src/bundles/conversations/ui/src/Dashboard.tsx
index 1d597007..7fe48c06 100644
--- a/src/bundles/conversations/ui/src/Dashboard.tsx
+++ b/src/bundles/conversations/ui/src/Dashboard.tsx
@@ -95,6 +95,43 @@ export function Dashboard() {
     }
   });
 
+  // Live conversation-title updates from auto-title generation.
+  //
+  // The host (App.tsx) forwards each `conversation.title` SSE event to this
+  // iframe via a `synapse/conversation-title` postMessage. We patch the
+  // matching row's title in-place instead of refetching the whole list — the
+  // runtime used to fire an extra `data.changed` on title-resolve to force a
+  // refetch, but that triggered a full reload of every row. Listening
+  // directly is cheaper and updates a single row without flicker.
+  //
+  // Raw `window.addEventListener` (not via the synapse SDK) because the SDK
+  // doesn't know this method; the host owns both ends, so the side channel
+  // is safe. The SDK's own `message` listener ignores envelopes whose
+  // `method` it doesn't recognize, so there's no double-handling.
+  useEffect(() => {
+    const handler = (event: MessageEvent) => {
+      const msg = event.data;
+      if (!msg || typeof msg !== "object") return;
+      if (msg.jsonrpc !== "2.0" || msg.method !== "synapse/conversation-title") return;
+      const params = msg.params;
+      if (!params || typeof params !== "object") return;
+      const conversationId = (params as { conversationId?: unknown }).conversationId;
+      const title = (params as { title?: unknown }).title;
+      if (typeof conversationId !== "string" || typeof title !== "string") return;
+      setConversations((prev) => {
+        let changed = false;
+        const next = prev.map((c) => {
+          if (c.id !== conversationId) return c;
+          changed = true;
+          return { ...c, title };
+        });
+        return changed ? next : prev;
+      });
+    };
+    window.addEventListener("message", handler);
+    return () => window.removeEventListener("message", handler);
+  }, []);
+
   const handleSelectFilter = useCallback(
     (key: FilterKey) => {
       setActiveFilter(key);
diff --git a/src/runtime/runtime.ts b/src/runtime/runtime.ts
index 28e4002c..7b78db7e 100644
--- a/src/runtime/runtime.ts
+++ b/src/runtime/runtime.ts
@@ -1436,11 +1436,16 @@ export class Runtime {
 
     // Fire-and-forget title generation on first turn (use "fast" slot for cost
     // savings). Decoupled from the turn lifecycle: when it resolves we persist
-    // the title, then broadcast `conversation.title` on the global SSE so any
-    // live viewer's panel header updates in place, and refresh the
-    // conversations list. The global channel (not the turn stream, which the
-    // client closes on `done`) means delivery is reliable after the turn ends
-    // and across tabs — routed to the right conversation by `conversationId`.
+    // the title and broadcast `conversation.title` on the global SSE.
+    //
+    // No `emitConversationsChanged()` here — the conversation-list iframe
+    // listens for `conversation.title` directly (forwarded via postMessage
+    // by the web shell) and patches the matching row in-place. Firing
+    // `data.changed` on title resolve used to trigger a full list refetch,
+    // which was wasteful and caused row flicker. The global channel (not
+    // the turn stream, which the client closes on `done`) means delivery
+    // is reliable after the turn ends and across tabs — routed to the
+    // right conversation by `conversationId`.
     if (conversation.title === null) {
       const titleModel = this.resolveModelFn(this.getModelSlot("fast"));
       const titleInput =
@@ -1453,7 +1458,6 @@ export class Runtime {
             type: "conversation.title",
             data: { conversationId: conversation.id, title, wsId },
           });
-          this.emitConversationsChanged();
         },
         (err) => console.error("[runtime] title generation failed:", err),
       );
diff --git a/web/src/App.tsx b/web/src/App.tsx
index f9e5e019..eac27cbf 100644
--- a/web/src/App.tsx
+++ b/web/src/App.tsx
@@ -38,6 +38,7 @@ import {
 } from "./context/WorkspaceContext";
 import { chatStore } from "./hooks/chat-store";
 import { useDataSync } from "./hooks/useDataSync";
+import { forwardConversationTitleToIframes } from "./lib/forward-conversation-title";
 import { useEvents } from "./hooks/useEvents";
 import { useShell } from "./hooks/useShell";
 import { bootstrapWorkspacesToInfo } from "./lib/bootstrap";
@@ -229,9 +230,12 @@ function AuthenticatedAppContent({
     onDataChanged,
     onConfigChanged: () => config.refreshConfig(),
     // Auto-title arrived — update the matching conversation's slice so the
-    // chat panel header reflects it live (routed by conversationId).
+    // chat panel header reflects it live (routed by conversationId), and
+    // forward to the conversations-list iframe so its sidebar row updates
+    // in place without a full list refetch.
     onConversationTitle: ({ conversationId, title }) => {
       chatStore.setTitle(conversationId, title);
+      forwardConversationTitleToIframes(conversationId, title);
     },
     // Bundle install / uninstall changes the placement set; refetch
     // the shell so the sidebar's Apps group reflects the new state
diff --git a/web/src/lib/forward-conversation-title.ts b/web/src/lib/forward-conversation-title.ts
new file mode 100644
index 00000000..9f65733b
--- /dev/null
+++ b/web/src/lib/forward-conversation-title.ts
@@ -0,0 +1,37 @@
+/**
+ * Forward a live `conversation.title` SSE event to the conversations-list
+ * iframe via postMessage.
+ *
+ * The conversations bundle's Dashboard listens for `synapse/conversation-title`
+ * and patches the matching row's title in-place. This is the cheap path: a
+ * full `data.changed` would force a list refetch, which is what the runtime
+ * used to fire on title resolve. Sending the (conversationId, title) tuple
+ * directly is one postMessage and an in-place state update.
+ *
+ * Targets only iframes whose `data-app` matches the conversations bundle
+ * name (`@nimblebraininc/conversations`). Unrelated iframes never see the
+ * message. No-op when the conversations panel isn't currently mounted —
+ * the next mount loads from disk where the title is already persisted, so
+ * there's no race.
+ *
+ * @param conversationId Conversation whose title was just generated.
+ * @param title          The generated title.
+ */
+const CONVERSATIONS_APP = "@nimblebraininc/conversations";
+
+export function forwardConversationTitleToIframes(conversationId: string, title: string): void {
+  const iframes = document.querySelectorAll<HTMLIFrameElement>(
+    `iframe[data-app="${CONVERSATIONS_APP}"]`,
+  );
+  if (iframes.length === 0) return;
+  const message = {
+    jsonrpc: "2.0",
+    method: "synapse/conversation-title",
+    params: { conversationId, title },
+  };
+  for (const iframe of iframes) {
+    // Srcdoc iframes have the opaque "null" origin; targetOrigin must be "*"
+    // (matches useDataSync's path — same constraint).
+    iframe.contentWindow?.postMessage(message, "*");
+  }
+}

From d37e54eb962c63ce2804f58fa43a010e1f66ed47 Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Wed, 27 May 2026 12:10:56 -0500
Subject: [PATCH 19/26] chore: drop stale streamChat refs + scope code-style
 check to non-bundle src

Two unrelated cleanups:

- `web/src/api/client.ts`: comments still referenced the deleted
  `streamChat` / `streamChatMultipart` helpers (uploadResource header
  pattern note + startChatTurn docblock). Rot-flagged only; no
  behavior change.

- `scripts/check-code-style.ts`: the doc comment says "bundles are out
  of scope" but the glob walked `src/**/*.ts`, which after
  `bun run build:bundles` pulls in `src/bundles/*/ui/node_modules/`
  and surfaces 1625 false-positive inline-type-import violations in
  vendored `.d.ts` files. Skip `node_modules/` and `src/bundles/`
  per the documented scope.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 scripts/check-code-style.ts | 7 +++++++
 web/src/api/client.ts       | 8 ++++----
 2 files changed, 11 insertions(+), 4 deletions(-)

diff --git a/scripts/check-code-style.ts b/scripts/check-code-style.ts
index 5edc7a86..ea499ebb 100644
--- a/scripts/check-code-style.ts
+++ b/scripts/check-code-style.ts
@@ -52,6 +52,13 @@ function checkNoInlineTypeImports(): CheckResult {
 
   for (const file of glob.scanSync({ cwd: SRC_ROOT, absolute: true })) {
     const rel = relative(ROOT, file);
+    // Skip bundle subtrees (their UIs have their own conventions, per the
+    // doc comment) and vendored deps. `bun run build:bundles` installs
+    // node_modules under each bundle's UI, so an unfiltered walk picks
+    // up thousands of vendored `.d.ts` violations that have nothing to
+    // do with our source.
+    if (rel.includes("/node_modules/")) continue;
+    if (rel.startsWith("src/bundles/")) continue;
     const content = readFileSync(file, "utf-8");
     const source = ts.createSourceFile(file, content, ts.ScriptTarget.Latest, true);
 
diff --git a/web/src/api/client.ts b/web/src/api/client.ts
index f0bb414c..c68c38a8 100644
--- a/web/src/api/client.ts
+++ b/web/src/api/client.ts
@@ -290,14 +290,14 @@ export interface UploadResourceResult {
  */
 export async function uploadResource(files: File[]): Promise<UploadResourceResult> {
   const formData = new FormData();
-  // Use `files` (plural) to match `streamChatMultipart`; the server
-  // accepts either, but one canonical spelling avoids surprises.
+  // Use `files` (plural) — the server's multipart route accepts either
+  // `files` or `file`, but one canonical spelling avoids surprises.
   for (const file of files) {
     formData.append("files", file, file.name);
   }
 
   // Build headers WITHOUT Content-Type — let the browser set the
-  // multipart boundary. Same pattern as `streamChatMultipart`.
+  // multipart boundary. Standard pattern for FormData uploads.
   const h: Record<string, string> = {};
   if (authToken && authToken !== "__cookie__") {
     h.Authorization = `Bearer ${authToken}`;
@@ -341,7 +341,7 @@ export async function chat(req: ChatRequest): Promise<ChatResult> {
 /**
  * Start a server-authoritative turn. Returns the conversation id immediately;
  * the turn runs to completion on the server regardless of this client. Watch
- * it via `connectConversationStream`. Replaces the streaming `streamChat` path.
+ * it via `connectConversationStream`.
  */
 export async function startChatTurn(req: ChatRequest): Promise<{ conversationId: string }> {
   const res = await fetchWithRefresh(`${API_BASE}/v1/chat/start`, {

From 8d0a6122b82394d2f95f81c1f6dec75660a8ac26 Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Mon, 1 Jun 2026 11:33:06 -0500
Subject: [PATCH 20/26] refactor(web): consolidate onto the seq-based
 conversation stream
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The upstream merge resurrected the per-conversation SSE chain from PR #325
(conversation-sse.ts + conversation-events-client.ts + useConversationEvents.ts
+ conversation-subscribers.ts). On this branch that chain is dead code: the
ChatContext/useChat rewrite drives chat through chat-store →
conversation-stream.ts (the server-authoritative, seq-based replay path), and
nothing mounts useConversationEvents. The two clients are not interchangeable —
upstream's reconnect does a full reload from disk, which loses an unpersisted
in-flight turn; the whole point of #254 is gapless afterSeq replay.

Rather than keep both, delete the dead chain and fold its one genuinely-better
trait — transport robustness — into the live path:

- Port the stale-stream watchdog + tab-visibility-resume from the deleted
  conversation-sse.ts into conversation-stream.ts. A silently-stalled stream
  (proxy idle-timeout, dead NAT binding, laptop sleep) now force-reconnects;
  the reconnect carries afterSeq=lastSeq so recovery is gapless. Thresholds are
  injectable for deterministic tests.
- Replace App.tsx's pagehide closeAllConversationEvents() with a new
  chatStore.closeAllConnections() that closes per-slice sockets without
  clearing state (bfcache-safe; the heavier reset() is for identity change).
- Delete conversation-sse.ts, conversation-events-client.ts,
  useConversationEvents.ts, conversation-subscribers.ts, and the
  conversation-events-client test. Net −520 lines of dead code.

The workspace /v1/events singleton (events-client.ts) is untouched — it's a
separate, live upstream improvement.

Adds conversation-stream watchdog tests. They import the real module via the
test/setup.ts preload snapshot because chat-store.test / chatBleed / inlineError
mock.module this path with a watchdog-less fake, and bun's mock.module registry
is process-global and never unwinds — the same footgun setup.ts already guards
for api/client.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 web/src/App.tsx                               |   5 +-
 .../conversation-events-client.test.ts        | 195 -------------
 web/src/api/conversation-events-client.ts     | 171 -----------
 web/src/api/conversation-sse.ts               | 275 ------------------
 web/src/api/conversation-stream.test.ts       | 165 +++++++++++
 web/src/api/conversation-stream.ts            |  92 +++++-
 web/src/api/conversation-subscribers.ts       |  37 ---
 web/src/api/sse.ts                            |   5 +-
 web/src/hooks/chat-store.ts                   |  18 ++
 web/src/hooks/useConversationEvents.ts        |  72 -----
 web/test/setup.ts                             |  11 +
 11 files changed, 290 insertions(+), 756 deletions(-)
 delete mode 100644 web/src/__tests__/conversation-events-client.test.ts
 delete mode 100644 web/src/api/conversation-events-client.ts
 delete mode 100644 web/src/api/conversation-sse.ts
 create mode 100644 web/src/api/conversation-stream.test.ts
 delete mode 100644 web/src/api/conversation-subscribers.ts
 delete mode 100644 web/src/hooks/useConversationEvents.ts

diff --git a/web/src/App.tsx b/web/src/App.tsx
index 66180695..4df10029 100644
--- a/web/src/App.tsx
+++ b/web/src/App.tsx
@@ -11,7 +11,6 @@ import {
   setPlatformVersion,
   tryBootstrap,
 } from "./api/client";
-import { closeAllConversationEvents } from "./api/conversation-events-client";
 import { closeEventsClient } from "./api/events-client";
 import { AppWithChat } from "./components/AppWithChat";
 import { ErrorBoundary } from "./components/ErrorBoundary";
@@ -572,7 +571,9 @@ export function App() {
   useEffect(() => {
     const onPageHide = (): void => {
       closeEventsClient();
-      closeAllConversationEvents();
+      // Close per-conversation turn-stream sockets so the server reclaims
+      // SSE slots immediately. Slices stay intact for a bfcache restore.
+      chatStore.closeAllConnections();
     };
     window.addEventListener("pagehide", onPageHide);
     return () => {
diff --git a/web/src/__tests__/conversation-events-client.test.ts b/web/src/__tests__/conversation-events-client.test.ts
deleted file mode 100644
index b66a1c3b..00000000
--- a/web/src/__tests__/conversation-events-client.test.ts
+++ /dev/null
@@ -1,195 +0,0 @@
-// ---------------------------------------------------------------------------
-// conversation-events-client.ts — keyed conversation SSE singleton
-//
-// Mocks `./api/conversation-sse` so the singleton can be driven without
-// touching the network. Verifies the per-conversation ref-counted
-// open/close semantic, which is the contract that prevents the latent
-// "two consumers → two connections" regression even though today only
-// one consumer (ChatContext) subscribes.
-// ---------------------------------------------------------------------------
-
-import { afterEach, beforeEach, describe, expect, mock, test } from "bun:test";
-import type { ConversationSseConnection, ConversationSseOptions } from "../api/conversation-sse";
-
-let connectCalls = 0;
-let closeCalls = 0;
-const optionsByConvId = new Map<string, ConversationSseOptions>();
-
-class FakeConvConnection implements ConversationSseConnection {
-  closed = false;
-  conversationId: string;
-  constructor(conversationId: string) {
-    this.conversationId = conversationId;
-  }
-  close(): void {
-    if (this.closed) return;
-    this.closed = true;
-    closeCalls += 1;
-  }
-}
-
-const liveConnections: FakeConvConnection[] = [];
-
-function fakeConnectConversationEvents(options: ConversationSseOptions): ConversationSseConnection {
-  connectCalls += 1;
-  optionsByConvId.set(options.conversationId, options);
-  const conn = new FakeConvConnection(options.conversationId);
-  liveConnections.push(conn);
-  return conn;
-}
-
-mock.module("../api/conversation-sse", () => ({
-  connectConversationEvents: fakeConnectConversationEvents,
-}));
-
-// Import AFTER mocking so the singleton sees the fake.
-import { setAuthLifecycleHandler, setAuthToken } from "../api/client";
-import {
-  __internal__,
-  closeAllConversationEvents,
-  subscribeConversation,
-} from "../api/conversation-events-client";
-
-function resetCounters(): void {
-  connectCalls = 0;
-  closeCalls = 0;
-  optionsByConvId.clear();
-  liveConnections.length = 0;
-}
-
-beforeEach(() => {
-  resetCounters();
-  setAuthToken("tok-initial");
-  __internal__.resetForTest();
-});
-
-afterEach(() => {
-  __internal__.resetForTest();
-  setAuthLifecycleHandler(null);
-  setAuthToken(null);
-});
-
-describe("conversation-events-client — keyed singleton", () => {
-  test("first subscribe for a conversation opens exactly one connection", () => {
-    subscribeConversation("conv_a", { onEvent: () => {} });
-    expect(connectCalls).toBe(1);
-    expect(__internal__.hasConnection("conv_a")).toBe(true);
-    expect(__internal__.connectionCount()).toBe(1);
-  });
-
-  test("multiple subscribers to the same conversation share one connection", () => {
-    subscribeConversation("conv_a", { onEvent: () => {} });
-    subscribeConversation("conv_a", { onEvent: () => {} });
-    subscribeConversation("conv_a", { onEvent: () => {} });
-    expect(connectCalls).toBe(1);
-    expect(__internal__.connectionCount()).toBe(1);
-  });
-
-  test("different conversations get their own connections", () => {
-    subscribeConversation("conv_a", { onEvent: () => {} });
-    subscribeConversation("conv_b", { onEvent: () => {} });
-    expect(connectCalls).toBe(2);
-    expect(__internal__.connectionCount()).toBe(2);
-    expect(__internal__.hasConnection("conv_a")).toBe(true);
-    expect(__internal__.hasConnection("conv_b")).toBe(true);
-  });
-});
-
-describe("conversation-events-client — event fan-out", () => {
-  test("events route to every subscriber of the same conversation", () => {
-    const a = mock(() => {});
-    const b = mock(() => {});
-    const other = mock(() => {});
-    subscribeConversation("conv_a", { onEvent: a });
-    subscribeConversation("conv_a", { onEvent: b });
-    subscribeConversation("conv_b", { onEvent: other });
-
-    optionsByConvId.get("conv_a")?.onEvent("text.delta", { delta: "hi" });
-
-    expect(a).toHaveBeenCalledTimes(1);
-    expect(b).toHaveBeenCalledTimes(1);
-    expect(other).toHaveBeenCalledTimes(0);
-  });
-
-  test("onReconnect fires for every registered reconnect handler", () => {
-    const a = mock(() => {});
-    const b = mock(() => {});
-    subscribeConversation("conv_a", { onEvent: () => {}, onReconnect: a });
-    subscribeConversation("conv_a", { onEvent: () => {}, onReconnect: b });
-
-    optionsByConvId.get("conv_a")?.onReconnect?.();
-
-    expect(a).toHaveBeenCalledTimes(1);
-    expect(b).toHaveBeenCalledTimes(1);
-  });
-
-  test("a throwing handler does not block siblings", () => {
-    const thrower = mock(() => {
-      throw new Error("boom");
-    });
-    const good = mock(() => {});
-    subscribeConversation("conv_a", { onEvent: thrower });
-    subscribeConversation("conv_a", { onEvent: good });
-
-    optionsByConvId.get("conv_a")?.onEvent("text.delta", {});
-
-    expect(thrower).toHaveBeenCalledTimes(1);
-    expect(good).toHaveBeenCalledTimes(1);
-  });
-});
-
-describe("conversation-events-client — ref-counted teardown", () => {
-  test("last unsubscribe closes the conversation's connection", () => {
-    const unsubA = subscribeConversation("conv_a", { onEvent: () => {} });
-    const unsubB = subscribeConversation("conv_a", { onEvent: () => {} });
-    expect(__internal__.connectionCount()).toBe(1);
-
-    unsubA();
-    // Still one subscriber → connection stays.
-    expect(__internal__.hasConnection("conv_a")).toBe(true);
-    expect(closeCalls).toBe(0);
-
-    unsubB();
-    // No subscribers → close.
-    expect(__internal__.hasConnection("conv_a")).toBe(false);
-    expect(closeCalls).toBe(1);
-  });
-
-  test("unsubscribing one conversation doesn't affect others", () => {
-    const unsubA = subscribeConversation("conv_a", { onEvent: () => {} });
-    subscribeConversation("conv_b", { onEvent: () => {} });
-
-    unsubA();
-    expect(__internal__.hasConnection("conv_a")).toBe(false);
-    expect(__internal__.hasConnection("conv_b")).toBe(true);
-  });
-
-  test("unsubscribe is idempotent (calling twice is safe)", () => {
-    const unsub = subscribeConversation("conv_a", { onEvent: () => {} });
-    unsub();
-    expect(() => unsub()).not.toThrow();
-    expect(closeCalls).toBe(1);
-  });
-});
-
-describe("conversation-events-client — auth lifecycle", () => {
-  test("auth-lifecycle fire closes every active conversation stream", () => {
-    subscribeConversation("conv_a", { onEvent: () => {} });
-    subscribeConversation("conv_b", { onEvent: () => {} });
-    expect(__internal__.connectionCount()).toBe(2);
-
-    setAuthToken(null);
-
-    expect(__internal__.connectionCount()).toBe(0);
-    // No auto-rebuild — conversation streams are user-driven.
-  });
-
-  test("closeAllConversationEvents is idempotent", () => {
-    expect(() => closeAllConversationEvents()).not.toThrow();
-    expect(closeCalls).toBe(0);
-    subscribeConversation("conv_a", { onEvent: () => {} });
-    closeAllConversationEvents();
-    expect(closeCalls).toBe(1);
-    expect(() => closeAllConversationEvents()).not.toThrow();
-  });
-});
diff --git a/web/src/api/conversation-events-client.ts b/web/src/api/conversation-events-client.ts
deleted file mode 100644
index e73d86ac..00000000
--- a/web/src/api/conversation-events-client.ts
+++ /dev/null
@@ -1,171 +0,0 @@
-// ---------------------------------------------------------------------------
-// Per-conversation Event Stream — keyed singleton client
-//
-// One `GET /v1/conversations/:id/events` SSE connection per ACTIVE
-// conversation, fanned out to many subscribers via `subscribeConversation`.
-// Same singleton pattern as `events-client.ts`, but keyed by
-// `conversationId` and ref-counted: when the last subscriber for a
-// conversation unsubscribes, that conversation's connection closes.
-// (Conversations are mounted / unmounted as the user navigates; the
-// workspace stream is tab-life because it always has a consumer.)
-//
-// Why this exists. Today only `ChatContext.tsx:170` calls
-// `useConversationEvents`, so it's a singleton by coincidence. The
-// moment a second component starts subscribing — a preview pane, a
-// notification surface, an embedded view — the per-component
-// connectConversationEvents pattern would silently duplicate the
-// connection per conversation. Building the singleton up-front prevents
-// tomorrow's regression at zero ongoing cost.
-//
-// Auth lifecycle: identity rotation closes every active conversation
-// stream. Existing subscribers may re-subscribe after navigation; we
-// don't auto-rebuild like the workspace stream because conversation
-// streams are user-driven (mounted by ChatContext on conversation
-// focus), not always-on substrate.
-// ---------------------------------------------------------------------------
-
-import { addAuthLifecycleHandler, getAuthToken } from "./client";
-import { type ConversationSseConnection, connectConversationEvents } from "./conversation-sse";
-
-type EventHandler = (type: string, data: unknown) => void;
-type ReconnectHandler = () => void;
-
-interface ConversationEntry {
-  connection: ConversationSseConnection;
-  eventHandlers: Set<EventHandler>;
-  reconnectHandlers: Set<ReconnectHandler>;
-}
-
-const entries = new Map<string, ConversationEntry>();
-
-function ensureEntry(conversationId: string): ConversationEntry {
-  const existing = entries.get(conversationId);
-  if (existing) return existing;
-
-  // Create the entry first so the `onEvent` / `onReconnect` closures
-  // below can reference it directly. Closing over `entries.get(...)`
-  // in each callback would re-look-up every event.
-  const entry: ConversationEntry = {
-    connection: null as unknown as ConversationSseConnection,
-    eventHandlers: new Set(),
-    reconnectHandlers: new Set(),
-  };
-  entries.set(conversationId, entry);
-
-  entry.connection = connectConversationEvents({
-    conversationId,
-    token: getAuthToken() ?? undefined,
-    onEvent: (type, data) => {
-      for (const h of entry.eventHandlers) {
-        try {
-          h(type, data);
-        } catch (err) {
-          console.warn("[conv-events-client] event handler threw:", err);
-        }
-      }
-    },
-    onReconnect: () => {
-      for (const h of entry.reconnectHandlers) {
-        try {
-          h();
-        } catch (err) {
-          console.warn("[conv-events-client] reconnect handler threw:", err);
-        }
-      }
-    },
-    // Surface unrecoverable transport errors (403 after participant
-    // removal, persistent auth failure) the way the pre-singleton hook
-    // did — silent failure makes a dying conversation stream
-    // undiagnosable. Drop the entry so a later subscribe re-attempts.
-    onError: (err) => {
-      console.warn(`[conv-events-client] stream error for ${conversationId}:`, err.message);
-      entries.delete(conversationId);
-    },
-  });
-
-  return entry;
-}
-
-function closeEntry(conversationId: string): void {
-  const entry = entries.get(conversationId);
-  if (!entry) return;
-  entries.delete(conversationId);
-  try {
-    entry.connection.close();
-  } catch (err) {
-    // The transport already swallows close errors internally; logging
-    // here just in case a future implementation throws.
-    console.warn("[conv-events-client] close threw for", conversationId, err);
-  }
-}
-
-/**
- * Close every active conversation stream. Used by the auth lifecycle
- * handler below and by `pagehide` cleanup in `App.tsx`. Idempotent.
- */
-export function closeAllConversationEvents(): void {
-  for (const id of Array.from(entries.keys())) {
-    closeEntry(id);
-  }
-}
-
-// Identity rotation drops every conversation stream. Unlike the
-// workspace events client, we don't auto-rebuild — conversation streams
-// are user-driven (mounted by ChatContext when a conversation is in
-// focus), so the next conversation focus will open a fresh stream
-// under the new identity.
-const authLifecycleHandler = closeAllConversationEvents;
-addAuthLifecycleHandler(authLifecycleHandler);
-
-export interface ConversationSubscription {
-  /** Fires for every SSE event on this conversation's stream. */
-  onEvent: EventHandler;
-  /** Fires after a reconnect — caller should reload missed messages. */
-  onReconnect?: ReconnectHandler;
-}
-
-/**
- * Subscribe to a conversation's SSE event stream. The first subscribe
- * for a given `conversationId` opens the underlying connection; the
- * last unsubscribe closes it. Ref-counted per conversation.
- *
- * Returns an unsubscribe function. Calling it removes this subscription
- * and, if no subscriptions remain for the conversation, tears down the
- * connection.
- */
-export function subscribeConversation(
-  conversationId: string,
-  sub: ConversationSubscription,
-): () => void {
-  const entry = ensureEntry(conversationId);
-  entry.eventHandlers.add(sub.onEvent);
-  if (sub.onReconnect) entry.reconnectHandlers.add(sub.onReconnect);
-
-  return () => {
-    const current = entries.get(conversationId);
-    if (!current) return;
-    current.eventHandlers.delete(sub.onEvent);
-    if (sub.onReconnect) current.reconnectHandlers.delete(sub.onReconnect);
-    if (current.eventHandlers.size === 0 && current.reconnectHandlers.size === 0) {
-      closeEntry(conversationId);
-    }
-  };
-}
-
-// ── Test seams ───────────────────────────────────────────────────────
-
-export const __internal__ = {
-  hasConnection(conversationId: string): boolean {
-    return entries.has(conversationId);
-  },
-  connectionCount(): number {
-    return entries.size;
-  },
-  resetForTest(): void {
-    closeAllConversationEvents();
-    // Other test files may have cleared the global lifecycle Set;
-    // re-register idempotently. See events-client.ts for the same
-    // pattern + rationale.
-    addAuthLifecycleHandler(authLifecycleHandler);
-  },
-};
diff --git a/web/src/api/conversation-sse.ts b/web/src/api/conversation-sse.ts
deleted file mode 100644
index 84d7d8b0..00000000
--- a/web/src/api/conversation-sse.ts
+++ /dev/null
@@ -1,275 +0,0 @@
-/**
- * Per-conversation SSE client.
- *
- * Connects to GET /v1/conversations/:id/events to receive real-time
- * chat events from other participants in a shared conversation.
- *
- * Same pattern and reliability primitives as `sse.ts`:
- *   - fetch + ReadableStream (for custom auth headers — EventSource
- *     doesn't carry them)
- *   - auto-reconnect with jittered exponential backoff
- *   - heartbeat watchdog (force-reconnect on stale stream)
- *   - visibility-resume (immediate reconnect when the tab returns)
- *   - `onReconnect` for state resync (load missed messages)
- */
-
-import { refreshSession } from "./client";
-import {
-  clearConversationSubscriberId,
-  setConversationSubscriberId,
-} from "./conversation-subscribers";
-
-/** Options for connecting to a conversation event stream. */
-export interface ConversationSseOptions {
-  conversationId: string;
-  /** Base URL. Defaults to empty string (same-origin). */
-  apiBase?: string;
-  /** Bearer token for authorization. */
-  token?: string;
-  /** Called when an SSE event is received. */
-  onEvent: (type: string, data: unknown) => void;
-  /** Called on successful reconnection (caller should reload conversation). */
-  onReconnect?: () => void;
-  /** Called when the connection is lost (before reconnect). */
-  onDisconnect?: () => void;
-  /** Called on unrecoverable error (e.g. 403 after participant removal). */
-  onError?: (error: Error) => void;
-}
-
-/** Handle to close the conversation SSE connection. */
-export interface ConversationSseConnection {
-  close(): void;
-}
-
-const INITIAL_BACKOFF_MS = 1_000;
-const MAX_BACKOFF_MS = 30_000;
-const BACKOFF_MULTIPLIER = 2;
-const BACKOFF_JITTER = 0.2;
-const STALE_THRESHOLD_MS = 75_000;
-const WATCHDOG_TICK_MS = 15_000;
-
-export function connectConversationEvents(
-  options: ConversationSseOptions,
-): ConversationSseConnection {
-  const {
-    conversationId,
-    apiBase = "",
-    token,
-    onEvent,
-    onReconnect,
-    onDisconnect,
-    onError,
-  } = options;
-
-  let closed = false;
-  let abortController: AbortController | null = null;
-  let reconnectTimer: ReturnType<typeof setTimeout> | null = null;
-  let watchdogTimer: ReturnType<typeof setInterval> | null = null;
-  let backoff = INITIAL_BACKOFF_MS;
-  let hasConnectedBefore = false;
-  let lastFrameAt = Date.now();
-
-  function markFrame(): void {
-    lastFrameAt = Date.now();
-  }
-
-  function isStale(): boolean {
-    return Date.now() - lastFrameAt > STALE_THRESHOLD_MS;
-  }
-
-  function forceReconnect(): void {
-    abortController?.abort();
-  }
-
-  function startWatchdog(): void {
-    if (watchdogTimer) return;
-    watchdogTimer = setInterval(() => {
-      if (closed) return;
-      if (isStale()) forceReconnect();
-    }, WATCHDOG_TICK_MS);
-  }
-
-  function stopWatchdog(): void {
-    if (watchdogTimer) {
-      clearInterval(watchdogTimer);
-      watchdogTimer = null;
-    }
-  }
-
-  function onVisibilityChange(): void {
-    if (closed) return;
-    if (typeof document === "undefined") return;
-    if (document.visibilityState !== "visible") return;
-    if (isStale()) forceReconnect();
-  }
-
-  if (typeof document !== "undefined") {
-    document.addEventListener("visibilitychange", onVisibilityChange);
-  }
-
-  async function connect(): Promise<void> {
-    if (closed) return;
-
-    abortController = new AbortController();
-    const hdrs: Record<string, string> = {};
-    if (token && token !== "__cookie__") {
-      hdrs.Authorization = `Bearer ${token}`;
-    }
-
-    try {
-      const res = await fetch(
-        `${apiBase}/v1/conversations/${encodeURIComponent(conversationId)}/events`,
-        {
-          headers: hdrs,
-          credentials: "include",
-          signal: abortController.signal,
-        },
-      );
-
-      if (res.status === 401) {
-        // Attempt silent token refresh before giving up
-        const refreshed = await refreshSession();
-        if (refreshed) {
-          scheduleReconnect();
-          return;
-        }
-        onError?.(new Error("Conversation SSE auth failed after token refresh"));
-        return;
-      }
-
-      if (!res.ok) {
-        // 403/404 = access denied or removed — don't reconnect
-        if (res.status === 403 || res.status === 404) {
-          onError?.(new Error(`Conversation access denied: ${res.status}`));
-          return;
-        }
-        throw new Error(`Conversation SSE failed: ${res.status} ${res.statusText}`);
-      }
-
-      // Connected successfully — reset backoff
-      backoff = INITIAL_BACKOFF_MS;
-      markFrame();
-      startWatchdog();
-
-      // If this is a reconnect, notify so caller can reload missed messages
-      if (hasConnectedBefore) {
-        onReconnect?.();
-      }
-      hasConnectedBefore = true;
-
-      const reader = res.body?.getReader();
-      if (!reader) throw new Error("No response body");
-
-      const decoder = new TextDecoder();
-      let buffer = "";
-
-      for (;;) {
-        const { done, value } = await reader.read();
-        if (done || closed) break;
-        markFrame();
-
-        buffer += decoder.decode(value, { stream: true });
-        const lines = buffer.split("\n");
-        buffer = lines.pop() ?? "";
-
-        let currentEvent = "";
-        for (const line of lines) {
-          if (line.startsWith("event: ")) {
-            currentEvent = line.slice(7).trim();
-          } else if (line.startsWith("data: ") && currentEvent) {
-            try {
-              const data = JSON.parse(line.slice(6));
-              if (currentEvent === "subscribed") {
-                // Server-issued subscriber id — record it so the
-                // chat-stream POST can suppress self-echo. We
-                // deliberately don't surface this event to onEvent;
-                // it's plumbing, not a chat event.
-                const subscriberId = (data as { subscriberId?: unknown })?.subscriberId;
-                if (typeof subscriberId === "string") {
-                  setConversationSubscriberId(conversationId, subscriberId);
-                }
-              } else {
-                onEvent(currentEvent, data);
-              }
-            } catch {
-              // Skip malformed data lines
-            }
-            currentEvent = "";
-          }
-        }
-      }
-
-      // Stream ended — reconnect unless closed
-      if (!closed) {
-        stopWatchdog();
-        onDisconnect?.();
-        scheduleReconnect();
-      }
-    } catch (err) {
-      if (closed) return;
-      if (err instanceof DOMException && err.name === "AbortError") {
-        // Self-aborted (watchdog / visibility) — reschedule.
-        stopWatchdog();
-        onDisconnect?.();
-        scheduleReconnect();
-        return;
-      }
-
-      stopWatchdog();
-      onDisconnect?.();
-
-      // 403 is unrecoverable (access denied). 401 — try refresh first.
-      if (err instanceof Error && err.message.includes("401")) {
-        const refreshed = await refreshSession();
-        if (refreshed) {
-          scheduleReconnect();
-          return;
-        }
-        onError?.(err);
-        return;
-      }
-      if (err instanceof Error && err.message.includes("403")) {
-        onError?.(err);
-        return;
-      }
-
-      scheduleReconnect();
-    }
-  }
-
-  function scheduleReconnect(): void {
-    if (closed) return;
-    if (reconnectTimer) return;
-    const jittered = backoff * (1 - BACKOFF_JITTER + Math.random() * 2 * BACKOFF_JITTER);
-    reconnectTimer = setTimeout(() => {
-      reconnectTimer = null;
-      backoff = Math.min(backoff * BACKOFF_MULTIPLIER, MAX_BACKOFF_MS);
-      connect();
-    }, jittered);
-  }
-
-  connect();
-
-  return {
-    close() {
-      closed = true;
-      stopWatchdog();
-      if (typeof document !== "undefined") {
-        document.removeEventListener("visibilitychange", onVisibilityChange);
-      }
-      if (reconnectTimer) {
-        clearTimeout(reconnectTimer);
-        reconnectTimer = null;
-      }
-      if (abortController) {
-        abortController.abort();
-        abortController = null;
-      }
-      // Drop the cached subscriber id — the next subscription gets a
-      // fresh server-issued id, so a stale entry would mislead the
-      // chat-stream POST into excluding a subscriber that no longer
-      // exists.
-      clearConversationSubscriberId(conversationId);
-    },
-  };
-}
diff --git a/web/src/api/conversation-stream.test.ts b/web/src/api/conversation-stream.test.ts
new file mode 100644
index 00000000..f2c33f35
--- /dev/null
+++ b/web/src/api/conversation-stream.test.ts
@@ -0,0 +1,165 @@
+// ---------------------------------------------------------------------------
+// conversation-stream.ts — transport robustness (watchdog + visibility-resume)
+//
+// The seq-based replay path (afterSeq resume) is exercised end-to-end by the
+// chat-store suite. These tests pin the transport-layer behavior ported from
+// the former conversation-sse.ts: a silently-stalled stream (no error, no
+// close — just no frames) must be force-reconnected, and a foregrounded tab
+// must reconnect immediately rather than wait for the next watchdog tick.
+//
+// Determinism: thresholds are injected tiny (stale=30ms, tick=10ms) so the
+// watchdog fires within the test window using real timers. The fetch mock
+// returns a stream that emits the `subscribed` frame then goes silent, which
+// is exactly the stall the watchdog exists to recover from.
+// ---------------------------------------------------------------------------
+
+import { afterEach, beforeEach, describe, expect, test } from "bun:test";
+// Use the real module captured in the preload (test/setup.ts), NOT a direct
+// `import from "./conversation-stream"`: sibling suites (chat-store.test,
+// chatBleed, inlineError) `mock.module` this path with a watchdog-less fake,
+// and that mock is process-global + permanent. Importing directly would
+// resolve to their fake whenever this file runs after them.
+import { realConversationStream } from "../../test/setup";
+
+const { connectConversationStream } = realConversationStream;
+
+let originalFetch: typeof globalThis.fetch;
+
+/** Poll `predicate` every 10ms up to `timeoutMs`. Resolves true as soon as it
+ *  holds, false on timeout. Load-tolerant — the watchdog fires on a real timer
+ *  whose callback can be delayed under a busy event loop (full-suite runs), so
+ *  a fixed sleep races; polling waits exactly as long as needed. */
+async function waitFor(predicate: () => boolean, timeoutMs = 2_000): Promise<boolean> {
+  const deadline = Date.now() + timeoutMs;
+  while (Date.now() < deadline) {
+    if (predicate()) return true;
+    await new Promise((r) => setTimeout(r, 10));
+  }
+  return predicate();
+}
+
+/** Build an SSE Response whose body emits `subscribed` then stays open and
+ *  silent forever (until aborted). Mirrors a proxy that holds the connection
+ *  but stops forwarding bytes. */
+function silentStreamResponse(signal: AbortSignal): Response {
+  const body = new ReadableStream<Uint8Array>({
+    start(controller) {
+      const enc = new TextEncoder();
+      controller.enqueue(
+        enc.encode(
+          `event: subscribed\ndata: ${JSON.stringify({ isActive: false, activeSeq: 0 })}\n\n`,
+        ),
+      );
+      // Never enqueue again. On abort, error the stream with an AbortError —
+      // exactly what a real aborted fetch body does — so the client takes its
+      // immediate-reconnect path (vs the backoff path used for clean EOF).
+      signal.addEventListener("abort", () => {
+        try {
+          controller.error(new DOMException("Aborted", "AbortError"));
+        } catch {
+          // already closed/errored
+        }
+      });
+    },
+  });
+  return new Response(body, { status: 200, headers: { "content-type": "text/event-stream" } });
+}
+
+beforeEach(() => {
+  originalFetch = globalThis.fetch;
+});
+
+afterEach(() => {
+  globalThis.fetch = originalFetch;
+});
+
+describe("conversation-stream watchdog", () => {
+  test("force-reconnects a silently-stalled stream", async () => {
+    const urls: string[] = [];
+    globalThis.fetch = (async (input: string | URL | Request, init?: RequestInit) => {
+      const url = typeof input === "string" ? input : input.toString();
+      urls.push(url);
+      return silentStreamResponse(init?.signal as AbortSignal);
+    }) as typeof fetch;
+
+    const conn = connectConversationStream({
+      conversationId: "conv_abc",
+      onEvent: () => {},
+      staleThresholdMs: 30,
+      watchdogTickMs: 10,
+    });
+
+    // First connect is immediate; the watchdog detects staleness (>30ms with
+    // no frame) and force-reconnects. Poll so a busy event loop doesn't race.
+    const reconnected = await waitFor(() => urls.length >= 2);
+    conn.close();
+
+    expect(reconnected).toBe(true);
+    expect(urls.length).toBeGreaterThanOrEqual(2);
+    // Every (re)connect carries the afterSeq resume param — gapless by design.
+    for (const u of urls) expect(u).toContain("afterSeq=");
+  });
+
+  test("does not reconnect after close()", async () => {
+    let calls = 0;
+    globalThis.fetch = (async (input: string | URL | Request, init?: RequestInit) => {
+      calls++;
+      return silentStreamResponse(init?.signal as AbortSignal);
+    }) as typeof fetch;
+
+    const conn = connectConversationStream({
+      conversationId: "conv_abc",
+      onEvent: () => {},
+      staleThresholdMs: 30,
+      watchdogTickMs: 10,
+    });
+
+    // Wait for the first connect to land (poll, not a fixed sleep), then close.
+    await waitFor(() => calls >= 1);
+    conn.close();
+    const afterClose = calls;
+
+    // Wait well past several watchdog ticks — the count must not grow.
+    await new Promise((r) => setTimeout(r, 120));
+    expect(calls).toBe(afterClose);
+  });
+
+  test("visibility-resume reconnects a stale backgrounded tab on foreground", async () => {
+    const urls: string[] = [];
+    globalThis.fetch = (async (input: string | URL | Request, init?: RequestInit) => {
+      const url = typeof input === "string" ? input : input.toString();
+      urls.push(url);
+      return silentStreamResponse(init?.signal as AbortSignal);
+    }) as typeof fetch;
+
+    // Big watchdog tick so the ONLY thing that can trigger a reconnect within
+    // the window is the visibility handler — isolates the behavior under test.
+    const conn = connectConversationStream({
+      conversationId: "conv_abc",
+      onEvent: () => {},
+      staleThresholdMs: 20,
+      watchdogTickMs: 10_000,
+    });
+
+    // Wait for the first connect to land, then let it go stale (>20ms idle).
+    await waitFor(() => urls.length >= 1);
+    await new Promise((r) => setTimeout(r, 30));
+    const beforeVisibility = urls.length;
+
+    // Simulate tab returning to foreground. Construct the event from the
+    // happy-dom window realm (globalThis.Event is Bun-native and would fail
+    // happy-dom's cross-realm instanceof check in dispatchEvent).
+    Object.defineProperty(document, "visibilityState", {
+      value: "visible",
+      configurable: true,
+    });
+    document.dispatchEvent(new window.Event("visibilitychange"));
+
+    // The big watchdog tick (10s) can't fire in-window, so any reconnect here
+    // is the visibility handler's doing.
+    const resumed = await waitFor(() => urls.length > beforeVisibility);
+    conn.close();
+
+    expect(resumed).toBe(true);
+  });
+});
diff --git a/web/src/api/conversation-stream.ts b/web/src/api/conversation-stream.ts
index 30a44afd..c944a58f 100644
--- a/web/src/api/conversation-stream.ts
+++ b/web/src/api/conversation-stream.ts
@@ -10,6 +10,16 @@
  * highest seq seen and reconnect with `afterSeq=<lastSeq>`, so a dropped
  * connection resumes seamlessly with no gap or duplication — no full reload.
  *
+ * Transport robustness (ported from the former conversation-sse.ts):
+ *   - stale-stream watchdog: a silent connection (proxy idle-timeout, dead
+ *     NAT binding, laptop sleep) stops delivering frames without surfacing an
+ *     error. A periodic watchdog force-reconnects when no frame has arrived
+ *     within `staleThresholdMs`. The reconnect carries `afterSeq=lastSeq`, so
+ *     it's gapless — the seq machinery makes the recovery free.
+ *   - visibility-resume: when a backgrounded tab returns to foreground and the
+ *     stream is stale, reconnect immediately instead of waiting for the next
+ *     watchdog tick.
+ *
  * This viewer assumes the RunBus (seq'd) path. The legacy `/v1/chat` and
  * `/v1/chat/stream` endpoints fan out to the same conversation subscribers via
  * `broadcastToConversation`, which is seq-less (no `id:` line) and not RunBus-
@@ -21,6 +31,12 @@
 
 import { refreshSession } from "./client";
 
+/** No-frame interval after which the watchdog force-reconnects. Slightly above
+ *  the server's 30s heartbeat so a single missed heartbeat doesn't churn. */
+const DEFAULT_STALE_THRESHOLD_MS = 75_000;
+/** How often the watchdog checks for staleness. */
+const DEFAULT_WATCHDOG_TICK_MS = 15_000;
+
 export interface ConversationStreamOptions {
   conversationId: string;
   apiBase?: string;
@@ -34,6 +50,11 @@ export interface ConversationStreamOptions {
   onSubscribed?: (info: { isActive: boolean; activeSeq: number }) => void;
   /** Called on unrecoverable error (403/404/auth). */
   onError?: (error: Error) => void;
+  /** No-frame interval before the watchdog force-reconnects. Default 75s.
+   *  Exposed for tests to drive staleness deterministically. */
+  staleThresholdMs?: number;
+  /** Watchdog poll interval. Default 15s. Exposed for tests. */
+  watchdogTickMs?: number;
 }
 
 export interface ConversationStreamConnection {
@@ -47,14 +68,67 @@ const BACKOFF_MULTIPLIER = 2;
 export function connectConversationStream(
   options: ConversationStreamOptions,
 ): ConversationStreamConnection {
-  const { conversationId, apiBase = "", token, onEvent, onSubscribed, onError } = options;
+  const {
+    conversationId,
+    apiBase = "",
+    token,
+    onEvent,
+    onSubscribed,
+    onError,
+    staleThresholdMs = DEFAULT_STALE_THRESHOLD_MS,
+    watchdogTickMs = DEFAULT_WATCHDOG_TICK_MS,
+  } = options;
 
   let closed = false;
   let abortController: AbortController | null = null;
   let reconnectTimer: ReturnType<typeof setTimeout> | null = null;
+  let watchdogTimer: ReturnType<typeof setInterval> | null = null;
   let backoff = INITIAL_BACKOFF_MS;
   // Track the resume point so a reconnect picks up exactly where we left off.
   let lastSeq = options.afterSeq ?? 0;
+  // Timestamp of the last byte received; drives stale-stream detection.
+  let lastFrameAt = Date.now();
+
+  function markFrame(): void {
+    lastFrameAt = Date.now();
+  }
+
+  function isStale(): boolean {
+    return Date.now() - lastFrameAt > staleThresholdMs;
+  }
+
+  /** Abort the live fetch. The read loop's catch path reschedules a reconnect
+   *  (with afterSeq=lastSeq), so this is the single "force a fresh stream" lever
+   *  shared by the watchdog and the visibility handler. */
+  function forceReconnect(): void {
+    abortController?.abort();
+  }
+
+  function startWatchdog(): void {
+    if (watchdogTimer) return;
+    watchdogTimer = setInterval(() => {
+      if (closed) return;
+      if (isStale()) forceReconnect();
+    }, watchdogTickMs);
+  }
+
+  function stopWatchdog(): void {
+    if (watchdogTimer) {
+      clearInterval(watchdogTimer);
+      watchdogTimer = null;
+    }
+  }
+
+  function onVisibilityChange(): void {
+    if (closed) return;
+    if (typeof document === "undefined") return;
+    if (document.visibilityState !== "visible") return;
+    if (isStale()) forceReconnect();
+  }
+
+  if (typeof document !== "undefined") {
+    document.addEventListener("visibilitychange", onVisibilityChange);
+  }
 
   async function connect(): Promise<void> {
     if (closed) return;
@@ -85,6 +159,8 @@ export function connectConversationStream(
       }
 
       backoff = INITIAL_BACKOFF_MS;
+      markFrame();
+      startWatchdog();
       const reader = res.body?.getReader();
       if (!reader) throw new Error("No response body");
 
@@ -96,6 +172,7 @@ export function connectConversationStream(
       for (;;) {
         const { done, value } = await reader.read();
         if (done || closed) break;
+        markFrame();
         buffer += decoder.decode(value, { stream: true });
         const lines = buffer.split("\n");
         buffer = lines.pop() ?? "";
@@ -129,10 +206,17 @@ export function connectConversationStream(
         }
       }
 
+      stopWatchdog();
       if (!closed) scheduleReconnect();
     } catch (err) {
+      stopWatchdog();
       if (closed) return;
-      if (err instanceof DOMException && err.name === "AbortError") return;
+      if (err instanceof DOMException && err.name === "AbortError") {
+        // Self-aborted by the watchdog / visibility handler — reconnect
+        // immediately (no backoff; the stream was stale, not erroring).
+        connect();
+        return;
+      }
       if (err instanceof Error && err.message.includes("403")) {
         onError?.(err);
         return;
@@ -158,6 +242,10 @@ export function connectConversationStream(
         clearTimeout(reconnectTimer);
         reconnectTimer = null;
       }
+      stopWatchdog();
+      if (typeof document !== "undefined") {
+        document.removeEventListener("visibilitychange", onVisibilityChange);
+      }
       abortController?.abort();
       abortController = null;
     },
diff --git a/web/src/api/conversation-subscribers.ts b/web/src/api/conversation-subscribers.ts
deleted file mode 100644
index d1175bc4..00000000
--- a/web/src/api/conversation-subscribers.ts
+++ /dev/null
@@ -1,37 +0,0 @@
-/**
- * Per-conversation `subscriberId` registry.
- *
- * The server-issued subscriber id arrives in the first SSE frame
- * (`event: subscribed`) once a conversation event stream opens. We
- * stash it here so the chat-stream POST path can pick it up via
- * `getConversationSubscriberId(convId)` and forward it as
- * `X-Origin-Subscriber-Id` — that makes the broadcast skip this
- * tab's own conv-events subscription and prevents the sender from
- * double-handling every event (once via the chat-stream HTTP
- * response, once via the broadcast hitting its own subscription).
- *
- * Cleared on stream cancel / close to avoid stale ids leaking into
- * a future stream attempt for the same conv.
- *
- * This registry lives in its own module — not in `conversation-sse.ts` —
- * so `client.ts` can read subscriber ids without importing
- * `conversation-sse.ts`, which imports `refreshSession` back from
- * `client.ts`. That was a circular import (`client ↔ conversation-sse`);
- * Bun resolves cycles in module-evaluation order, which is non-deterministic
- * under the parallel test runner and intermittently surfaced client.ts's
- * named exports as "not found". Holding the shared state here breaks the cycle:
- * `client.ts` and `conversation-sse.ts` both depend only on this leaf module.
- */
-const conversationSubscriberIds = new Map<string, string>();
-
-export function getConversationSubscriberId(conversationId: string): string | undefined {
-  return conversationSubscriberIds.get(conversationId);
-}
-
-export function setConversationSubscriberId(conversationId: string, subscriberId: string): void {
-  conversationSubscriberIds.set(conversationId, subscriberId);
-}
-
-export function clearConversationSubscriberId(conversationId: string): void {
-  conversationSubscriberIds.delete(conversationId);
-}
diff --git a/web/src/api/sse.ts b/web/src/api/sse.ts
index 079d1cd8..50de77a7 100644
--- a/web/src/api/sse.ts
+++ b/web/src/api/sse.ts
@@ -23,8 +23,9 @@ export interface ConnectEventsOptions {
   /**
    * Called on successful reconnection (NOT the initial connect). Lets
    * consumers refetch state that may have drifted during the gap —
-   * bundles, config, skills. Mirrors the same hook on
-   * `conversation-sse.ts` so call sites can route both with one pattern.
+   * bundles, config, skills. (The per-conversation turn stream handles its
+   * own gap recovery via seq-based replay in `conversation-stream.ts`; this
+   * hook is the workspace stream's equivalent, which has no seq cursor.)
    */
   onReconnect?: () => void;
   /** Called on unrecoverable error. */
diff --git a/web/src/hooks/chat-store.ts b/web/src/hooks/chat-store.ts
index 429d0445..be41b7d9 100644
--- a/web/src/hooks/chat-store.ts
+++ b/web/src/hooks/chat-store.ts
@@ -287,6 +287,13 @@ export interface ChatStore {
   retryLastMessage(key: string): string | null;
   simulateError(key: string, message: string): void;
   reset(): void;
+  /** Close every per-slice SSE socket WITHOUT clearing slice state. For
+   *  `pagehide` (tab close / bfcache enter): lets the server reclaim SSE
+   *  slots immediately instead of waiting on TCP teardown, while leaving
+   *  the in-memory slices intact so a bfcache restore can re-attach. The
+   *  heavier {@link reset} (which also clears all state) is for identity
+   *  change, not tab lifecycle. */
+  closeAllConnections(): void;
   sliceCount(): number;
 }
 
@@ -957,6 +964,16 @@ export function createChatStore(): ChatStore {
     for (const cb of streamingListeners) cb();
   }
 
+  function closeAllConnections(): void {
+    // Close sockets only — keep slices so a bfcache restore re-attaches.
+    // No listener notify: the snapshot is unchanged (we're not mutating
+    // isStreaming/state here; the socket close is invisible to render).
+    for (const slice of allSlices) {
+      slice.connection?.close();
+      slice.connection = null;
+    }
+  }
+
   return {
     ensureSlice,
     getSnapshot(key) {
@@ -1006,6 +1023,7 @@ export function createChatStore(): ChatStore {
     retryLastMessage,
     simulateError,
     reset,
+    closeAllConnections,
     sliceCount() {
       return allSlices.size;
     },
diff --git a/web/src/hooks/useConversationEvents.ts b/web/src/hooks/useConversationEvents.ts
deleted file mode 100644
index 09e21363..00000000
--- a/web/src/hooks/useConversationEvents.ts
+++ /dev/null
@@ -1,72 +0,0 @@
-/**
- * React hook for subscribing to per-conversation SSE events.
- *
- * Stage 1: conversations are single-owner; the broadcast still fires
- * server-side so this subscription is the same-user cross-tab sync
- * path (one user, multiple browser tabs/devices on the same
- * conversation). Stage 4 reintroduces multi-user sharing and this
- * hook's audience widens.
- *
- * Transport ownership lives in the keyed singleton at
- * `api/conversation-events-client.ts`. This hook is a thin subscriber:
- * the first mount for a given `conversationId` opens the underlying
- * connection, additional mounts share it, and the last unmount tears
- * it down. On reconnect, the hook fires `onReconnect` so the caller can
- * reload the full conversation to catch missed messages.
- */
-
-import { useEffect, useRef } from "react";
-import { subscribeConversation } from "../api/conversation-events-client";
-
-export interface ConversationEventCallbacks {
-  /** A user message arrived from another participant. */
-  onRemoteUserMessage: (data: {
-    userId: string;
-    displayName: string;
-    content: string;
-    timestamp: string;
-  }) => void;
-  /** A streaming event arrived from the assistant (responding to another user's message). */
-  onRemoteStreamEvent: (type: string, data: unknown) => void;
-  /** Connection was re-established — reload the conversation to catch missed messages. */
-  onReconnect: () => void;
-}
-
-export function useConversationEvents(
-  conversationId: string | null,
-  callbacks: ConversationEventCallbacks,
-): void {
-  // Keep callbacks in a ref so consumers can re-render without churning
-  // the subscription. The effect re-runs only on conversationId change.
-  const callbacksRef = useRef(callbacks);
-  callbacksRef.current = callbacks;
-
-  useEffect(() => {
-    if (!conversationId) return;
-
-    const unsubscribe = subscribeConversation(conversationId, {
-      onEvent: (type, data) => {
-        if (type === "user.message") {
-          callbacksRef.current.onRemoteUserMessage(
-            data as {
-              userId: string;
-              displayName: string;
-              content: string;
-              timestamp: string;
-            },
-          );
-        } else if (type === "heartbeat") {
-          // Ignore heartbeats — they're keep-alive frames, not chat events.
-        } else {
-          // text.delta, tool.start, tool.done, llm.done, done
-          callbacksRef.current.onRemoteStreamEvent(type, data);
-        }
-      },
-      onReconnect: () => {
-        callbacksRef.current.onReconnect();
-      },
-    });
-
-    return unsubscribe;
-  }, [conversationId]);
-}
diff --git a/web/test/setup.ts b/web/test/setup.ts
index 04a64003..f8e5d1e6 100644
--- a/web/test/setup.ts
+++ b/web/test/setup.ts
@@ -20,6 +20,17 @@ import * as realApiClient from "../src/api/client";
 
 export const realClient = { ...realApiClient };
 
+// Same defense for `conversation-stream`. chat-store.test / chatBleed /
+// inlineError all `mock.module("../api/conversation-stream", ...)` with a
+// fake `connectConversationStream` (they test chat-store without real SSE).
+// That mock is process-global and never unwinds, so conversation-stream's
+// OWN test — which needs the real watchdog/visibility implementation — gets
+// the fake if it runs after any of them. Capturing the real module here, in
+// the preload before any mock exists, gives that test a stable handle.
+import * as realConversationStreamMod from "../src/api/conversation-stream";
+
+export const realConversationStream = { ...realConversationStreamMod };
+
 const window = new Window({ url: "http://localhost" });
 
 // Register DOM globals that React and testing-library need

From 92f67b6b0c9bc04870fac4917dffc8a518d99396 Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Tue, 2 Jun 2026 16:52:00 -0500
Subject: [PATCH 21/26] fix(web): live-update the conversation list title via
 the correct iframe data-app
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The auto-title `conversation.title` SSE event reached the shell, but the
conversations-list iframe never updated until a refresh. `forwardConversationTitleToIframes`
targeted `iframe[data-app="@nimblebraininc/conversations"]` — the SDK
SynapseProvider app name — whereas `SlotRenderer` sets `data-app` to the
placement's serverName (`conversations`). The selector matched zero iframes,
so the in-place row patch never fired; only a refetch-from-disk (refresh)
surfaced the title.

Target `data-app="conversations"` — the same `data-app === serverName`
contract `useDataSync` relies on. Adds a regression test pinning the selector.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 .../lib/forward-conversation-title.test.ts    | 82 +++++++++++++++++++
 web/src/lib/forward-conversation-title.ts     | 17 ++--
 2 files changed, 93 insertions(+), 6 deletions(-)
 create mode 100644 web/src/lib/forward-conversation-title.test.ts

diff --git a/web/src/lib/forward-conversation-title.test.ts b/web/src/lib/forward-conversation-title.test.ts
new file mode 100644
index 00000000..5195813f
--- /dev/null
+++ b/web/src/lib/forward-conversation-title.test.ts
@@ -0,0 +1,82 @@
+// ---------------------------------------------------------------------------
+// forward-conversation-title — iframe targeting regression
+//
+// The live `conversation.title` SSE event is forwarded to the conversations
+// list iframe via postMessage so the row title updates without a refetch. The
+// iframe is addressed by its `data-app` attribute, which `SlotRenderer` sets to
+// the placement's *serverName* (`conversations`) — NOT the SDK SynapseProvider
+// app name (`@nimblebraininc/conversations`). Targeting the wrong value matches
+// zero iframes and the title silently never reaches the list (only a refresh,
+// which refetches from disk, then shows it). Pin the selector to serverName.
+// ---------------------------------------------------------------------------
+
+import { afterEach, describe, expect, test } from "bun:test";
+import { forwardConversationTitleToIframes } from "./forward-conversation-title";
+
+interface CapturedPost {
+  data: unknown;
+  targetOrigin: string;
+}
+
+let originalQSA: typeof document.querySelectorAll;
+
+afterEach(() => {
+  if (originalQSA) document.querySelectorAll = originalQSA;
+});
+
+/** Stub querySelectorAll to return a single fake iframe ONLY for the exact
+ *  selector the caller is expected to use. A mismatched selector (the bug)
+ *  falls through to the real (empty) DOM, so the post count stays 0. */
+function installIframeStub(expectedSelector: string): CapturedPost[] {
+  const posts: CapturedPost[] = [];
+  const iframe = {
+    contentWindow: {
+      postMessage(data: unknown, targetOrigin: string) {
+        posts.push({ data, targetOrigin });
+      },
+    },
+  } as unknown as HTMLIFrameElement;
+
+  originalQSA = document.querySelectorAll.bind(document);
+  document.querySelectorAll = ((selector: string) => {
+    if (selector === expectedSelector) {
+      return [iframe] as unknown as NodeListOf<Element>;
+    }
+    return originalQSA(selector);
+  }) as typeof document.querySelectorAll;
+
+  return posts;
+}
+
+describe("forwardConversationTitleToIframes", () => {
+  test("targets the conversations iframe by serverName data-app", () => {
+    const posts = installIframeStub('iframe[data-app="conversations"]');
+
+    forwardConversationTitleToIframes("conv_abc", "The Importance of Sleep");
+
+    expect(posts.length).toBe(1);
+    expect(posts[0]?.targetOrigin).toBe("*");
+    const data = posts[0]?.data as {
+      jsonrpc?: string;
+      method?: string;
+      params?: { conversationId?: string; title?: string };
+    };
+    expect(data?.jsonrpc).toBe("2.0");
+    expect(data?.method).toBe("synapse/conversation-title");
+    expect(data?.params?.conversationId).toBe("conv_abc");
+    expect(data?.params?.title).toBe("The Importance of Sleep");
+  });
+
+  test("no-op when no conversations iframe is mounted", () => {
+    // No matching iframe in the DOM — querySelectorAll returns empty for any
+    // selector. Forward must not throw and must post nothing.
+    originalQSA = document.querySelectorAll.bind(document);
+    let posted = false;
+    document.querySelectorAll = (() =>
+      [] as unknown as NodeListOf<Element>) as typeof document.querySelectorAll;
+    // Guard: if forward somehow posted, this would flip — but with zero
+    // iframes there's nothing to post to.
+    forwardConversationTitleToIframes("conv_abc", "Title");
+    expect(posted).toBe(false);
+  });
+});
diff --git a/web/src/lib/forward-conversation-title.ts b/web/src/lib/forward-conversation-title.ts
index 9f65733b..f75711e3 100644
--- a/web/src/lib/forward-conversation-title.ts
+++ b/web/src/lib/forward-conversation-title.ts
@@ -8,16 +8,21 @@
  * used to fire on title resolve. Sending the (conversationId, title) tuple
  * directly is one postMessage and an in-place state update.
  *
- * Targets only iframes whose `data-app` matches the conversations bundle
- * name (`@nimblebraininc/conversations`). Unrelated iframes never see the
- * message. No-op when the conversations panel isn't currently mounted —
- * the next mount loads from disk where the title is already persisted, so
- * there's no race.
+ * Targets the conversations iframe by its `data-app` attribute. That attribute
+ * is set by `SlotRenderer` to the placement's *serverName* (`conversations`) —
+ * NOT the SDK SynapseProvider app name (`@nimblebraininc/conversations`). Using
+ * the SDK name matches zero iframes and the title silently never reaches the
+ * list (only a refresh, which refetches from disk, surfaces it). This is the
+ * same `data-app === serverName` contract `useDataSync` relies on.
+ *
+ * Unrelated iframes never see the message. No-op when the conversations panel
+ * isn't currently mounted — the next mount loads from disk where the title is
+ * already persisted, so there's no race.
  *
  * @param conversationId Conversation whose title was just generated.
  * @param title          The generated title.
  */
-const CONVERSATIONS_APP = "@nimblebraininc/conversations";
+const CONVERSATIONS_APP = "conversations";
 
 export function forwardConversationTitleToIframes(conversationId: string, title: string): void {
   const iframes = document.querySelectorAll<HTMLIFrameElement>(

From 6b82c93bcbaef35d63fb726efad50510f468afd2 Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Tue, 2 Jun 2026 16:52:00 -0500
Subject: [PATCH 22/26] fix(web): recover from an unwatchable turn instead of
 hanging the spinner
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

When `startChatTurn` succeeds but the event stream then fails unrecoverably
(events route 403/404 or auth-fail after refresh — transient/5xx reconnect via
backoff and never reach here), the chat-store's stream `onError` was a no-op.
The fresh turn's optimistic assistant placeholder spun forever with no feed
and no error surfaced.

`onError` now stops the spinner and stamps a recoverable error on the empty
placeholder, keeping both the user message and placeholder (the turn ran
server-side and persists — this is a failure to WATCH it, not to run it; the
result is on disk and a reload surfaces it). Idle resumes (no live turn) are
left intact. Not reusing `handleTurnError`, which drops both placeholders —
correct only for a start failure.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 web/src/hooks/chat-store.ts | 31 ++++++++++++++++++++++++++++++-
 web/test/chat-store.test.ts | 26 ++++++++++++++++++++++++++
 2 files changed, 56 insertions(+), 1 deletion(-)

diff --git a/web/src/hooks/chat-store.ts b/web/src/hooks/chat-store.ts
index be41b7d9..b2b9f2c8 100644
--- a/web/src/hooks/chat-store.ts
+++ b/web/src/hooks/chat-store.ts
@@ -546,7 +546,36 @@ export function createChatStore(): ChatStore {
         applyStreamEvent(slice, type, data);
       },
       onError: () => {
-        // Leave the slice intact; the persisted history still renders.
+        // The stream gave up unrecoverably (events route 403/404 or auth fail
+        // after refresh; transient network / 5xx reconnect via backoff instead
+        // and never reach here). The turn itself runs to completion
+        // server-side and persists — this is a failure to WATCH it, not to run
+        // it, so we must NOT drop the optimistic placeholder pair the way a
+        // start-failure does (the user's message really was sent).
+        //
+        // For an idle resume (no live turn) there's nothing to clean up — the
+        // loaded disk history renders fine; leave it intact.
+        if (!slice.isStreaming) return;
+        // A fresh/active turn was being watched: without this the optimistic
+        // assistant placeholder spins forever with no feed and no error.
+        // Stop the spinner and stamp a recoverable error; the result is on
+        // disk, so reopening / reloading the conversation surfaces it.
+        slice.isStreaming = false;
+        slice.streamingState = null;
+        slice.preparingTool = null;
+        slice.pendingEcho = false;
+        const updated = [...slice.messages];
+        const last = updated[updated.length - 1];
+        if (last?.role === "assistant" && !last.content && (last.blocks?.length ?? 0) === 0) {
+          updated[updated.length - 1] = {
+            ...last,
+            error: "Lost the connection to this response. Reload to view it.",
+          };
+          slice.messages = updated;
+        } else {
+          slice.error = "Lost the connection to this response.";
+        }
+        commit(slice);
       },
     });
   }
diff --git a/web/test/chat-store.test.ts b/web/test/chat-store.test.ts
index dca8a29b..60ab9904 100644
--- a/web/test/chat-store.test.ts
+++ b/web/test/chat-store.test.ts
@@ -15,6 +15,7 @@ interface CapturedStream {
   conversationId: string;
   onEvent: (type: string, data: unknown, seq: number) => void;
   onSubscribed?: (info: { isActive: boolean; activeSeq: number }) => void;
+  onError?: (error: Error) => void;
   closed: boolean;
 }
 let streams: CapturedStream[] = [];
@@ -36,11 +37,13 @@ mock.module("../src/api/conversation-stream", () => ({
     conversationId: string;
     onEvent: (type: string, data: unknown, seq: number) => void;
     onSubscribed?: (info: { isActive: boolean; activeSeq: number }) => void;
+    onError?: (error: Error) => void;
   }) => {
     const entry: CapturedStream = {
       conversationId: opts.conversationId,
       onEvent: opts.onEvent,
       onSubscribed: opts.onSubscribed,
+      onError: opts.onError,
       closed: false,
     };
     streams.push(entry);
@@ -165,6 +168,29 @@ describe("chat-store viewer", () => {
     expect(s.closed).toBe(true);
   });
 
+  it("recovers from an unwatchable turn: stops the spinner, keeps the sent message, stamps a recoverable error", async () => {
+    const store = createChatStore();
+    await store.sendTurn("kA", { text: "go" });
+    const s = latestStream();
+    expect(store.getSnapshot("kA").isStreaming).toBe(true);
+
+    // The turn started server-side (startChatTurn resolved), but the event
+    // stream fails unrecoverably (events route 403/404/auth) before any frame.
+    s.onError?.(new Error("Conversation stream access denied: 403"));
+
+    const snap = store.getSnapshot("kA");
+    // Spinner cleared — no infinite hang.
+    expect(snap.isStreaming).toBe(false);
+    expect(snap.streamingState).toBeNull();
+    // The user's message is NOT dropped (the turn really ran + persisted).
+    const users = snap.messages.filter((m) => m.role === "user");
+    expect(users).toHaveLength(1);
+    expect(users[0].content).toBe("go");
+    // The empty assistant placeholder carries a recoverable error.
+    const assistant = lastAssistant(snap.messages);
+    expect(assistant?.error).toContain("Reload");
+  });
+
   it("does not clobber a slice that is streaming on loadConversation", async () => {
     const store = createChatStore();
     await store.sendTurn("conv_1", { text: "go" });

From c3a98d8a69a86ce6294bbbe9b4c457a40915af03 Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Tue, 2 Jun 2026 16:53:14 -0500
Subject: [PATCH 23/26] fix(runtime): allow identity-level chat-start instead
 of 500 on missing workspaceId

`startTurn` hard-threw when `request.workspaceId` was absent, but the sync
`chat()` it delegates to treats workspace as optional (Stage 2: chat is
identity-bound; the focused workspace is briefing context, not a requirement).
A `/v1/chat/start` from a home / identity route with no focused workspace hit
the throw and surfaced as a raw 500.

Fall back to the caller's personal workspace (`personalWorkspaceIdFor(ownerId)`)
for the conversation-metadata breadcrumb, matching `chat()`'s `sessionWsId`
resolution. Parity with `/v1/chat` and `/v1/chat/stream`; latent 500 gone.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 src/runtime/runtime.ts                 | 14 ++++++++++----
 test/integration/detached-turn.test.ts | 17 +++++++++++++++++
 2 files changed, 27 insertions(+), 4 deletions(-)

diff --git a/src/runtime/runtime.ts b/src/runtime/runtime.ts
index 2bfe22e3..a5751aea 100644
--- a/src/runtime/runtime.ts
+++ b/src/runtime/runtime.ts
@@ -968,14 +968,20 @@ export class Runtime {
    * {@link RunInProgressError} if a turn is already active for the conversation.
    */
   async startTurn(request: ChatRequest): Promise<{ conversationId: string }> {
-    if (!request.workspaceId) {
-      throw new Error("workspaceId is required. Every chat request must be workspace-scoped.");
-    }
     const store = this.findConversationStore();
     const ownerId = this.resolveOwnerId(request);
+    // `workspaceId` is the FOCUSED workspace (the `/w/:slug` the user is
+    // viewing), optional — exactly as the sync `chat()` path treats it. On a
+    // home / identity route there's no focus, so the turn is identity-level;
+    // fall back to the caller's personal workspace for the conversation
+    // metadata breadcrumb, matching `chat()`'s `sessionWsId` resolution. This
+    // is delegated to `chat()` below, which re-resolves the same fallback for
+    // tool scope. (Pre-Stage-2 this hard-threw; that surfaced as a raw 500 on
+    // a legitimate workspaceless chat-start.)
+    const wsId = request.workspaceId ?? personalWorkspaceIdFor(ownerId);
     const createOpts: CreateConversationOptions = {
       ownerId,
-      workspaceId: request.workspaceId,
+      workspaceId: wsId,
       ...(request.metadata ? { metadata: request.metadata } : {}),
     };
 
diff --git a/test/integration/detached-turn.test.ts b/test/integration/detached-turn.test.ts
index c3ccd5b5..dc761b3a 100644
--- a/test/integration/detached-turn.test.ts
+++ b/test/integration/detached-turn.test.ts
@@ -136,6 +136,23 @@ describe("detached turns (server-authoritative streaming)", () => {
     expect(again.conversationId).toBe(conversationId);
     await awaitTurn(conversationId);
   });
+
+  it("starts an identity-level turn with no workspaceId (personal-workspace fallback)", async () => {
+    // Parity with the sync `chat()` path and `/v1/chat`: a chat-start with no
+    // focused workspace (home / identity route) is identity-level, not an
+    // error. startTurn must fall back to the caller's personal workspace
+    // instead of throwing (which surfaced as a raw 500 via handleChatStart).
+    const { conversationId } = await runtime.startTurn({ message: "no workspace here" });
+    expect(conversationId).toMatch(/^conv_/);
+
+    const { status } = await awaitTurn(conversationId);
+    expect(status).toBe("done");
+
+    // Conversation persisted with the personal-workspace breadcrumb.
+    const conv = await runtime.findConversation(conversationId, { userId: "usr_default" });
+    expect(conv).not.toBeNull();
+    expect(conv?.workspaceId).toBe("ws_user_usr_default");
+  });
 });
 
 describe("cancel delivers a terminal frame to live viewers (Stop button)", () => {

From bac91a2da32e52c584cf6a8cc64be713eca790ca Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Tue, 2 Jun 2026 16:53:35 -0500
Subject: [PATCH 24/26] fix(api): reject a malformed conversationId with 400
 instead of 500
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

A chat request with a conversationId that doesn't match `conv_<16 hex>` (e.g.
a path-traversal probe like `../../foo`) bubbled a raw Error out of
`validateConversationId` → 500.

Two surfaces, two guards:
- JSON: add `pattern: CONVERSATION_ID_RE.source` to the `conversationId` field
  in `ChatRequestBody`, so `validateAgainst` rejects it as 400 at every JSON
  chat surface (`/v1/chat`, `/v1/chat/stream`, `/v1/chat/start`).
- multipart: `parseMultipartChatBody` parses raw (bypasses the schema), so
  validate the same regex there. Also guards the value before it reaches
  `ingestFiles`, which feeds it into file-store path building.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 src/api/handlers.ts                         | 12 +++++++++
 src/api/schemas/rest.ts                     | 11 +++++++-
 test/integration/detached-turn-http.test.ts | 29 +++++++++++++++++++++
 3 files changed, 51 insertions(+), 1 deletion(-)

diff --git a/src/api/handlers.ts b/src/api/handlers.ts
index b8f0eeb5..cb8467ea 100644
--- a/src/api/handlers.ts
+++ b/src/api/handlers.ts
@@ -9,6 +9,7 @@ import { resolveMimeType } from "../files/mime.ts";
 import type { FileEntry } from "../files/types.ts";
 import type { IdentityProvider, UserIdentity } from "../identity/provider.ts";
 import { DEV_IDENTITY } from "../identity/providers/dev.ts";
+import { CONVERSATION_ID_RE } from "../conversation/types.ts";
 import {
   ConversationAccessDeniedError,
   ConversationCorruptedError,
@@ -1598,6 +1599,17 @@ async function parseMultipartChatBody(
   const message = typeof messageRaw === "string" ? messageRaw : "";
 
   const conversationId = formData.get("conversationId");
+  // Reject a malformed conversationId before it reaches store path-building
+  // / ingestFiles (convId feeds the file-store path). The JSON surface gets
+  // this from the ChatRequestBody schema pattern; multipart parses raw, so
+  // validate the same shape here. Mirrors the canonical conv_<16 hex> regex.
+  if (
+    typeof conversationId === "string" &&
+    conversationId &&
+    !CONVERSATION_ID_RE.test(conversationId)
+  ) {
+    return apiError(400, "bad_request", "Invalid conversationId format");
+  }
   const model = formData.get("model");
 
   let appContext: { appName: string; serverName: string } | undefined;
diff --git a/src/api/schemas/rest.ts b/src/api/schemas/rest.ts
index d2d9bd45..a2a5511a 100644
--- a/src/api/schemas/rest.ts
+++ b/src/api/schemas/rest.ts
@@ -21,6 +21,7 @@
 // ---------------------------------------------------------------------------
 
 import { type Static, Type } from "@sinclair/typebox";
+import { CONVERSATION_ID_RE } from "../../conversation/types.ts";
 
 // ── /v1/tools/call ───────────────────────────────────────────────────────
 
@@ -66,7 +67,15 @@ export const ChatRequestBody = Type.Object(
       description: "The user's message. Must be non-empty.",
     }),
     conversationId: Type.Optional(
-      Type.String({ description: "Existing conversation id; omit to start a new one." }),
+      Type.String({
+        // Constrain to the canonical `conv_<16 hex>` shape at the schema
+        // boundary so a malformed id (e.g. a path-traversal probe like
+        // `../../foo`) is a 400 at every JSON chat surface, rather than
+        // bubbling a raw Error out of `validateConversationId` → 500. The
+        // multipart path validates the same regex in parseMultipartChatBody.
+        pattern: CONVERSATION_ID_RE.source,
+        description: "Existing conversation id; omit to start a new one.",
+      }),
     ),
     model: Type.Optional(
       Type.String({ description: "Model override; omit to use the workspace default." }),
diff --git a/test/integration/detached-turn-http.test.ts b/test/integration/detached-turn-http.test.ts
index 95645623..e08d40b0 100644
--- a/test/integration/detached-turn-http.test.ts
+++ b/test/integration/detached-turn-http.test.ts
@@ -146,4 +146,33 @@ describe("detached turn HTTP surface", () => {
     const body = await res.json();
     expect(body.error).toBe("conversation_corrupted");
   });
+
+  it("start with a malformed conversationId is 400, not 500 (JSON)", async () => {
+    const res = await fetch(`${baseUrl}/v1/chat/start`, {
+      method: "POST",
+      headers: { "Content-Type": "application/json", "X-Workspace-Id": TEST_WORKSPACE_ID },
+      body: JSON.stringify({
+        message: "traversal attempt",
+        conversationId: "../../foo",
+        workspaceId: TEST_WORKSPACE_ID,
+      }),
+    });
+    expect(res.status).toBe(400);
+    const body = await res.json();
+    expect(body.error).toBe("bad_request");
+  });
+
+  it("start with a malformed conversationId is 400, not 500 (multipart)", async () => {
+    const form = new FormData();
+    form.set("message", "traversal attempt");
+    form.set("conversationId", "../../foo");
+    const res = await fetch(`${baseUrl}/v1/chat/start`, {
+      method: "POST",
+      headers: { "X-Workspace-Id": TEST_WORKSPACE_ID },
+      body: form,
+    });
+    expect(res.status).toBe(400);
+    const body = await res.json();
+    expect(body.error).toBe("bad_request");
+  });
 });

From c856b0a30d39a4c6911b537696079a66b7e0e0ab Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Tue, 2 Jun 2026 16:53:53 -0500
Subject: [PATCH 25/26] fix(runtime): abort in-flight detached turns on
 shutdown
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

`shutdown()` removed workspace sources and disposed the tool-list aggregator
but never tore down the RunBus. A detached turn's lifecycle is decoupled from
any HTTP request, so a turn mid-`doStream()` kept issuing tool calls into
sources the shutdown loop was concurrently removing — late calls hit removed
sources.

Call `this.runBus.reset()` BEFORE the source-removal loop: it aborts every
active run's signal (the engine stops cooperatively) so turns stop issuing
calls first, then their dependencies are dismantled. Order matters — reset
after the loop would leave a window where aborting turns still fire at
already-removed sources.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 src/runtime/runtime.ts                 |  9 +++++
 test/integration/detached-turn.test.ts | 53 ++++++++++++++++++++++++++
 2 files changed, 62 insertions(+)

diff --git a/src/runtime/runtime.ts b/src/runtime/runtime.ts
index a5751aea..7b16015c 100644
--- a/src/runtime/runtime.ts
+++ b/src/runtime/runtime.ts
@@ -3529,6 +3529,15 @@ export class Runtime {
 
   async shutdown(): Promise<void> {
     await this.telemetryManager.shutdown();
+    // Abort every in-flight detached turn BEFORE removing the sources they
+    // depend on. A detached turn's lifecycle is decoupled from any HTTP
+    // request (it runs to completion server-side), so without this a turn
+    // mid-`doStream()` keeps issuing tool calls into workspace sources that
+    // the loop below is concurrently tearing down — late calls hit removed
+    // sources. RunBus.reset() aborts each run's signal (the engine stops
+    // cooperatively) and clears the run map. Order matters: stop the
+    // producers first, then dismantle their dependencies.
+    this.runBus.reset();
     // Stop all sources across all workspace registries
     for (const [_wsId, reg] of this._workspaceRegistries) {
       for (const name of reg.sourceNames()) {
diff --git a/test/integration/detached-turn.test.ts b/test/integration/detached-turn.test.ts
index dc761b3a..57a9ee9e 100644
--- a/test/integration/detached-turn.test.ts
+++ b/test/integration/detached-turn.test.ts
@@ -207,3 +207,56 @@ describe("cancel delivers a terminal frame to live viewers (Stop button)", () =>
     expect(rt.isTurnActive(conversationId)).toBe(false);
   });
 });
+
+describe("shutdown aborts in-flight detached turns (RunBus teardown)", () => {
+  it("aborts active turn signals before tearing down workspace sources", async () => {
+    const dir = join(tmpdir(), `nimblebrain-shutdown-runbus-${Date.now()}`);
+    mkdirSync(dir, { recursive: true });
+
+    // Gate the model so the turn is genuinely mid-flight when shutdown runs.
+    // Capture the run's abort signal so we can prove shutdown aborted it.
+    let release!: () => void;
+    const gate = new Promise<void>((r) => {
+      release = r;
+    });
+    let capturedSignal: AbortSignal | undefined;
+
+    const rt = await Runtime.start({
+      model: {
+        provider: "custom",
+        adapter: createMockModel(async (options) => {
+          capturedSignal = options.abortSignal;
+          await gate;
+          return { content: [{ type: "text", text: "unreached" }] };
+        }),
+      },
+      noDefaultBundles: true,
+      logging: { disabled: true },
+      workDir: dir,
+    });
+    await provisionTestWorkspace(rt);
+
+    try {
+      const { conversationId } = await rt.startTurn({
+        message: "hang until shutdown",
+        workspaceId: TEST_WORKSPACE_ID,
+      });
+      // Wait until the engine has actually entered the model call (signal
+      // captured) — `isTurnActive` flips true on `runBus.begin()`, before
+      // `doStream`, so it alone would race the capture.
+      await waitFor(() => capturedSignal !== undefined);
+      expect(rt.isTurnActive(conversationId)).toBe(true);
+      expect(capturedSignal?.aborted).toBe(false);
+
+      // Shutdown must abort the in-flight turn (RunBus.reset) so it stops
+      // issuing tool calls BEFORE its workspace sources are removed.
+      await rt.shutdown();
+
+      expect(capturedSignal?.aborted).toBe(true);
+      expect(rt.isTurnActive(conversationId)).toBe(false);
+    } finally {
+      release(); // let the parked engine task unwind
+      rmSync(dir, { recursive: true, force: true });
+    }
+  });
+});

From 7decc8e5b90659f7dd122bde1ef85e2fe652bd9b Mon Sep 17 00:00:00 2001
From: Mason <31372737+Ovaculos@users.noreply.github.com>
Date: Tue, 2 Jun 2026 16:54:23 -0500
Subject: [PATCH 26/26] docs+chore: clarify conversation.title wsId scoping;
 trim bug-archaeology comments
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- runtime.ts: document why `conversation.title` is scoped to the owner's
  personal workspace (`sessionWsId`), not the conversation's workspaceId —
  the latter would leak the title to co-members of a focused team workspace.
  Flag Stage 4 sharing as the point to revisit (route by conversation ACL).
- Trim historical narration that rationalized past bugs (round-3/round-4
  self-echo iterations in conversation-events.ts; PR #251 connection-binding
  regression in handlers.ts; stale "Task 005 collapses" future-tense in
  runtime.ts) down to the current-behavior rationale.
- Sort handlers.ts imports after the CONVERSATION_ID_RE addition. No behavior
  change.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
---
 src/api/conversation-events.ts | 27 +++++++++------------------
 src/api/handlers.ts            | 17 +++++++----------
 src/runtime/runtime.ts         | 27 +++++++++++++++++++--------
 3 files changed, 35 insertions(+), 36 deletions(-)

diff --git a/src/api/conversation-events.ts b/src/api/conversation-events.ts
index 95b41aa2..187873e5 100644
--- a/src/api/conversation-events.ts
+++ b/src/api/conversation-events.ts
@@ -153,22 +153,14 @@ export class ConversationEventManager {
   /**
    * Broadcast an event to all subscribers of a specific conversation.
    *
-   * Stage 1 single-owner: every legitimate subscriber to a given
-   * conversation is the same user (the owner) connected from another
-   * tab/device. Filtering on `userId` would skip every subscriber
-   * (round-3 had this bug); not filtering at all double-delivers to
-   * the sender's own tab (round-4 had this bug — the sender's tab
-   * receives via both `/v1/chat/stream` and its own
-   * `/v1/conversations/:id/events` subscription).
-   *
-   * The correct filter key is the **subscriber id**: the sender
-   * passes its current conv-events subscriber id as
-   * `excludeSubscriberId`, so its own subscription is skipped while
-   * peer tabs (different subscriber ids, same userId) still receive.
-   *
-   * Stage 4 will reintroduce multi-participant semantics with
-   * explicit policy gates; until then, this is the only exclusion
-   * shape needed.
+   * Conversations are single-owner (Stage 1): every subscriber is the same
+   * user on another tab/device. The exclusion key is the **subscriber id**,
+   * not `userId` — filtering by `userId` would skip every tab; not filtering
+   * double-delivers to the sender (it receives via both `/v1/chat/stream` and
+   * its own `/v1/conversations/:id/events` subscription). The sender passes
+   * its conv-events subscriber id as `excludeSubscriberId` so its own
+   * subscription is skipped while peer tabs still receive. (Stage 4
+   * multi-participant semantics will need explicit policy gates here.)
    *
    * Seq-less: unlike {@link publishEvent} (the RunBus path), these frames carry
    * no `id:` sequence. A seq-tracking `conversation-stream` viewer applies them
@@ -179,8 +171,7 @@ export class ConversationEventManager {
    * @param eventType - SSE event type (e.g. "text.delta", "user.message")
    * @param data - Event data payload
    * @param excludeSubscriberId - Optional subscriber id to skip
-   *   (typically the sender's own subscriber id, to prevent
-   *   self-echo on chat-stream-originated broadcasts).
+   *   (typically the sender's own, to prevent self-echo).
    */
   broadcastToConversation(
     conversationId: string,
diff --git a/src/api/handlers.ts b/src/api/handlers.ts
index cb8467ea..2cacf144 100644
--- a/src/api/handlers.ts
+++ b/src/api/handlers.ts
@@ -3,13 +3,13 @@ import { resolve } from "node:path";
 import { CallbackEventSink } from "../adapters/callback-events.ts";
 import { log } from "../cli/log.ts";
 import { isToolEnabled, isToolVisibleToRole, type ResolvedFeatures } from "../config/features.ts";
+import { CONVERSATION_ID_RE } from "../conversation/types.ts";
 import type { EngineEvent, EventSink } from "../engine/types.ts";
 import { ingestFiles, isAllowedMime, type UploadedFile } from "../files/ingest.ts";
 import { resolveMimeType } from "../files/mime.ts";
 import type { FileEntry } from "../files/types.ts";
 import type { IdentityProvider, UserIdentity } from "../identity/provider.ts";
 import { DEV_IDENTITY } from "../identity/providers/dev.ts";
-import { CONVERSATION_ID_RE } from "../conversation/types.ts";
 import {
   ConversationAccessDeniedError,
   ConversationCorruptedError,
@@ -80,10 +80,8 @@ export async function handleChat(
     // backgrounded tab, network blip) must not cancel the in-flight
     // engine loop; the run completes server-side, persists, and is
     // replayed to any reconnecting /v1/conversations/:id/events
-    // subscriber. See the detached `.chat(parsed, sink)` in
-    // handleChatStream for the full rationale (PR #251 regression). The
-    // automations executor's deadline cancellation is unaffected — that
-    // path supplies its own AbortController.
+    // subscriber. (The automations executor's deadline cancellation is
+    // unaffected — that path supplies its own AbortController.)
     const result = await runtime.chat(parsed);
     // Cost is derived at the boundary, never stored. Same wire shape as
     // the streaming `done` event so clients see one consistent contract.
@@ -441,11 +439,10 @@ export async function handleChatStream(
         // engine loop. The run completes server-side, persists to the
         // conversation store, and replays to any reconnecting
         // /v1/conversations/:id/events subscriber — the "leave and come
-        // back" contract. PR #251 bound the run to the connection and
-        // silently abandoned prompts the moment a mobile client dropped
-        // (run.error "The connection was closed"). The one caller that
-        // must cancel on a deadline — the automations executor — owns its
-        // own AbortController in bundles/automations/src/executor.ts.
+        // back" contract. Binding the run to the connection would silently
+        // abandon a prompt the moment a mobile client dropped. The one
+        // caller that must cancel on a deadline — the automations executor —
+        // owns its own AbortController in bundles/automations/src/executor.ts.
         .chat(parsed, sink)
         .then((result) => {
           // Cost is computed at the API boundary — never stored. The
diff --git a/src/runtime/runtime.ts b/src/runtime/runtime.ts
index 7b16015c..e7d17ad8 100644
--- a/src/runtime/runtime.ts
+++ b/src/runtime/runtime.ts
@@ -1189,14 +1189,10 @@ export class Runtime {
     };
 
     // Resume an existing conversation only if the caller owns it.
-    // Stage 1 single-owner invariant: a conversation's ownerId must
-    // match the requesting identity. Today this is implicitly
-    // workspace-bounded because the store dir is per-wsId, but Task 005
-    // collapses every conversation onto a top-level store — at which
-    // point this owner check is the ONLY barrier between users and
-    // each other's conversations. Enforce it now, in the load-bearing
-    // chat path, so the invariant doesn't have a window of being
-    // workspace-discipline-only.
+    // Conversations live on a single top-level store (not per-workspace),
+    // so this ownerId check is the ONLY barrier between users and each
+    // other's conversations — it runs in the load-bearing chat path, not
+    // just at a higher layer.
     //
     // The disambiguation between "doesn't exist" (→ create new) and
     // "exists but isn't yours" (→ throw) matters: silently creating a
@@ -1772,6 +1768,21 @@ export class Runtime {
       void generateTitle(titleModel, titleInput, result.output)
         .then(async (title) => {
           await store.update(conversation.id, { title });
+          // `wsId: sessionWsId` (the owner's personal workspace) — NOT
+          // `conversation.workspaceId`. The SSE layer (events.ts) scopes
+          // `scope: "workspace"` events to clients whose membership set
+          // contains this wsId. Conversations are owner-scoped, and the owner
+          // is always a member of their own personal workspace, so this
+          // reaches exactly the owner's tabs. Using the conversation's
+          // workspaceId would be WRONG here: when the chat was focused on a
+          // team workspace, that id fans the title out to every member of the
+          // team — none of whom can see this owner-scoped conversation, so it
+          // leaks the title string to their browsers for no benefit.
+          // (The iframe list patch is routed by `conversationId`, not wsId, so
+          // it's unaffected either way.) Stage 4 cross-user sharing must
+          // revisit this — route by the conversation's ACL, not the owner's
+          // personal ws — so an org-admin viewing another user's conversation
+          // receives the live title.
           this.defaultEvents.emit({
             type: "conversation.title",
             data: { conversationId: conversation.id, title, wsId: sessionWsId },