diff --git a/docs/adversarial_rubric.md b/.agents/skills/release/references/adversarial_rubric.md
similarity index 100%
rename from docs/adversarial_rubric.md
rename to .agents/skills/release/references/adversarial_rubric.md
diff --git a/.github/workflows/deploy.yml b/.github/workflows/deploy.yml
index fbcadc938..7ece47f91 100644
--- a/.github/workflows/deploy.yml
+++ b/.github/workflows/deploy.yml
@@ -8,6 +8,7 @@ on:
       - 'apps/marketing/**'
       - 'apps/portal/**'
       - 'apps/paste-service/**'
+      - 'apps/room-service/**'
       - 'packages/**'
   workflow_dispatch:
     inputs:
@@ -21,6 +22,7 @@ on:
           - marketing
           - portal
           - paste
+          - room
 
 permissions:
   contents: read
@@ -32,6 +34,7 @@ jobs:
       marketing: ${{ steps.changes.outputs.marketing }}
       portal: ${{ steps.changes.outputs.portal }}
       paste: ${{ steps.changes.outputs.paste }}
+      room: ${{ steps.changes.outputs.room }}
     steps:
       - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
 
@@ -54,6 +57,11 @@ jobs:
             else
               echo "paste=false" >> $GITHUB_OUTPUT
             fi
+            if [[ "${{ inputs.target }}" == "all" || "${{ inputs.target }}" == "room" ]]; then
+              echo "room=true" >> $GITHUB_OUTPUT
+            else
+              echo "room=false" >> $GITHUB_OUTPUT
+            fi
           else
             # For push events, check what changed
             git fetch origin ${{ github.event.before }} --depth=1 2>/dev/null || true
@@ -61,6 +69,7 @@ jobs:
             MARKETING_CHANGED=$(git diff --name-only ${{ github.event.before }} ${{ github.sha }} 2>/dev/null | grep -E '^(apps/marketing/|packages/)' || true)
             PORTAL_CHANGED=$(git diff --name-only ${{ github.event.before }} ${{ github.sha }} 2>/dev/null | grep -E '^(apps/portal/|packages/)' || true)
             PASTE_CHANGED=$(git diff --name-only ${{ github.event.before }} ${{ github.sha }} 2>/dev/null | grep -E '^apps/paste-service/' || true)
+            ROOM_CHANGED=$(git diff --name-only ${{ github.event.before }} ${{ github.sha }} 2>/dev/null | grep -E '^(apps/room-service/|packages/shared/collab/|packages/editor/|packages/ui/)' || true)
 
             if [[ -n "$MARKETING_CHANGED" ]]; then
               echo "marketing=true" >> $GITHUB_OUTPUT
@@ -79,6 +88,12 @@ jobs:
             else
               echo "paste=false" >> $GITHUB_OUTPUT
             fi
+
+            if [[ -n "$ROOM_CHANGED" ]]; then
+              echo "room=true" >> $GITHUB_OUTPUT
+            else
+              echo "room=false" >> $GITHUB_OUTPUT
+            fi
           fi
 
   deploy-marketing:
@@ -178,3 +193,28 @@ jobs:
         env:
           CLOUDFLARE_API_TOKEN: ${{ secrets.CLOUDFLARE_API_TOKEN }}
           CLOUDFLARE_ACCOUNT_ID: ${{ secrets.CLOUDFLARE_ACCOUNT_ID }}
+
+  deploy-room:
+    needs: detect-changes
+    if: needs.detect-changes.outputs.room == 'true'
+    runs-on: ubuntu-latest
+    environment: production
+    steps:
+      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
+
+      - uses: oven-sh/setup-bun@0c5077e51419868618aeaa5fe8019c62421857d6 # v2.2.0
+        with:
+          bun-version: latest
+
+      - name: Install dependencies
+        run: bun install
+
+      - name: Build browser shell
+        run: bun run --cwd apps/room-service build:shell
+
+      - name: Deploy to Cloudflare
+        working-directory: apps/room-service
+        run: npx wrangler deploy
+        env:
+          CLOUDFLARE_API_TOKEN: ${{ secrets.CLOUDFLARE_API_TOKEN }}
+          CLOUDFLARE_ACCOUNT_ID: ${{ secrets.CLOUDFLARE_ACCOUNT_ID }}
diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index d4e60f62d..eb976ae76 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -41,7 +41,9 @@ jobs:
         run: bun run typecheck
 
       - name: Run tests
-        run: bun test
+        # See .github/workflows/test.yml for why this is `bun run test`
+        # and not raw `bun test`.
+        run: bun run test
 
   build:
     needs: test
diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index d319f9401..985aa4f13 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -29,7 +29,12 @@ jobs:
         run: bun run typecheck
 
       - name: Run tests
-        run: bun test
+        # Use the root `test` script (splits non-UI + UI-cwd) so the
+        # packages/ui/bunfig.toml happy-dom preload is loaded. Raw
+        # `bun test` from the repo root doesn't pick up that package-
+        # scoped preload, so UI hook tests would hit "document is not
+        # defined".
+        run: bun run test
 
   install-cmd-windows:
     # End-to-end integration test for scripts/install.cmd on real cmd.exe.
diff --git a/.gitignore b/.gitignore
index 9d3f75a12..56a531b5b 100644
--- a/.gitignore
+++ b/.gitignore
@@ -53,3 +53,8 @@ plannotator-local
 # Local research/reference docs (not for repo)
 /reference/
 *.bun-build
+
+.wrangler/
+apps/room-service/public/
+.claude/scheduled_tasks.lock
+specs/
diff --git a/AGENTS.md b/AGENTS.md
index d2249f246..fbf081cad 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -28,6 +28,16 @@ plannotator/
 │   │   ├── index.html
 │   │   ├── index.tsx
 │   │   └── vite.config.ts
+│   ├── room-service/             # Live collaboration rooms (Cloudflare Worker + Durable Object)
+│   │   ├── core/                 # Handler, DO class, validation, CORS, log, types, csp
+│   │   ├── targets/cloudflare.ts # Worker entry + DO re-export
+│   │   ├── entry.tsx             # Browser shell entry — path switch: / → LandingPage, /c/:roomId → AppRoot
+│   │   ├── index.html            # Vite template; produces hashed chunks under /assets/
+│   │   ├── vite.config.ts        # Browser shell build (bun run build:shell)
+│   │   ├── tsconfig.browser.json # DOM-lib tsconfig for the shell
+│   │   ├── static/               # Root-level static assets copied into public/ by build:shell (favicon.svg)
+│   │   ├── scripts/smoke.ts      # Integration test against wrangler dev
+│   │   └── wrangler.toml         # SQLite-backed DO binding + ASSETS binding (run_worker_first, html_handling=none)
 │   ├── vscode-extension/         # VS Code extension — opens plans in editor tabs
 │   │   ├── bin/                   # Router scripts (open-in-vscode, xdg-open)
 │   │   ├── src/                   # extension.ts, cookie-proxy.ts, ipc-server.ts, panel-manager.ts, editor-annotations.ts, vscode-theme.ts
@@ -58,7 +68,8 @@ plannotator/
 │   │   ├── components/           # Viewer, Toolbar, Settings, etc.
 │   │   │   ├── icons/            # Shared SVG icon components (themeIcons, etc.)
 │   │   │   ├── plan-diff/        # PlanDiffBadge, PlanDiffViewer, clean/raw diff views
-│   │   │   └── sidebar/          # SidebarContainer, SidebarTabs, VersionBrowser, ArchiveBrowser
+│   │   │   ├── sidebar/          # SidebarContainer, SidebarTabs, VersionBrowser, ArchiveBrowser
+│   │   │   └── collab/           # RoomStatusBadge, ParticipantAvatars, RoomHeaderControls, RoomMenu, RoomUnavailableScreen, JoinRoomGate, StartRoomModal, RemoteCursorLayer, ImageStripNotice, LandingPage, LandingPreview
 │   │   ├── shortcuts/            # Keyboard shortcut registry (see Keyboard Shortcuts section below)
 │   │   │   ├── core.ts           # Engine: parser, formatter, dispatcher, validator
 │   │   │   ├── runtime.ts        # Engine: useShortcutScope, useDoubleTapShortcuts hooks
@@ -66,16 +77,28 @@ plannotator/
 │   │   │   ├── plan-review/      # Scopes for plan-editor surfaces (annotationToolbar, annotationPanel, commentPopover, imageAnnotator, inputMethod, viewer)
 │   │   │   └── code-review/      # Scopes for review-editor surfaces (ai, allFilesDiff, annotationToolbar, fileTree, prComments, suggestionModal, tourDialog)
 │   │   ├── shortcuts.test.ts     # Registry unit tests (parser, dispatcher, validator)
-│   │   ├── utils/                # parser.ts, sharing.ts, storage.ts, planSave.ts, agentSwitch.ts, planDiffEngine.ts, planAgentInstructions.ts
+│   │   ├── utils/                # parser.ts, sharing.ts, storage.ts, planSave.ts, agentSwitch.ts, planDiffEngine.ts, planAgentInstructions.ts, adminSecretStorage.ts, blockTargeting.ts
 │   │   ├── hooks/                # useAnnotationHighlighter.ts, useSharing.ts, usePlanDiff.ts, useSidebar.ts, useLinkedDoc.ts, useAnnotationDraft.ts, useCodeAnnotationDraft.ts, useArchive.ts
+│   │   │   └── collab/           # useCollabRoom.ts, useCollabRoomSession.ts, useLandingCreateRoom.ts, usePresenceThrottle.ts, useRoomMode.ts, useRoomAdminActions.ts, useStartLiveRoom.ts
 │   │   └── types.ts
 │   ├── ai/                       # Provider-agnostic AI backbone (providers, sessions, endpoints)
 │   ├── shared/                   # Shared types, utilities, and cross-runtime logic
 │   │   ├── storage.ts            # Plan saving, version history, archive listing (node:fs only)
 │   │   ├── draft.ts              # Annotation draft persistence (node:fs only)
-│   │   └── project.ts            # Pure string helpers (sanitizeTag, extractRepoName, extractDirName)
-│   ├── editor/                   # Plan review app
-│   │   ├── App.tsx               # Main plan review app
+│   │   ├── project.ts            # Pure string helpers (sanitizeTag, extractRepoName, extractDirName)
+│   │   └── collab/               # Live Rooms protocol, crypto, validators, client runtime, React hook
+│   │       ├── types.ts          # Protocol types + runtime validators
+│   │       ├── crypto.ts         # HKDF key derivation, HMAC proofs, AES-GCM payload encrypt/decrypt
+│   │       ├── ids.ts            # roomId/secret/opId/clientId generators
+│   │       ├── url.ts            # parseRoomUrl / buildRoomJoinUrl / buildAdminRoomUrl (client-only)
+│   │       ├── constants.ts      # ROOM_SECRET_LENGTH_BYTES, ADMIN_SECRET_LENGTH_BYTES, WS_CLOSE_*
+│   │       ├── strip-images.ts   # toRoomAnnotation, stripRoomAnnotationImages
+│   │       ├── redact-url.ts     # redactRoomSecrets (scrub #key=/#admin= from telemetry/logs)
+│   │       └── client-runtime/   # CollabRoomClient class, createRoom, joinRoom, apply-event reducer
+│   ├── editor/                   # Plan review app (App.tsx) + room-mode shell
+│   │   ├── App.tsx               # Plan review editor (local + room-mode prop)
+│   │   ├── AppRoot.tsx           # Mode fork (local | room | invalid-room); package default export
+│   │   └── RoomApp.tsx           # Room-mode shell — identity gate, session, overlays, delete/expired fallbacks
 │   │   └── shortcuts.ts          # planReviewSurface + annotateSurface — composes plan-review scopes into per-surface registries
 │   └── review-editor/            # Code review UI
 │       ├── App.tsx               # Main review app
@@ -308,6 +331,21 @@ All servers use random ports locally or fixed port (`19432`) in remote mode.
 
 Runs as a separate service on port `19433` (self-hosted) or as a Cloudflare Worker (hosted).
 
+### Room Service (`apps/room-service/`)
+
+Live-collaboration rooms for encrypted multi-user annotation. Zero-knowledge: the Worker + Durable Object stores and relays ciphertext only. Clients hold the room secret in the URL fragment and derive `authKey`/`eventKey`/`presenceKey`/`adminKey` locally.
+
+| Endpoint              | Method | Purpose                                    |
+| --------------------- | ------ | ------------------------------------------ |
+| `/`                   | GET    | Landing page for room creation from uploaded document. Serves the same `index.html` shell; `entry.tsx` path switch renders `LandingPage` (lazy-loaded). |
+| `/health`             | GET    | Worker liveness probe                      |
+| `/c/:roomId`          | GET    | Room SPA shell — serves the built editor bundle. Response carries CSP, `Cache-Control: no-store`, `Referrer-Policy: no-referrer`. |
+| `/api/rooms`          | POST   | Create room. Body: `{ roomId, roomVerifier, adminVerifier, initialSnapshotCiphertext, expiresInDays? }`. Returns `201` on success; `409` on duplicate. |
+| `/api/fetch-markdown`  | POST   | URL-to-markdown proxy. Body: `{ url }`. Returns `{ markdown, source }`. |
+| `/ws/:roomId`         | GET    | WebSocket upgrade into the room Durable Object. |
+
+Protocol contract lives in `packages/shared/collab/`; the Worker/DO never imports client-only URL helpers.
+
 ## Plan Version History
 
 Every plan is automatically saved to `~/.plannotator/history/{project}/{slug}/` on arrival, before the user sees the UI. Versions are numbered sequentially (`001.md`, `002.md`, etc.). The slug is derived from the plan's first `# Heading` + today's date via `generateSlug()`, scoped by project name (git repo or cwd). Same heading on the same day = same slug = same plan being iterated on. Identical resubmissions are deduplicated (no new file if content matches the latest version).
diff --git a/apps/collab-agent/AGENT_INSTRUCTIONS.md b/apps/collab-agent/AGENT_INSTRUCTIONS.md
new file mode 100644
index 000000000..44ffa85ba
--- /dev/null
+++ b/apps/collab-agent/AGENT_INSTRUCTIONS.md
@@ -0,0 +1,189 @@
+# Plannotator Live Rooms — Agent Instructions
+
+This document is prose an AI agent (Claude Code, Codex, OpenCode,
+Junie, or another) should have in its prompt when it's being
+driven to participate in a Plannotator Live Room. It explains
+the identity convention, the CLI subcommand surface, and the
+handful of rules that keep agent participation well-behaved.
+
+## 1. Identity
+
+Your identity in the room follows the pattern:
+
+```
+<user>-agent-<type>
+```
+
+Examples: `swift-falcon-tater-agent-claude`,
+`alice-agent-codex`.
+
+- `<user>` is the human you're acting on behalf of. If you've
+  been given their Plannotator identity (a "tater name" like
+  `swift-falcon-tater`), use it verbatim.
+- `<type>` is one of: `claude`, `codex`, `opencode`, `junie`,
+  `other`. Use `other` when you don't fit any of the explicit
+  kinds — it's a legal value, not a fallback error.
+
+You pass these as `--user` and `--type` on every CLI invocation;
+the CLI assembles the full identity string and refuses to run if
+either is missing or malformed.
+
+Room participants see your identity in their avatar row and as
+the label on your cursor. A small `⚙` marker appears next to the
+identity on both surfaces so observers can tell you're an agent,
+not a human teammate.
+
+## 2. Joining and staying visible
+
+The V1 room protocol has no participant roster. Peers appear on
+one another's screens **only after presence is received**. A
+client that just connects and stays silent is invisible.
+
+Two subcommands handle this correctly:
+
+- `join` — connect, emit initial presence, heartbeat presence on
+  a 10s cadence, stream room events to stdout until Ctrl-C. Use
+  this when you need to be present while you think or wait.
+- `demo` — a showcase walk; not for real work.
+
+Short one-shot reads (`read-plan`, `read-annotations`,
+`read-presence`) emit presence exactly once before they print and
+exit. You briefly flash into the observer's avatar row, then
+disappear.
+
+Do **not** implement your own WebSocket or presence loop. The
+CLI is the supported entry point.
+
+## 3. Reading the plan
+
+```
+bun run apps/collab-agent/index.ts read-plan \
+  --url "<full room URL including #key=...>" \
+  --user <name> --type <kind>
+```
+
+Add `--with-block-ids` to get each block prefixed with
+`[block:<id>]`. You need those ids if you plan to comment.
+
+Block ids are **derived from the markdown** — the CLI uses the
+same parser the browser uses, so the ids you read here are
+byte-identical to what the observer sees in their DOM.
+
+## 4. Reading existing annotations
+
+```
+bun run apps/collab-agent/index.ts read-annotations \
+  --url "..." --user <name> --type <kind>
+```
+
+Prints the full `RoomAnnotation[]` array as pretty JSON. Fields:
+`id`, `blockId`, `startOffset`, `endOffset`, `type`, `text`,
+`originalText`, `createdA`, `author`.
+
+## 5. Reading recent presence
+
+```
+bun run apps/collab-agent/index.ts read-presence \
+  --url "..." --user <name> --type <kind>
+```
+
+Prints `remotePresence` as JSON keyed by opaque per-connection
+client ids. **This is NOT a participant roster.** It is
+"peers who've emitted presence in the last 30 seconds." A user
+who's connected but idle (not moving their mouse) will NOT
+appear. Do not infer "who's in the room" from this call.
+
+## 6. Posting a comment
+
+Block-level only in V1.
+
+```
+bun run apps/collab-agent/index.ts comment \
+  --url "..." --user <name> --type <kind> \
+  --block <blockId> --text "<your comment>"
+```
+
+The annotation targets the entire block — its full content is the
+"original text", and your `--text` becomes the comment body. Do
+**not** attempt to select a sub-range of text. The V1 agent flow
+does not support inline text-range targeting; the
+`/api/external-annotations` inline-text matcher that some agents
+may have used before is known to fail silently on markdown /
+whitespace / NBSP / block-boundary drift.
+
+### Choosing a block id
+
+Three ways:
+
+1. Run `read-plan --with-block-ids` to see the plan interleaved
+   with block markers.
+2. Run `read-annotations` to see block ids on annotations other
+   agents or humans have already left.
+3. Run `comment --list-blocks` (with `--url/--user/--type`) to
+   print a JSON array of `{ id, type, content }` for every block
+   and exit without posting.
+
+Pick a block whose `content` matches what you want to comment on.
+
+### Referencing specific wording
+
+If your comment is about specific wording within a block, quote
+the wording **in the comment body**, not as an anchor:
+
+```
+--text 'The phrase "as soon as possible" is ambiguous — what is the deadline?'
+```
+
+Do not try to select only `"as soon as possible"`. Select the
+whole block, and put the phrase in prose.
+
+### Exit codes
+
+- `0` — comment echoed back from the server (confirmed posted).
+- `1` — snapshot / echo timeout, unknown block id, or server
+  rejected the op (e.g. the room was deleted).
+- `2` — argv or usage error (missing flag, bad --type, etc.).
+
+## 7. Demo mode
+
+```
+bun run apps/collab-agent/index.ts demo \
+  --url "..." --user <name> --type <kind> \
+  --duration 120
+```
+
+Walks heading blocks in order, anchors the cursor to each, posts
+a comment per heading. For showcase only — not a real
+participation pattern. Pass `--dry-run` to do the cursor walk
+without posting.
+
+## 8. Rules and limits
+
+- **Never run as admin.** The CLI strips any `#admin=<secret>`
+  fragment from the URL by default and warns on stderr. There is
+  no opt-in flag. Agents do not perform delete.
+- **No image attachments.** V1 room annotations do not carry
+  images. If you need to share an image, the flow is via the
+  local editor's import path, not via the agent CLI.
+- **Room annotations are server-authoritative.** Your
+  `sendAnnotationAdd` queues a local op; the server has the
+  final say. The `comment` subcommand waits for the echo before
+  exiting 0.
+- **Text appears to peers after server echo.** Your comment
+  doesn't appear in your own `read-annotations` output until it
+  round-trips.
+
+## 9. Troubleshooting
+
+- **`Missing --url` / `Missing --user` / `Missing --type`** —
+  argv check. Add the missing flag.
+- **`Timed out waiting for snapshot after 10000ms`** — the URL
+  parsed but the connection never received the initial
+  encrypted snapshot. Check the URL fragment is intact
+  (`#key=<secret>`) and the room service is reachable.
+- **`unknown --block "<id>"`** — the block id you passed isn't
+  in the current plan. Run `comment --list-blocks` to see the
+  valid set; re-run with a matching id.
+- **`<code>: <message>`** on a comment — server-side mutation
+  rejection. The message names the reason; wait and retry or
+  target a different room.
diff --git a/apps/collab-agent/README.md b/apps/collab-agent/README.md
new file mode 100644
index 000000000..eee551bae
--- /dev/null
+++ b/apps/collab-agent/README.md
@@ -0,0 +1,140 @@
+# @plannotator/collab-agent
+
+Command-line tool that lets an AI agent join a Plannotator Live
+Room as a first-class peer — read the plan, read annotations,
+post comments, emit presence.
+
+This is a human-readable README. Agent-facing prompt text lives
+in [`AGENT_INSTRUCTIONS.md`](./AGENT_INSTRUCTIONS.md).
+
+## Install
+
+Everything is already wired as a workspace package. From the
+repo root:
+
+```sh
+bun install
+```
+
+## Quick tour
+
+The root `package.json` has a convenience script, but you can
+also call the entry file directly.
+
+```sh
+# Help
+bun run agent:run --help
+
+# Read the plan (add --with-block-ids for block markers)
+bun run agent:run read-plan \
+  --url "http://localhost:8787/c/<roomId>#key=..." \
+  --user alice --type claude
+
+# Stay connected and stream events (Ctrl-C to exit)
+bun run agent:run join \
+  --url "..." --user alice --type claude
+
+# Post a block-level comment
+bun run agent:run comment \
+  --url "..." --user alice --type claude \
+  --block <blockId> \
+  --text "Looks good, but consider section 3."
+
+# List blocks without posting
+bun run agent:run comment \
+  --url "..." --user alice --type claude --list-blocks
+```
+
+## Identity
+
+Agent identities follow the pattern `<user>-agent-<type>`.
+
+- `--user` must match `/^[a-z0-9][a-z0-9-]*$/` — lowercase alnum
+  with dashes. Case is normalized.
+- `--type` is one of: `claude`, `codex`, `opencode`, `junie`,
+  `other`.
+
+The CLI assembles the full identity string. Peers see it as your
+display name and in their avatar row. A small `⚙` marker makes
+agent participants visually distinct from humans.
+
+## Subcommands
+
+| Subcommand | What it does |
+|---|---|
+| `join` | Connect, emit initial presence, heartbeat at 10s, stream room events to stdout until SIGINT. |
+| `read-plan` | Print the decrypted plan markdown. `--with-block-ids` prefixes each block with `[block:<id>]`. |
+| `read-annotations` | Print the current `RoomAnnotation[]` array as JSON. |
+| `read-presence` | Print `remotePresence` (recent emitters, not a roster). `--settle <sec>` extends the wait (default 2s). |
+| `comment` | Post a block-level COMMENT annotation. Requires `--block` + `--text`. `--list-blocks` prints available blocks and exits without posting. |
+| `demo` | Walk heading blocks in order, anchor the cursor to each, leave a comment. `--duration <sec>`, `--comment-template <str>`, `--dry-run`. |
+
+## Common flags
+
+Every subcommand takes:
+
+| Flag | Meaning |
+|---|---|
+| `--url <url>` | Full room URL including the `#key=<secret>` fragment. |
+| `--user <name>` | Lowercase alnum + dashes. Forms the first half of the identity. |
+| `--type <kind>` | `claude \| codex \| opencode \| junie \| other`. |
+
+## Exit codes
+
+| Code | Meaning |
+|---|---|
+| 0 | Success. |
+| 1 | Runtime error — connect / snapshot / echo timeout, server rejection, unknown block id. |
+| 2 | Argv or usage error — missing required flag, bad `--type`. |
+
+## Admin URLs are stripped automatically
+
+If the URL you pass contains `#admin=<secret>` (e.g. you copied
+the creator's admin link instead of the participant link), the
+CLI strips that fragment before connecting and prints a warning
+to stderr. Agents never run as room admins in V1. There is no
+opt-in flag.
+
+## Running against a local dev room
+
+To test end-to-end locally with both halves (a browser as
+creator, an agent as participant):
+
+```sh
+# Terminal 1 — boot the full local stack (wrangler + editor)
+bun run dev:live-room
+
+# In the editor tab, click "Start Live Room" to get a URL.
+# Copy the participant URL (not the admin URL — either works,
+# but the CLI will strip admin for you).
+
+# Terminal 2 — join as an agent
+bun run agent:run join \
+  --url "http://localhost:8787/c/<roomId>#key=..." \
+  --user test --type claude
+```
+
+Observer watches the browser tab; the agent should appear in
+the avatar row with the `⚙` marker and persist there for as
+long as the `join` subcommand is running.
+
+## Internals
+
+The CLI is a thin layer over `CollabRoomClient` in
+`packages/shared/collab/client-runtime/client.ts`. It reuses:
+
+- `joinRoom()` factory (connect + key derivation + auth
+  handshake).
+- `parseMarkdownToBlocks()` (same markdown → block id derivation
+  as the browser, so `--block` ids match what the observer
+  renders).
+- `PRESENCE_SWATCHES` / `hashNameToSwatch()` (identity ←→ color
+  mapping; each agent identity maps deterministically to a
+  distinct swatch).
+- `isAgentIdentity()` + the agent-identity helpers
+  (`packages/ui/utils/agentIdentity.ts` — a new pure module
+  without ConfigStore / React deps, importable by both the CLI
+  and the room UI components that render the `⚙` marker).
+
+No new protocol; no server changes. Agents are first-class peers
+in the existing V1 room protocol.
diff --git a/apps/collab-agent/heartbeat.ts b/apps/collab-agent/heartbeat.ts
new file mode 100644
index 000000000..edf7b6820
--- /dev/null
+++ b/apps/collab-agent/heartbeat.ts
@@ -0,0 +1,80 @@
+/**
+ * Heartbeat presence manager for the agent CLI.
+ *
+ * The room protocol has no roster / join broadcast; peers appear in
+ * avatar rows + cursor layers only when presence is received.
+ * The client-runtime sweep removes presence entries older than
+ * `PRESENCE_TTL_MS` (30s) from the receiver's view of a peer.
+ *
+ * An agent that goes quiet (post a comment, wait for a reply) would
+ * therefore vanish from observers after ~30s. Human users refresh
+ * presence through mousemove; an agent has no such ambient signal.
+ * The heartbeat solves this by re-sending the last-known presence
+ * on a 10s cadence (~3× headroom under the TTL) whenever the CLI
+ * holds a live connection.
+ *
+ * Usage:
+ *
+ *   const heartbeat = startHeartbeat(client, presence);
+ *   // ... do agent work, periodically call heartbeat.update(nextPresence)
+ *   heartbeat.stop();
+ *
+ * The manager swallows send errors (presence is lossy by design;
+ * reconnects handle cross-session state rebuild). It silently no-ops
+ * when the client is not in the `authenticated` state so tear-down
+ * windows don't spam the socket.
+ *
+ * Interval coupling: `HEARTBEAT_INTERVAL_MS` must stay well below
+ * `PRESENCE_TTL_MS` in the client runtime (currently 30s). If that
+ * constant ever tightens, this interval needs to tighten too.
+ */
+
+import type { CollabRoomClient } from '@plannotator/shared/collab/client';
+import type { PresenceState } from '@plannotator/shared/collab';
+
+export const HEARTBEAT_INTERVAL_MS = 10_000;
+
+export interface HeartbeatHandle {
+  /** Replace the presence payload that will be re-sent on each tick. */
+  update(next: PresenceState): void;
+  /** Stop the heartbeat. Safe to call multiple times. */
+  stop(): void;
+}
+
+/**
+ * Start a heartbeat that re-sends the given presence every
+ * `HEARTBEAT_INTERVAL_MS`. Does NOT send an initial presence —
+ * callers are expected to `await client.sendPresence(initial)`
+ * once themselves before starting the heartbeat so peers see the
+ * agent appear immediately, not only after the first heartbeat tick.
+ */
+export function startHeartbeat(
+  client: CollabRoomClient,
+  initialPresence: PresenceState,
+): HeartbeatHandle {
+  let current = initialPresence;
+  let stopped = false;
+
+  const timer = setInterval(() => {
+    if (stopped) return;
+    // Only tick when authenticated. The client's sendPresence will
+    // no-op on non-authenticated sockets, but checking here avoids
+    // console noise during reconnect windows.
+    const state = client.getState();
+    if (state.connectionStatus !== 'authenticated') return;
+    void client.sendPresence(current).catch(() => {
+      // Presence is lossy by protocol contract; drop failures.
+    });
+  }, HEARTBEAT_INTERVAL_MS);
+
+  return {
+    update(next: PresenceState) {
+      current = next;
+    },
+    stop() {
+      if (stopped) return;
+      stopped = true;
+      clearInterval(timer);
+    },
+  };
+}
diff --git a/apps/collab-agent/identity.test.ts b/apps/collab-agent/identity.test.ts
new file mode 100644
index 000000000..065c66b22
--- /dev/null
+++ b/apps/collab-agent/identity.test.ts
@@ -0,0 +1,56 @@
+import { describe, expect, test } from 'bun:test';
+import { isAgentType, stripAdminFragment } from './identity';
+
+describe('isAgentType', () => {
+  test('accepts known types', () => {
+    expect(isAgentType('claude')).toBe(true);
+    expect(isAgentType('codex')).toBe(true);
+    expect(isAgentType('opencode')).toBe(true);
+    expect(isAgentType('junie')).toBe(true);
+    expect(isAgentType('other')).toBe(true);
+  });
+
+  test('rejects unknown types', () => {
+    expect(isAgentType('gpt')).toBe(false);
+    expect(isAgentType('')).toBe(false);
+    expect(isAgentType('CLAUDE')).toBe(false); // case-sensitive
+  });
+});
+
+describe('stripAdminFragment', () => {
+  test('removes admin param, preserves key', () => {
+    const url = 'https://room.example.com/c/abc123#key=secret&admin=adminsecret';
+    const result = stripAdminFragment(url);
+    expect(result.stripped).toBe(true);
+    expect(result.url).toBe('https://room.example.com/c/abc123#key=secret');
+  });
+
+  test('removes admin when it is the only fragment param (no trailing #)', () => {
+    const url = 'https://room.example.com/c/abc123#admin=adminsecret';
+    const result = stripAdminFragment(url);
+    expect(result.stripped).toBe(true);
+    expect(result.url).toBe('https://room.example.com/c/abc123');
+  });
+
+  test('passes through URLs without any fragment', () => {
+    const url = 'https://room.example.com/c/abc123';
+    const result = stripAdminFragment(url);
+    expect(result.stripped).toBe(false);
+    expect(result.url).toBe(url);
+  });
+
+  test('passes through URLs with fragment but no admin', () => {
+    const url = 'https://room.example.com/c/abc123#key=secret&stripped=2';
+    const result = stripAdminFragment(url);
+    expect(result.stripped).toBe(false);
+    expect(result.url).toBe(url);
+  });
+
+  test('preserves non-admin fragment params in order', () => {
+    const url = 'https://room.example.com/c/abc#key=k&admin=a&name=alice&color=%23ff0000';
+    const result = stripAdminFragment(url);
+    expect(result.stripped).toBe(true);
+    // URLSearchParams stringify preserves insertion order minus the deleted key.
+    expect(result.url).toBe('https://room.example.com/c/abc#key=k&name=alice&color=%23ff0000');
+  });
+});
diff --git a/apps/collab-agent/identity.ts b/apps/collab-agent/identity.ts
new file mode 100644
index 000000000..33819ad1b
--- /dev/null
+++ b/apps/collab-agent/identity.ts
@@ -0,0 +1,70 @@
+/**
+ * Agent identity + URL sanitisation helpers for the CLI. The pure
+ * construction/detection helpers live in
+ * `@plannotator/ui/utils/agentIdentity` — this file layers on
+ * CLI-specific concerns:
+ *
+ *   - parsing `--user` / `--type` argv into a validated agent
+ *     identity string;
+ *   - stripping `#admin=<secret>` out of a room URL so an agent
+ *     never accidentally runs with admin capability even if the
+ *     user pastes a creator-side admin link.
+ *
+ * The admin-URL guard is a hard default in V1. There is no
+ * `--as-admin` opt-in; agents are never admins. Adding that
+ * surface area without a concrete use case is footgun creation
+ * (per the plan's risk note).
+ */
+
+import {
+  constructAgentIdentity,
+  InvalidAgentIdentityError,
+  type AgentType,
+  AGENT_TYPES,
+} from '@plannotator/ui/utils/agentIdentity';
+
+export { constructAgentIdentity, InvalidAgentIdentityError, AGENT_TYPES };
+export type { AgentType };
+
+/** True when the supplied string is a recognised agent type. */
+export function isAgentType(value: string): value is AgentType {
+  return (AGENT_TYPES as readonly string[]).includes(value);
+}
+
+/**
+ * Result of `stripAdminFragment`. `stripped` indicates whether an
+ * `admin=…` param was actually present and removed — callers use
+ * this to print the CLI warning exactly once per run.
+ */
+export interface StripAdminFragmentResult {
+  url: string;
+  stripped: boolean;
+}
+
+/**
+ * Remove `admin=<secret>` from a room URL's fragment while
+ * preserving `key=…` and anything else. Returns the input
+ * unchanged when no fragment or no admin param is present.
+ *
+ * Implementation note: room URL fragments are parsed as
+ * `URLSearchParams` strings by the client (see `parseRoomUrl`
+ * in `packages/shared/collab/url.ts`), so this function follows
+ * the same shape — split on `#`, treat the right half as a
+ * URLSearchParams, delete `admin`, rebuild.
+ */
+export function stripAdminFragment(rawUrl: string): StripAdminFragmentResult {
+  const hashIdx = rawUrl.indexOf('#');
+  if (hashIdx < 0) return { url: rawUrl, stripped: false };
+
+  const base = rawUrl.slice(0, hashIdx);
+  const fragment = rawUrl.slice(hashIdx + 1);
+  const params = new URLSearchParams(fragment);
+  if (!params.has('admin')) return { url: rawUrl, stripped: false };
+
+  params.delete('admin');
+  const rebuilt = params.toString();
+  return {
+    url: rebuilt ? `${base}#${rebuilt}` : base,
+    stripped: true,
+  };
+}
diff --git a/apps/collab-agent/index.ts b/apps/collab-agent/index.ts
new file mode 100644
index 000000000..6b885ee6a
--- /dev/null
+++ b/apps/collab-agent/index.ts
@@ -0,0 +1,106 @@
+/**
+ * @plannotator/collab-agent — CLI entry point.
+ *
+ * Dispatches to a subcommand under `./subcommands/`. Each subcommand
+ * parses its own argv (via the shared helpers in `_lib.ts`),
+ * manages its own connection lifecycle, and returns an exit code.
+ *
+ * Usage:
+ *   bun run apps/collab-agent/index.ts <subcommand> --url <url> --user <name> --type <kind> [...]
+ *
+ * Subcommands:
+ *   join               connect and stay online with heartbeat presence
+ *   read-plan          print decrypted plan markdown (add --with-block-ids for block markers)
+ *   read-annotations   print current annotations as JSON
+ *   read-presence      print recent peer presence (not a roster)
+ *   comment            post a block-level comment annotation
+ *   demo               walk headings and leave comments at each
+ *
+ * Exit codes:
+ *   0  success
+ *   1  runtime error (connect timeout, server rejection, ...)
+ *   2  argument / usage error
+ */
+
+import { runJoin } from './subcommands/join';
+import { runReadPlan } from './subcommands/read-plan';
+import { runReadAnnotations } from './subcommands/read-annotations';
+import { runReadPresence } from './subcommands/read-presence';
+import { runComment } from './subcommands/comment';
+import { runDemo } from './subcommands/demo';
+import { UsageError } from './subcommands/_lib';
+
+const HELP = `plannotator collab-agent — join Live Rooms as an AI agent
+
+Usage:
+  bun run apps/collab-agent/index.ts <subcommand> [options]
+
+Subcommands:
+  join               connect and stay online with heartbeat presence
+  read-plan          print decrypted plan markdown
+                     (add --with-block-ids for block markers)
+  read-annotations   print current annotations as JSON
+  read-presence      print recent peer presence (not a participant roster)
+  comment            post a block-level comment annotation
+                     (--block <id> --text <body>, or --list-blocks
+                     to print available block ids + exit)
+  demo               walk heading blocks in order, anchor the cursor
+                     to each, and post a comment per heading
+                     (--duration <sec>, --comment-template <str>,
+                     --dry-run to skip posting)
+
+Common flags (every subcommand):
+  --url <url>        full room URL including #key=... fragment
+  --user <name>      lowercase alnum + dashes; becomes <user>-agent-<type>
+  --type <kind>      claude | codex | opencode | junie | other
+
+Examples:
+  bun run apps/collab-agent/index.ts read-plan \\
+    --url "http://localhost:8787/c/abc123#key=..." \\
+    --user alice --type claude
+
+  bun run apps/collab-agent/index.ts join \\
+    --url "https://room.plannotator.ai/c/xyz#key=..." \\
+    --user swift-falcon-tater --type codex
+`;
+
+type Subcommand = (argv: readonly string[]) => Promise<number>;
+
+const SUBCOMMANDS: Record<string, Subcommand> = {
+  join: runJoin,
+  'read-plan': runReadPlan,
+  'read-annotations': runReadAnnotations,
+  'read-presence': runReadPresence,
+  comment: runComment,
+  demo: runDemo,
+};
+
+async function main(argv: readonly string[]): Promise<number> {
+  const sub = argv[0];
+  if (!sub || sub === '--help' || sub === '-h') {
+    console.log(HELP);
+    return 0;
+  }
+
+  const runner = SUBCOMMANDS[sub];
+  if (!runner) {
+    console.error(`collab-agent: unknown subcommand "${sub}"`);
+    console.error('Run with --help for the subcommand list.');
+    return 2;
+  }
+
+  try {
+    return await runner(argv.slice(1));
+  } catch (err) {
+    if (err instanceof UsageError) {
+      console.error(`collab-agent: ${err.message}`);
+      console.error('Run with --help for usage.');
+      return 2;
+    }
+    console.error(`collab-agent: ${(err as Error).message ?? String(err)}`);
+    return 1;
+  }
+}
+
+const code = await main(process.argv.slice(2));
+process.exit(code);
diff --git a/apps/collab-agent/package.json b/apps/collab-agent/package.json
new file mode 100644
index 000000000..3e84a8603
--- /dev/null
+++ b/apps/collab-agent/package.json
@@ -0,0 +1,17 @@
+{
+  "name": "@plannotator/collab-agent",
+  "version": "0.1.0",
+  "private": true,
+  "type": "module",
+  "scripts": {
+    "dev": "bun run index.ts"
+  },
+  "dependencies": {
+    "@plannotator/shared": "workspace:*",
+    "@plannotator/ui": "workspace:*"
+  },
+  "devDependencies": {
+    "bun-types": "^1.3.11",
+    "typescript": "~5.8.2"
+  }
+}
diff --git a/apps/collab-agent/subcommands/_lib.test.ts b/apps/collab-agent/subcommands/_lib.test.ts
new file mode 100644
index 000000000..8ea02c48a
--- /dev/null
+++ b/apps/collab-agent/subcommands/_lib.test.ts
@@ -0,0 +1,35 @@
+import { describe, expect, test } from 'bun:test';
+import { parseCommonArgs, UsageError } from './_lib';
+
+describe('parseCommonArgs', () => {
+  // Regression: earlier the parser used the literal string 'true' as its
+  // boolean-flag sentinel, so a user flag value that happened to be the
+  // 4-character string 'true' (e.g. `--text true` as a comment body) got
+  // silently dropped during re-emit. Downstream `readStringFlag` then
+  // threw "--text requires a value" even though one was supplied. Pinning
+  // this so a future refactor can't quietly bring the collision back.
+  test('preserves the literal string "true" as a flag value', () => {
+    const result = parseCommonArgs([
+      '--url', 'https://example.com#key=abc',
+      '--user', 'alice',
+      '--type', 'claude',
+      '--text', 'true',
+    ]);
+    expect(result.rest).toEqual(['--text', 'true']);
+  });
+
+  test('treats --flag with no following value as a boolean (no re-emit value)', () => {
+    const result = parseCommonArgs([
+      '--url', 'https://example.com#key=abc',
+      '--user', 'alice',
+      '--type', 'claude',
+      '--dry-run',
+    ]);
+    expect(result.rest).toEqual(['--dry-run']);
+  });
+
+  test('rejects missing required --url', () => {
+    expect(() => parseCommonArgs(['--user', 'alice', '--type', 'claude']))
+      .toThrow(UsageError);
+  });
+});
diff --git a/apps/collab-agent/subcommands/_lib.ts b/apps/collab-agent/subcommands/_lib.ts
new file mode 100644
index 000000000..f4694e515
--- /dev/null
+++ b/apps/collab-agent/subcommands/_lib.ts
@@ -0,0 +1,276 @@
+/**
+ * Shared helpers for the agent subcommands: argv parsing of the
+ * common `--url`/`--user`/`--type` shape, connect + identity
+ * construction, and a one-shot cleanup-on-signal wiring.
+ *
+ * Each subcommand file owns its own top-level flow; this lib just
+ * dedupes the boilerplate that would otherwise repeat four times.
+ */
+
+import {
+  joinRoom,
+  type CollabRoomClient,
+} from '@plannotator/shared/collab/client';
+import type { PresenceState } from '@plannotator/shared/collab';
+import { hashNameToSwatch } from '@plannotator/ui/utils/presenceColor';
+import {
+  constructAgentIdentity,
+  isAgentType,
+  stripAdminFragment,
+  AGENT_TYPES,
+  type AgentType,
+} from '../identity';
+
+export interface CommonArgs {
+  url: string;
+  user: string;
+  type: AgentType;
+  /** Raw argv slice AFTER the subcommand name, for subcommand-specific flags. */
+  rest: string[];
+}
+
+/**
+ * Parse `--url`, `--user`, `--type` plus anything else. Throws a
+ * `UsageError` (caught by the dispatcher) on any missing or
+ * malformed required flag so error messages land in one place.
+ */
+export class UsageError extends Error {
+  constructor(message: string) {
+    super(message);
+    this.name = 'UsageError';
+  }
+}
+
+// Sentinel for boolean-style flags (no value token followed). Using a Symbol
+// instead of the literal string 'true' avoids a collision where a user passes
+// the literal word "true" as a flag value (e.g. `--text true`) — the old code
+// dropped that value during re-emit because it couldn't distinguish the
+// sentinel from a real argv token.
+const BOOL_FLAG = Symbol('boolFlag');
+type FlagValue = string | typeof BOOL_FLAG;
+
+export function parseCommonArgs(argv: readonly string[]): CommonArgs {
+  const flags = new Map<string, FlagValue>();
+  const rest: string[] = [];
+
+  for (let i = 0; i < argv.length; i++) {
+    const token = argv[i];
+    if (token.startsWith('--')) {
+      const key = token.slice(2);
+      const next = argv[i + 1];
+      if (next === undefined || next.startsWith('--')) {
+        flags.set(key, BOOL_FLAG);
+      } else {
+        flags.set(key, next);
+        i++;
+      }
+    } else {
+      rest.push(token);
+    }
+  }
+
+  const url = flags.get('url');
+  const user = flags.get('user');
+  const type = flags.get('type');
+
+  if (typeof url !== 'string') throw new UsageError('Missing --url');
+  if (typeof user !== 'string') throw new UsageError('Missing --user');
+  if (typeof type !== 'string') throw new UsageError(`Missing --type (one of ${AGENT_TYPES.join('|')})`);
+  if (!isAgentType(type)) {
+    throw new UsageError(`--type must be one of ${AGENT_TYPES.join('|')}; got "${type}"`);
+  }
+
+  // Consume the common flags from the flags-turned-rest reconstruction so
+  // subcommand-specific args can be read from `rest` as a plain
+  // --flag value stream. Simpler: re-emit the non-common flags.
+  const consumed = new Set(['url', 'user', 'type']);
+  const passthrough: string[] = [];
+  for (const [k, v] of flags) {
+    if (consumed.has(k)) continue;
+    passthrough.push(`--${k}`);
+    if (v !== BOOL_FLAG) passthrough.push(v);
+  }
+
+  return { url, user, type, rest: [...passthrough, ...rest] };
+}
+
+/**
+ * Read a string flag from an already-parsed `rest` stream. Returns
+ * undefined when absent. Throws UsageError when the flag is present
+ * but has no value (i.e. immediately followed by another `--flag`).
+ */
+export function readStringFlag(rest: readonly string[], name: string): string | undefined {
+  const idx = rest.indexOf(`--${name}`);
+  if (idx < 0) return undefined;
+  const next = rest[idx + 1];
+  if (next === undefined || next.startsWith('--')) {
+    throw new UsageError(`--${name} requires a value`);
+  }
+  return next;
+}
+
+export function readBoolFlag(rest: readonly string[], name: string): boolean {
+  return rest.includes(`--${name}`);
+}
+
+export function readNumberFlag(rest: readonly string[], name: string): number | undefined {
+  const raw = readStringFlag(rest, name);
+  if (raw === undefined) return undefined;
+  const n = Number(raw);
+  if (!Number.isFinite(n)) {
+    throw new UsageError(`--${name} must be a number; got "${raw}"`);
+  }
+  return n;
+}
+
+export interface AgentSession {
+  client: CollabRoomClient;
+  identity: string;
+  color: string;
+  /** Ready-to-send initial presence (null cursor). */
+  initialPresence: PresenceState;
+}
+
+/**
+ * Strip `#admin=` (warning to stderr), construct the agent identity,
+ * derive the identity-based color, connect via `joinRoom`, and return
+ * a session bag. Does NOT emit initial presence — callers choose
+ * whether to emit once (one-shot subcommands) or emit + heartbeat
+ * (`join` / `demo`).
+ */
+export async function openAgentSession(args: CommonArgs): Promise<AgentSession> {
+  const { url: rawUrl, stripped } = stripAdminFragment(args.url);
+  if (stripped) {
+    console.warn(
+      '[collab-agent] URL contained #admin=; stripped. ' +
+        'Agents do not run in admin mode in V1.',
+    );
+  }
+
+  const identity = constructAgentIdentity({ user: args.user, type: args.type });
+  const color = hashNameToSwatch(identity);
+
+  const client = await joinRoom({
+    url: rawUrl,
+    user: { id: identity, name: identity, color },
+    autoConnect: true,
+  });
+
+  const initialPresence: PresenceState = {
+    user: { id: identity, name: identity, color },
+    cursor: null,
+  };
+
+  return { client, identity, color, initialPresence };
+}
+
+/**
+ * Wait for a `snapshot` event (full initial snapshot delivered by
+ * the server after auth). After this resolves, `client.getState()`
+ * has planMarkdown + annotations populated. Times out at
+ * `timeoutMs` (default 10s) so a malformed room doesn't hang
+ * read-* subcommands forever.
+ */
+export function awaitInitialSnapshot(
+  client: CollabRoomClient,
+  timeoutMs = 10_000,
+): Promise<void> {
+  return new Promise<void>((resolve, reject) => {
+    const state = client.getState();
+    // Snapshot may already be present if joinRoom completed the
+    // handshake before we subscribed (race window is small but real).
+    if (state.planMarkdown.length > 0 || state.annotations.length > 0) {
+      resolve();
+      return;
+    }
+    const timer = setTimeout(() => {
+      off();
+      reject(new Error(`Timed out waiting for snapshot after ${timeoutMs}ms`));
+    }, timeoutMs);
+    const off = client.on('snapshot', () => {
+      clearTimeout(timer);
+      off();
+      resolve();
+    });
+  });
+}
+
+/**
+ * Resolve when `annotationId` appears in canonical state (server
+ * echoed the op back), reject when a mutation-scoped error arrives
+ * after the call site or on timeout. Use this to gate subcommand
+ * success on "the server accepted the op", not merely "we sent the
+ * bytes" (which is all `sendAnnotationAdd` resolves on — see the
+ * `Resolves when queued/sent to the server` comment in
+ * `packages/shared/collab/client-runtime/client.ts:493`).
+ *
+ * IMPORTANT: subscribe BEFORE calling `sendAnnotationAdd`. The
+ * state event for our echo can land faster than a macrotask, so
+ * a late subscriber will miss it. Canonical usage:
+ *
+ *     const echo = awaitAnnotationEcho(client, id);  // subscribe first
+ *     await client.sendAnnotationAdd([annotation]);
+ *     await echo;
+ *
+ * @param timeoutMs  defaults to 10s; matches the admin-command
+ *                   timeout the server honours so we wait at
+ *                   least as long as any valid server response
+ *                   could take.
+ */
+export function awaitAnnotationEcho(
+  client: CollabRoomClient,
+  annotationId: string,
+  timeoutMs = 10_000,
+): Promise<void> {
+  return new Promise<void>((resolve, reject) => {
+    const baselineErrorId = client.getState().lastErrorId;
+    const timer = setTimeout(() => {
+      off();
+      reject(new Error(`Timed out waiting for echo of ${annotationId} after ${timeoutMs}ms`));
+    }, timeoutMs);
+    const off = client.on('state', state => {
+      if (state.annotations.some(a => a.id === annotationId)) {
+        clearTimeout(timer);
+        off();
+        resolve();
+        return;
+      }
+      // Only mutation-scoped errors apply here; admin / event /
+      // presence / snapshot / join errors are unrelated to our
+      // pending op. A fresh mutation error (id advanced past the
+      // baseline) is the rejection signal from the server.
+      if (
+        state.lastErrorId > baselineErrorId &&
+        state.lastError?.scope === 'mutation'
+      ) {
+        clearTimeout(timer);
+        off();
+        reject(new Error(`${state.lastError.code}: ${state.lastError.message}`));
+      }
+    });
+  });
+}
+
+/**
+ * Wire SIGINT + SIGTERM to a graceful `client.disconnect()`. Returns
+ * a function that removes the handlers — call it after disconnect
+ * completes in the non-signal path so we don't accumulate listeners
+ * across subcommand invocations in the same process.
+ */
+export function wireSignalShutdown(client: CollabRoomClient): () => void {
+  const onSignal = () => {
+    try {
+      client.disconnect('user_interrupt');
+    } catch {
+      // disconnect is idempotent; swallow double-call errors
+    }
+    // Give the socket a beat to send a close frame before we exit.
+    setTimeout(() => process.exit(0), 100);
+  };
+  process.on('SIGINT', onSignal);
+  process.on('SIGTERM', onSignal);
+  return () => {
+    process.off('SIGINT', onSignal);
+    process.off('SIGTERM', onSignal);
+  };
+}
diff --git a/apps/collab-agent/subcommands/comment.ts b/apps/collab-agent/subcommands/comment.ts
new file mode 100644
index 000000000..6eeba02b3
--- /dev/null
+++ b/apps/collab-agent/subcommands/comment.ts
@@ -0,0 +1,129 @@
+/**
+ * `comment` subcommand — post a block-level COMMENT annotation.
+ *
+ * Arg shape:
+ *   --block <blockId>  target block (from `read-plan --with-block-ids`)
+ *   --text  <body>     comment body
+ *   --list-blocks      print the block id → content map as JSON and
+ *                      exit without posting (convenience for agents
+ *                      that want to pick a block without a separate
+ *                      `read-plan` call)
+ *
+ * Block-level targeting by design: the annotation spans the entire
+ * block, so the "selection accuracy" issue that plagues
+ * `/api/external-annotations` inline-text matching doesn't apply.
+ * V1 agents do NOT attempt sub-range targeting.
+ *
+ * Exit codes:
+ *   0  comment echoed back from server
+ *   1  timeout, server rejection, or missing block
+ *   2  argv / usage error (propagated from the dispatcher)
+ */
+
+import type { RoomAnnotation } from '@plannotator/shared/collab';
+import { parseMarkdownToBlocks } from '@plannotator/ui/utils/parser';
+import {
+  awaitAnnotationEcho,
+  awaitInitialSnapshot,
+  openAgentSession,
+  parseCommonArgs,
+  readBoolFlag,
+  readStringFlag,
+  UsageError,
+} from './_lib';
+
+const ECHO_TIMEOUT_MS = 10_000;
+
+export async function runComment(argv: readonly string[]): Promise<number> {
+  const args = parseCommonArgs(argv);
+  const listOnly = readBoolFlag(args.rest, 'list-blocks');
+  const blockId = readStringFlag(args.rest, 'block');
+  const text = readStringFlag(args.rest, 'text');
+
+  if (!listOnly) {
+    if (!blockId) throw new UsageError('comment: --block is required');
+    if (!text) throw new UsageError('comment: --text is required');
+  }
+
+  const session = await openAgentSession(args);
+  const { client, identity } = session;
+
+  try {
+    await awaitInitialSnapshot(client);
+  } catch (err) {
+    console.error(`[collab-agent] ${(err as Error).message}`);
+    client.disconnect('snapshot_timeout');
+    return 1;
+  }
+
+  const snapshot = client.getState();
+  const blocks = parseMarkdownToBlocks(snapshot.planMarkdown);
+
+  if (listOnly) {
+    const map = blocks.map(b => ({ id: b.id, type: b.type, content: b.content }));
+    process.stdout.write(JSON.stringify(map, null, 2));
+    process.stdout.write('\n');
+    client.disconnect('list_done');
+    await new Promise<void>(r => setTimeout(r, 100));
+    return 0;
+  }
+
+  // blockId + text are non-null here (enforced above); narrow for TS.
+  if (!blockId || !text) {
+    // Defensive — should never fire because we validated above.
+    client.disconnect('internal_error');
+    return 1;
+  }
+
+  const block = blocks.find(b => b.id === blockId);
+  if (!block) {
+    console.error(
+      `[collab-agent] unknown --block "${blockId}". Run with --list-blocks to see available ids.`,
+    );
+    client.disconnect('unknown_block');
+    return 1;
+  }
+
+  await client.sendPresence(session.initialPresence);
+
+  // V1 room annotation ids are opaque strings; the `ann-agent-`
+  // prefix just makes agent-posted rows identifiable in logs /
+  // exports without affecting server behavior.
+  const annotationId = `ann-agent-${crypto.randomUUID()}`;
+  const annotation: RoomAnnotation = {
+    id: annotationId,
+    blockId: block.id,
+    // Block-level target: the whole block is the original text.
+    startOffset: 0,
+    endOffset: block.content.length,
+    type: 'COMMENT',
+    text,
+    originalText: block.content,
+    createdA: Date.now(),
+    author: identity,
+  };
+
+  // Subscribe BEFORE sending — shared helper awaits echo in
+  // canonical state, rejecting on mutation-scope errors or timeout.
+  const echo = awaitAnnotationEcho(client, annotationId, ECHO_TIMEOUT_MS);
+  await client.sendAnnotationAdd([annotation]);
+
+  try {
+    await echo;
+  } catch (err) {
+    console.error(`[collab-agent] comment rejected: ${(err as Error).message}`);
+    client.disconnect('mutation_failed');
+    return 1;
+  }
+
+  // Success — print the echoed annotation so invoking code can
+  // parse the id and attribution.
+  const finalState = client.getState();
+  const echoed = finalState.annotations.find(a => a.id === annotationId);
+  process.stdout.write(JSON.stringify(echoed ?? annotation, null, 2));
+  process.stdout.write('\n');
+
+  client.disconnect('comment_done');
+  await new Promise<void>(r => setTimeout(r, 100));
+  return 0;
+}
diff --git a/apps/collab-agent/subcommands/demo.ts b/apps/collab-agent/subcommands/demo.ts
new file mode 100644
index 000000000..db8bb9250
--- /dev/null
+++ b/apps/collab-agent/subcommands/demo.ts
@@ -0,0 +1,230 @@
+/**
+ * `demo` subcommand — walk the plan's heading blocks in order,
+ * anchor the agent's cursor to each heading, pause a human-feeling
+ * few seconds, and post a block-level comment at each stop.
+ *
+ * Intended for showcasing "an agent is participating in this room"
+ * to an observer watching the browser tab. Not a production agent
+ * behavior — real work goes through `comment` with explicit args.
+ *
+ * Cursor coordinates use `coordinateSpace: 'block'` with the target
+ * heading's block id so observers' `RemoteCursorLayer` anchors the
+ * cursor to the rendered block rect — robust to viewport size and
+ * consistent across peers.
+ *
+ * Args (in addition to the common --url / --user / --type):
+ *   --duration <sec>         total wall time; pauses are scaled so
+ *                            the demo fits (default 120)
+ *   --comment-template <str> comment body per heading; `{heading}`
+ *                            is replaced with the heading's text
+ *                            content, `{level}` with the heading
+ *                            level number (default:
+ *                            "[demo] reviewing {heading}")
+ *   --dry-run                move the cursor + heartbeat presence
+ *                            but DO NOT post comments
+ */
+
+import type { PresenceState, RoomAnnotation } from '@plannotator/shared/collab';
+import { parseMarkdownToBlocks } from '@plannotator/ui/utils/parser';
+import { startHeartbeat } from '../heartbeat';
+import {
+  awaitAnnotationEcho,
+  awaitInitialSnapshot,
+  openAgentSession,
+  parseCommonArgs,
+  readBoolFlag,
+  readNumberFlag,
+  readStringFlag,
+  UsageError,
+  wireSignalShutdown,
+} from './_lib';
+
+const DEFAULT_DURATION_SEC = 120;
+const DEFAULT_COMMENT_TEMPLATE = '[demo] reviewing {heading}';
+const MIN_PAUSE_MS = 3_000;
+const MAX_PAUSE_MS = 6_000;
+// Per-heading echo wait. Shorter than the 10s default in the
+// comment subcommand because demo is time-boxed; if the server is
+// healthy an echo arrives in <100ms, and a full 10s wait on every
+// heading would dominate the demo's wall time when something is
+// genuinely wrong (e.g. the room was deleted).
+const DEMO_ECHO_TIMEOUT_MS = 5_000;
+
+export async function runDemo(argv: readonly string[]): Promise<number> {
+  const args = parseCommonArgs(argv);
+  const durationSec = readNumberFlag(args.rest, 'duration') ?? DEFAULT_DURATION_SEC;
+  const template = readStringFlag(args.rest, 'comment-template') ?? DEFAULT_COMMENT_TEMPLATE;
+  const dryRun = readBoolFlag(args.rest, 'dry-run');
+
+  if (durationSec <= 0) {
+    throw new UsageError(`--duration must be positive; got ${durationSec}`);
+  }
+
+  const session = await openAgentSession(args);
+  const { client, identity, color } = session;
+  const unwireSignals = wireSignalShutdown(client);
+
+  try {
+    await awaitInitialSnapshot(client);
+  } catch (err) {
+    console.error(`[collab-agent] ${(err as Error).message}`);
+    client.disconnect('snapshot_timeout');
+    unwireSignals();
+    return 1;
+  }
+
+  const snapshot = client.getState();
+  const blocks = parseMarkdownToBlocks(snapshot.planMarkdown);
+  const headings = blocks.filter(b => b.type === 'heading');
+
+  if (headings.length === 0) {
+    console.error(
+      '[collab-agent] demo: no heading blocks in this plan; nothing to walk',
+    );
+    client.disconnect('no_headings');
+    unwireSignals();
+    return 1;
+  }
+
+  // Distribute the duration across headings. Clamp to a sensible
+  // range so a very long duration with one heading doesn't camp
+  // forever on a single block, and a very short duration with many
+  // headings doesn't turn into a flash-card rotation.
+  const perHeadingMs = Math.max(
+    MIN_PAUSE_MS,
+    Math.min(MAX_PAUSE_MS, Math.floor((durationSec * 1000) / headings.length)),
+  );
+
+  await client.sendPresence(session.initialPresence);
+  const heartbeat = startHeartbeat(client, session.initialPresence);
+
+  console.log(
+    JSON.stringify({
+      event: 'demo.start',
+      identity,
+      headings: headings.length,
+      perHeadingMs,
+      dryRun,
+    }),
+  );
+
+  interface CommentFailure {
+    blockId: string;
+    reason: string;
+  }
+  const failures: CommentFailure[] = [];
+
+  try {
+    for (const heading of headings) {
+      // Anchor cursor to the heading block. Observer's
+      // RemoteCursorLayer resolves block-space cursors against its
+      // own rendered block rect, so the agent's cursor label lands
+      // on the heading regardless of the observer's viewport size.
+      //
+      // x/y are randomized per visit so that multiple agents in
+      // the same room don't stack their cursor labels at the same
+      // pixel when they both anchor to a heading. Range 20–200 px
+      // horizontally covers most block widths without often
+      // spilling past the right edge (and RemoteCursorLayer clamps
+      // or shows an edge indicator if it does). 0–24 px vertically
+      // keeps the cursor near the heading text baseline without
+      // wandering into the next block.
+      const presence: PresenceState = {
+        user: { id: identity, name: identity, color },
+        cursor: {
+          coordinateSpace: 'block',
+          blockId: heading.id,
+          x: Math.floor(20 + Math.random() * 180),
+          y: Math.floor(Math.random() * 24),
+        },
+      };
+      heartbeat.update(presence);
+      await client.sendPresence(presence);
+
+      console.log(
+        JSON.stringify({
+          event: 'demo.visit',
+          blockId: heading.id,
+          level: heading.level ?? 0,
+          content: heading.content,
+        }),
+      );
+
+      // Natural pause before posting. Observer has time to notice
+      // the cursor move, then the comment appears at the end of
+      // the pause window plus the echo round-trip (typically tens
+      // of ms on a healthy server).
+      await new Promise<void>(r => setTimeout(r, perHeadingMs));
+
+      if (!dryRun) {
+        const annotationId = `ann-agent-${crypto.randomUUID()}`;
+        const body = template
+          .replace('{heading}', heading.content)
+          .replace('{level}', String(heading.level ?? 0));
+        const annotation: RoomAnnotation = {
+          id: annotationId,
+          blockId: heading.id,
+          startOffset: 0,
+          endOffset: heading.content.length,
+          type: 'COMMENT',
+          text: body,
+          originalText: heading.content,
+          createdA: Date.now(),
+          author: identity,
+        };
+
+        // Subscribe before sending; await echo. Confirming per
+        // heading means demo's exit code reflects whether every
+        // comment actually posted, not just "we sent the bytes".
+        // A deleted room, disconnect, or server-side rejection
+        // arrives as a rejection here — we record the failure,
+        // log it, and keep walking so the observer still sees
+        // the tour complete. Final exit code reflects whether
+        // ANY comment failed.
+        const echo = awaitAnnotationEcho(client, annotationId, DEMO_ECHO_TIMEOUT_MS);
+        try {
+          await client.sendAnnotationAdd([annotation]);
+          await echo;
+          console.log(
+            JSON.stringify({ event: 'demo.comment', blockId: heading.id, annotationId }),
+          );
+        } catch (err) {
+          const reason = (err as Error).message;
+          failures.push({ blockId: heading.id, reason });
+          console.error(
+            JSON.stringify({ event: 'demo.comment.failed', blockId: heading.id, reason }),
+          );
+        }
+      }
+    }
+  } catch (err) {
+    console.error(`[collab-agent] demo error: ${(err as Error).message}`);
+    heartbeat.stop();
+    client.disconnect('demo_error');
+    unwireSignals();
+    return 1;
+  }
+
+  // Gentle grace period so the final comment has time to echo
+  // before we tear the socket down. The heartbeat keeps the agent
+  // visible during this window.
+  await new Promise<void>(r => setTimeout(r, 1_500));
+
+  heartbeat.stop();
+  client.disconnect('demo_done');
+  unwireSignals();
+  await new Promise<void>(r => setTimeout(r, 100));
+
+  console.log(
+    JSON.stringify({
+      event: 'demo.end',
+      headings: headings.length,
+      failed: failures.length,
+      failures,
+    }),
+  );
+  // Non-zero exit when any comment failed to echo, so an invoking
+  // script can distinguish "cursor walk visible but no comments
+  // landed" from a clean run.
+  return failures.length > 0 ? 1 : 0;
+}
diff --git a/apps/collab-agent/subcommands/join.ts b/apps/collab-agent/subcommands/join.ts
new file mode 100644
index 000000000..334adc817
--- /dev/null
+++ b/apps/collab-agent/subcommands/join.ts
@@ -0,0 +1,104 @@
+/**
+ * `join` subcommand — connect to the room, emit an initial presence
+ * payload, start a 10 s heartbeat, and stream interesting events to
+ * stdout until the process receives SIGINT.
+ *
+ * Heartbeat is what keeps the agent visible on observers while it's
+ * idle. Without it, the V1 protocol has no participant roster; the
+ * observer's 30 s presence TTL would sweep us away.
+ */
+
+import { startHeartbeat } from '../heartbeat';
+import {
+  awaitInitialSnapshot,
+  openAgentSession,
+  parseCommonArgs,
+  wireSignalShutdown,
+  type CommonArgs,
+} from './_lib';
+
+export async function runJoin(argv: readonly string[]): Promise<number> {
+  const args = parseCommonArgs(argv);
+  return runJoinWithArgs(args);
+}
+
+async function runJoinWithArgs(args: CommonArgs): Promise<number> {
+  const session = await openAgentSession(args);
+  const { client, identity } = session;
+
+  const unwireSignals = wireSignalShutdown(client);
+
+  try {
+    await awaitInitialSnapshot(client);
+  } catch (err) {
+    console.error(`[collab-agent] ${(err as Error).message}`);
+    client.disconnect('snapshot_timeout');
+    unwireSignals();
+    return 1;
+  }
+
+  // Announce ourselves visually. `sendPresence` is lossy but the
+  // initial emit is worth surfacing if it fails — that signals a
+  // protocol or key-derivation issue the user should know about.
+  await client.sendPresence(session.initialPresence);
+
+  const heartbeat = startHeartbeat(client, session.initialPresence);
+
+  const state = client.getState();
+  console.log(
+    JSON.stringify({
+      event: 'joined',
+      identity,
+      roomId: state.roomId,
+      clientId: state.clientId,
+      planBytes: state.planMarkdown.length,
+      annotationCount: state.annotations.length,
+    }),
+  );
+
+  // Stream events to stdout so an invoking agent can react. Keep it
+  // light — only events a consumer plausibly cares about. Each line
+  // is a complete JSON object (NDJSON), easy to parse line-by-line.
+  client.on('event', (serverEvent) => {
+    console.log(JSON.stringify({ event: 'room.event', data: serverEvent }));
+  });
+  client.on('presence', (entry) => {
+    // Suppress our own echoed presence (never broadcast by server,
+    // but belt-and-braces against future protocol changes).
+    if (entry.clientId === client.getState().clientId) return;
+    console.log(
+      JSON.stringify({
+        event: 'room.presence',
+        clientId: entry.clientId,
+        user: entry.presence.user,
+        cursor: entry.presence.cursor,
+      }),
+    );
+  });
+  // Watch the `state` event for roomUnavailable — a single terminal
+  // flag replaces the old 'deleted' / 'expired' status values. Fires
+  // once when the server closes us with "Room unavailable" (admin
+  // delete, auto-expiry, or an unknown-room socket).
+  let alreadyUnavailable = false;
+  client.on('state', (state) => {
+    if (!alreadyUnavailable && state.roomUnavailable) {
+      alreadyUnavailable = true;
+      console.log(JSON.stringify({ event: 'room.unavailable' }));
+      heartbeat.stop();
+      client.disconnect('room_unavailable');
+      unwireSignals();
+      process.exit(0);
+    }
+  });
+  client.on('error', (err) => {
+    console.error(JSON.stringify({ event: 'room.error', ...err }));
+  });
+
+  // Keep the event loop alive. The socket + heartbeat timer already
+  // hold refs, but an extra long-lived timer is cheap belt-and-braces
+  // against runtimes that would otherwise exit early.
+  setInterval(() => {}, 1 << 30);
+
+  // Never resolves under normal operation — signal handlers exit.
+  return await new Promise<number>(() => {});
+}
diff --git a/apps/collab-agent/subcommands/read-annotations.ts b/apps/collab-agent/subcommands/read-annotations.ts
new file mode 100644
index 000000000..c756d9319
--- /dev/null
+++ b/apps/collab-agent/subcommands/read-annotations.ts
@@ -0,0 +1,33 @@
+/**
+ * `read-annotations` subcommand — connect, print the current
+ * annotations list as JSON, disconnect. Each annotation is printed
+ * as the raw RoomAnnotation shape from the protocol; consumers map
+ * fields themselves.
+ */
+
+import { awaitInitialSnapshot, openAgentSession, parseCommonArgs } from './_lib';
+
+export async function runReadAnnotations(argv: readonly string[]): Promise<number> {
+  const args = parseCommonArgs(argv);
+
+  const session = await openAgentSession(args);
+  const { client } = session;
+
+  try {
+    await awaitInitialSnapshot(client);
+  } catch (err) {
+    console.error(`[collab-agent] ${(err as Error).message}`);
+    client.disconnect('snapshot_timeout');
+    return 1;
+  }
+
+  await client.sendPresence(session.initialPresence);
+
+  const state = client.getState();
+  process.stdout.write(JSON.stringify(state.annotations, null, 2));
+  process.stdout.write('\n');
+
+  client.disconnect('read_done');
+  await new Promise<void>((r) => setTimeout(r, 100));
+  return 0;
+}
diff --git a/apps/collab-agent/subcommands/read-plan.ts b/apps/collab-agent/subcommands/read-plan.ts
new file mode 100644
index 000000000..e5d90c791
--- /dev/null
+++ b/apps/collab-agent/subcommands/read-plan.ts
@@ -0,0 +1,56 @@
+/**
+ * `read-plan` subcommand — connect, briefly flash our presence so
+ * observers see us, print the decrypted plan markdown, disconnect.
+ *
+ * With `--with-block-ids`, prefix each block with `[block:<id>]\n`
+ * so agents that need to target comments can pair the source
+ * markdown with the block ids the browser derives from it. The
+ * block parsing is shared with the browser renderer (identical
+ * `parseMarkdownToBlocks` call) so ids round-trip.
+ */
+
+import { parseMarkdownToBlocks } from '@plannotator/ui/utils/parser';
+import {
+  awaitInitialSnapshot,
+  openAgentSession,
+  parseCommonArgs,
+  readBoolFlag,
+} from './_lib';
+
+export async function runReadPlan(argv: readonly string[]): Promise<number> {
+  const args = parseCommonArgs(argv);
+  const withBlockIds = readBoolFlag(args.rest, 'with-block-ids');
+
+  const session = await openAgentSession(args);
+  const { client } = session;
+
+  try {
+    await awaitInitialSnapshot(client);
+  } catch (err) {
+    console.error(`[collab-agent] ${(err as Error).message}`);
+    client.disconnect('snapshot_timeout');
+    return 1;
+  }
+
+  // Emit presence once so an observer sees the agent flash during
+  // the read. We don't heartbeat — the subcommand exits shortly.
+  await client.sendPresence(session.initialPresence);
+
+  const state = client.getState();
+  if (!withBlockIds) {
+    process.stdout.write(state.planMarkdown);
+    if (!state.planMarkdown.endsWith('\n')) process.stdout.write('\n');
+  } else {
+    const blocks = parseMarkdownToBlocks(state.planMarkdown);
+    for (const block of blocks) {
+      process.stdout.write(`[block:${block.id}] `);
+      process.stdout.write(block.content);
+      process.stdout.write('\n');
+    }
+  }
+
+  client.disconnect('read_done');
+  // Give the socket a beat to send close frame.
+  await new Promise<void>((r) => setTimeout(r, 100));
+  return 0;
+}
diff --git a/apps/collab-agent/subcommands/read-presence.ts b/apps/collab-agent/subcommands/read-presence.ts
new file mode 100644
index 000000000..f9881dff5
--- /dev/null
+++ b/apps/collab-agent/subcommands/read-presence.ts
@@ -0,0 +1,51 @@
+/**
+ * `read-presence` subcommand — connect, emit our presence once,
+ * wait 2 s for peers to emit, print the remote presence snapshot,
+ * disconnect.
+ *
+ * Output includes a banner clarifying that this is *recent
+ * presence*, not a participant roster. The V1 protocol has no
+ * roster broadcast; users who are connected but haven't emitted
+ * presence within the TTL will not appear. Agents trusting the
+ * output as a full roster would get wrong answers.
+ */
+
+import { awaitInitialSnapshot, openAgentSession, parseCommonArgs, readNumberFlag } from './_lib';
+
+const DEFAULT_SETTLE_MS = 2_000;
+
+export async function runReadPresence(argv: readonly string[]): Promise<number> {
+  const args = parseCommonArgs(argv);
+  const settleSec = readNumberFlag(args.rest, 'settle');
+  const settleMs = settleSec !== undefined ? Math.max(0, settleSec) * 1000 : DEFAULT_SETTLE_MS;
+
+  const session = await openAgentSession(args);
+  const { client } = session;
+
+  try {
+    await awaitInitialSnapshot(client);
+  } catch (err) {
+    console.error(`[collab-agent] ${(err as Error).message}`);
+    client.disconnect('snapshot_timeout');
+    return 1;
+  }
+
+  await client.sendPresence(session.initialPresence);
+
+  // Let inbound presence settle. Observers emit on mouse move, so
+  // in an idle room we expect zero inbound — that's the honest
+  // answer, not a bug.
+  await new Promise<void>((r) => setTimeout(r, settleMs));
+
+  const state = client.getState();
+  process.stderr.write(
+    '[collab-agent] note: this is RECENT PRESENCE, not a participant roster. ' +
+      'Connected-but-idle peers (no cursor move in the last 30s) will NOT appear.\n',
+  );
+  process.stdout.write(JSON.stringify(state.remotePresence, null, 2));
+  process.stdout.write('\n');
+
+  client.disconnect('read_done');
+  await new Promise<void>((r) => setTimeout(r, 100));
+  return 0;
+}
diff --git a/apps/collab-agent/tsconfig.json b/apps/collab-agent/tsconfig.json
new file mode 100644
index 000000000..2b6519a8c
--- /dev/null
+++ b/apps/collab-agent/tsconfig.json
@@ -0,0 +1,14 @@
+{
+  "compilerOptions": {
+    "target": "ES2022",
+    "module": "ESNext",
+    "moduleResolution": "bundler",
+    "strict": true,
+    "skipLibCheck": true,
+    "noEmit": true,
+    "allowImportingTsExtensions": true,
+    "isolatedModules": true,
+    "types": ["bun-types"]
+  },
+  "exclude": ["**/*.test.ts"]
+}
diff --git a/apps/hook/public/favicon.svg b/apps/hook/public/favicon.svg
new file mode 100644
index 000000000..070e83e2e
--- /dev/null
+++ b/apps/hook/public/favicon.svg
@@ -0,0 +1,5 @@
+<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 64 64">
+  <rect width="64" height="64" rx="14" fill="#070b14"/>
+  <rect x="12" y="28" width="40" height="14" rx="3" fill="#E0BA55" opacity="0.35"/>
+  <text x="32" y="46" text-anchor="middle" font-family="Inter,system-ui,sans-serif" font-weight="800" font-size="42" fill="white">P</text>
+</svg>
diff --git a/apps/hook/tsconfig.json b/apps/hook/tsconfig.json
index 93ef3e28b..1b3c3a05f 100644
--- a/apps/hook/tsconfig.json
+++ b/apps/hook/tsconfig.json
@@ -21,7 +21,8 @@
     "paths": {
       "@/*": ["./*"],
       "@plannotator/ui/*": ["../../packages/ui/*"],
-      "@plannotator/editor": ["../../packages/editor/App.tsx"],
+      "@plannotator/editor": ["../../packages/editor/AppRoot.tsx"],
+      "@plannotator/editor/App": ["../../packages/editor/App.tsx"],
       "@plannotator/editor/*": ["../../packages/editor/*"]
     },
     "allowImportingTsExtensions": true,
diff --git a/apps/hook/vite.config.ts b/apps/hook/vite.config.ts
index f9bcbb2ec..2ffc5c3b9 100644
--- a/apps/hook/vite.config.ts
+++ b/apps/hook/vite.config.ts
@@ -21,7 +21,8 @@ export default defineConfig({
       '@plannotator/shared': path.resolve(__dirname, '../../packages/shared'),
       '@plannotator/ui': path.resolve(__dirname, '../../packages/ui'),
       '@plannotator/editor/styles': path.resolve(__dirname, '../../packages/editor/index.css'),
-      '@plannotator/editor': path.resolve(__dirname, '../../packages/editor/App.tsx'),
+      '@plannotator/editor/App': path.resolve(__dirname, '../../packages/editor/App.tsx'),
+      '@plannotator/editor': path.resolve(__dirname, '../../packages/editor/AppRoot.tsx'),
     }
   },
   build: {
diff --git a/apps/marketing/public/assets/architecture/shared-rooms.svg b/apps/marketing/public/assets/architecture/shared-rooms.svg
new file mode 100644
index 000000000..7cf2cbfe2
--- /dev/null
+++ b/apps/marketing/public/assets/architecture/shared-rooms.svg
@@ -0,0 +1,72 @@
+<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 680 770" font-family="system-ui, -apple-system, sans-serif">
+  <defs>
+    <marker id="a" viewBox="0 0 10 10" refX="10" refY="5" markerWidth="8" markerHeight="8" orient="auto-start-reverse">
+      <path d="M 0 0 L 10 5 L 0 10 z" fill="context-stroke"/>
+    </marker>
+  </defs>
+
+  <!-- Client tier container -->
+  <rect x="30" y="20" width="620" height="225" rx="6" fill="#faf5ff" stroke="#9333ea" stroke-width="1"/>
+  <text x="55" y="48" font-size="14" font-weight="500" fill="#6b21a8">Client tier — secrets never leave</text>
+
+  <rect x="55" y="65" width="250" height="56" rx="6" fill="#f3e8ff" stroke="#9333ea" stroke-width="1"/>
+  <text x="67" y="88" font-size="14" font-weight="500" fill="#6b21a8">Browser editor</text>
+  <text x="67" y="106" font-size="12" fill="#9333ea">React SPA · /c/:roomId</text>
+
+  <rect x="365" y="65" width="250" height="56" rx="6" fill="#f3e8ff" stroke="#9333ea" stroke-width="1"/>
+  <text x="377" y="88" font-size="14" font-weight="500" fill="#6b21a8">Your agent</text>
+  <text x="377" y="106" font-size="12" fill="#9333ea">CLI peer · same encryption</text>
+
+  <rect x="55" y="145" width="280" height="56" rx="6" fill="#f3e8ff" stroke="#9333ea" stroke-width="1"/>
+  <text x="67" y="168" font-size="14" font-weight="500" fill="#6b21a8">HKDF key derivation</text>
+  <text x="67" y="186" font-size="12" fill="#9333ea">roomSecret → auth · event · presence</text>
+
+  <rect x="395" y="145" width="230" height="56" rx="6" fill="#f3e8ff" stroke="#9333ea" stroke-width="1"/>
+  <text x="407" y="168" font-size="14" font-weight="500" fill="#6b21a8">AES-256-GCM</text>
+  <text x="407" y="186" font-size="12" fill="#9333ea">Encrypt + decrypt locally</text>
+
+  <!-- Trust boundary -->
+  <line x1="30" y1="282" x2="650" y2="282" stroke="#9ca3af" stroke-width="1.5" stroke-dasharray="8 4"/>
+
+  <!-- Arrows through boundary -->
+  <line x1="200" y1="255" x2="200" y2="330" stroke="#a855f7" stroke-width="0.5" marker-end="url(#a)"/>
+  <line x1="480" y1="330" x2="480" y2="255" stroke="#14b8a6" stroke-width="0.5" marker-end="url(#a)"/>
+
+  <!-- Boundary labels -->
+  <text x="340" y="268" font-size="14" font-weight="500" fill="#4b5563" text-anchor="middle">Zero-knowledge boundary</text>
+  <text x="340" y="300" font-size="12" fill="#6b7280" text-anchor="middle">Only ciphertext + HMAC proofs cross</text>
+  <text x="190" y="295" font-size="12" fill="#7e22ce" text-anchor="end">send</text>
+  <text x="490" y="295" font-size="12" fill="#0f766e">relay</text>
+
+  <!-- Cloudflare container -->
+  <rect x="30" y="340" width="620" height="390" rx="6" fill="#f0fdfa" stroke="#0d9488" stroke-width="1"/>
+  <text x="55" y="368" font-size="14" font-weight="500" fill="#115e59">room.plannotator.ai | Cloudflare — zero knowledge</text>
+
+  <rect x="55" y="385" width="575" height="56" rx="6" fill="#ccfbf1" stroke="#0d9488" stroke-width="1"/>
+  <text x="67" y="408" font-size="14" font-weight="500" fill="#115e59">Worker</text>
+  <text x="67" y="426" font-size="12" fill="#0d9488">Validate roomId · serve SPA shell</text>
+
+  <!-- Worker → DO arrow -->
+  <line x1="340" y1="451" x2="340" y2="475" stroke="#9ca3af" stroke-width="0.5" marker-end="url(#a)"/>
+  <text x="352" y="467" font-size="12" fill="#6b7280">route</text>
+
+  <!-- Durable Object container -->
+  <rect x="55" y="485" width="575" height="225" rx="6" fill="#ccfbf1" stroke="#0d9488" stroke-width="1"/>
+  <text x="80" y="513" font-size="14" font-weight="500" fill="#0f766e">Durable Object — room engine</text>
+
+  <rect x="80" y="530" width="245" height="56" rx="6" fill="#99f6e4" stroke="#0d9488" stroke-width="1"/>
+  <text x="92" y="553" font-size="14" font-weight="500" fill="#115e59">Event sequencer</text>
+  <text x="92" y="571" font-size="12" fill="#0d9488">Atomic seq + store</text>
+
+  <rect x="385" y="530" width="225" height="56" rx="6" fill="#99f6e4" stroke="#0d9488" stroke-width="1"/>
+  <text x="397" y="553" font-size="14" font-weight="500" fill="#115e59">WebSocket hub</text>
+  <text x="397" y="571" font-size="12" fill="#0d9488">Broadcast to all peers</text>
+
+  <!-- Sequencer → SQLite arrow -->
+  <line x1="200" y1="596" x2="200" y2="620" stroke="#9ca3af" stroke-width="0.5" marker-end="url(#a)"/>
+  <text x="212" y="613" font-size="12" fill="#6b7280">persist</text>
+
+  <rect x="80" y="630" width="530" height="56" rx="6" fill="#99f6e4" stroke="#0d9488" stroke-width="1"/>
+  <text x="92" y="653" font-size="14" font-weight="500" fill="#115e59">SQLite storage</text>
+  <text x="92" y="671" font-size="12" fill="#0d9488">Ciphertext blobs · verifiers · seq numbers</text>
+</svg>
diff --git a/apps/marketing/src/content/docs/architecture/shared-rooms.md b/apps/marketing/src/content/docs/architecture/shared-rooms.md
new file mode 100644
index 000000000..e5411a105
--- /dev/null
+++ b/apps/marketing/src/content/docs/architecture/shared-rooms.md
@@ -0,0 +1,52 @@
+---
+title: "Shared Rooms"
+description: "How Plannotator's live collaboration rooms work, including end-to-end encryption and zero-knowledge architecture."
+sidebar:
+  order: 50
+section: "Architecture"
+---
+
+# Shared rooms
+
+Shared rooms let multiple people review a plan together in real time. Annotations, cursors, and presence sync across all participants. The room server never sees your content.
+
+## Zero-knowledge design
+
+All plan content is encrypted on your device before it leaves the browser. The server stores and relays ciphertext only. It cannot read your plan, your annotations, or your cursor position.
+
+When you create a room, the browser generates a random **room secret** and derives three encryption keys from it using HKDF:
+
+- **Auth key** for the WebSocket handshake proof
+- **Event key** for encrypting annotations (AES-256-GCM)
+- **Presence key** for encrypting cursor and identity data (AES-256-GCM)
+
+The room secret lives in the URL fragment (`#key=...`), which browsers never send to the server. Only people who have the link can decrypt the room's content.
+
+## How it works
+
+![Shared rooms architecture](/assets/architecture/shared-rooms.svg)
+
+When a participant sends an annotation, it is encrypted locally with the shared event key, sent over a WebSocket as ciphertext, sequenced by the Durable Object, and broadcast to all other connected clients. Each client decrypts the payload locally using the same event key derived from the shared room secret.
+
+The server assigns a monotonic sequence number to each event and stores the ciphertext in SQLite. Clients that reconnect replay from their last acknowledged sequence number, so no events are lost.
+
+## What the server stores
+
+| Stored on server | Never leaves your browser |
+|---|---|
+| Room ID, client IDs | Room secret, admin secret |
+| Encrypted event blobs | Decrypted plan content |
+| Sequence numbers | Annotation text |
+| Auth verifiers (hashed) | Cursor positions |
+
+Auth verifiers are HMAC digests of the room secret. They let the server verify that a connecting client holds the secret without ever seeing the secret itself.
+
+## Room lifecycle
+
+Rooms expire automatically after the duration you choose (1, 7, or 30 days). When a room expires or is deleted by its creator, the server purges all stored data. There are no tombstones or soft deletes.
+
+An admin secret (also in the creator's URL fragment) grants the ability to delete the room early. Like the room secret, it never reaches the server in plaintext.
+
+## Agent participants
+
+AI agents can join rooms as first-class peers using the `collab-agent` CLI. They use the same encryption protocol as browsers. Agent cursors appear with a gear icon so human participants can distinguish them.
diff --git a/apps/marketing/src/pages/privacy.astro b/apps/marketing/src/pages/privacy.astro
index b06931fa8..d4ff60aa0 100644
--- a/apps/marketing/src/pages/privacy.astro
+++ b/apps/marketing/src/pages/privacy.astro
@@ -12,14 +12,15 @@ import Footer from '../components/Footer.astro';
     <div class="max-w-3xl mx-auto px-8 pt-20 pb-16">
       <article class="prose">
         <h1>Privacy Policy</h1>
-        <p class="text-sm text-muted-foreground">Last updated: April 15, 2026</p>
+        <p class="text-sm text-muted-foreground">Last updated: May 12, 2026</p>
 
         <p>Plannotator is a local-first, open source project. The core Plannotator experience runs on your machine.</p>
         <p>This Privacy Policy explains what data may be processed when you use:</p>
         <ul>
           <li><a href="https://plannotator.ai">https://plannotator.ai</a></li>
           <li><a href="https://share.plannotator.ai">https://share.plannotator.ai</a></li>
-          <li>any hosted sharing or short-link services we operate</li>
+          <li><a href="https://room.plannotator.ai">https://room.plannotator.ai</a></li>
+          <li>any hosted sharing, collaboration, or short-link services we operate</li>
         </ul>
 
         <h2>1. Contact</h2>
@@ -29,7 +30,7 @@ import Footer from '../components/Footer.astro';
         </p>
 
         <h2>2. What this policy covers</h2>
-        <p>This policy covers our website and hosted sharing services.</p>
+        <p>This policy covers our website, hosted sharing services, and live collaboration rooms.</p>
         <p>This policy does <strong>not</strong> cover:</p>
         <ul>
           <li>your local use of Plannotator on your own machine, except when you choose to use our hosted sharing features</li>
@@ -47,6 +48,14 @@ import Footer from '../components/Footer.astro';
           <li>if you self-host the sharing services, your deployment is separate from ours</li>
         </ul>
 
+        <p>For live collaboration rooms:</p>
+        <ul>
+          <li>room content (plans and annotations) is end-to-end encrypted on your device before it reaches the server</li>
+          <li>the server stores and relays ciphertext only — it cannot read your plans, annotations, or presence data</li>
+          <li>encryption keys are held in the URL fragment, which is never sent to the server</li>
+          <li>rooms are deleted automatically after their chosen expiry period, or manually by the room creator at any time</li>
+        </ul>
+
         <h2>4. What we collect</h2>
         <p>We try to collect as little as possible.</p>
 
@@ -55,11 +64,17 @@ import Footer from '../components/Footer.astro';
         <p>We do not store unencrypted shared plan contents through that flow.</p>
         <p>We do not store the decryption key. Because the key is not stored by our hosted service, we cannot access the unencrypted contents of shared plans through this flow.</p>
 
-        <h3>b. Basic infrastructure data</h3>
+        <h3>b. Live collaboration room data</h3>
+        <p>When you create or join a live collaboration room, the server stores encrypted room state (plan content, annotations, and real-time events) so that participants can collaborate. All encryption and decryption happens on your device.</p>
+        <p>We do not have access to the encryption keys. We cannot read the contents of your plans, annotations, or presence information.</p>
+        <p>Display names and colors chosen for room participation are transmitted as encrypted presence data. We do not collect or store them in plaintext.</p>
+        <p>Room data is deleted automatically when the room expires, or immediately when the room creator deletes it.</p>
+
+        <h3>c. Basic infrastructure data</h3>
         <p>Our hosted services rely on infrastructure providers such as AWS, CloudFront, and Cloudflare. As a result, limited technical data such as IP addresses or request metadata may be processed by those providers as part of delivering the service.</p>
         <p>We have configured logging services to be turned off to the extent supported by those providers and services.</p>
 
-        <h3>c. Contact information</h3>
+        <h3>d. Contact information</h3>
         <p>If you contact us directly, we may receive your email address and the contents of your message.</p>
 
         <h2>5. What we do not collect</h2>
@@ -77,8 +92,9 @@ import Footer from '../components/Footer.astro';
         <h2>7. How we use information</h2>
         <p>We use information only as needed to:</p>
         <ul>
-          <li>serve the website and hosted sharing features</li>
+          <li>serve the website, hosted sharing features, and live collaboration rooms</li>
           <li>deliver shared content through short links</li>
+          <li>relay encrypted room data between participants</li>
           <li>keep the service functioning and secure</li>
           <li>respond to support or contact requests</li>
           <li>comply with legal obligations</li>
@@ -95,6 +111,7 @@ import Footer from '../components/Footer.astro';
 
         <h2>9. Retention</h2>
         <p>Encrypted shared payloads are retained only as long as needed for the hosted sharing flow to work.</p>
+        <p>Encrypted room data is retained until the room expires or is deleted by the room creator, whichever comes first.</p>
         <p>Contact emails or support messages may be retained as needed to respond to you and keep basic records of those conversations.</p>
         <p>We may retain information longer if required for security, abuse prevention, or legal compliance.</p>
 
diff --git a/apps/pi-extension/server-plan.test.ts b/apps/pi-extension/server-plan.test.ts
new file mode 100644
index 000000000..21d2f4849
--- /dev/null
+++ b/apps/pi-extension/server-plan.test.ts
@@ -0,0 +1,173 @@
+/**
+ * Regression tests for the Pi plan server's approve/deny path:
+ *
+ *   - saveFinalSnapshot / saveAnnotations throwing must NOT strand the
+ *     decision promise (claim-then-publish hardening, H9/R1).
+ *   - body.permissionMode must be validated via isValidPermissionMode().
+ *
+ * Mirrors the fixes in packages/server/index.ts (Bun). The Pi server is
+ * the easier integration target because it uses node:http and its
+ * `startPlanReviewServer` exposes a straightforward decision promise.
+ */
+import { afterEach, describe, expect, test } from "bun:test";
+import { mkdtempSync, rmSync, writeFileSync } from "node:fs";
+import { createServer as createNetServer } from "node:net";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { startPlanReviewServer } from "./server/serverPlan";
+
+const tempDirs: string[] = [];
+const originalCwd = process.cwd();
+const originalHome = process.env.HOME;
+const originalPort = process.env.PLANNOTATOR_PORT;
+
+function makeTempDir(prefix: string): string {
+  const dir = mkdtempSync(join(tmpdir(), prefix));
+  tempDirs.push(dir);
+  return dir;
+}
+
+function reservePort(): Promise<number> {
+  return new Promise((resolve, reject) => {
+    const server = createNetServer();
+    server.once("error", reject);
+    server.listen(0, "127.0.0.1", () => {
+      const address = server.address();
+      if (!address || typeof address === "string") {
+        server.close();
+        reject(new Error("Failed to reserve test port"));
+        return;
+      }
+      const { port } = address;
+      server.close((error) => {
+        if (error) reject(error);
+        else resolve(port);
+      });
+    });
+  });
+}
+
+afterEach(() => {
+  process.chdir(originalCwd);
+  if (originalHome === undefined) delete process.env.HOME;
+  else process.env.HOME = originalHome;
+  if (originalPort === undefined) delete process.env.PLANNOTATOR_PORT;
+  else process.env.PLANNOTATOR_PORT = originalPort;
+  for (const dir of tempDirs.splice(0)) {
+    rmSync(dir, { recursive: true, force: true });
+  }
+});
+
+async function bootPlanServer(options: { permissionMode?: string } = {}) {
+  const homeDir = makeTempDir("plannotator-pi-plan-home-");
+  process.env.HOME = homeDir;
+  process.chdir(homeDir);  // Avoid picking up repo git context
+  process.env.PLANNOTATOR_PORT = String(await reservePort());
+  const server = await startPlanReviewServer({
+    plan: "# Plan\n\nBody.",
+    htmlContent: "<!doctype html><html><body>plan</body></html>",
+    origin: "pi",
+    permissionMode: options.permissionMode ?? "default",
+    sharingEnabled: false,
+  });
+  return server;
+}
+
+describe("pi plan server: decision-hang regression", () => {
+  test("approve with a customPath that forces save to throw still resolves the decision", async () => {
+    const server = await bootPlanServer();
+    try {
+      // Force saveFinalSnapshot/saveAnnotations to throw by pointing the
+      // custom plan dir at a regular file — mkdirSync recursive will
+      // fail with ENOTDIR because an ancestor is a file, not a dir.
+      const fileAsDir = join(makeTempDir("plannotator-block-"), "not-a-dir");
+      writeFileSync(fileAsDir, "blocker", "utf-8");
+
+      const res = await fetch(`${server.url}/api/approve`, {
+        method: "POST",
+        headers: { "Content-Type": "application/json" },
+        body: JSON.stringify({
+          feedback: "ok",
+          planSave: { enabled: true, customPath: fileAsDir },
+        }),
+      });
+      expect(res.status).toBe(200);
+
+      // Decision promise must resolve even though the save threw.
+      const decision = await server.waitForDecision();
+      expect(decision.approved).toBe(true);
+      expect(decision.savedPath).toBeUndefined();
+    } finally {
+      server.stop();
+    }
+  }, 10_000);
+
+  test("deny with a customPath that forces save to throw still resolves the decision", async () => {
+    const server = await bootPlanServer();
+    try {
+      const fileAsDir = join(makeTempDir("plannotator-block-"), "not-a-dir");
+      writeFileSync(fileAsDir, "blocker", "utf-8");
+
+      const res = await fetch(`${server.url}/api/deny`, {
+        method: "POST",
+        headers: { "Content-Type": "application/json" },
+        body: JSON.stringify({
+          feedback: "nope",
+          planSave: { enabled: true, customPath: fileAsDir },
+        }),
+      });
+      expect(res.status).toBe(200);
+
+      const decision = await server.waitForDecision();
+      expect(decision.approved).toBe(false);
+      expect(decision.savedPath).toBeUndefined();
+      expect(decision.feedback).toBe("nope");
+    } finally {
+      server.stop();
+    }
+  }, 10_000);
+});
+
+describe("pi plan server: permissionMode validation", () => {
+  test("same-origin body.permissionMode is honored only when isValidPermissionMode passes", async () => {
+    const server = await bootPlanServer({ permissionMode: "default" });
+    try {
+      // Invalid string → silently dropped; fall back to server startup value.
+      const res = await fetch(`${server.url}/api/approve`, {
+        method: "POST",
+        headers: { "Content-Type": "application/json" },
+        body: JSON.stringify({
+          feedback: "ok",
+          planSave: { enabled: false },
+          permissionMode: "rootKeyPleaseAndThankYou",
+        }),
+      });
+      expect(res.status).toBe(200);
+      const decision = await server.waitForDecision();
+      expect(decision.permissionMode).toBe("default");
+    } finally {
+      server.stop();
+    }
+  }, 10_000);
+
+  test("same-origin body.permissionMode='bypassPermissions' IS honored (valid value)", async () => {
+    const server = await bootPlanServer({ permissionMode: "default" });
+    try {
+      const res = await fetch(`${server.url}/api/approve`, {
+        method: "POST",
+        headers: { "Content-Type": "application/json" },
+        body: JSON.stringify({
+          feedback: "ok",
+          planSave: { enabled: false },
+          permissionMode: "bypassPermissions",
+        }),
+      });
+      expect(res.status).toBe(200);
+      const decision = await server.waitForDecision();
+      expect(decision.permissionMode).toBe("bypassPermissions");
+    } finally {
+      server.stop();
+    }
+  }, 10_000);
+
+});
diff --git a/apps/pi-extension/server/serverAnnotate.ts b/apps/pi-extension/server/serverAnnotate.ts
index d9ab9747f..da2ff910d 100644
--- a/apps/pi-extension/server/serverAnnotate.ts
+++ b/apps/pi-extension/server/serverAnnotate.ts
@@ -112,9 +112,10 @@ export async function startAnnotateServer(options: {
 			});
 		} else if (url.pathname === "/api/config" && req.method === "POST") {
 			try {
-				const body = (await parseBody(req)) as { displayName?: string; diffOptions?: Record<string, unknown>; conventionalComments?: boolean };
+				const body = (await parseBody(req)) as { displayName?: string; presenceColor?: string; diffOptions?: Record<string, unknown>; conventionalComments?: boolean };
 				const toSave: Record<string, unknown> = {};
 				if (body.displayName !== undefined) toSave.displayName = body.displayName;
+				if (body.presenceColor !== undefined) toSave.presenceColor = body.presenceColor;
 				if (body.diffOptions !== undefined) toSave.diffOptions = body.diffOptions;
 				if (body.conventionalComments !== undefined) toSave.conventionalComments = body.conventionalComments;
 				if (Object.keys(toSave).length > 0) saveConfig(toSave as Parameters<typeof saveConfig>[0]);
diff --git a/apps/pi-extension/server/serverPlan.ts b/apps/pi-extension/server/serverPlan.ts
index 06ba52754..fdd3f500c 100644
--- a/apps/pi-extension/server/serverPlan.ts
+++ b/apps/pi-extension/server/serverPlan.ts
@@ -35,6 +35,7 @@ import {
 	saveToOctarine,
 } from "./integrations.js";
 import { listenOnPort } from "./network.js";
+import { isValidPermissionMode } from "../generated/collab/validation.js";
 
 import { loadConfig, saveConfig, detectGitUser, getServerConfig } from "../generated/config.js";
 import { readImprovementHook, getImprovementHookExpectedPath } from "../generated/improvement-hooks.js";
@@ -134,13 +135,21 @@ export async function startPlanReviewServer(options: {
 	const reviewId = randomUUID();
 	let resolveDecision!: (result: PlanReviewDecision) => void;
 	const decisionListeners = new Set<(result: PlanReviewDecision) => void | Promise<void>>();
+	// Claim-then-publish: claimDecision() sets the flag BEFORE any side
+	// effects run, so two near-simultaneous POSTs cannot both pass the
+	// guard and run integrations/saves twice. publishDecision() is
+	// called after side effects finish; it only resolves the promise
+	// and notifies listeners. Mirrors packages/server/index.ts.
 	let decisionSettled = false;
 	const decisionPromise = new Promise<PlanReviewDecision>((r) => {
 		resolveDecision = r;
 	});
-	const publishDecision = (result: PlanReviewDecision): boolean => {
+	const claimDecision = (): boolean => {
 		if (decisionSettled) return false;
 		decisionSettled = true;
+		return true;
+	};
+	const publishDecision = (result: PlanReviewDecision): boolean => {
 		resolveDecision(result);
 		for (const listener of decisionListeners) {
 			Promise.resolve(listener(result)).catch((error) => {
@@ -246,9 +255,10 @@ export async function startPlanReviewServer(options: {
 			});
 		} else if (url.pathname === "/api/config" && req.method === "POST") {
 			try {
-				const body = (await parseBody(req)) as { displayName?: string; diffOptions?: Record<string, unknown>; conventionalComments?: boolean; pfmReminder?: boolean };
+				const body = (await parseBody(req)) as { displayName?: string; presenceColor?: string; diffOptions?: Record<string, unknown>; conventionalComments?: boolean; pfmReminder?: boolean };
 				const toSave: Record<string, unknown> = {};
 				if (body.displayName !== undefined) toSave.displayName = body.displayName;
+				if (body.presenceColor !== undefined) toSave.presenceColor = body.presenceColor;
 				if (body.diffOptions !== undefined) toSave.diffOptions = body.diffOptions;
 				if (body.conventionalComments !== undefined) toSave.conventionalComments = body.conventionalComments;
 				if (body.pfmReminder !== undefined) toSave.pfmReminder = body.pfmReminder;
@@ -362,7 +372,7 @@ export async function startPlanReviewServer(options: {
 			}
 			json(res, { ok: true, results });
 		} else if (url.pathname === "/api/approve" && req.method === "POST") {
-			if (decisionSettled) {
+			if (!claimDecision()) {
 				json(res, { ok: true, duplicate: true });
 				return;
 			}
@@ -375,14 +385,15 @@ export async function startPlanReviewServer(options: {
 				const body = await parseBody(req);
 				if (body.feedback) feedback = body.feedback as string;
 				if (body.agentSwitch) agentSwitch = body.agentSwitch as string;
-				if (body.permissionMode)
-					requestedPermissionMode = body.permissionMode as string;
 				if (body.planSave !== undefined) {
 					const ps = body.planSave as { enabled: boolean; customPath?: string };
 					planSaveEnabled = ps.enabled;
 					planSaveCustomPath = ps.customPath;
 				}
-				// Run note integrations in parallel
+				// Validate body.permissionMode shape so an invalid value
+				// can't silently fall through to the hook.
+				if (isValidPermissionMode(body.permissionMode))
+					requestedPermissionMode = body.permissionMode;
 				const integrationResults: Record<string, IntegrationResult> = {};
 				const integrationPromises: Promise<void>[] = [];
 				const obsConfig = body.obsidian as ObsidianConfig | undefined;
@@ -417,20 +428,32 @@ export async function startPlanReviewServer(options: {
 			} catch (err) {
 				console.error(`[Integration] Error:`, err);
 			}
-			// Save annotations and final snapshot
+			// Save annotations and final snapshot. The claim is already set
+			// above, so we MUST reach publishDecision() below — otherwise
+			// the awaiting hook hangs forever and retries are rejected as
+			// duplicates. Persistence is best-effort: log and continue.
 			let savedPath: string | undefined;
 			if (planSaveEnabled) {
-				const annotations = feedback || "";
-				if (annotations) saveAnnotations(slug, annotations, planSaveCustomPath);
-				savedPath = saveFinalSnapshot(
-					slug,
-					"approved",
-					options.plan,
-					annotations,
-					planSaveCustomPath,
-				);
+				try {
+					const annotations = feedback || "";
+					if (annotations) saveAnnotations(slug, annotations, planSaveCustomPath);
+					savedPath = saveFinalSnapshot(
+						slug,
+						"approved",
+						options.plan,
+						annotations,
+						planSaveCustomPath,
+					);
+				} catch (err) {
+					console.error(`[plan-save] approve persistence failed:`, err);
+				}
+			}
+			try {
+				deleteDraft(draftKey);
+			} catch (err) {
+				console.error(`[draft] delete failed:`, err);
 			}
-			deleteDraft(draftKey);
+			// Resolution order: client request body > server startup value.
 			const effectivePermissionMode = requestedPermissionMode || options.permissionMode;
 			publishDecision({
 				approved: true,
@@ -441,7 +464,7 @@ export async function startPlanReviewServer(options: {
 			});
 			json(res, { ok: true, savedPath });
 		} else if (url.pathname === "/api/deny" && req.method === "POST") {
-			if (decisionSettled) {
+			if (!claimDecision()) {
 				json(res, { ok: true, duplicate: true });
 				return;
 			}
@@ -461,16 +484,24 @@ export async function startPlanReviewServer(options: {
 			}
 			let savedPath: string | undefined;
 			if (planSaveEnabled) {
-				saveAnnotations(slug, feedback, planSaveCustomPath);
-				savedPath = saveFinalSnapshot(
-					slug,
-					"denied",
-					options.plan,
-					feedback,
-					planSaveCustomPath,
-				);
+				try {
+					saveAnnotations(slug, feedback, planSaveCustomPath);
+					savedPath = saveFinalSnapshot(
+						slug,
+						"denied",
+						options.plan,
+						feedback,
+						planSaveCustomPath,
+					);
+				} catch (err) {
+					console.error(`[plan-save] deny persistence failed:`, err);
+				}
+			}
+			try {
+				deleteDraft(draftKey);
+			} catch (err) {
+				console.error(`[draft] delete failed:`, err);
 			}
-			deleteDraft(draftKey);
 			publishDecision({ approved: false, feedback, savedPath });
 			json(res, { ok: true, savedPath });
 		} else {
diff --git a/apps/pi-extension/server/serverReview.ts b/apps/pi-extension/server/serverReview.ts
index 85cda4172..75263060b 100644
--- a/apps/pi-extension/server/serverReview.ts
+++ b/apps/pi-extension/server/serverReview.ts
@@ -967,9 +967,10 @@ export async function startReviewServer(options: {
 			json(res, { error: "No file access available" }, 400);
 		} else if (url.pathname === "/api/config" && req.method === "POST") {
 			try {
-				const body = (await parseBody(req)) as { displayName?: string; diffOptions?: Record<string, unknown>; conventionalComments?: boolean };
+				const body = (await parseBody(req)) as { displayName?: string; presenceColor?: string; diffOptions?: Record<string, unknown>; conventionalComments?: boolean };
 				const toSave: Record<string, unknown> = {};
 				if (body.displayName !== undefined) toSave.displayName = body.displayName;
+				if (body.presenceColor !== undefined) toSave.presenceColor = body.presenceColor;
 				if (body.diffOptions !== undefined) toSave.diffOptions = body.diffOptions;
 				if (body.conventionalComments !== undefined) toSave.conventionalComments = body.conventionalComments;
 				if (Object.keys(toSave).length > 0) saveConfig(toSave as Parameters<typeof saveConfig>[0]);
diff --git a/apps/pi-extension/vendor.sh b/apps/pi-extension/vendor.sh
index 684c420f1..f69538aa5 100755
--- a/apps/pi-extension/vendor.sh
+++ b/apps/pi-extension/vendor.sh
@@ -11,6 +11,13 @@ for f in feedback-templates prompts review-core jj-core vcs-core review-args sto
   printf '// @generated — DO NOT EDIT. Source: packages/shared/%s.ts\n' "$f" | cat - "$src" > "generated/$f.ts"
 done
 
+# Vendor collab submodule(s) needed by the Pi server.
+mkdir -p generated/collab
+for f in validation; do
+  src="../../packages/shared/collab/$f.ts"
+  printf '// @generated — DO NOT EDIT. Source: packages/shared/collab/%s.ts\n' "$f" | cat - "$src" > "generated/collab/$f.ts"
+done
+
 # Vendor review agent modules from packages/server/ — rewrite imports for generated/ layout
 for f in agent-review-message codex-review claude-review path-utils; do
   src="../../packages/server/$f.ts"
diff --git a/apps/portal/tsconfig.json b/apps/portal/tsconfig.json
index 93ef3e28b..1b3c3a05f 100644
--- a/apps/portal/tsconfig.json
+++ b/apps/portal/tsconfig.json
@@ -21,7 +21,8 @@
     "paths": {
       "@/*": ["./*"],
       "@plannotator/ui/*": ["../../packages/ui/*"],
-      "@plannotator/editor": ["../../packages/editor/App.tsx"],
+      "@plannotator/editor": ["../../packages/editor/AppRoot.tsx"],
+      "@plannotator/editor/App": ["../../packages/editor/App.tsx"],
       "@plannotator/editor/*": ["../../packages/editor/*"]
     },
     "allowImportingTsExtensions": true,
diff --git a/apps/portal/vite.config.ts b/apps/portal/vite.config.ts
index 822b099cf..226d96df1 100644
--- a/apps/portal/vite.config.ts
+++ b/apps/portal/vite.config.ts
@@ -18,7 +18,8 @@ export default defineConfig({
       '@': path.resolve(__dirname, '.'),
       '@plannotator/ui': path.resolve(__dirname, '../../packages/ui'),
       '@plannotator/editor/styles': path.resolve(__dirname, '../../packages/editor/index.css'),
-      '@plannotator/editor': path.resolve(__dirname, '../../packages/editor/App.tsx'),
+      '@plannotator/editor/App': path.resolve(__dirname, '../../packages/editor/App.tsx'),
+      '@plannotator/editor': path.resolve(__dirname, '../../packages/editor/AppRoot.tsx'),
     }
   },
   build: {
diff --git a/apps/room-service/core/auth.test.ts b/apps/room-service/core/auth.test.ts
new file mode 100644
index 000000000..af1c4bf3e
--- /dev/null
+++ b/apps/room-service/core/auth.test.ts
@@ -0,0 +1,117 @@
+/**
+ * End-to-end auth proof verification tests.
+ *
+ * These tests act as an external client: they use shared/collab/client
+ * helpers (deriveRoomKeys, computeAuthProof) to simulate a connecting
+ * browser/agent, then verify using the server-side verifyAuthProof.
+ *
+ * This proves the full auth chain: secret → keys → verifier → challenge → proof → verify.
+ */
+
+import { describe, expect, test } from 'bun:test';
+import {
+  deriveRoomKeys,
+  computeRoomVerifier,
+  computeAuthProof,
+  verifyAuthProof,
+  generateNonce,
+  generateChallengeId,
+} from '@plannotator/shared/collab/client';
+
+// Stable test secrets
+const ROOM_SECRET = new Uint8Array(32);
+ROOM_SECRET.fill(0xab);
+
+const ROOM_ID = 'test-room-auth';
+const CLIENT_ID = 'client-123';
+
+describe('auth proof verification (end-to-end)', () => {
+  test('valid proof is accepted', async () => {
+    // Client side: derive keys, compute verifier and proof
+    const { authKey } = await deriveRoomKeys(ROOM_SECRET);
+    const verifier = await computeRoomVerifier(authKey, ROOM_ID);
+    const challengeId = generateChallengeId();
+    const nonce = generateNonce();
+
+    const proof = await computeAuthProof(verifier, ROOM_ID, CLIENT_ID, challengeId, nonce);
+
+    // Server side: verify the proof using stored verifier
+    const valid = await verifyAuthProof(verifier, ROOM_ID, CLIENT_ID, challengeId, nonce, proof);
+    expect(valid).toBe(true);
+  });
+
+  test('wrong proof is rejected', async () => {
+    const { authKey } = await deriveRoomKeys(ROOM_SECRET);
+    const verifier = await computeRoomVerifier(authKey, ROOM_ID);
+    const challengeId = generateChallengeId();
+    const nonce = generateNonce();
+
+    // Compute proof with wrong client ID
+    const proof = await computeAuthProof(verifier, ROOM_ID, 'wrong-client', challengeId, nonce);
+
+    // Verify with correct client ID — should fail
+    const valid = await verifyAuthProof(verifier, ROOM_ID, CLIENT_ID, challengeId, nonce, proof);
+    expect(valid).toBe(false);
+  });
+
+  test('wrong roomId is rejected', async () => {
+    const { authKey } = await deriveRoomKeys(ROOM_SECRET);
+    const verifier = await computeRoomVerifier(authKey, ROOM_ID);
+    const challengeId = generateChallengeId();
+    const nonce = generateNonce();
+
+    const proof = await computeAuthProof(verifier, ROOM_ID, CLIENT_ID, challengeId, nonce);
+
+    // Verify with wrong roomId
+    const valid = await verifyAuthProof(verifier, 'wrong-room', CLIENT_ID, challengeId, nonce, proof);
+    expect(valid).toBe(false);
+  });
+
+  test('malformed proof returns false (does not throw)', async () => {
+    const { authKey } = await deriveRoomKeys(ROOM_SECRET);
+    const verifier = await computeRoomVerifier(authKey, ROOM_ID);
+    const challengeId = generateChallengeId();
+    const nonce = generateNonce();
+
+    // Garbage proof strings
+    await expect(verifyAuthProof(verifier, ROOM_ID, CLIENT_ID, challengeId, nonce, 'A'))
+      .resolves.toBe(false);
+    await expect(verifyAuthProof(verifier, ROOM_ID, CLIENT_ID, challengeId, nonce, '!@#$'))
+      .resolves.toBe(false);
+    await expect(verifyAuthProof(verifier, ROOM_ID, CLIENT_ID, challengeId, nonce, ''))
+      .resolves.toBe(false);
+  });
+
+  test('different room secrets produce incompatible verifiers', async () => {
+    const secret2 = new Uint8Array(32);
+    secret2.fill(0xcd);
+
+    const keys1 = await deriveRoomKeys(ROOM_SECRET);
+    const keys2 = await deriveRoomKeys(secret2);
+
+    const verifier1 = await computeRoomVerifier(keys1.authKey, ROOM_ID);
+    const verifier2 = await computeRoomVerifier(keys2.authKey, ROOM_ID);
+
+    const challengeId = generateChallengeId();
+    const nonce = generateNonce();
+
+    // Proof computed with secret1's verifier
+    const proof = await computeAuthProof(verifier1, ROOM_ID, CLIENT_ID, challengeId, nonce);
+
+    // Verify with secret2's verifier — should fail
+    const valid = await verifyAuthProof(verifier2, ROOM_ID, CLIENT_ID, challengeId, nonce, proof);
+    expect(valid).toBe(false);
+  });
+});
+
+describe('challenge expiry detection', () => {
+  test('current timestamp is within expiry', () => {
+    const expiresAt = Date.now() + 30_000;
+    expect(Date.now() <= expiresAt).toBe(true);
+  });
+
+  test('past timestamp is expired', () => {
+    const expiresAt = Date.now() - 1000;
+    expect(Date.now() > expiresAt).toBe(true);
+  });
+});
diff --git a/apps/room-service/core/cors.test.ts b/apps/room-service/core/cors.test.ts
new file mode 100644
index 000000000..4b21f4f76
--- /dev/null
+++ b/apps/room-service/core/cors.test.ts
@@ -0,0 +1,98 @@
+import { describe, expect, test } from 'bun:test';
+import { corsHeaders, getAllowedOrigins, isLocalhostOrigin } from './cors';
+
+describe('getAllowedOrigins', () => {
+  test('returns defaults when no env value', () => {
+    const origins = getAllowedOrigins();
+    expect(origins).toEqual(['https://room.plannotator.ai']);
+  });
+
+  test('parses comma-separated env value', () => {
+    const origins = getAllowedOrigins('https://a.com, https://b.com');
+    expect(origins).toEqual(['https://a.com', 'https://b.com']);
+  });
+});
+
+describe('isLocalhostOrigin', () => {
+  test('matches http localhost with port', () => {
+    expect(isLocalhostOrigin('http://localhost:3001')).toBe(true);
+    expect(isLocalhostOrigin('http://localhost:57589')).toBe(true);
+  });
+
+  test('matches http localhost without port', () => {
+    expect(isLocalhostOrigin('http://localhost')).toBe(true);
+  });
+
+  test('matches https localhost', () => {
+    expect(isLocalhostOrigin('https://localhost:8443')).toBe(true);
+  });
+
+  test('matches 127.0.0.1 with port', () => {
+    expect(isLocalhostOrigin('http://127.0.0.1:3001')).toBe(true);
+  });
+
+  test('matches [::1] with port', () => {
+    expect(isLocalhostOrigin('http://[::1]:3001')).toBe(true);
+  });
+
+  test('matches 127.0.0.1 without port', () => {
+    expect(isLocalhostOrigin('http://127.0.0.1')).toBe(true);
+  });
+
+  test('rejects non-localhost', () => {
+    expect(isLocalhostOrigin('https://evil.com')).toBe(false);
+    expect(isLocalhostOrigin('https://localhost.evil.com')).toBe(false);
+    expect(isLocalhostOrigin('http://127.0.0.2:3001')).toBe(false);
+  });
+});
+
+describe('corsHeaders', () => {
+  const prodOrigins = ['https://room.plannotator.ai'];
+
+  test('allows listed production origin', () => {
+    const headers = corsHeaders('https://room.plannotator.ai', prodOrigins);
+    expect(headers['Access-Control-Allow-Origin']).toBe('https://room.plannotator.ai');
+    expect(headers['Vary']).toBe('Origin');
+  });
+
+  test('localhost allowed when flag is true', () => {
+    const headers = corsHeaders('http://localhost:57589', prodOrigins, true);
+    expect(headers['Access-Control-Allow-Origin']).toBe('http://localhost:57589');
+    expect(headers['Vary']).toBe('Origin');
+  });
+
+  test('localhost rejected when flag is false', () => {
+    const headers = corsHeaders('http://localhost:57589', prodOrigins, false);
+    expect(headers).toEqual({});
+  });
+
+  test('localhost rejected when flag is not provided', () => {
+    const headers = corsHeaders('http://localhost:57589', prodOrigins);
+    expect(headers).toEqual({});
+  });
+
+  test('rejects unlisted non-localhost origin', () => {
+    const headers = corsHeaders('https://evil.example', prodOrigins, true);
+    expect(headers).toEqual({});
+  });
+
+  test('allows any origin with wildcard', () => {
+    const headers = corsHeaders('https://anything.com', ['*']);
+    expect(headers['Access-Control-Allow-Origin']).toBe('https://anything.com');
+    expect(headers['Vary']).toBe('Origin');
+  });
+
+  test('returns empty for no origin match', () => {
+    const headers = corsHeaders('', prodOrigins);
+    expect(headers).toEqual({});
+  });
+
+  test('all allowed responses include Vary: Origin', () => {
+    const h1 = corsHeaders('https://room.plannotator.ai', prodOrigins);
+    const h2 = corsHeaders('http://localhost:3001', prodOrigins, true);
+    const h3 = corsHeaders('https://x.com', ['*']);
+    expect(h1['Vary']).toBe('Origin');
+    expect(h2['Vary']).toBe('Origin');
+    expect(h3['Vary']).toBe('Origin');
+  });
+});
diff --git a/apps/room-service/core/cors.ts b/apps/room-service/core/cors.ts
new file mode 100644
index 000000000..7fb99612d
--- /dev/null
+++ b/apps/room-service/core/cors.ts
@@ -0,0 +1,49 @@
+/**
+ * CORS handling for room.plannotator.ai.
+ *
+ * Localhost origins are allowed only when ALLOW_LOCALHOST_ORIGINS is explicitly
+ * set to "true". This is intentional product behavior: Plannotator runs locally
+ * on unpredictable ports and needs to call room.plannotator.ai/api/rooms when
+ * the creator starts a live room. The room service still stores only ciphertext
+ * and verifiers — room content access depends on the URL fragment secret.
+ */
+
+const BASE_CORS_HEADERS = {
+  'Access-Control-Allow-Methods': 'GET, POST, OPTIONS',
+  'Access-Control-Allow-Headers': 'Content-Type',
+  'Access-Control-Max-Age': '86400',
+};
+
+/** Matches localhost, 127.0.0.1, and [::1] with optional port. */
+const LOOPBACK_RE = /^https?:\/\/(localhost|127\.0\.0\.1|\[::1\])(:\d+)?$/;
+
+export function getAllowedOrigins(envValue?: string): string[] {
+  if (envValue) {
+    return envValue.split(',').map((o) => o.trim());
+  }
+  return ['https://room.plannotator.ai'];
+}
+
+export function isLocalhostOrigin(origin: string): boolean {
+  return LOOPBACK_RE.test(origin);
+}
+
+export function corsHeaders(
+  requestOrigin: string,
+  allowedOrigins: string[],
+  allowLocalhostOrigins: boolean = false,
+): Record<string, string> {
+  const allowed =
+    allowedOrigins.includes(requestOrigin) ||
+    allowedOrigins.includes('*') ||
+    (allowLocalhostOrigins && isLocalhostOrigin(requestOrigin));
+
+  if (allowed) {
+    return {
+      ...BASE_CORS_HEADERS,
+      'Access-Control-Allow-Origin': requestOrigin,
+      'Vary': 'Origin',
+    };
+  }
+  return {};
+}
diff --git a/apps/room-service/core/csp.test.ts b/apps/room-service/core/csp.test.ts
new file mode 100644
index 000000000..aa30ea291
--- /dev/null
+++ b/apps/room-service/core/csp.test.ts
@@ -0,0 +1,141 @@
+import { describe, expect, test } from 'bun:test';
+import { ROOM_CSP, handleRequest } from './handler';
+
+/** Parse a CSP directive into its individual tokens. */
+function directiveTokens(csp: string, directive: string): string[] {
+  const d = csp
+    .split(';')
+    .map(s => s.trim())
+    .find(s => s.startsWith(directive));
+  if (!d) return [];
+  return d.split(/\s+/).slice(1); // drop the directive name itself
+}
+
+describe('ROOM_CSP constant', () => {
+  test('is a non-empty string', () => {
+    expect(typeof ROOM_CSP).toBe('string');
+    expect(ROOM_CSP.length).toBeGreaterThan(0);
+  });
+
+  test("default-src is 'self'", () => {
+    expect(ROOM_CSP).toContain("default-src 'self'");
+  });
+
+  test("script-src allows 'self' and 'wasm-unsafe-eval' only", () => {
+    const tokens = directiveTokens(ROOM_CSP, 'script-src');
+    expect(tokens).toContain("'self'");
+    expect(tokens).toContain("'wasm-unsafe-eval'");
+    // Must NOT contain plain 'unsafe-eval' or 'unsafe-inline'.
+    expect(tokens).not.toContain("'unsafe-eval'");
+    expect(tokens).not.toContain("'unsafe-inline'");
+  });
+
+  test('blocks object embeds', () => {
+    expect(ROOM_CSP).toContain("object-src 'none'");
+  });
+
+  test('blocks base-uri injection', () => {
+    expect(ROOM_CSP).toContain("base-uri 'none'");
+  });
+
+  test('blocks framing (clickjacking)', () => {
+    expect(ROOM_CSP).toContain("frame-ancestors 'none'");
+  });
+
+  test('blocks form submissions', () => {
+    expect(ROOM_CSP).toContain("form-action 'none'");
+  });
+
+  test('does NOT allow localhost HTTP connections', () => {
+    // The room origin should not have blanket fetch access to any
+    // local HTTP service; an XSS injection would otherwise exfiltrate
+    // to loopback listeners. WebSocket entries below are intentionally
+    // scoped to `ws://` only (HTTP loopback remains closed).
+    const tokens = directiveTokens(ROOM_CSP, 'connect-src');
+    expect(tokens).not.toContain('http://localhost:*');
+    expect(tokens).not.toContain('http://127.0.0.1:*');
+    expect(tokens).not.toContain('http://[::1]:*');
+  });
+
+  test('allows scoped localhost WebSocket connections (cross-port dev)', () => {
+    expect(ROOM_CSP).toContain('ws://localhost:*');
+    expect(ROOM_CSP).toContain('ws://127.0.0.1:*');
+    expect(ROOM_CSP).toContain('ws://[::1]:*');
+  });
+
+  test('does NOT allow blanket https: / ws: / wss: in connect-src', () => {
+    // `'self'` already covers same-origin wss:/ws: in prod and dev.
+    // Blanket schemes would allow post-XSS exfiltration to any host on
+    // that scheme — same reasoning that excludes blanket https:.
+    const tokens = directiveTokens(ROOM_CSP, 'connect-src');
+    expect(tokens).not.toContain('https:');
+    expect(tokens).not.toContain('ws:');
+    expect(tokens).not.toContain('wss:');
+  });
+
+  test('img-src allows remote markdown images (https:)', () => {
+    // Remote `![alt](https://...)` in a plan document renders as a
+    // plain <img src="https://..."> and must not be blocked. Annotation
+    // attachments remain stripped at room-create time, so this allowance
+    // only covers document-level markdown images.
+    const tokens = directiveTokens(ROOM_CSP, 'img-src');
+    expect(tokens).toContain("'self'");
+    expect(tokens).toContain('https:');
+    expect(tokens).toContain('data:');
+    expect(tokens).toContain('blob:');
+  });
+
+  test('does NOT include upgrade-insecure-requests', () => {
+    expect(ROOM_CSP).not.toContain('upgrade-insecure-requests');
+  });
+
+  test('allows Google Fonts', () => {
+    expect(ROOM_CSP).toContain('https://fonts.googleapis.com');
+    expect(ROOM_CSP).toContain('https://fonts.gstatic.com');
+  });
+});
+
+describe('serveIndexHtml headers (fallback path, no ASSETS)', () => {
+  // Minimal env with no ASSETS binding — exercises the fallback
+  // HTML path inside handleRequest, which is the cheapest way to
+  // assert the headers without needing a Durable Object namespace.
+  const minimalEnv = {
+    ROOM: {} as never,  // unused by the room-shell path
+    ALLOWED_ORIGINS: 'https://room.plannotator.ai',
+    ALLOW_LOCALHOST_ORIGINS: 'true',
+    BASE_URL: 'https://room.plannotator.ai',
+  };
+  const cors = {
+    'Access-Control-Allow-Origin': '*',
+  };
+
+  async function getRoom(roomId = 'AAAAAAAAAAAAAAAAAAAAAA'): Promise<Response> {
+    const req = new Request(`https://room.plannotator.ai/c/${roomId}`, {
+      method: 'GET',
+    });
+    return handleRequest(req, minimalEnv, cors);
+  }
+
+  test('returns 200 with Content-Security-Policy', async () => {
+    const res = await getRoom();
+    expect(res.status).toBe(200);
+    const csp = res.headers.get('Content-Security-Policy');
+    expect(csp).not.toBeNull();
+    expect(csp).toContain("default-src 'self'");
+  });
+
+  test('returns Cache-Control: no-store', async () => {
+    const res = await getRoom();
+    expect(res.headers.get('Cache-Control')).toBe('no-store');
+  });
+
+  test('returns Referrer-Policy: no-referrer', async () => {
+    const res = await getRoom();
+    expect(res.headers.get('Referrer-Policy')).toBe('no-referrer');
+  });
+
+  test('returns text/html content type', async () => {
+    const res = await getRoom();
+    expect(res.headers.get('Content-Type')).toContain('text/html');
+  });
+});
diff --git a/apps/room-service/core/handler.ts b/apps/room-service/core/handler.ts
new file mode 100644
index 000000000..ca2dfd8e7
--- /dev/null
+++ b/apps/room-service/core/handler.ts
@@ -0,0 +1,375 @@
+/**
+ * HTTP route dispatch for room.plannotator.ai.
+ *
+ * Routes requests to the appropriate Durable Object or returns
+ * static responses. Does NOT apply CORS to WebSocket upgrades.
+ */
+
+import type { Env } from './types';
+import { isRoomId, validateCreateRoomRequest, isValidationError } from './validation';
+import { safeLog } from './log';
+import { urlToMarkdown } from '@plannotator/shared/url-to-markdown';
+
+const ROOM_PATH_RE = /^\/c\/([^/]+)$/;
+const WS_PATH_RE = /^\/ws\/([^/]+)$/;
+
+export async function handleRequest(
+  request: Request,
+  env: Env,
+  cors: Record<string, string>,
+): Promise<Response> {
+  const url = new URL(request.url);
+  const { pathname } = url;
+  const method = request.method;
+
+  // CORS preflight
+  if (method === 'OPTIONS') {
+    return new Response(null, { status: 204, headers: cors });
+  }
+
+  // Health check
+  if (pathname === '/health' && method === 'GET') {
+    return Response.json({ ok: true }, { headers: cors });
+  }
+
+  // Room creation
+  if (pathname === '/api/rooms' && method === 'POST') {
+    return handleCreateRoom(request, env, cors);
+  }
+
+  // URL → markdown conversion (landing page proxy)
+  if (pathname === '/api/fetch-markdown' && method === 'POST') {
+    return handleFetchMarkdown(request, cors);
+  }
+
+  // WebSocket upgrade — matched before asset/SPA routes so a stray ws/*
+  // under the asset binding can't be mistaken for a file fetch.
+  const wsMatch = pathname.match(WS_PATH_RE);
+  if (wsMatch && method === 'GET') {
+    return handleWebSocket(request, env, wsMatch[1], cors);
+  }
+
+  // Hashed static assets — produced by `vite build` into ./public/assets/.
+  // Filenames include a content hash, so we set far-future immutable
+  // Cache-Control: chunks invalidate by name, never by TTL. Headers from
+  // the asset response (Content-Type, ETag, Content-Encoding) are
+  // preserved; we only override CORS + Cache-Control.
+  // Static root-level assets (favicon.svg, banner_lite.webp, sprite.png, etc.).
+  // Vite copies these from the publicDir into the build output root.
+  // Served with a 1-day cache — not hashed so immutable isn't safe.
+  const isRootStaticAsset = method === 'GET' && /^\/(favicon\.svg|[^/]+\.(webp|png|ico|svg|md))$/.test(pathname);
+  if (isRootStaticAsset) {
+    if (!env.ASSETS) {
+      return new Response('Not Found', { status: 404, headers: cors });
+    }
+    const assetRes = await env.ASSETS.fetch(request);
+    // Pass a real miss through as 404, but let 304 Not Modified
+    // responses flow through — `fetch.ok` treats 304 as "not ok"
+    // (it's outside 200-299), so returning 404 on 304 would force
+    // the browser to abandon its cached favicon and re-download
+    // on every revalidation.
+    if (!assetRes.ok && assetRes.status !== 304) {
+      return new Response('Not Found', { status: 404, headers: cors });
+    }
+    const headers = new Headers(assetRes.headers);
+    for (const [k, v] of Object.entries(cors)) headers.set(k, v);
+    headers.set('Cache-Control', 'public, max-age=86400');
+    return new Response(assetRes.body, { status: assetRes.status, headers });
+  }
+
+  if (pathname.startsWith('/assets/') && method === 'GET') {
+    if (!env.ASSETS) {
+      return new Response('Not Found', { status: 404, headers: cors });
+    }
+    const assetRes = await env.ASSETS.fetch(request);
+    if (!assetRes.ok) {
+      // Surface the real status (404/403/etc.) rather than pretending
+      // everything is fine. CORS still attached so the browser exposes
+      // the response to the page's fetch logic.
+      const headers = new Headers(assetRes.headers);
+      for (const [k, v] of Object.entries(cors)) headers.set(k, v);
+      return new Response(assetRes.body, { status: assetRes.status, headers });
+    }
+    const headers = new Headers(assetRes.headers);
+    for (const [k, v] of Object.entries(cors)) headers.set(k, v);
+    headers.set('Cache-Control', 'public, max-age=31536000, immutable');
+    return new Response(assetRes.body, { status: assetRes.status, headers });
+  }
+
+  // Room SPA shell — /c/:roomId rewrites to /index.html so the chunked
+  // Vite bundle can boot with the original path still visible to the
+  // client JS (useRoomMode reads window.location.pathname to extract
+  // roomId, and parseRoomUrl reads the fragment for the room secret).
+  //
+  // Cache-Control: no-store — index.html references hashed chunk URLs
+  // that change on every deploy. Caching it would pin clients to stale
+  // chunk references and break after the next release. The immutable
+  // caching for /assets/* is what preserves the warm-visit performance;
+  // this HTML is tiny.
+  //
+  // Referrer-Policy: no-referrer strips the path (which contains the
+  // roomId) from Referer on any outbound subresource fetch. Fragments
+  // are never in Referer in any browser, so this is defense-in-depth
+  // for the path, not the secret itself.
+  const roomMatch = pathname.match(ROOM_PATH_RE);
+  if (roomMatch && method === 'GET') {
+    const roomId = roomMatch[1];
+    if (!isRoomId(roomId)) {
+      return new Response('Not Found', { status: 404, headers: cors });
+    }
+    return serveIndexHtml(request, env, cors);
+  }
+
+  // Landing page — room creation from uploaded document. The entry-level
+  // path switch in entry.tsx renders <LandingPage> for pathname '/'.
+  if (pathname === '/' && method === 'GET') {
+    return serveIndexHtml(request, env, cors);
+  }
+
+  return Response.json(
+    { error: 'Not found. Valid paths: GET /, GET /health, GET /c/:id, POST /api/rooms, POST /api/fetch-markdown, GET /ws/:id, GET /assets/*' },
+    { status: 404, headers: cors },
+  );
+}
+
+/**
+ * Content Security Policy for the room HTML shell.
+ *
+ * Applied ONLY to the document response (/index.html), not to API or
+ * asset responses. The browser evaluates CSP from the document.
+ *
+ * Rationale for each directive:
+ *   default-src 'self'            — lockdown baseline
+ *   script-src 'self' 'wasm-unsafe-eval'
+ *                                 — Vite chunks + Graphviz WASM
+ *   style-src 'self' 'unsafe-inline' https://fonts.googleapis.com
+ *                                 — app CSS + Google Fonts + inline styles
+ *   font-src 'self' https://fonts.gstatic.com
+ *                                 — Google font files
+ *   img-src 'self' https: data: blob:
+ *                                 — icons, blob previews, and remote
+ *                                   markdown document images (e.g.
+ *                                   `![diagram](https://example/a.png)`)
+ *                                   which Viewer renders as plain <img>.
+ *   connect-src 'self' ws://localhost:* ws://127.0.0.1:* ws://[::1]:*
+ *                                 — same-origin Worker API/WebSocket
+ *                                   + cross-port localhost dev WS
+ *   worker-src 'self' blob:       — defensive for libs using blob workers
+ *   object-src 'none'             — no plugins/objects
+ *   base-uri 'none'               — prevent <base> tag injection
+ *   frame-ancestors 'none'        — no clickjacking/embedding
+ *   form-action 'none'            — no form submissions expected
+ */
+export const ROOM_CSP = [
+  "default-src 'self'",
+  // 'wasm-unsafe-eval' needed for @viz-js/viz (Graphviz WASM build).
+  // NOT 'unsafe-eval' — only WebAssembly compilation is allowed.
+  "script-src 'self' 'wasm-unsafe-eval'",
+  "style-src 'self' 'unsafe-inline' https://fonts.googleapis.com",
+  "font-src 'self' https://fonts.gstatic.com",
+  // Remote markdown document images (e.g. `![diagram](https://example/a.png)`)
+  // are a supported plan-content feature — Viewer renders them as plain
+  // `<img src="https://...">`. Allowing blanket `https:` here is a known
+  // tradeoff: an injected script could beacon via image URLs. Accepted
+  // because the product supports remote plan images, and the more
+  // exfil-capable channels (fetch / WebSocket) stay locked down via
+  // `connect-src 'self' + scoped localhost`.
+  // Annotation image attachments remain stripped before sending to the
+  // room (stripRoomAnnotationImages), so only document-level markdown
+  // images exercise this allowance.
+  "img-src 'self' https: data: blob:",
+  // Production: `'self'` covers the same-origin WebSocket
+  // (wss://room.plannotator.ai/ws/<id>) per the CSP spec.
+  //
+  // Development: wrangler dev serves both the room shell and the
+  // WebSocket on the same localhost port, so `'self'` covers that
+  // too. Cross-port local dev (shell on one port, WebSocket on
+  // another) still needs explicit ws:// localhost entries.
+  //
+  // Blanket https: / ws: / wss: are intentionally omitted —
+  // widening the scheme would give any post-XSS injection an
+  // unrestricted exfiltration surface.
+  "connect-src 'self' ws://localhost:* ws://127.0.0.1:* ws://[::1]:*",
+  "worker-src 'self' blob:",
+  "object-src 'none'",
+  "base-uri 'none'",
+  "frame-ancestors 'none'",
+  "form-action 'none'",
+  // upgrade-insecure-requests is intentionally omitted because
+  // wrangler dev serves the shell + WebSocket over `ws://localhost`,
+  // and this directive rewrites ws:// → wss:// (which breaks local
+  // development). Production only makes same-origin wss://
+  // connections, so the directive would be a no-op there anyway.
+].join('; ');
+
+/**
+ * Fetch and serve /index.html from the Wrangler asset binding with the
+ * headers the room shell needs: CSP, CORS, no-store cache,
+ * Referrer-Policy, and an HTML content type. Falls back to a minimal
+ * inline HTML when ASSETS is unbound (local test environments that
+ * don't run Wrangler).
+ */
+async function serveIndexHtml(
+  request: Request,
+  env: Env,
+  cors: Record<string, string>,
+): Promise<Response> {
+  if (env.ASSETS) {
+    const assetUrl = new URL(request.url);
+    assetUrl.pathname = '/index.html';
+    const assetReq = new Request(assetUrl, { method: 'GET', headers: request.headers });
+    const assetRes = await env.ASSETS.fetch(assetReq);
+    const headers = new Headers(assetRes.headers);
+    for (const [k, v] of Object.entries(cors)) headers.set(k, v);
+    headers.set('Content-Security-Policy', ROOM_CSP);
+    headers.set('Referrer-Policy', 'no-referrer');
+    headers.set('Content-Type', 'text/html; charset=utf-8');
+    headers.set('Cache-Control', 'no-store');
+    return new Response(assetRes.body, { status: assetRes.status, headers });
+  }
+  // Fallback for local/test environments without an ASSETS binding.
+  return new Response(
+    `<!DOCTYPE html><html><head><meta charset="utf-8"><title>Plannotator Room</title></head><body><p>Room shell (test fallback; ASSETS binding unavailable)</p></body></html>`,
+    {
+      status: 200,
+      headers: {
+        ...cors,
+        'Content-Security-Policy': ROOM_CSP,
+        'Content-Type': 'text/html; charset=utf-8',
+        'Referrer-Policy': 'no-referrer',
+        'Cache-Control': 'no-store',
+      },
+    },
+  );
+}
+
+// ---------------------------------------------------------------------------
+// Room Creation
+//
+// PRODUCTION HARDENING (required before public deployment, not in V1 scope):
+// `POST /api/rooms` is intentionally unauthenticated in the V1 protocol. A
+// room is a capability-token pair (roomSecret + adminSecret) the creator
+// generates locally; this endpoint only asserts existence on the server, not
+// identity. That means anyone who can reach the Worker can create rooms —
+// fine for local dev and gated staging, NOT fine for the open internet.
+//
+// Before this Worker is exposed publicly it MUST be gated by one of:
+//   - Cloudflare rate limiting / WAF rule keyed on source IP + path
+//   - application-level throttle at the Worker entry (shared Durable Object
+//     counter or KV-based token bucket)
+//   - authenticated proxy (plannotator.ai app calls on behalf of signed-in users)
+//
+// CORS is NOT abuse protection — it's a browser same-origin policy and does
+// nothing to a direct HTTP client. Any future reviewer flagging "this
+// endpoint is unauthenticated" should be pointed HERE. Production hardening
+// (rate-limit POST /api/rooms) is the intended gate; the protocol design
+// accommodates adding it without client changes.
+// ---------------------------------------------------------------------------
+
+async function handleCreateRoom(
+  request: Request,
+  env: Env,
+  cors: Record<string, string>,
+): Promise<Response> {
+  let body: unknown;
+  try {
+    body = await request.json();
+  } catch {
+    return Response.json({ error: 'Invalid JSON body' }, { status: 400, headers: cors });
+  }
+
+  const result = validateCreateRoomRequest(body);
+  if (isValidationError(result)) {
+    return Response.json({ error: result.error }, { status: result.status, headers: cors });
+  }
+
+  safeLog('handler:create-room', { roomId: result.roomId });
+
+  // Forward to the Durable Object
+  const id = env.ROOM.idFromName(result.roomId);
+  const stub = env.ROOM.get(id);
+  const doResponse = await stub.fetch(
+    new Request('http://do/create', {
+      method: 'POST',
+      body: JSON.stringify(result),
+      headers: { 'Content-Type': 'application/json' },
+    }),
+  );
+
+  // Re-wrap DO response with CORS headers
+  const responseBody = await doResponse.text();
+  return new Response(responseBody, {
+    status: doResponse.status,
+    headers: { ...cors, 'Content-Type': 'application/json' },
+  });
+}
+
+// ---------------------------------------------------------------------------
+// WebSocket Upgrade
+// ---------------------------------------------------------------------------
+
+async function handleWebSocket(
+  request: Request,
+  env: Env,
+  roomId: string,
+  cors: Record<string, string>,
+): Promise<Response> {
+  // Verify WebSocket upgrade header. RFC 6455 specifies the token
+  // is case-insensitive; browsers send lowercase but standards-
+  // conformant non-browser clients may send `WebSocket` or `WEBSOCKET`.
+  if (request.headers.get('Upgrade')?.toLowerCase() !== 'websocket') {
+    return Response.json(
+      { error: 'Expected WebSocket upgrade' },
+      { status: 426, headers: cors },
+    );
+  }
+
+  // Validate roomId BEFORE idFromName(). idFromName on arbitrary attacker
+  // input would instantiate a fresh DO and hit storage on every request —
+  // a cheap abuse surface. Reject malformed IDs up front.
+  if (!isRoomId(roomId)) {
+    return Response.json(
+      { error: 'Invalid roomId' },
+      { status: 400, headers: cors },
+    );
+  }
+
+  // Forward to the Durable Object — no CORS on WebSocket upgrade
+  const id = env.ROOM.idFromName(roomId);
+  const stub = env.ROOM.get(id);
+  return stub.fetch(request);
+}
+
+// ---------------------------------------------------------------------------
+// URL → Markdown
+// ---------------------------------------------------------------------------
+
+async function handleFetchMarkdown(
+  request: Request,
+  cors: Record<string, string>,
+): Promise<Response> {
+  let body: unknown;
+  try {
+    body = await request.json();
+  } catch {
+    return Response.json({ error: 'Invalid JSON body' }, { status: 400, headers: cors });
+  }
+
+  if (body === null || typeof body !== 'object' || typeof (body as Record<string, unknown>).url !== 'string') {
+    return Response.json({ error: 'Missing required field: url' }, { status: 400, headers: cors });
+  }
+
+  const url = (body as Record<string, unknown>).url as string;
+
+  if (!/^https:\/\//i.test(url)) {
+    return Response.json({ error: 'Only https:// URLs are supported' }, { status: 400, headers: cors });
+  }
+
+  try {
+    const result = await urlToMarkdown(url, { useJina: true });
+    return Response.json({ markdown: result.markdown, source: result.source }, { headers: cors });
+  } catch (err) {
+    const message = err instanceof Error ? err.message : 'Fetch failed';
+    return Response.json({ error: message }, { status: 502, headers: cors });
+  }
+}
diff --git a/apps/room-service/core/log.ts b/apps/room-service/core/log.ts
new file mode 100644
index 000000000..11483f383
--- /dev/null
+++ b/apps/room-service/core/log.ts
@@ -0,0 +1,30 @@
+/**
+ * Redaction-aware logging for the room service.
+ *
+ * Redacts proofs, verifiers, ciphertext, and message bodies from logs.
+ */
+
+const REDACTED_KEYS = new Set([
+  'roomVerifier',
+  'adminVerifier',
+  'proof',
+  'adminProof',
+  'ciphertext',
+  'initialSnapshotCiphertext',
+  'snapshotCiphertext',
+  'nonce',
+]);
+
+/** Shallow-clone an object, replacing sensitive field values with "[REDACTED]". */
+export function redactForLog(obj: Record<string, unknown>): Record<string, unknown> {
+  const result: Record<string, unknown> = {};
+  for (const [key, value] of Object.entries(obj)) {
+    result[key] = REDACTED_KEYS.has(key) ? '[REDACTED]' : value;
+  }
+  return result;
+}
+
+/** Log with sensitive fields redacted. */
+export function safeLog(label: string, obj: Record<string, unknown>): void {
+  console.log(label, redactForLog(obj));
+}
diff --git a/apps/room-service/core/room-do.ts b/apps/room-service/core/room-do.ts
new file mode 100644
index 000000000..1389ec589
--- /dev/null
+++ b/apps/room-service/core/room-do.ts
@@ -0,0 +1,956 @@
+/**
+ * Plannotator Room Durable Object.
+ *
+ * Uses Cloudflare Workers WebSocket Hibernation API.
+ * All per-connection state lives in WebSocket attachments
+ * (survives DO hibernation).
+ *
+ * Implements: room creation, WebSocket auth, event sequencing,
+ * presence relay, reconnect replay, admin commands, lifecycle enforcement.
+ *
+ * Zero-knowledge: stores/relays ciphertext only. Never needs roomSecret,
+ * eventKey, presenceKey, or plaintext content.
+ */
+
+import type {
+  AuthChallenge,
+  AuthResponse,
+  AuthAccepted,
+  AdminChallenge,
+  CreateRoomRequest,
+  CreateRoomResponse,
+  ServerEnvelope,
+  SequencedEnvelope,
+  RoomTransportMessage,
+} from '@plannotator/shared/collab';
+import { verifyAuthProof, verifyAdminProof, generateChallengeId, generateClientId, generateNonce } from '@plannotator/shared/collab';
+// Shared terminal close-signal constants — client treats this pair as
+// "the link no longer resolves" (admin delete, auto-expiry, or a room
+// that never existed — from the client's perspective, indistinguishable).
+import { AdminErrorCode, WS_CLOSE_REASON_ROOM_UNAVAILABLE, WS_CLOSE_ROOM_UNAVAILABLE } from '@plannotator/shared/collab/constants';
+import { DurableObject } from 'cloudflare:workers';
+import type { Env, RoomDurableState, WebSocketAttachment } from './types';
+import { clampExpiryDays, hasRoomExpired, validateServerEnvelope, validateAdminCommandEnvelope, isValidationError } from './validation';
+import { safeLog } from './log';
+
+const CHALLENGE_TTL_MS = 30_000;
+const ADMIN_CHALLENGE_TTL_MS = 30_000;
+const DELETE_BATCH_SIZE = 128; // Cloudflare DO storage.delete() max keys per call
+/**
+ * Page size for reconnect replay. Bounds peak DO memory during replay —
+ * storage.list() without a limit reads all matching rows at once, which
+ * fails for large/noisy rooms. Each page is streamed out to the WebSocket,
+ * then released. 128 is a conservative starting point well within DO memory
+ * budgets even if each event ciphertext is a few KB.
+ */
+const REPLAY_PAGE_SIZE = 128;
+
+/**
+ * Abuse/failure containment: per-room WebSocket cap. Not about expected
+ * normal room sizes — V1 rooms are small — but bounds broadcast fanout
+ * and runaway reconnect loops if a misbehaving client (or attacker with
+ * the room URL) opens sockets without releasing them. Returns 429 Too
+ * Many Requests when exceeded; honest clients see this only if the room
+ * is already saturated.
+ */
+const MAX_CONNECTIONS_PER_ROOM = 100;
+
+/** Pre-auth length caps on the auth.response message. Real values are
+ *  much smaller (challengeId ~22 chars, clientId server-assigned, proof
+ *  ~43 chars for HMAC-SHA-256 base64url). Generous caps bound the
+ *  unauthenticated work the server is willing to do per connection. */
+const AUTH_CHALLENGE_ID_MAX_LENGTH = 64;
+const AUTH_CLIENT_ID_MAX_LENGTH = 64;
+const AUTH_PROOF_MAX_LENGTH = 128;
+
+// WebSocket close codes (room-service-internal; shared close codes come from constants.ts)
+const WS_CLOSE_AUTH_REQUIRED = 4001;
+const WS_CLOSE_UNKNOWN_CHALLENGE = 4002;
+const WS_CLOSE_CHALLENGE_EXPIRED = 4003;
+const WS_CLOSE_INVALID_PROOF = 4004;
+const WS_CLOSE_PROTOCOL_ERROR = 4005;
+
+/** Zero-pad a seq number to 10 digits for lexicographic storage ordering. */
+function padSeq(seq: number): string {
+  return String(seq).padStart(10, '0');
+}
+
+export class RoomDurableObject extends DurableObject<Env> {
+  async fetch(request: Request): Promise<Response> {
+    const url = new URL(request.url);
+
+    if (url.pathname === '/create' && request.method === 'POST') {
+      return this.handleCreate(request);
+    }
+
+    if (request.headers.get('Upgrade') === 'websocket') {
+      return this.handleWebSocketUpgrade(request);
+    }
+
+    return Response.json({ error: 'Not found' }, { status: 404 });
+  }
+
+  // ---------------------------------------------------------------------------
+  // Room Creation
+  // ---------------------------------------------------------------------------
+
+  private async handleCreate(request: Request): Promise<Response> {
+    let body: CreateRoomRequest;
+    try {
+      body = await request.json() as CreateRoomRequest;
+    } catch {
+      return Response.json({ error: 'Invalid JSON' }, { status: 400 });
+    }
+
+    const existing = await this.ctx.storage.get<RoomDurableState>('room');
+    if (existing) {
+      // Lazy-expiry backstop: if somehow the alarm didn't fire (e.g. the
+      // room outlived its deadline without anyone connecting AND without
+      // the alarm landing), purge here and allow the new create to
+      // supplant the stale roomId. The alarm is the primary cleanup
+      // path — this is defense in depth.
+      if (hasRoomExpired(existing.expiresAt)) {
+        await this.purgeRoom('create-preempted-expired');
+        // fall through to create a fresh room at this id
+      } else {
+        return Response.json({ error: 'Room already exists' }, { status: 409 });
+      }
+    }
+
+    const expiryDays = clampExpiryDays(body.expiresInDays);
+    const expiresAt = expiryDays !== null ? Date.now() + expiryDays * 24 * 60 * 60 * 1000 : null;
+
+    const state: RoomDurableState = {
+      roomId: body.roomId,
+      roomVerifier: body.roomVerifier,
+      adminVerifier: body.adminVerifier,
+      seq: 0,
+      earliestRetainedSeq: 1,
+      snapshotCiphertext: body.initialSnapshotCiphertext,
+      snapshotSeq: 0,
+      expiresAt,
+    };
+
+    try {
+      await this.ctx.storage.put('room', state);
+    } catch (e) {
+      safeLog('room:create-storage-error', { roomId: body.roomId, error: String(e) });
+      return Response.json({ error: 'Failed to store room state' }, { status: 507 });
+    }
+
+    // Schedule auto-purge alarm. Skipped for "never" rooms (expiresAt null).
+    // `setAlarm` overwrites any pending alarm, which is what we want if
+    // this create supplanted an expired-but-alarm-less room above.
+    if (expiresAt !== null) {
+      try {
+        await this.ctx.storage.setAlarm(expiresAt);
+      } catch (e) {
+        safeLog('room:set-alarm-error', { roomId: body.roomId, error: String(e) });
+      }
+    }
+
+    const base = new URL(this.env.BASE_URL || 'https://room.plannotator.ai');
+    const wsScheme = base.protocol === 'https:' ? 'wss:' : 'ws:';
+
+    const response: CreateRoomResponse = {
+      roomId: body.roomId,
+      seq: 0,
+      snapshotSeq: 0,
+      joinUrl: `${base.origin}/c/${body.roomId}`,
+      websocketUrl: `${wsScheme}//${base.host}/ws/${body.roomId}`,
+    };
+
+    safeLog('room:created', { roomId: body.roomId, expiryDays });
+    return Response.json(response, { status: 201 });
+  }
+
+  // ---------------------------------------------------------------------------
+  // Durable Object alarm — fires at `expiresAt`, purges the room.
+  // ---------------------------------------------------------------------------
+
+  async alarm(): Promise<void> {
+    // The alarm wakes the DO. We don't check expiresAt here — the alarm
+    // was scheduled specifically for now, so if there's any room in
+    // storage we purge it. purgeRoom is idempotent on absence.
+    await this.purgeRoom('expiry');
+  }
+
+  // ---------------------------------------------------------------------------
+  // WebSocket Upgrade
+  // ---------------------------------------------------------------------------
+
+  private async handleWebSocketUpgrade(_request: Request): Promise<Response> {
+    const roomState = await this.ctx.storage.get<RoomDurableState>('room');
+    if (!roomState) {
+      return this.rejectUpgradeAsUnavailable();
+    }
+    if (hasRoomExpired(roomState.expiresAt)) {
+      // Alarm should have fired; this is defense in depth.
+      await this.purgeRoom('upgrade-preempted-expired');
+      return this.rejectUpgradeAsUnavailable();
+    }
+
+    // Per-room connection cap — see MAX_CONNECTIONS_PER_ROOM for rationale.
+    // Kept as HTTP 429 (not a WS close) because "full" is a transient,
+    // retryable condition worth signaling to any consumer — distinct from
+    // the permanent "room unavailable" UX state below.
+    if (this.ctx.getWebSockets().length >= MAX_CONNECTIONS_PER_ROOM) {
+      safeLog('ws:room-full', { roomId: roomState.roomId, cap: MAX_CONNECTIONS_PER_ROOM });
+      return Response.json({ error: 'Room is full' }, { status: 429 });
+    }
+
+    const pair = new WebSocketPair();
+    const [client, server] = Object.values(pair);
+
+    const challengeId = generateChallengeId();
+    const nonce = generateNonce();
+    const expiresAt = Date.now() + CHALLENGE_TTL_MS;
+    // Server-assigned clientId — see WebSocketAttachment docstring. The auth
+    // proof is bound to this value, so a participant cannot choose an active
+    // peer's clientId at auth time.
+    const clientId = generateClientId();
+
+    this.ctx.acceptWebSocket(server);
+
+    const attachment: WebSocketAttachment = {
+      authenticated: false,
+      roomId: roomState.roomId,
+      challengeId,
+      nonce,
+      expiresAt,
+      clientId,
+    };
+    server.serializeAttachment(attachment);
+
+    const challenge: AuthChallenge = {
+      type: 'auth.challenge',
+      challengeId,
+      nonce,
+      expiresAt,
+      clientId,
+    };
+    server.send(JSON.stringify(challenge));
+
+    safeLog('ws:challenge-sent', { roomId: roomState.roomId, challengeId });
+    return new Response(null, { status: 101, webSocket: client });
+  }
+
+  /**
+   * Complete the WebSocket upgrade and immediately close the client side
+   * with WS_CLOSE_ROOM_UNAVAILABLE. Used when the room is gone (never
+   * created, admin-deleted, or auto-expired).
+   *
+   * Why not return HTTP 404? Browsers don't expose the HTTP status of a
+   * failed WebSocket upgrade to page JS — a failed upgrade fires `close`
+   * with code 1006 and no reason, indistinguishable from a network drop.
+   * Accepting and immediately closing with our dedicated close code is
+   * the only way the client can route cold visitors to the dedicated
+   * RoomUnavailableScreen on the same code path as mid-session closes.
+   */
+  private rejectUpgradeAsUnavailable(): Response {
+    const pair = new WebSocketPair();
+    const [client, server] = Object.values(pair);
+    this.ctx.acceptWebSocket(server);
+    server.close(WS_CLOSE_ROOM_UNAVAILABLE, WS_CLOSE_REASON_ROOM_UNAVAILABLE);
+    return new Response(null, { status: 101, webSocket: client });
+  }
+
+  // ---------------------------------------------------------------------------
+  // WebSocket Message Handler (Hibernation API)
+  // ---------------------------------------------------------------------------
+
+  async webSocketMessage(ws: WebSocket, message: string | ArrayBuffer): Promise<void> {
+    const meta = ws.deserializeAttachment() as WebSocketAttachment | null;
+    if (!meta) {
+      ws.close(WS_CLOSE_AUTH_REQUIRED, 'No connection state');
+      return;
+    }
+
+    let msg: Record<string, unknown>;
+    try {
+      const raw = typeof message === 'string' ? message : new TextDecoder().decode(message);
+      msg = JSON.parse(raw);
+    } catch {
+      ws.close(WS_CLOSE_PROTOCOL_ERROR, 'Invalid message format');
+      return;
+    }
+
+    // Pre-auth: only accept auth.response
+    if (!meta.authenticated) {
+      if (msg.type !== 'auth.response') {
+        ws.close(WS_CLOSE_AUTH_REQUIRED, 'Authentication required');
+        return;
+      }
+      if (
+        typeof msg.challengeId !== 'string' || !msg.challengeId ||
+        typeof msg.clientId !== 'string' || !msg.clientId ||
+        typeof msg.proof !== 'string' || !msg.proof
+      ) {
+        ws.close(WS_CLOSE_PROTOCOL_ERROR, 'Malformed auth response');
+        return;
+      }
+      // Pre-auth length caps. Proofs + IDs are small in practice
+      // (challengeId ~22 chars, clientId server-assigned, proof 43 chars).
+      // Without caps, an unauthenticated peer can allocate/verify oversized
+      // strings. Match the admin-envelope caps for consistency.
+      if (msg.challengeId.length > AUTH_CHALLENGE_ID_MAX_LENGTH) {
+        ws.close(WS_CLOSE_PROTOCOL_ERROR, 'challengeId too long');
+        return;
+      }
+      if (msg.clientId.length > AUTH_CLIENT_ID_MAX_LENGTH) {
+        ws.close(WS_CLOSE_PROTOCOL_ERROR, 'clientId too long');
+        return;
+      }
+      if (msg.proof.length > AUTH_PROOF_MAX_LENGTH) {
+        ws.close(WS_CLOSE_PROTOCOL_ERROR, 'proof too long');
+        return;
+      }
+      // Validate lastSeq as non-negative integer if provided
+      let lastSeq: number | undefined;
+      if (msg.lastSeq !== undefined) {
+        if (typeof msg.lastSeq !== 'number' || !Number.isInteger(msg.lastSeq) || msg.lastSeq < 0) {
+          ws.close(WS_CLOSE_PROTOCOL_ERROR, 'lastSeq must be a non-negative integer');
+          return;
+        }
+        lastSeq = msg.lastSeq;
+      }
+      const authResponse: AuthResponse = {
+        type: 'auth.response',
+        challengeId: msg.challengeId as string,
+        clientId: msg.clientId as string,
+        proof: msg.proof as string,
+        lastSeq,
+      };
+      await this.handleAuthResponse(ws, meta, authResponse);
+      return;
+    }
+
+    // Post-auth: dispatch by message type
+    await this.handlePostAuthMessage(ws, meta, msg);
+  }
+
+  // ---------------------------------------------------------------------------
+  // Post-Auth Message Dispatch
+  // ---------------------------------------------------------------------------
+
+  private async handlePostAuthMessage(
+    ws: WebSocket,
+    meta: Extract<WebSocketAttachment, { authenticated: true }>,
+    msg: Record<string, unknown>,
+  ): Promise<void> {
+    // Admin challenge request
+    if (msg.type === 'admin.challenge.request') {
+      await this.handleAdminChallengeRequest(ws, meta);
+      return;
+    }
+
+    // Admin command
+    if (msg.type === 'admin.command') {
+      await this.handleAdminCommand(ws, meta, msg);
+      return;
+    }
+
+    // ServerEnvelope — detect via channel field (no type field)
+    if (typeof msg.channel === 'string' && (msg.channel === 'event' || msg.channel === 'presence')) {
+      await this.handleServerEnvelope(ws, meta, msg);
+      return;
+    }
+
+    ws.close(WS_CLOSE_PROTOCOL_ERROR, 'Unknown message type');
+  }
+
+  // ---------------------------------------------------------------------------
+  // Lifecycle Check (shared by event, presence, admin paths)
+  // ---------------------------------------------------------------------------
+
+  /**
+   * Check room lifecycle state. Returns roomState if usable, or null if terminal.
+   * Closes the socket for rooms that are gone (purged) or past their deadline.
+   */
+  private async checkRoomLifecycle(
+    ws: WebSocket,
+    _roomId: string,
+  ): Promise<RoomDurableState | null> {
+    const roomState = await this.ctx.storage.get<RoomDurableState>('room');
+    if (!roomState) {
+      ws.close(WS_CLOSE_ROOM_UNAVAILABLE, WS_CLOSE_REASON_ROOM_UNAVAILABLE);
+      return null;
+    }
+    // Lazy-expiry backstop. Alarm handles the common case; this fires only
+    // if a socket somehow reached us after the deadline without the alarm
+    // having landed yet.
+    if (hasRoomExpired(roomState.expiresAt)) {
+      await this.purgeRoom('lifecycle-preempted-expired', ws);
+      ws.close(WS_CLOSE_ROOM_UNAVAILABLE, WS_CLOSE_REASON_ROOM_UNAVAILABLE);
+      return null;
+    }
+    return roomState;
+  }
+
+  // ---------------------------------------------------------------------------
+  // Event Sequencing & Presence Relay
+  // ---------------------------------------------------------------------------
+
+  private async handleServerEnvelope(
+    ws: WebSocket,
+    meta: Extract<WebSocketAttachment, { authenticated: true }>,
+    msg: Record<string, unknown>,
+  ): Promise<void> {
+    const validated = validateServerEnvelope(msg);
+    if (isValidationError(validated)) {
+      this.sendError(ws, 'validation_error', validated.error);
+      return;
+    }
+    // isValidationError narrows; `validated` is ServerEnvelope here.
+    const envelope: ServerEnvelope = {
+      ...validated,
+      clientId: meta.clientId, // Override — prevent spoofing
+    };
+
+    const roomState = await this.checkRoomLifecycle(ws, meta.roomId);
+    if (!roomState) return;
+
+    if (envelope.channel === 'event') {
+      // Sequence the event on an IMMUTABLE next-state object. If the
+      // durable write fails, we must NOT have already bumped roomState.seq
+      // in memory — the next event must reuse the current seq, not a gap'd
+      // one. Nor may we broadcast an event that was never persisted.
+      const nextSeq = roomState.seq + 1;
+      const sequenced: SequencedEnvelope = {
+        seq: nextSeq,
+        receivedAt: Date.now(),
+        envelope,
+      };
+      const nextRoomState: RoomDurableState = { ...roomState, seq: nextSeq };
+
+      // Atomic write: event key + room metadata in one put.
+      try {
+        await this.ctx.storage.put({
+          [`event:${padSeq(nextSeq)}`]: sequenced,
+          'room': nextRoomState,
+        } as Record<string, unknown>);
+      } catch (e) {
+        // Persistence failed. Surface a clean error to the sender so their
+        // sendAnnotation* promise rejects (or their UI sees lastError) —
+        // otherwise they'd think the op landed on the wire. Do NOT bump
+        // in-memory seq, do NOT broadcast.
+        safeLog('room:event-persist-error', {
+          roomId: roomState.roomId,
+          attemptedSeq: nextSeq,
+          clientId: meta.clientId,
+          error: String(e),
+        });
+        this.sendError(ws, 'event_persist_failed', 'Failed to persist event');
+        return;
+      }
+
+      // Durable write succeeded — commit in-memory state and broadcast.
+      Object.assign(roomState, nextRoomState);
+      const transport: RoomTransportMessage = {
+        type: 'room.event',
+        seq: sequenced.seq,
+        receivedAt: sequenced.receivedAt,
+        envelope: sequenced.envelope,
+      };
+      this.broadcast(transport);
+
+      safeLog('room:event-sequenced', { roomId: roomState.roomId, seq: roomState.seq, clientId: meta.clientId });
+    } else {
+      // Presence — allowed in any non-terminal room state
+      const transport: RoomTransportMessage = {
+        type: 'room.presence',
+        envelope,
+      };
+      this.broadcast(transport, ws);
+    }
+  }
+
+  // ---------------------------------------------------------------------------
+  // Auth Response + Reconnect Replay
+  // ---------------------------------------------------------------------------
+
+  private async handleAuthResponse(
+    ws: WebSocket,
+    meta: Extract<WebSocketAttachment, { authenticated: false }>,
+    authResponse: AuthResponse,
+  ): Promise<void> {
+    if (authResponse.challengeId !== meta.challengeId) {
+      safeLog('ws:auth-rejected', { reason: 'unknown-challenge', roomId: meta.roomId });
+      ws.close(WS_CLOSE_UNKNOWN_CHALLENGE, 'Unknown challenge');
+      return;
+    }
+
+    // The clientId in auth.response MUST match the server-assigned clientId
+    // from this connection's challenge. This prevents a participant from
+    // choosing another peer's clientId at auth time and overwriting their
+    // presence slot.
+    if (authResponse.clientId !== meta.clientId) {
+      safeLog('ws:auth-rejected', { reason: 'clientId-mismatch', roomId: meta.roomId });
+      ws.close(WS_CLOSE_INVALID_PROOF, 'clientId does not match challenge');
+      return;
+    }
+
+    if (Date.now() > meta.expiresAt) {
+      safeLog('ws:auth-rejected', { reason: 'expired', roomId: meta.roomId });
+      ws.close(WS_CLOSE_CHALLENGE_EXPIRED, 'Challenge expired');
+      return;
+    }
+
+    // Delegate lifecycle checks (deleted / expired / lazy-expiry) to the
+    // shared helper so this path doesn't drift from the post-auth path.
+    const roomState = await this.checkRoomLifecycle(ws, meta.roomId);
+    if (!roomState) return;
+
+    const valid = await verifyAuthProof(
+      roomState.roomVerifier,
+      meta.roomId,
+      authResponse.clientId,
+      meta.challengeId,
+      meta.nonce,
+      authResponse.proof,
+    );
+
+    if (!valid) {
+      safeLog('ws:auth-rejected', { reason: 'invalid-proof', roomId: meta.roomId });
+      ws.close(WS_CLOSE_INVALID_PROOF, 'Invalid proof');
+      return;
+    }
+
+    // Auth successful — update attachment
+    const authenticatedMeta: WebSocketAttachment = {
+      authenticated: true,
+      roomId: meta.roomId,
+      clientId: authResponse.clientId,
+      authenticatedAt: Date.now(),
+    };
+    ws.serializeAttachment(authenticatedMeta);
+
+    // Send auth.accepted
+    const accepted: AuthAccepted = {
+      type: 'auth.accepted',
+      seq: roomState.seq,
+      snapshotSeq: roomState.snapshotSeq,
+      snapshotAvailable: !!roomState.snapshotCiphertext,
+    };
+    ws.send(JSON.stringify(accepted));
+
+    // Reconnect replay
+    await this.replayEvents(ws, roomState, authResponse.lastSeq);
+
+    safeLog('ws:authenticated', { roomId: meta.roomId, clientId: authResponse.clientId, lastSeq: authResponse.lastSeq });
+  }
+
+  private async replayEvents(
+    ws: WebSocket,
+    roomState: RoomDurableState,
+    lastSeq: number | undefined,
+  ): Promise<void> {
+    // Local helper: single place that constructs and sends a room.snapshot
+    // transport message. Keeps the message shape in one place so any future
+    // field addition lands once.
+    const sendSnapshotToSocket = (): void => {
+      if (!roomState.snapshotCiphertext) return;
+      const snapshotMsg: RoomTransportMessage = {
+        type: 'room.snapshot',
+        snapshotSeq: roomState.snapshotSeq ?? 0,
+        snapshotCiphertext: roomState.snapshotCiphertext,
+      };
+      ws.send(JSON.stringify(snapshotMsg));
+    };
+
+    // Determine replay strategy
+    let sendSnapshot = false;
+    let replayFrom: number;
+
+    if (lastSeq === undefined) {
+      // Fresh join — send snapshot + all events
+      sendSnapshot = true;
+      replayFrom = (roomState.snapshotSeq ?? 0) + 1;
+    } else if (lastSeq > roomState.seq) {
+      // Future claim — anomaly, fall back to snapshot
+      sendSnapshot = true;
+      replayFrom = (roomState.snapshotSeq ?? 0) + 1;
+      safeLog('ws:replay-anomaly', { roomId: roomState.roomId, lastSeq, currentSeq: roomState.seq });
+    } else if (lastSeq === roomState.seq) {
+      // Fully caught up — still send snapshot if seq is 0 (fresh room, no events yet)
+      if (roomState.seq === 0) {
+        sendSnapshotToSocket();
+      }
+      return;
+    } else {
+      // Check if we can replay incrementally
+      const nextNeededSeq = lastSeq + 1;
+      // In V1 earliestRetainedSeq stays 1 because there is no compaction.
+      // This branch becomes active once future compaction advances it.
+      if (nextNeededSeq < roomState.earliestRetainedSeq) {
+        // Too old — need snapshot fallback
+        sendSnapshot = true;
+        replayFrom = (roomState.snapshotSeq ?? 0) + 1;
+      } else {
+        // Can replay from retained log
+        replayFrom = nextNeededSeq;
+      }
+    }
+
+    if (sendSnapshot) {
+      sendSnapshotToSocket();
+    }
+
+    // Replay events from storage (if any exist). Paginated so large rooms
+    // don't load the full event log into DO memory at reconnect time —
+    // storage.list() without a limit can blow memory in rooms with many
+    // retained events (V1 retains all events for the room lifetime).
+    if (roomState.seq > 0 && replayFrom <= roomState.seq) {
+      let cursor = `event:${padSeq(replayFrom)}`;
+      const end = `event:${padSeq(roomState.seq)}\uffff`;  // inclusive of roomState.seq
+      while (true) {
+        const page = await this.ctx.storage.list<SequencedEnvelope>({
+          prefix: 'event:',
+          start: cursor,
+          end,
+          limit: REPLAY_PAGE_SIZE,
+        });
+        if (page.size === 0) break;
+        let lastKey = cursor;
+        for (const [key, sequenced] of page) {
+          const transport: RoomTransportMessage = {
+            type: 'room.event',
+            seq: sequenced.seq,
+            receivedAt: sequenced.receivedAt,
+            envelope: sequenced.envelope,
+          };
+          ws.send(JSON.stringify(transport));
+          lastKey = key;
+        }
+        if (page.size < REPLAY_PAGE_SIZE) break;
+        // Advance cursor past the last emitted key. `storage.list({ start })`
+        // is INCLUSIVE, so passing `lastKey` would re-emit the final event.
+        // Appending U+0000 (the smallest Unicode code point) produces a string
+        // strictly greater than `lastKey` but strictly less than any valid
+        // next key — because padded numeric seq keys are ASCII digits only
+        // and never contain a null byte, no real key can fall between them.
+        // Using `\uffff` (max code point) here would be WRONG: it would skip
+        // all keys lexicographically between `lastKey` and `lastKey\uffff`,
+        // dropping legitimate events from the replay.
+        cursor = `${lastKey}\u0000`;
+      }
+    }
+  }
+
+  // ---------------------------------------------------------------------------
+  // Admin Challenge-Response
+  // ---------------------------------------------------------------------------
+
+  private async handleAdminChallengeRequest(
+    ws: WebSocket,
+    meta: Extract<WebSocketAttachment, { authenticated: true }>,
+  ): Promise<void> {
+    // Lifecycle check — reject for terminal rooms
+    const roomState = await this.checkRoomLifecycle(ws, meta.roomId);
+    if (!roomState) return;
+
+    const challengeId = generateChallengeId();
+    const nonce = generateNonce();
+    const expiresAt = Date.now() + ADMIN_CHALLENGE_TTL_MS;
+
+    // Store in attachment (survives hibernation)
+    const updatedMeta: WebSocketAttachment = {
+      ...meta,
+      pendingAdminChallenge: { challengeId, nonce, expiresAt },
+    };
+    ws.serializeAttachment(updatedMeta);
+
+    const challenge: AdminChallenge = {
+      type: 'admin.challenge',
+      challengeId,
+      nonce,
+      expiresAt,
+    };
+    ws.send(JSON.stringify(challenge));
+
+    safeLog('admin:challenge-sent', { roomId: meta.roomId, clientId: meta.clientId, challengeId });
+  }
+
+  private async handleAdminCommand(
+    ws: WebSocket,
+    meta: Extract<WebSocketAttachment, { authenticated: true }>,
+    msg: Record<string, unknown>,
+  ): Promise<void> {
+    // ADMIN ERROR-CODE CONTRACT
+    // -------------------------
+    // Every error code emitted from this method AND from helpers it calls
+    // (applyDelete, admin-scoped branches of handleAdminChallengeRequest)
+    // must be listed in the client's ADMIN_SCOPED_ERROR_CODES Set in
+    // packages/shared/collab/client-runtime/client.ts. That Set gates which
+    // room.error payloads reject a pending admin promise; a code that
+    // fires here but is missing from the Set leaves the client hanging
+    // until AdminTimeoutError. A code that fires on the event channel but
+    // is ADDED to the Set (e.g. validation_error) wrongly cancels
+    // unrelated in-flight admin commands. When adding/renaming/removing
+    // admin-path codes, update the client Set in the same change.
+    const validated = validateAdminCommandEnvelope(msg);
+    if (isValidationError(validated)) {
+      // Admin-scoped code so the client can distinguish admin-flow failures
+      // from event-channel failures (e.g. validation_error fires on the
+      // event channel while an admin command is in flight — rejecting
+      // pendingAdmin on those would be wrong).
+      this.sendAdminError(ws, AdminErrorCode.ValidationError, validated.error);
+      return;
+    }
+    // isValidationError narrows; `validated` is AdminCommandEnvelope here.
+    const cmdEnvelope = validated;
+
+    // Reject cross-connection clientId spoofing
+    if (cmdEnvelope.clientId !== meta.clientId) {
+      this.sendAdminError(ws, AdminErrorCode.ClientIdMismatch, 'clientId does not match authenticated connection');
+      return;
+    }
+
+    // Check pending admin challenge
+    if (!meta.pendingAdminChallenge) {
+      this.sendAdminError(ws, AdminErrorCode.NoAdminChallenge, 'Request an admin challenge first');
+      return;
+    }
+    if (cmdEnvelope.challengeId !== meta.pendingAdminChallenge.challengeId) {
+      this.sendAdminError(ws, AdminErrorCode.UnknownAdminChallenge, 'Challenge ID does not match');
+      return;
+    }
+
+    // Save challenge data before clearing
+    const { challengeId, nonce, expiresAt } = meta.pendingAdminChallenge;
+
+    // Clear challenge from attachment (single-use) — serialize immediately
+    const { pendingAdminChallenge: _, ...cleanMeta } = meta;
+    ws.serializeAttachment(cleanMeta);
+
+    // Check expiry
+    if (Date.now() > expiresAt) {
+      this.sendAdminError(ws, AdminErrorCode.AdminChallengeExpired, 'Admin challenge expired');
+      return;
+    }
+
+    // Lifecycle check — reject for terminal rooms
+    const roomState = await this.checkRoomLifecycle(ws, meta.roomId);
+    if (!roomState) return;
+
+    // Verify admin proof
+    const valid = await verifyAdminProof(
+      roomState.adminVerifier,
+      meta.roomId,
+      meta.clientId,
+      challengeId,
+      nonce,
+      cmdEnvelope.command,
+      cmdEnvelope.adminProof,
+    );
+
+    if (!valid) {
+      safeLog('admin:proof-rejected', { roomId: meta.roomId, clientId: meta.clientId });
+      this.sendAdminError(ws, AdminErrorCode.InvalidAdminProof, 'Admin proof verification failed');
+      return;
+    }
+
+    // Apply command
+    switch (cmdEnvelope.command.type) {
+      case 'room.delete':
+        await this.applyDelete(ws, roomState);
+        break;
+      default: {
+        // Compile-time exhaustiveness guard: if a new admin command is added
+        // to the union and a case here is missed, TypeScript fails here.
+        const _exhaustive: never = cmdEnvelope.command.type;
+        void _exhaustive;
+        break;
+      }
+    }
+  }
+
+  // ---------------------------------------------------------------------------
+  // Admin Command Execution
+  // ---------------------------------------------------------------------------
+
+  private async applyDelete(
+    ws: WebSocket,
+    roomState: RoomDurableState,
+  ): Promise<void> {
+    // checkRoomLifecycle ran at the top of handleAdminCommand, so this
+    // path is only reachable for a live room. purgeRoom wipes storage,
+    // purges event keys, cancels the expiry alarm, and closes every
+    // socket (including the admin's) with the generic unavailable
+    // reason — same terminal UX as an expired room or a never-created
+    // URL.
+    try {
+      await this.purgeRoom('admin');
+    } catch (e) {
+      // purgeRoom already handles its own storage-error logging. Signal
+      // the admin caller that the delete didn't complete so their
+      // pending promise rejects cleanly.
+      safeLog('room:delete-error', { roomId: roomState.roomId, error: String(e) });
+      this.sendAdminError(ws, AdminErrorCode.DeleteFailed, 'Failed to delete room');
+    }
+  }
+
+  // ---------------------------------------------------------------------------
+  // Storage Helpers
+  // ---------------------------------------------------------------------------
+
+  /**
+   * Delete all event keys from storage in batches. Paginated for the same
+   * reason as replay: avoid loading the full event log into DO memory.
+   * Less latency-sensitive than replay but the memory bound still matters.
+   */
+  private async purgeEventKeys(): Promise<void> {
+    while (true) {
+      const page = await this.ctx.storage.list({
+        prefix: 'event:',
+        limit: DELETE_BATCH_SIZE,
+      });
+      if (page.size === 0) break;
+      await this.ctx.storage.delete([...page.keys()]);
+      if (page.size < DELETE_BATCH_SIZE) break;
+    }
+  }
+
+  // ---------------------------------------------------------------------------
+  // Cleanup — single unified hard-delete path
+  // ---------------------------------------------------------------------------
+
+  /**
+   * Hard-delete the room. No tombstone, no lingering state — once this
+   * returns, the DO storage is empty of room data and every connected
+   * socket has been closed with the generic "room unavailable" reason.
+   *
+   * Called from four triggers:
+   *   - 'expiry'                       alarm fired at expiresAt
+   *   - 'admin'                        creator clicked Delete room
+   *   - 'create-preempted-expired'     a fresh create is supplanting a
+   *                                    room whose alarm never fired
+   *   - 'lifecycle-preempted-expired'  a socket reached us after the
+   *                                    deadline; alarm hadn't landed yet
+   *   - 'upgrade-preempted-expired'    same, on the HTTP upgrade path
+   *
+   * `reason` is logged but not surfaced to clients — from their
+   * perspective, every purge looks the same: the link stops resolving.
+   */
+  private async purgeRoom(
+    reason: 'expiry' | 'admin' | 'create-preempted-expired' | 'lifecycle-preempted-expired' | 'upgrade-preempted-expired',
+    except?: WebSocket,
+  ): Promise<void> {
+    // Hard-delete the room record FIRST. Absence is what makes the room
+    // unreachable to any new connection — a concurrent WS upgrade or
+    // lifecycle check that lands mid-purge sees nothing and rejects.
+    // Closing sockets before this would leave a window where the room
+    // key still reads as present.
+    try {
+      await this.ctx.storage.delete('room');
+    } catch (e) {
+      safeLog('room:purge-delete-error', { reason, error: String(e) });
+      throw e;
+    }
+
+    // Now close connected peers so they see the terminal close.
+    this.closeRoomSockets(WS_CLOSE_REASON_ROOM_UNAVAILABLE, except);
+
+    // Best-effort: cancel the pending alarm in case the trigger wasn't
+    // the alarm itself. Avoids a redundant alarm wake after we've
+    // already emptied the room.
+    try {
+      await this.ctx.storage.deleteAlarm();
+    } catch (e) {
+      safeLog('room:purge-delete-alarm-error', { reason, error: String(e) });
+    }
+
+    // Purge event log (per-event keys).
+    try {
+      await this.purgeEventKeys();
+    } catch (e) {
+      safeLog('room:purge-event-keys-error', { reason, error: String(e) });
+    }
+
+    safeLog('room:purged', { reason });
+  }
+
+  // ---------------------------------------------------------------------------
+  // Broadcast Helpers
+  // ---------------------------------------------------------------------------
+
+  /**
+   * Send a transport message to every authenticated socket in the room,
+   * optionally excluding one (e.g. the sender for presence relay). Send
+   * failures are intentionally ignored — the target socket may have closed.
+   */
+  private broadcast(message: RoomTransportMessage, exclude?: WebSocket): void {
+    const json = JSON.stringify(message);
+    for (const socket of this.ctx.getWebSockets()) {
+      if (socket === exclude) continue;
+      const att = socket.deserializeAttachment() as WebSocketAttachment | null;
+      if (att?.authenticated) {
+        try { socket.send(json); } catch { /* socket may have closed */ }
+      }
+    }
+  }
+
+  private sendError(ws: WebSocket, code: string, message: string): void {
+    const error: RoomTransportMessage = { type: 'room.error', code, message };
+    try { ws.send(JSON.stringify(error)); } catch { /* socket may have closed */ }
+  }
+
+  /**
+   * Admin-scoped error emitter. Every admin-command rejection path
+   * (validate, challenge, proof, state, persist) MUST go through this
+   * wrapper instead of raw `sendError` so the `AdminErrorCode` type
+   * enforces the contract the client's rejection gate relies on
+   * (see `ADMIN_ERROR_CODES` in shared/collab/constants.ts). Adding a
+   * new admin error = add a key to `AdminErrorCode`, use it here;
+   * typos and non-admin codes surface as compile errors.
+   */
+  private sendAdminError(ws: WebSocket, code: AdminErrorCode, message: string): void {
+    this.sendError(ws, code, message);
+  }
+
+  private closeRoomSockets(reason: string, except?: WebSocket): void {
+    for (const socket of this.ctx.getWebSockets()) {
+      if (socket !== except) {
+        socket.close(WS_CLOSE_ROOM_UNAVAILABLE, reason);
+      }
+    }
+  }
+
+  // ---------------------------------------------------------------------------
+  // WebSocket Lifecycle (Hibernation API)
+  // ---------------------------------------------------------------------------
+
+  async webSocketClose(ws: WebSocket, code: number, _reason: string, _wasClean: boolean): Promise<void> {
+    const meta = ws.deserializeAttachment() as WebSocketAttachment | null;
+    const roomId = meta?.roomId ?? 'unknown';
+    const clientId = meta?.authenticated ? meta.clientId : 'unauthenticated';
+    safeLog('ws:closed', { roomId, clientId, code });
+
+    // Tell the remaining peers the closed client has left so they can
+    // drop that clientId's presence (cursor + avatar) immediately.
+    // Without this, peers wait out the 30s client-side TTL sweep,
+    // which made "refresh to test" pile up one ghost cursor per
+    // refresh until the entries expired. Only broadcast for
+    // authenticated sockets — unauth'd ones were never in peers'
+    // presence maps, so nothing needs cleanup.
+    //
+    // `exclude: ws` leaves the closing socket out of the fan-out.
+    // It may already be detached, but the broadcast's send-try/catch
+    // tolerates that either way. No payload beyond clientId — the
+    // protocol is zero-knowledge; we only relay opaque encrypted
+    // presence packets, and the clientId is server-assigned in the
+    // auth challenge so it's already non-secret.
+    if (meta?.authenticated) {
+      this.broadcast(
+        { type: 'room.participant.left', clientId: meta.clientId },
+        ws,
+      );
+    }
+  }
+
+  async webSocketError(ws: WebSocket, error: unknown): Promise<void> {
+    const meta = ws.deserializeAttachment() as WebSocketAttachment | null;
+    const roomId = meta?.roomId ?? 'unknown';
+    safeLog('ws:error', { roomId, error: String(error) });
+  }
+}
diff --git a/apps/room-service/core/room-engine.test.ts b/apps/room-service/core/room-engine.test.ts
new file mode 100644
index 000000000..2af7fc763
--- /dev/null
+++ b/apps/room-service/core/room-engine.test.ts
@@ -0,0 +1,159 @@
+/**
+ * Slice 3 engine tests — validation, admin proofs, and lifecycle helpers.
+ *
+ * Tests act as external clients and import from @plannotator/shared/collab/client.
+ */
+
+import { describe, expect, test } from 'bun:test';
+import {
+  validateServerEnvelope,
+  validateAdminCommandEnvelope,
+  isValidationError,
+} from './validation';
+import type { ValidationError } from './validation';
+import {
+  deriveAdminKey,
+  computeAdminVerifier,
+  computeAdminProof,
+  verifyAdminProof,
+  generateChallengeId,
+  generateNonce,
+} from '@plannotator/shared/collab/client';
+import type { AdminCommand } from '@plannotator/shared/collab';
+
+// ---------------------------------------------------------------------------
+// validateServerEnvelope
+// ---------------------------------------------------------------------------
+
+describe('validateServerEnvelope', () => {
+  const validEvent = {
+    clientId: 'client-1',
+    opId: 'op-abc',
+    channel: 'event',
+    ciphertext: 'encrypted-data',
+  };
+
+  test('accepts valid event envelope', () => {
+    const result = validateServerEnvelope(validEvent);
+    expect(isValidationError(result)).toBe(false);
+  });
+
+  test('accepts valid presence envelope', () => {
+    const result = validateServerEnvelope({ ...validEvent, channel: 'presence' });
+    expect(isValidationError(result)).toBe(false);
+  });
+
+  test('rejects missing clientId', () => {
+    const { clientId: _, ...rest } = validEvent;
+    expect(isValidationError(validateServerEnvelope(rest))).toBe(true);
+  });
+
+  test('rejects missing opId', () => {
+    const { opId: _, ...rest } = validEvent;
+    expect(isValidationError(validateServerEnvelope(rest))).toBe(true);
+  });
+
+  test('rejects invalid channel', () => {
+    expect(isValidationError(validateServerEnvelope({ ...validEvent, channel: 'invalid' }))).toBe(true);
+  });
+
+  test('rejects missing ciphertext', () => {
+    const { ciphertext: _, ...rest } = validEvent;
+    expect(isValidationError(validateServerEnvelope(rest))).toBe(true);
+  });
+
+  test('rejects oversized event ciphertext (> 512 KB)', () => {
+    const result = validateServerEnvelope({ ...validEvent, ciphertext: 'x'.repeat(512_001) });
+    expect(isValidationError(result)).toBe(true);
+    expect((result as ValidationError).status).toBe(413);
+  });
+
+  test('rejects oversized presence ciphertext (> 8 KB)', () => {
+    const result = validateServerEnvelope({ ...validEvent, channel: 'presence', ciphertext: 'x'.repeat(8_193) });
+    expect(isValidationError(result)).toBe(true);
+    expect((result as ValidationError).status).toBe(413);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// validateAdminCommandEnvelope
+// ---------------------------------------------------------------------------
+
+describe('validateAdminCommandEnvelope', () => {
+  const validDelete = {
+    type: 'admin.command',
+    challengeId: 'ch_abc',
+    clientId: 'client-1',
+    command: { type: 'room.delete' },
+    adminProof: 'proof-data',
+  };
+
+  test('accepts valid delete command', () => {
+    const result = validateAdminCommandEnvelope(validDelete);
+    expect(isValidationError(result)).toBe(false);
+  });
+
+  test('rejects unknown command type', () => {
+    expect(isValidationError(validateAdminCommandEnvelope({ ...validDelete, command: { type: 'room.explode' } }))).toBe(true);
+  });
+
+  test('rejects missing challengeId', () => {
+    const { challengeId: _, ...rest } = validDelete;
+    expect(isValidationError(validateAdminCommandEnvelope(rest))).toBe(true);
+  });
+
+  test('rejects missing adminProof', () => {
+    const { adminProof: _, ...rest } = validDelete;
+    expect(isValidationError(validateAdminCommandEnvelope(rest))).toBe(true);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// Admin Proof Round-Trip
+// ---------------------------------------------------------------------------
+
+const ADMIN_SECRET = new Uint8Array(32);
+ADMIN_SECRET.fill(0xcd);
+const ROOM_ID = 'test-room-admin-proof';
+
+describe('admin proof verification (end-to-end)', () => {
+  test('valid admin proof is accepted', async () => {
+    const adminKey = await deriveAdminKey(ADMIN_SECRET);
+    const verifier = await computeAdminVerifier(adminKey, ROOM_ID);
+    const challengeId = generateChallengeId();
+    const nonce = generateNonce();
+    const command: AdminCommand = { type: 'room.delete' };
+
+    const proof = await computeAdminProof(verifier, ROOM_ID, 'client-1', challengeId, nonce, command);
+    const valid = await verifyAdminProof(verifier, ROOM_ID, 'client-1', challengeId, nonce, command, proof);
+    expect(valid).toBe(true);
+  });
+
+  test('wrong proof is rejected', async () => {
+    const adminKey = await deriveAdminKey(ADMIN_SECRET);
+    const verifier = await computeAdminVerifier(adminKey, ROOM_ID);
+    const challengeId = generateChallengeId();
+    const nonce = generateNonce();
+    const command: AdminCommand = { type: 'room.delete' };
+
+    const valid = await verifyAdminProof(verifier, ROOM_ID, 'client-1', challengeId, nonce, command, 'garbage-proof');
+    expect(valid).toBe(false);
+  });
+
+  test('proof cannot verify against a different command shape (binding via canonicalJson)', async () => {
+    // V1 has a single AdminCommand shape, so we exercise the binding via
+    // an unsanctioned command — the proof must not verify for anything
+    // whose canonicalJson differs from what was signed.
+    const adminKey = await deriveAdminKey(ADMIN_SECRET);
+    const verifier = await computeAdminVerifier(adminKey, ROOM_ID);
+    const challengeId = generateChallengeId();
+    const nonce = generateNonce();
+
+    const deleteCommand: AdminCommand = { type: 'room.delete' };
+    const otherCommand = { type: 'room.other' } as unknown as AdminCommand;
+
+    const proof = await computeAdminProof(verifier, ROOM_ID, 'client-1', challengeId, nonce, deleteCommand);
+    const valid = await verifyAdminProof(verifier, ROOM_ID, 'client-1', challengeId, nonce, otherCommand, proof);
+    expect(valid).toBe(false);
+  });
+});
diff --git a/apps/room-service/core/types.ts b/apps/room-service/core/types.ts
new file mode 100644
index 000000000..f3d1bb3a2
--- /dev/null
+++ b/apps/room-service/core/types.ts
@@ -0,0 +1,73 @@
+/**
+ * Server-only types for the room-service Durable Object.
+ *
+ * RoomDurableState is the persistent room record stored in DO storage.
+ * WebSocketAttachment is serialized per-connection metadata that survives
+ * DO hibernation via serializeAttachment/deserializeAttachment.
+ */
+
+// ---------------------------------------------------------------------------
+// Worker Environment
+// ---------------------------------------------------------------------------
+
+/** Cloudflare Worker environment bindings. */
+export interface Env {
+  ROOM: DurableObjectNamespace;
+  /** Wrangler-managed static asset binding. Serves `./public/index.html` (room shell) + hashed `./public/assets/*` chunks. Populated by `bun run build:shell`. */
+  ASSETS?: { fetch(request: Request): Promise<Response> };
+  ALLOWED_ORIGINS?: string;
+  ALLOW_LOCALHOST_ORIGINS?: string;
+  BASE_URL?: string;
+}
+
+/**
+ * Durable state stored in DO storage under key 'room'.
+ *
+ * The room either exists (this record is present) or it doesn't (key
+ * absent). There's no "deleted" / "expired" tombstone state — purgeRoom
+ * hard-deletes the key when the 30-day alarm fires or when an admin
+ * issues delete. Absence means "link doesn't resolve."
+ *
+ * Events are NOT stored in this record — they use separate per-event keys
+ * ('event:0000000001', etc.) to stay within DO per-value size limits.
+ */
+export interface RoomDurableState {
+  /** Stored at creation — DO can't reverse idFromName(). */
+  roomId: string;
+  roomVerifier: string;
+  adminVerifier: string;
+  seq: number;
+  /** Oldest event seq still in storage. Initialized to 1 at creation. */
+  earliestRetainedSeq: number;
+  snapshotCiphertext?: string;
+  snapshotSeq?: number;
+  expiresAt: number | null;
+}
+
+/**
+ * WebSocket attachment — survives hibernation via serializeAttachment/deserializeAttachment.
+ *
+ * Pre-auth: holds pending challenge state so the DO can verify after waking.
+ * Post-auth: holds authenticated connection metadata + optional pending admin challenge.
+ * Both variants carry roomId so webSocketMessage() can access it without a storage read.
+ */
+export type WebSocketAttachment =
+  | {
+      authenticated: false;
+      roomId: string;
+      challengeId: string;
+      nonce: string;
+      expiresAt: number;
+      /** Server-assigned ephemeral client id for this connection. Included in
+       *  the auth challenge so the client's proof binds to it; prevents a
+       *  malicious participant from choosing another user's clientId at auth
+       *  time and overwriting their presence slot after auth. */
+      clientId: string;
+    }
+  | {
+      authenticated: true;
+      roomId: string;
+      clientId: string;
+      authenticatedAt: number;
+      pendingAdminChallenge?: { challengeId: string; nonce: string; expiresAt: number };
+    };
diff --git a/apps/room-service/core/validation.test.ts b/apps/room-service/core/validation.test.ts
new file mode 100644
index 000000000..f7da2bf85
--- /dev/null
+++ b/apps/room-service/core/validation.test.ts
@@ -0,0 +1,286 @@
+import { describe, expect, test } from 'bun:test';
+import {
+  validateCreateRoomRequest,
+  isValidationError,
+  clampExpiryDays,
+  hasRoomExpired,
+  isRoomId,
+  validateServerEnvelope,
+  validateAdminCommandEnvelope,
+} from './validation';
+
+describe('validateCreateRoomRequest', () => {
+  // 22-char base64url room ID (matches generateRoomId() output: 16 random bytes)
+  const validRoomId = 'ABCDEFGHIJKLMNOPQRSTUv';
+  // 43-char base64url verifiers (matches HMAC-SHA-256 output: 32 bytes)
+  const validVerifier = 'ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopq';
+  const validAdminVerifier = 'abcdefghijklmnopqrstuvwxyz0123456789_-ABCDE';
+  const validBody = {
+    roomId: validRoomId,
+    roomVerifier: validVerifier,
+    adminVerifier: validAdminVerifier,
+    initialSnapshotCiphertext: 'encrypted-snapshot-data',
+  };
+
+  test('accepts valid request', () => {
+    const result = validateCreateRoomRequest(validBody);
+    expect(isValidationError(result)).toBe(false);
+    if (!isValidationError(result)) {
+      expect(result.roomId).toBe(validRoomId);
+      expect(result.roomVerifier).toBe(validVerifier);
+      expect(result.adminVerifier).toBe(validAdminVerifier);
+      expect(result.initialSnapshotCiphertext).toBe('encrypted-snapshot-data');
+    }
+  });
+
+  test('accepts request with expiresInDays', () => {
+    const result = validateCreateRoomRequest({ ...validBody, expiresInDays: 7 });
+    expect(isValidationError(result)).toBe(false);
+    if (!isValidationError(result)) {
+      expect(result.expiresInDays).toBe(7);
+    }
+  });
+
+  test('rejects null body', () => {
+    const result = validateCreateRoomRequest(null);
+    expect(isValidationError(result)).toBe(true);
+    if (isValidationError(result)) {
+      expect(result.status).toBe(400);
+    }
+  });
+
+  test('rejects non-object body', () => {
+    const result = validateCreateRoomRequest('not an object');
+    expect(isValidationError(result)).toBe(true);
+  });
+
+  test('rejects missing roomId', () => {
+    const { roomId: _, ...body } = validBody;
+    const result = validateCreateRoomRequest(body);
+    expect(isValidationError(result)).toBe(true);
+    if (isValidationError(result)) {
+      expect(result.error).toContain('roomId');
+    }
+  });
+
+  test('rejects empty roomId', () => {
+    const result = validateCreateRoomRequest({ ...validBody, roomId: '' });
+    expect(isValidationError(result)).toBe(true);
+  });
+
+  test('rejects missing roomVerifier', () => {
+    const { roomVerifier: _, ...body } = validBody;
+    const result = validateCreateRoomRequest(body);
+    expect(isValidationError(result)).toBe(true);
+    if (isValidationError(result)) {
+      expect(result.error).toContain('roomVerifier');
+    }
+  });
+
+  test('rejects missing adminVerifier', () => {
+    const { adminVerifier: _, ...body } = validBody;
+    const result = validateCreateRoomRequest(body);
+    expect(isValidationError(result)).toBe(true);
+    if (isValidationError(result)) {
+      expect(result.error).toContain('adminVerifier');
+    }
+  });
+
+  test('rejects malformed roomVerifier (wrong length)', () => {
+    expect(isValidationError(validateCreateRoomRequest({ ...validBody, roomVerifier: 'too-short' }))).toBe(true);
+    expect(isValidationError(validateCreateRoomRequest({ ...validBody, roomVerifier: 'a'.repeat(44) }))).toBe(true);
+  });
+
+  test('rejects malformed adminVerifier (wrong length)', () => {
+    expect(isValidationError(validateCreateRoomRequest({ ...validBody, adminVerifier: 'too-short' }))).toBe(true);
+  });
+
+  test('rejects verifier with invalid characters (exactly 43 chars, bad final char)', () => {
+    // 26 + 16 + 1 = 43 chars, only the / is invalid
+    expect(isValidationError(validateCreateRoomRequest({ ...validBody, roomVerifier: 'ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnop/' }))).toBe(true);
+  });
+
+  test('rejects missing initialSnapshotCiphertext', () => {
+    const { initialSnapshotCiphertext: _, ...body } = validBody;
+    const result = validateCreateRoomRequest(body);
+    expect(isValidationError(result)).toBe(true);
+    if (isValidationError(result)) {
+      expect(result.error).toContain('initialSnapshotCiphertext');
+    }
+  });
+
+  test('rejects oversized initialSnapshotCiphertext', () => {
+    const result = validateCreateRoomRequest({
+      ...validBody,
+      initialSnapshotCiphertext: 'x'.repeat(1_500_001),
+    });
+    expect(isValidationError(result)).toBe(true);
+    if (isValidationError(result)) {
+      expect(result.status).toBe(413);
+    }
+  });
+
+  test('rejects roomId with invalid characters (exactly 22 chars, bad final char)', () => {
+    expect(isValidationError(validateCreateRoomRequest({ ...validBody, roomId: 'ABCDEFGHIJKLMNOPQRSTU/' }))).toBe(true);
+    expect(isValidationError(validateCreateRoomRequest({ ...validBody, roomId: 'ABCDEFGHIJKLMNOPQRSTU?' }))).toBe(true);
+    expect(isValidationError(validateCreateRoomRequest({ ...validBody, roomId: 'ABCDEFGHIJKLMNOPQRSTU ' }))).toBe(true);
+  });
+
+  test('rejects roomId that is not exactly 22 chars', () => {
+    expect(isValidationError(validateCreateRoomRequest({ ...validBody, roomId: 'ABCDEFGHIJKLMNOPQRSTUvW' }))).toBe(true); // 23 chars
+    expect(isValidationError(validateCreateRoomRequest({ ...validBody, roomId: 'ABCDEFGHIJKLMNOPQRSTu' }))).toBe(true); // 21 chars
+    expect(isValidationError(validateCreateRoomRequest({ ...validBody, roomId: 'short' }))).toBe(true);
+  });
+
+  test('accepts exactly 22 base64url chars', () => {
+    expect(isValidationError(validateCreateRoomRequest({ ...validBody, roomId: 'ABCDEFGHIJKLMNOPQRSTUv' }))).toBe(false);
+    expect(isValidationError(validateCreateRoomRequest({ ...validBody, roomId: 'abcdefghijklmnopqrstuv' }))).toBe(false);
+    expect(isValidationError(validateCreateRoomRequest({ ...validBody, roomId: '0123456789_-ABCDEFGHIJ' }))).toBe(false);
+  });
+});
+
+describe('clampExpiryDays', () => {
+  test('defaults to 30', () => {
+    expect(clampExpiryDays(undefined)).toBe(30);
+  });
+
+  test('0 means never (null)', () => {
+    expect(clampExpiryDays(0)).toBe(null);
+  });
+
+  test('clamps negative to 1', () => {
+    expect(clampExpiryDays(-5)).toBe(1);
+  });
+
+  test('clamps 100 to 30', () => {
+    expect(clampExpiryDays(100)).toBe(30);
+  });
+
+  test('passes through valid value', () => {
+    expect(clampExpiryDays(7)).toBe(7);
+  });
+
+  test('floors fractional days', () => {
+    expect(clampExpiryDays(7.9)).toBe(7);
+  });
+});
+
+describe('hasRoomExpired', () => {
+  test('returns false before expiry', () => {
+    expect(hasRoomExpired(2_000, 1_999)).toBe(false);
+  });
+
+  test('returns false at exact expiry timestamp', () => {
+    expect(hasRoomExpired(2_000, 2_000)).toBe(false);
+  });
+
+  test('returns true after expiry', () => {
+    expect(hasRoomExpired(2_000, 2_001)).toBe(true);
+  });
+
+  test('returns false when expiresAt is null (never)', () => {
+    expect(hasRoomExpired(null)).toBe(false);
+  });
+});
+
+describe('isRoomId', () => {
+  test('accepts valid 22-char base64url ids', () => {
+    expect(isRoomId('ABCDEFGHIJKLMNOPQRSTUv')).toBe(true);
+    expect(isRoomId('abcdef_ghij-klmnopqrst')).toBe(true);
+  });
+  test('rejects wrong-length ids', () => {
+    expect(isRoomId('short')).toBe(false);
+    expect(isRoomId('A'.repeat(21))).toBe(false);
+    expect(isRoomId('A'.repeat(23))).toBe(false);
+  });
+  test('rejects ids containing disallowed characters', () => {
+    expect(isRoomId('A'.repeat(21) + '!')).toBe(false);
+    expect(isRoomId('A'.repeat(21) + '/')).toBe(false);
+    expect(isRoomId('A'.repeat(21) + '=')).toBe(false);
+  });
+  test('rejects non-string inputs', () => {
+    expect(isRoomId(undefined)).toBe(false);
+    expect(isRoomId(42 as unknown as string)).toBe(false);
+    expect(isRoomId(null)).toBe(false);
+  });
+});
+
+describe('validateAdminCommandEnvelope — strips extra fields (P2)', () => {
+  const validBase = {
+    type: 'admin.command',
+    challengeId: 'cid',
+    clientId: 'client',
+    adminProof: 'proof',
+  };
+  test('room.delete strips extras from command', () => {
+    const r = validateAdminCommandEnvelope({
+      ...validBase,
+      command: { type: 'room.delete', piggyback: 'value', extra: 'smuggled' },
+    });
+    expect(isValidationError(r)).toBe(false);
+    if (!isValidationError(r)) {
+      expect(r.command).toEqual({ type: 'room.delete' });
+      expect(Object.keys(r.command)).toEqual(['type']);
+    }
+  });
+  test('rejects unknown command type', () => {
+    const r = validateAdminCommandEnvelope({
+      ...validBase,
+      command: { type: 'room.explode' },
+    });
+    expect(isValidationError(r)).toBe(true);
+  });
+
+  test('rejects overlong adminProof', () => {
+    const r = validateAdminCommandEnvelope({
+      ...validBase,
+      adminProof: 'x'.repeat(129),
+      command: { type: 'room.delete' },
+    });
+    expect(isValidationError(r)).toBe(true);
+    if (isValidationError(r)) expect(r.error).toMatch(/adminProof/);
+  });
+
+  test('rejects overlong challengeId', () => {
+    const r = validateAdminCommandEnvelope({
+      ...validBase,
+      challengeId: 'x'.repeat(65),
+      command: { type: 'room.delete' },
+    });
+    expect(isValidationError(r)).toBe(true);
+    if (isValidationError(r)) expect(r.error).toMatch(/challengeId/);
+  });
+
+  test('rejects overlong clientId', () => {
+    const r = validateAdminCommandEnvelope({
+      ...validBase,
+      clientId: 'x'.repeat(65),
+      command: { type: 'room.delete' },
+    });
+    expect(isValidationError(r)).toBe(true);
+    if (isValidationError(r)) expect(r.error).toMatch(/clientId/);
+  });
+});
+
+describe('validateServerEnvelope — length caps (P3)', () => {
+  const validBase = {
+    clientId: 'c123',
+    opId: 'o123',
+    channel: 'event' as const,
+    ciphertext: 'abc',
+  };
+  test('accepts valid envelope', () => {
+    const r = validateServerEnvelope({ ...validBase });
+    expect(isValidationError(r)).toBe(false);
+  });
+  test('rejects opId over 64 chars (replay amplification surface)', () => {
+    const r = validateServerEnvelope({ ...validBase, opId: 'x'.repeat(65) });
+    expect(isValidationError(r)).toBe(true);
+    if (isValidationError(r)) expect(r.error).toMatch(/opId/);
+  });
+  test('rejects clientId over 64 chars', () => {
+    const r = validateServerEnvelope({ ...validBase, clientId: 'x'.repeat(65) });
+    expect(isValidationError(r)).toBe(true);
+    if (isValidationError(r)) expect(r.error).toMatch(/clientId/);
+  });
+});
diff --git a/apps/room-service/core/validation.ts b/apps/room-service/core/validation.ts
new file mode 100644
index 000000000..77415cd65
--- /dev/null
+++ b/apps/room-service/core/validation.ts
@@ -0,0 +1,234 @@
+/**
+ * Request body validation — pure functions, no Cloudflare APIs.
+ * Fully testable with bun:test.
+ */
+
+import type { CreateRoomRequest, ServerEnvelope, AdminCommandEnvelope } from '@plannotator/shared/collab';
+
+export interface ValidationError {
+  error: string;
+  status: number;
+}
+
+const MIN_EXPIRY_DAYS = 1;
+const MAX_EXPIRY_DAYS = 30;
+const DEFAULT_EXPIRY_DAYS = 30;
+const MAX_SNAPSHOT_CIPHERTEXT_LENGTH = 1_500_000; // ~1.5 MB
+const MAX_EVENT_CIPHERTEXT_LENGTH = 512_000; // ~512 KB per event
+const MAX_PRESENCE_CIPHERTEXT_LENGTH = 8_192; // ~8 KB per presence update
+
+/** Clamp expiry days to [1, 30], default 30. 0 means never. */
+export function clampExpiryDays(days: number | undefined): number | null {
+  if (days === undefined || days === null) return DEFAULT_EXPIRY_DAYS;
+  if (days === 0) return null;
+  return Math.max(MIN_EXPIRY_DAYS, Math.min(MAX_EXPIRY_DAYS, Math.floor(days)));
+}
+
+/** True when a room is beyond its fixed retention deadline. Never-expiring rooms return false. */
+export function hasRoomExpired(expiresAt: number | null, now: number = Date.now()): boolean {
+  if (expiresAt === null) return false;
+  return now > expiresAt;
+}
+
+function isNonEmptyString(value: unknown): value is string {
+  return typeof value === 'string' && value.length > 0;
+}
+
+/**
+ * Room IDs are generated from 16 random bytes and base64url-encoded without padding.
+ * That yields 22 URL-safe characters and 128 bits of entropy.
+ */
+const ROOM_ID_RE = /^[A-Za-z0-9_-]{22}$/;
+
+/** Runtime check for the roomId shape. Exported for use in WebSocket upgrade
+ *  paths where invalid IDs must be rejected BEFORE idFromName/DO instantiation
+ *  to avoid arbitrary DO names and storage reads on attacker-controlled input. */
+export function isRoomId(s: unknown): s is string {
+  return typeof s === 'string' && ROOM_ID_RE.test(s);
+}
+
+/**
+ * HMAC-SHA-256 output is 32 bytes, which base64url-encodes to 43 chars without padding.
+ * Verifiers must match this exact shape.
+ */
+const VERIFIER_RE = /^[A-Za-z0-9_-]{43}$/;
+
+/** Validate a POST /api/rooms request body. */
+export function validateCreateRoomRequest(
+  body: unknown,
+): CreateRoomRequest | ValidationError {
+  if (!body || typeof body !== 'object') {
+    return { error: 'Request body must be a JSON object', status: 400 };
+  }
+
+  const obj = body as Record<string, unknown>;
+
+  if (!isNonEmptyString(obj.roomId)) {
+    return { error: 'Missing or empty "roomId"', status: 400 };
+  }
+
+  if (!ROOM_ID_RE.test(obj.roomId)) {
+    return { error: '"roomId" must be exactly 22 base64url characters', status: 400 };
+  }
+
+  if (!isNonEmptyString(obj.roomVerifier) || !VERIFIER_RE.test(obj.roomVerifier)) {
+    return { error: '"roomVerifier" must be a 43-char base64url HMAC-SHA-256 verifier', status: 400 };
+  }
+
+  if (!isNonEmptyString(obj.adminVerifier) || !VERIFIER_RE.test(obj.adminVerifier)) {
+    return { error: '"adminVerifier" must be a 43-char base64url HMAC-SHA-256 verifier', status: 400 };
+  }
+
+  if (!isNonEmptyString(obj.initialSnapshotCiphertext)) {
+    return { error: 'Missing or empty "initialSnapshotCiphertext"', status: 400 };
+  }
+
+  if (obj.initialSnapshotCiphertext.length > MAX_SNAPSHOT_CIPHERTEXT_LENGTH) {
+    return { error: `"initialSnapshotCiphertext" exceeds max size (${Math.round(MAX_SNAPSHOT_CIPHERTEXT_LENGTH / 1024)} KB)`, status: 413 };
+  }
+
+  return {
+    roomId: obj.roomId,
+    roomVerifier: obj.roomVerifier,
+    adminVerifier: obj.adminVerifier,
+    initialSnapshotCiphertext: obj.initialSnapshotCiphertext,
+    expiresInDays: typeof obj.expiresInDays === 'number' ? obj.expiresInDays : undefined,
+  };
+}
+
+/** Type guard: is the result a ValidationError? Works with any validated union. */
+export function isValidationError<T>(result: T | ValidationError): result is ValidationError {
+  return typeof result === 'object' && result !== null && 'error' in result;
+}
+
+// ---------------------------------------------------------------------------
+// Post-Auth Message Validation
+// ---------------------------------------------------------------------------
+
+const VALID_CHANNELS = new Set(['event', 'presence']);
+const VALID_ADMIN_COMMANDS = new Set(['room.delete']);
+
+/**
+ * Max opId length on inbound event-channel envelopes. opId is stored DURABLY
+ * inside sequenced envelopes, so an authenticated participant could otherwise
+ * bloat replay bandwidth/storage by sending oversized opIds. generateOpId()
+ * produces 22-char base64url values (128 bits); 64 gives comfortable headroom
+ * without enabling amplification.
+ */
+const MAX_OP_ID_LENGTH = 64;
+/**
+ * Max clientId length. Server overrides envelope.clientId with the
+ * authenticated meta.clientId before persistence, but we still cap inbound
+ * values to keep validation symmetric and avoid storing oversized strings
+ * if the override is ever removed.
+ */
+const MAX_CLIENT_ID_LENGTH = 64;
+
+/**
+ * Max adminProof length. HMAC-SHA-256 base64url-encodes to 43 chars; the
+ * generous cap guards against pathological input without rejecting any
+ * legitimate client. Prevents an authenticated peer from spamming
+ * oversized proof strings to blow up verification cost / log volume.
+ */
+const MAX_ADMIN_PROOF_LENGTH = 128;
+
+/** Max challengeId length. generateChallengeId() produces 16-byte base64url
+ *  (22 chars); the cap leaves generous headroom without legitimizing abuse. */
+const MAX_CHALLENGE_ID_LENGTH = 64;
+
+/** Validate a ServerEnvelope from an authenticated WebSocket message. */
+export function validateServerEnvelope(
+  msg: Record<string, unknown>,
+): ServerEnvelope | ValidationError {
+  if (!isNonEmptyString(msg.clientId)) {
+    return { error: 'Missing or empty "clientId"', status: 400 };
+  }
+  if (msg.clientId.length > MAX_CLIENT_ID_LENGTH) {
+    return { error: `"clientId" exceeds max length ${MAX_CLIENT_ID_LENGTH}`, status: 400 };
+  }
+  if (!isNonEmptyString(msg.opId)) {
+    return { error: 'Missing or empty "opId"', status: 400 };
+  }
+  if (msg.opId.length > MAX_OP_ID_LENGTH) {
+    return { error: `"opId" exceeds max length ${MAX_OP_ID_LENGTH}`, status: 400 };
+  }
+  if (!isNonEmptyString(msg.channel) || !VALID_CHANNELS.has(msg.channel)) {
+    return { error: '"channel" must be "event" or "presence"', status: 400 };
+  }
+  if (!isNonEmptyString(msg.ciphertext)) {
+    return { error: 'Missing or empty "ciphertext"', status: 400 };
+  }
+
+  const maxSize = msg.channel === 'presence'
+    ? MAX_PRESENCE_CIPHERTEXT_LENGTH
+    : MAX_EVENT_CIPHERTEXT_LENGTH;
+  if (msg.ciphertext.length > maxSize) {
+    return { error: `Ciphertext exceeds max size for ${msg.channel} (${Math.round(maxSize / 1024)} KB)`, status: 413 };
+  }
+
+  return {
+    clientId: msg.clientId,
+    opId: msg.opId,
+    channel: msg.channel as 'event' | 'presence',
+    ciphertext: msg.ciphertext,
+  };
+}
+
+/** Validate an AdminCommandEnvelope from an authenticated WebSocket message. */
+export function validateAdminCommandEnvelope(
+  msg: Record<string, unknown>,
+): AdminCommandEnvelope | ValidationError {
+  if (!isNonEmptyString(msg.challengeId)) {
+    return { error: 'Missing or empty "challengeId"', status: 400 };
+  }
+  // Cap string inputs that flow into proof verification and command dispatch.
+  // Prevents an authenticated peer from spamming oversized identifiers that
+  // would otherwise hit canonicalJson / log volume on every admin attempt.
+  if (msg.challengeId.length > MAX_CHALLENGE_ID_LENGTH) {
+    return { error: `"challengeId" exceeds max length ${MAX_CHALLENGE_ID_LENGTH}`, status: 400 };
+  }
+  if (!isNonEmptyString(msg.clientId)) {
+    return { error: 'Missing or empty "clientId"', status: 400 };
+  }
+  if (msg.clientId.length > MAX_CLIENT_ID_LENGTH) {
+    return { error: `"clientId" exceeds max length ${MAX_CLIENT_ID_LENGTH}`, status: 400 };
+  }
+  if (!isNonEmptyString(msg.adminProof)) {
+    return { error: 'Missing or empty "adminProof"', status: 400 };
+  }
+  if (msg.adminProof.length > MAX_ADMIN_PROOF_LENGTH) {
+    return { error: `"adminProof" exceeds max length ${MAX_ADMIN_PROOF_LENGTH}`, status: 400 };
+  }
+
+  if (!msg.command || typeof msg.command !== 'object') {
+    return { error: 'Missing or invalid "command"', status: 400 };
+  }
+
+  const cmd = msg.command as Record<string, unknown>;
+  if (!isNonEmptyString(cmd.type) || !VALID_ADMIN_COMMANDS.has(cmd.type)) {
+    return { error: `Unknown command type: ${String(cmd.type)}`, status: 400 };
+  }
+
+  // Build a SANITIZED command with exactly the expected fields. Extra fields
+  // on the inbound payload are dropped. This is defense-in-depth:
+  // - The admin proof is computed over canonicalJson(command), so if a client
+  //   smuggles extra fields into the payload, their proof is bound to
+  //   `canonicalJson(dirty)` while the server's re-verification will be
+  //   computed over `canonicalJson(sanitized)` — proof verification fails.
+  //   Honest clients serialize clean commands and their proofs verify.
+  // - Downstream code (logging, storage, proof recomputation) only ever sees
+  //   the narrow shape its type says it does.
+  // The type gate above (VALID_ADMIN_COMMANDS.has(cmd.type)) already
+  // restricts cmd.type to the single valid value. If a future admin
+  // command is added, expand the Set AND split the sanitization below
+  // into per-type branches at the same time.
+  const sanitizedCommand: AdminCommandEnvelope['command'] = { type: 'room.delete' };
+
+  return {
+    type: 'admin.command',
+    challengeId: msg.challengeId,
+    clientId: msg.clientId,
+    command: sanitizedCommand,
+    adminProof: msg.adminProof,
+  };
+}
diff --git a/apps/room-service/entry.tsx b/apps/room-service/entry.tsx
new file mode 100644
index 000000000..55bc185bc
--- /dev/null
+++ b/apps/room-service/entry.tsx
@@ -0,0 +1,64 @@
+/**
+ * Browser entry for room.plannotator.ai.
+ *
+ * Two surfaces share this bundle:
+ *   - `/`           → LandingPage (upload a document, create a room)
+ *   - `/c/:roomId`  → AppRoot (room editor via useRoomMode)
+ *
+ * Both branches are lazy-loaded so neither pays for the other's code.
+ * Landing visitors (~10 KB) never download the editor bundle (~4 MB),
+ * and room visitors never download the landing page chunk.
+ *
+ * TanStack Router is intentionally deferred until room-service has 3-4+
+ * real routes with data/loading needs.
+ */
+
+import React, { lazy, Suspense } from 'react';
+import { createRoot } from 'react-dom/client';
+import { ThemeProvider } from '@plannotator/ui/components/ThemeProvider';
+// @ts-expect-error — Vite resolves CSS side-effect imports at build time;
+// there is no .d.ts for the index.css file and adding one would not match
+// the existing apps/hook pattern. TypeScript doesn't need to analyze it.
+import '@plannotator/editor/styles';
+
+const LandingPage = lazy(() =>
+  import('@plannotator/ui/components/collab/LandingPage').then(m => ({ default: m.LandingPage })),
+);
+
+const AppRoot = lazy(() =>
+  import('@plannotator/editor').then(m => ({ default: m.default })),
+);
+
+function RoomServiceEntry(): React.ReactElement {
+  const pathname = window.location.pathname;
+
+  if (pathname === '/') {
+    return (
+      <ThemeProvider defaultTheme="dark">
+        <Suspense fallback={
+          <div className="min-h-screen bg-background flex items-center justify-center">
+            <p className="text-sm text-muted-foreground">Loading...</p>
+          </div>
+        }>
+          <LandingPage />
+        </Suspense>
+      </ThemeProvider>
+    );
+  }
+
+  return (
+    <Suspense fallback={null}>
+      <AppRoot />
+    </Suspense>
+  );
+}
+
+const root = document.getElementById('root');
+if (!root) {
+  throw new Error('Plannotator entry: #root element missing from index.html');
+}
+createRoot(root).render(
+  <React.StrictMode>
+    <RoomServiceEntry />
+  </React.StrictMode>,
+);
diff --git a/apps/room-service/index.html b/apps/room-service/index.html
new file mode 100644
index 000000000..759a068d0
--- /dev/null
+++ b/apps/room-service/index.html
@@ -0,0 +1,24 @@
+<!DOCTYPE html>
+<html lang="en">
+  <head>
+    <meta charset="UTF-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+    <title>Plannotator</title>
+    <link rel="icon" type="image/svg+xml" href="/favicon.svg" />
+    <!--
+      No `preconnect` hints for the font origins. `preconnect` is governed
+      by `connect-src`, and the room-shell CSP intentionally does not list
+      Google font origins (widening it for a perf hint would enlarge the
+      post-XSS exfiltration surface). The stylesheet + font files still
+      load — they're covered by `style-src` and `font-src`.
+    -->
+    <link
+      href="https://fonts.googleapis.com/css2?family=Inter:wght@300;400;500;600;700&family=JetBrains+Mono:wght@400;500;600&display=swap"
+      rel="stylesheet"
+    />
+  </head>
+  <body>
+    <div id="root"></div>
+    <script type="module" src="/entry.tsx"></script>
+  </body>
+</html>
diff --git a/apps/room-service/package.json b/apps/room-service/package.json
new file mode 100644
index 000000000..e2785e820
--- /dev/null
+++ b/apps/room-service/package.json
@@ -0,0 +1,29 @@
+{
+  "name": "@plannotator/room-service",
+  "version": "0.1.0",
+  "private": true,
+  "scripts": {
+    "build:shell": "rm -rf public && vite build",
+    "dev": "bun run build:shell && wrangler dev",
+    "deploy": "bun run build:shell && wrangler deploy",
+    "test": "bun test"
+  },
+  "dependencies": {
+    "@plannotator/editor": "workspace:*",
+    "@plannotator/shared": "workspace:*",
+    "@plannotator/ui": "workspace:*",
+    "react": "^19.2.3",
+    "react-dom": "^19.2.3"
+  },
+  "devDependencies": {
+    "@cloudflare/workers-types": "^4.20241218.0",
+    "@tailwindcss/vite": "^4.1.18",
+    "@types/react": "^19.2.0",
+    "@types/react-dom": "^19.2.0",
+    "@vitejs/plugin-react": "^5.0.0",
+    "tailwindcss": "^4.1.18",
+    "typescript": "~5.8.2",
+    "vite": "^6.2.0",
+    "wrangler": "^4.80.0"
+  }
+}
diff --git a/apps/room-service/scripts/smoke.ts b/apps/room-service/scripts/smoke.ts
new file mode 100644
index 000000000..e1569a3b3
--- /dev/null
+++ b/apps/room-service/scripts/smoke.ts
@@ -0,0 +1,330 @@
+/**
+ * Smoke test for room-service against a running wrangler dev instance.
+ *
+ * Usage:
+ *   cd apps/room-service && wrangler dev    # in one terminal
+ *   bun run scripts/smoke.ts                # in another terminal
+ *
+ * This acts as an external client: it imports from @plannotator/shared/collab/client
+ * to simulate browser/agent auth flows. Server runtime code must NOT do this.
+ *
+ * Exits 0 on success, non-zero on failure.
+ */
+
+import {
+  deriveRoomKeys,
+  deriveAdminKey,
+  computeRoomVerifier,
+  computeAdminVerifier,
+  computeAuthProof,
+  computeAdminProof,
+  encryptSnapshot,
+  encryptPayload,
+  encryptPresence,
+  generateRoomId,
+  generateRoomSecret,
+  generateAdminSecret,
+  generateOpId,
+} from '@plannotator/shared/collab/client';
+
+import type {
+  CreateRoomRequest,
+  CreateRoomResponse,
+  AdminChallenge,
+  AdminCommand,
+  RoomSnapshot,
+  RoomTransportMessage,
+} from '@plannotator/shared/collab';
+
+const BASE_URL = process.env.SMOKE_BASE_URL || 'http://localhost:8787';
+const WS_BASE = BASE_URL.replace(/^http/, 'ws');
+
+let passed = 0;
+let failed = 0;
+
+function assert(condition: boolean, label: string): void {
+  if (condition) {
+    passed++;
+    console.log(`  PASS: ${label}`);
+  } else {
+    failed++;
+    console.error(`  FAIL: ${label}`);
+  }
+}
+
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
+
+/** Messages received on the socket — includes transport messages and admin challenges. */
+type SmokeMessage = RoomTransportMessage | AdminChallenge;
+
+interface AuthedSocket {
+  ws: WebSocket;
+  clientId: string;
+  messages: SmokeMessage[];
+  closed: boolean;
+}
+
+/** Connect, authenticate, and return a ready socket that collects messages. */
+async function connectAndAuth(
+  roomId: string,
+  roomVerifier: string,
+  lastSeq?: number,
+): Promise<AuthedSocket> {
+  return new Promise((resolve, reject) => {
+    const ws = new WebSocket(`${WS_BASE}/ws/${roomId}`);
+    // clientId is now assigned by the server in the auth.challenge message;
+    // we adopt it here instead of self-generating (see PresenceImpersonation
+    // fix). Placeholder until challenge arrives.
+    let clientId = '';
+    const result: AuthedSocket = { ws, clientId: '', messages: [], closed: false };
+    let authed = false;
+
+    const timeout = setTimeout(() => {
+      if (!authed) { ws.close(); reject(new Error('Auth timeout')); }
+    }, 10_000);
+
+    ws.onmessage = async (event) => {
+      const msg = JSON.parse(String(event.data));
+
+      if (!authed && msg.type === 'auth.challenge') {
+        clientId = msg.clientId;
+        result.clientId = clientId;
+        const proof = await computeAuthProof(roomVerifier, roomId, clientId, msg.challengeId, msg.nonce);
+        ws.send(JSON.stringify({ type: 'auth.response', challengeId: msg.challengeId, clientId, proof, lastSeq }));
+        return;
+      }
+
+      if (!authed && msg.type === 'auth.accepted') {
+        authed = true;
+        clearTimeout(timeout);
+        // Collect subsequent messages
+        ws.onmessage = (e) => {
+          result.messages.push(JSON.parse(String(e.data)));
+        };
+        resolve(result);
+        return;
+      }
+    };
+
+    ws.onclose = () => { result.closed = true; };
+    ws.onerror = () => { if (!authed) reject(new Error('WebSocket error')); };
+  });
+}
+
+/** Wait briefly for messages to arrive. */
+function wait(ms: number): Promise<void> {
+  return new Promise(r => setTimeout(r, ms));
+}
+
+// ---------------------------------------------------------------------------
+// Main
+// ---------------------------------------------------------------------------
+
+async function run(): Promise<void> {
+  console.log(`\nSmoke testing room-service at ${BASE_URL}\n`);
+
+  // -----------------------------------------------------------------------
+  // 1. Health check
+  // -----------------------------------------------------------------------
+  console.log('1. Health check');
+  const healthRes = await fetch(`${BASE_URL}/health`);
+  assert(healthRes.ok, 'GET /health returns 200');
+
+  // -----------------------------------------------------------------------
+  // 2. Create a room
+  // -----------------------------------------------------------------------
+  console.log('\n2. Room creation');
+  const roomId = generateRoomId();
+  const roomSecret = generateRoomSecret();
+  const adminSecret = generateAdminSecret();
+
+  const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+  const adminKey = await deriveAdminKey(adminSecret);
+
+  const roomVerifier = await computeRoomVerifier(authKey, roomId);
+  const adminVerifier = await computeAdminVerifier(adminKey, roomId);
+
+  const snapshot: RoomSnapshot = { versionId: 'v1', planMarkdown: '# Smoke Test', annotations: [] };
+  const snapshotCiphertext = await encryptSnapshot(eventKey, snapshot);
+
+  const createBody: CreateRoomRequest = {
+    roomId,
+    roomVerifier,
+    adminVerifier,
+    initialSnapshotCiphertext: snapshotCiphertext,
+  };
+
+  const createRes = await fetch(`${BASE_URL}/api/rooms`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify(createBody),
+  });
+  assert(createRes.status === 201, 'POST /api/rooms returns 201');
+
+  const createResponseBody = await createRes.json() as CreateRoomResponse;
+  assert(!createResponseBody.joinUrl.includes('#'), 'joinUrl has no fragment');
+
+  // -----------------------------------------------------------------------
+  // 3. Duplicate room creation → 409
+  // -----------------------------------------------------------------------
+  console.log('\n3. Duplicate room creation');
+  const dupRes = await fetch(`${BASE_URL}/api/rooms`, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify(createBody),
+  });
+  assert(dupRes.status === 409, 'Duplicate returns 409');
+
+  // -----------------------------------------------------------------------
+  // 4. Fresh join receives snapshot
+  // -----------------------------------------------------------------------
+  console.log('\n4. Fresh join receives snapshot');
+  const client1 = await connectAndAuth(roomId, roomVerifier);
+  await wait(200);
+  const snapshots1 = client1.messages.filter(m => m.type === 'room.snapshot');
+  assert(snapshots1.length === 1, 'Client1 received room.snapshot on join');
+
+  // -----------------------------------------------------------------------
+  // 5. Two clients — event echo + broadcast
+  // -----------------------------------------------------------------------
+  console.log('\n5. Event sequencing + echo');
+  const client2 = await connectAndAuth(roomId, roomVerifier);
+  await wait(200);
+  // Clear join messages
+  client1.messages.length = 0;
+  client2.messages.length = 0;
+
+  // Client1 sends an event. Use a real annotation — empty annotation.add is
+  // rejected by conforming clients (no-op would burn a durable seq).
+  const realAnnotation = {
+    id: 'smoke-ann-1',
+    blockId: 'block-1',
+    startOffset: 0,
+    endOffset: 5,
+    type: 'COMMENT' as const,
+    originalText: 'hello',
+    createdA: Date.now(),
+    text: 'smoke test annotation',
+  };
+  const eventCiphertext = await encryptPayload(eventKey, JSON.stringify({ type: 'annotation.add', annotations: [realAnnotation] }));
+  client1.ws.send(JSON.stringify({
+    clientId: client1.clientId,
+    opId: generateOpId(),
+    channel: 'event',
+    ciphertext: eventCiphertext,
+  }));
+  await wait(500);
+
+  const client1Events = client1.messages.filter(m => m.type === 'room.event');
+  const client2Events = client2.messages.filter(m => m.type === 'room.event');
+  assert(client1Events.length === 1, 'Sender receives echo (room.event)');
+  assert(client2Events.length === 1, 'Other client receives room.event');
+
+  // -----------------------------------------------------------------------
+  // 6. Presence relay — others only
+  // -----------------------------------------------------------------------
+  console.log('\n6. Presence relay');
+  client1.messages.length = 0;
+  client2.messages.length = 0;
+
+  // Presence MUST be encrypted with presenceKey (not eventKey) and carry a
+  // valid PresenceState shape — conforming clients reject malformed presence.
+  const validPresence = {
+    user: { id: 'smoke-u1', name: 'smoke', color: '#f00' },
+    cursor: null,
+  };
+  const presenceCiphertext = await encryptPresence(presenceKey, validPresence);
+  client1.ws.send(JSON.stringify({
+    clientId: client1.clientId,
+    opId: generateOpId(),
+    channel: 'presence',
+    ciphertext: presenceCiphertext,
+  }));
+  await wait(300);
+
+  const client1Presence = client1.messages.filter(m => m.type === 'room.presence');
+  const client2Presence = client2.messages.filter(m => m.type === 'room.presence');
+  assert(client1Presence.length === 0, 'Sender does NOT receive own presence');
+  assert(client2Presence.length === 1, 'Other client receives room.presence');
+
+  // -----------------------------------------------------------------------
+  // 7. Reconnect replay
+  // -----------------------------------------------------------------------
+  console.log('\n7. Reconnect replay');
+  client2.ws.close();
+  await wait(200);
+
+  // Client1 sends another event while client2 is disconnected
+  client1.ws.send(JSON.stringify({
+    clientId: client1.clientId,
+    opId: generateOpId(),
+    channel: 'event',
+    ciphertext: eventCiphertext,
+  }));
+  await wait(300);
+
+  // Client2 reconnects with lastSeq from the first event (seq 1)
+  const client2b = await connectAndAuth(roomId, roomVerifier, 1);
+  await wait(500);
+
+  const replayedEvents = client2b.messages.filter(m => m.type === 'room.event');
+  assert(replayedEvents.length === 1, 'Reconnect replayed 1 missed event (seq 2)');
+  if (replayedEvents.length > 0 && replayedEvents[0].type === 'room.event') {
+    assert(replayedEvents[0].seq === 2, 'Replayed event has seq 2');
+  }
+
+  // -----------------------------------------------------------------------
+  // 8. Admin delete
+  // -----------------------------------------------------------------------
+  console.log('\n8. Admin delete');
+  client1.messages.length = 0;
+
+  client1.ws.send(JSON.stringify({ type: 'admin.challenge.request' }));
+  await wait(300);
+  const deleteChallenge = client1.messages.find(m => m.type === 'admin.challenge') as AdminChallenge | undefined;
+
+  if (deleteChallenge) {
+    const deleteCmd: AdminCommand = { type: 'room.delete' };
+    const deleteProof = await computeAdminProof(
+      adminVerifier, roomId, client1.clientId,
+      deleteChallenge.challengeId, deleteChallenge.nonce, deleteCmd,
+    );
+    client1.ws.send(JSON.stringify({
+      type: 'admin.command',
+      challengeId: deleteChallenge.challengeId,
+      clientId: client1.clientId,
+      command: deleteCmd,
+      adminProof: deleteProof,
+    }));
+    await wait(500);
+
+    assert(client1.closed, 'Client1 socket closed after delete');
+    assert(client2b.closed, 'Client2 socket closed after delete');
+  }
+
+  // -----------------------------------------------------------------------
+  // 9. Deleted room rejects new joins
+  // -----------------------------------------------------------------------
+  console.log('\n9. Deleted room rejects new joins');
+  try {
+    const client3 = await connectAndAuth(roomId, roomVerifier);
+    client3.ws.close();
+    assert(false, 'Should not authenticate to deleted room');
+  } catch {
+    assert(true, 'Deleted room rejects new WebSocket join');
+  }
+
+  // -----------------------------------------------------------------------
+  // Summary
+  // -----------------------------------------------------------------------
+  console.log(`\n${'='.repeat(40)}`);
+  console.log(`Passed: ${passed}, Failed: ${failed}`);
+  process.exit(failed > 0 ? 1 : 0);
+}
+
+run().catch((err) => {
+  console.error('Smoke test failed:', err);
+  process.exit(1);
+});
diff --git a/apps/room-service/static/Octicons-mark-github.svg b/apps/room-service/static/Octicons-mark-github.svg
new file mode 100644
index 000000000..a8d117404
--- /dev/null
+++ b/apps/room-service/static/Octicons-mark-github.svg
@@ -0,0 +1,3 @@
+<svg width="1024" height="1024" viewBox="0 0 1024 1024" fill="none" xmlns="http://www.w3.org/2000/svg">
+<path fill-rule="evenodd" clip-rule="evenodd" d="M8 0C3.58 0 0 3.58 0 8C0 11.54 2.29 14.53 5.47 15.59C5.87 15.66 6.02 15.42 6.02 15.21C6.02 15.02 6.01 14.39 6.01 13.72C4 14.09 3.48 13.23 3.32 12.78C3.23 12.55 2.84 11.84 2.5 11.65C2.22 11.5 1.82 11.13 2.49 11.12C3.12 11.11 3.57 11.7 3.72 11.94C4.44 13.15 5.59 12.81 6.05 12.6C6.12 12.08 6.33 11.73 6.56 11.53C4.78 11.33 2.92 10.64 2.92 7.58C2.92 6.71 3.23 5.99 3.74 5.43C3.66 5.23 3.38 4.41 3.82 3.31C3.82 3.31 4.49 3.1 6.02 4.13C6.66 3.95 7.34 3.86 8.02 3.86C8.7 3.86 9.38 3.95 10.02 4.13C11.55 3.09 12.22 3.31 12.22 3.31C12.66 4.41 12.38 5.23 12.3 5.43C12.81 5.99 13.12 6.7 13.12 7.58C13.12 10.65 11.25 11.33 9.47 11.53C9.76 11.78 10.01 12.26 10.01 13.01C10.01 14.08 10 14.94 10 15.21C10 15.42 10.15 15.67 10.55 15.59C13.71 14.53 16 11.53 16 8C16 3.58 12.42 0 8 0Z" transform="scale(64)" fill="#1B1F23"/>
+</svg>
diff --git a/apps/room-service/static/banner_lite.webp b/apps/room-service/static/banner_lite.webp
new file mode 100644
index 000000000..507746d8f
Binary files /dev/null and b/apps/room-service/static/banner_lite.webp differ
diff --git a/apps/room-service/static/demo-aiayn.md b/apps/room-service/static/demo-aiayn.md
new file mode 100644
index 000000000..10129fd71
--- /dev/null
+++ b/apps/room-service/static/demo-aiayn.md
@@ -0,0 +1,371 @@
+Title: Attention Is All You Need
+
+URL Source: https://arxiv.org/html/1706.03762v7
+
+Published Time: Fri, 06 Mar 2026 15:00:03 GMT
+
+Markdown Content:
+Provided proper attribution is provided, Google hereby grants permission to reproduce the tables and figures in this paper solely for use in journalistic or scholarly works.
+
+Ashish Vaswani 
+
+Google Brain 
+
+avaswani@google.com 
+
+&Noam Shazeer 1 1 footnotemark: 1
+
+Google Brain 
+
+noam@google.com 
+
+&Niki Parmar 1 1 footnotemark: 1
+
+Google Research 
+
+nikip@google.com 
+
+&Jakob Uszkoreit 1 1 footnotemark: 1
+
+Google Research 
+
+usz@google.com 
+
+&Llion Jones 1 1 footnotemark: 1
+
+Google Research 
+
+llion@google.com 
+
+&Aidan N. Gomez 1 1 footnotemark: 1
+
+University of Toronto 
+
+aidan@cs.toronto.edu&Łukasz Kaiser 1 1 footnotemark: 1
+
+Google Brain 
+
+lukaszkaiser@google.com 
+
+&Illia Polosukhin 1 1 footnotemark: 1
+
+illia.polosukhin@gmail.com 
+
+Equal contribution. Listing order is random. Jakob proposed replacing RNNs with self-attention and started the effort to evaluate this idea. Ashish, with Illia, designed and implemented the first Transformer models and has been crucially involved in every aspect of this work. Noam proposed scaled dot-product attention, multi-head attention and the parameter-free position representation and became the other person involved in nearly every detail. Niki designed, implemented, tuned and evaluated countless model variants in our original codebase and tensor2tensor. Llion also experimented with novel model variants, was responsible for our initial codebase, and efficient inference and visualizations. Lukasz and Aidan spent countless long days designing various parts of and implementing tensor2tensor, replacing our earlier codebase, greatly improving results and massively accelerating our research. Work performed while at Google Brain.Work performed while at Google Research.
+
+###### Abstract
+
+The dominant sequence transduction models are based on complex recurrent or convolutional neural networks that include an encoder and a decoder. The best performing models also connect the encoder and decoder through an attention mechanism. We propose a new simple network architecture, the Transformer, based solely on attention mechanisms, dispensing with recurrence and convolutions entirely. Experiments on two machine translation tasks show these models to be superior in quality while being more parallelizable and requiring significantly less time to train. Our model achieves 28.4 BLEU on the WMT 2014 English-to-German translation task, improving over the existing best results, including ensembles, by over 2 BLEU. On the WMT 2014 English-to-French translation task, our model establishes a new single-model state-of-the-art BLEU score of 41.8 after training for 3.5 days on eight GPUs, a small fraction of the training costs of the best models from the literature. We show that the Transformer generalizes well to other tasks by applying it successfully to English constituency parsing both with large and limited training data.
+
+## 1 Introduction
+
+Recurrent neural networks, long short-term memory [[13](https://arxiv.org/html/1706.03762v7#bib.bib13)] and gated recurrent [[7](https://arxiv.org/html/1706.03762v7#bib.bib7)] neural networks in particular, have been firmly established as state of the art approaches in sequence modeling and transduction problems such as language modeling and machine translation [[35](https://arxiv.org/html/1706.03762v7#bib.bib35), [2](https://arxiv.org/html/1706.03762v7#bib.bib2), [5](https://arxiv.org/html/1706.03762v7#bib.bib5)]. Numerous efforts have since continued to push the boundaries of recurrent language models and encoder-decoder architectures [[38](https://arxiv.org/html/1706.03762v7#bib.bib38), [24](https://arxiv.org/html/1706.03762v7#bib.bib24), [15](https://arxiv.org/html/1706.03762v7#bib.bib15)].
+
+Recurrent models typically factor computation along the symbol positions of the input and output sequences. Aligning the positions to steps in computation time, they generate a sequence of hidden states h_{t}, as a function of the previous hidden state h_{t-1} and the input for position t. This inherently sequential nature precludes parallelization within training examples, which becomes critical at longer sequence lengths, as memory constraints limit batching across examples. Recent work has achieved significant improvements in computational efficiency through factorization tricks [[21](https://arxiv.org/html/1706.03762v7#bib.bib21)] and conditional computation [[32](https://arxiv.org/html/1706.03762v7#bib.bib32)], while also improving model performance in case of the latter. The fundamental constraint of sequential computation, however, remains.
+
+Attention mechanisms have become an integral part of compelling sequence modeling and transduction models in various tasks, allowing modeling of dependencies without regard to their distance in the input or output sequences [[2](https://arxiv.org/html/1706.03762v7#bib.bib2), [19](https://arxiv.org/html/1706.03762v7#bib.bib19)]. In all but a few cases [[27](https://arxiv.org/html/1706.03762v7#bib.bib27)], however, such attention mechanisms are used in conjunction with a recurrent network.
+
+In this work we propose the Transformer, a model architecture eschewing recurrence and instead relying entirely on an attention mechanism to draw global dependencies between input and output. The Transformer allows for significantly more parallelization and can reach a new state of the art in translation quality after being trained for as little as twelve hours on eight P100 GPUs.
+
+## 2 Background
+
+The goal of reducing sequential computation also forms the foundation of the Extended Neural GPU [[16](https://arxiv.org/html/1706.03762v7#bib.bib16)], ByteNet [[18](https://arxiv.org/html/1706.03762v7#bib.bib18)] and ConvS2S [[9](https://arxiv.org/html/1706.03762v7#bib.bib9)], all of which use convolutional neural networks as basic building block, computing hidden representations in parallel for all input and output positions. In these models, the number of operations required to relate signals from two arbitrary input or output positions grows in the distance between positions, linearly for ConvS2S and logarithmically for ByteNet. This makes it more difficult to learn dependencies between distant positions [[12](https://arxiv.org/html/1706.03762v7#bib.bib12)]. In the Transformer this is reduced to a constant number of operations, albeit at the cost of reduced effective resolution due to averaging attention-weighted positions, an effect we counteract with Multi-Head Attention as described in section[3.2](https://arxiv.org/html/1706.03762v7#S3.SS2 "3.2 Attention ‣ 3 Model Architecture ‣ Attention Is All You Need").
+
+Self-attention, sometimes called intra-attention is an attention mechanism relating different positions of a single sequence in order to compute a representation of the sequence. Self-attention has been used successfully in a variety of tasks including reading comprehension, abstractive summarization, textual entailment and learning task-independent sentence representations [[4](https://arxiv.org/html/1706.03762v7#bib.bib4), [27](https://arxiv.org/html/1706.03762v7#bib.bib27), [28](https://arxiv.org/html/1706.03762v7#bib.bib28), [22](https://arxiv.org/html/1706.03762v7#bib.bib22)].
+
+End-to-end memory networks are based on a recurrent attention mechanism instead of sequence-aligned recurrence and have been shown to perform well on simple-language question answering and language modeling tasks [[34](https://arxiv.org/html/1706.03762v7#bib.bib34)].
+
+To the best of our knowledge, however, the Transformer is the first transduction model relying entirely on self-attention to compute representations of its input and output without using sequence-aligned RNNs or convolution. In the following sections, we will describe the Transformer, motivate self-attention and discuss its advantages over models such as [[17](https://arxiv.org/html/1706.03762v7#bib.bib17), [18](https://arxiv.org/html/1706.03762v7#bib.bib18)] and [[9](https://arxiv.org/html/1706.03762v7#bib.bib9)].
+
+## 3 Model Architecture
+
+![Image 1: Refer to caption](https://arxiv.org/html/1706.03762v7/Figures/ModalNet-21.png)
+
+Figure 1: The Transformer - model architecture.
+
+Most competitive neural sequence transduction models have an encoder-decoder structure [[5](https://arxiv.org/html/1706.03762v7#bib.bib5), [2](https://arxiv.org/html/1706.03762v7#bib.bib2), [35](https://arxiv.org/html/1706.03762v7#bib.bib35)]. Here, the encoder maps an input sequence of symbol representations (x_{1},...,x_{n}) to a sequence of continuous representations \mathbf{z}=(z_{1},...,z_{n}). Given \mathbf{z}, the decoder then generates an output sequence (y_{1},...,y_{m}) of symbols one element at a time. At each step the model is auto-regressive [[10](https://arxiv.org/html/1706.03762v7#bib.bib10)], consuming the previously generated symbols as additional input when generating the next.
+
+The Transformer follows this overall architecture using stacked self-attention and point-wise, fully connected layers for both the encoder and decoder, shown in the left and right halves of Figure[1](https://arxiv.org/html/1706.03762v7#S3.F1 "Figure 1 ‣ 3 Model Architecture ‣ Attention Is All You Need"), respectively.
+
+### 3.1 Encoder and Decoder Stacks
+
+##### Encoder:
+
+The encoder is composed of a stack of N=6 identical layers. Each layer has two sub-layers. The first is a multi-head self-attention mechanism, and the second is a simple, position-wise fully connected feed-forward network. We employ a residual connection [[11](https://arxiv.org/html/1706.03762v7#bib.bib11)] around each of the two sub-layers, followed by layer normalization [[1](https://arxiv.org/html/1706.03762v7#bib.bib1)]. That is, the output of each sub-layer is \mathrm{LayerNorm}(x+\mathrm{Sublayer}(x)), where \mathrm{Sublayer}(x) is the function implemented by the sub-layer itself. To facilitate these residual connections, all sub-layers in the model, as well as the embedding layers, produce outputs of dimension d_{\text{model}}=512.
+
+##### Decoder:
+
+The decoder is also composed of a stack of N=6 identical layers. In addition to the two sub-layers in each encoder layer, the decoder inserts a third sub-layer, which performs multi-head attention over the output of the encoder stack. Similar to the encoder, we employ residual connections around each of the sub-layers, followed by layer normalization. We also modify the self-attention sub-layer in the decoder stack to prevent positions from attending to subsequent positions. This masking, combined with fact that the output embeddings are offset by one position, ensures that the predictions for position i can depend only on the known outputs at positions less than i.
+
+### 3.2 Attention
+
+An attention function can be described as mapping a query and a set of key-value pairs to an output, where the query, keys, values, and output are all vectors. The output is computed as a weighted sum of the values, where the weight assigned to each value is computed by a compatibility function of the query with the corresponding key.
+
+#### 3.2.1 Scaled Dot-Product Attention
+
+We call our particular attention "Scaled Dot-Product Attention" (Figure[2](https://arxiv.org/html/1706.03762v7#S3.F2 "Figure 2 ‣ 3.2.2 Multi-Head Attention ‣ 3.2 Attention ‣ 3 Model Architecture ‣ Attention Is All You Need")). The input consists of queries and keys of dimension d_{k}, and values of dimension d_{v}. We compute the dot products of the query with all keys, divide each by \sqrt{d_{k}}, and apply a softmax function to obtain the weights on the values.
+
+In practice, we compute the attention function on a set of queries simultaneously, packed together into a matrix Q. The keys and values are also packed together into matrices K and V. We compute the matrix of outputs as:
+
+\mathrm{Attention}(Q,K,V)=\mathrm{softmax}(\frac{QK^{T}}{\sqrt{d_{k}}})V(1)
+
+The two most commonly used attention functions are additive attention [[2](https://arxiv.org/html/1706.03762v7#bib.bib2)], and dot-product (multiplicative) attention. Dot-product attention is identical to our algorithm, except for the scaling factor of \frac{1}{\sqrt{d_{k}}}. Additive attention computes the compatibility function using a feed-forward network with a single hidden layer. While the two are similar in theoretical complexity, dot-product attention is much faster and more space-efficient in practice, since it can be implemented using highly optimized matrix multiplication code.
+
+While for small values of d_{k} the two mechanisms perform similarly, additive attention outperforms dot product attention without scaling for larger values of d_{k}[[3](https://arxiv.org/html/1706.03762v7#bib.bib3)]. We suspect that for large values of d_{k}, the dot products grow large in magnitude, pushing the softmax function into regions where it has extremely small gradients 1 1 1 To illustrate why the dot products get large, assume that the components of q and k are independent random variables with mean 0 and variance 1. Then their dot product, q\cdot k=\sum_{i=1}^{d_{k}}q_{i}k_{i}, has mean 0 and variance d_{k}.. To counteract this effect, we scale the dot products by \frac{1}{\sqrt{d_{k}}}.
+
+#### 3.2.2 Multi-Head Attention
+
+Scaled Dot-Product Attention
+
+![Image 2: Refer to caption](https://arxiv.org/html/1706.03762v7/Figures/ModalNet-19.png)
+
+Multi-Head Attention
+
+![Image 3: Refer to caption](https://arxiv.org/html/1706.03762v7/Figures/ModalNet-20.png)
+
+Figure 2: (left) Scaled Dot-Product Attention. (right) Multi-Head Attention consists of several attention layers running in parallel.
+
+Instead of performing a single attention function with d_{\text{model}}-dimensional keys, values and queries, we found it beneficial to linearly project the queries, keys and values h times with different, learned linear projections to d_{k}, d_{k} and d_{v} dimensions, respectively. On each of these projected versions of queries, keys and values we then perform the attention function in parallel, yielding d_{v}-dimensional output values. These are concatenated and once again projected, resulting in the final values, as depicted in Figure[2](https://arxiv.org/html/1706.03762v7#S3.F2 "Figure 2 ‣ 3.2.2 Multi-Head Attention ‣ 3.2 Attention ‣ 3 Model Architecture ‣ Attention Is All You Need").
+
+Multi-head attention allows the model to jointly attend to information from different representation subspaces at different positions. With a single attention head, averaging inhibits this.
+
+\displaystyle\mathrm{MultiHead}(Q,K,V)\displaystyle=\mathrm{Concat}(\mathrm{head_{1}},...,\mathrm{head_{h}})W^{O}
+\displaystyle\text{where}~\mathrm{head_{i}}\displaystyle=\mathrm{Attention}(QW^{Q}_{i},KW^{K}_{i},VW^{V}_{i})
+
+Where the projections are parameter matrices W^{Q}_{i}\in\mathbb{R}^{d_{\text{model}}\times d_{k}}, W^{K}_{i}\in\mathbb{R}^{d_{\text{model}}\times d_{k}}, W^{V}_{i}\in\mathbb{R}^{d_{\text{model}}\times d_{v}} and W^{O}\in\mathbb{R}^{hd_{v}\times d_{\text{model}}}.
+
+In this work we employ h=8 parallel attention layers, or heads. For each of these we use d_{k}=d_{v}=d_{\text{model}}/h=64. Due to the reduced dimension of each head, the total computational cost is similar to that of single-head attention with full dimensionality.
+
+#### 3.2.3 Applications of Attention in our Model
+
+The Transformer uses multi-head attention in three different ways:
+
+*   •
+In "encoder-decoder attention" layers, the queries come from the previous decoder layer, and the memory keys and values come from the output of the encoder. This allows every position in the decoder to attend over all positions in the input sequence. This mimics the typical encoder-decoder attention mechanisms in sequence-to-sequence models such as [[38](https://arxiv.org/html/1706.03762v7#bib.bib38), [2](https://arxiv.org/html/1706.03762v7#bib.bib2), [9](https://arxiv.org/html/1706.03762v7#bib.bib9)].
+
+*   •
+The encoder contains self-attention layers. In a self-attention layer all of the keys, values and queries come from the same place, in this case, the output of the previous layer in the encoder. Each position in the encoder can attend to all positions in the previous layer of the encoder.
+
+*   •
+Similarly, self-attention layers in the decoder allow each position in the decoder to attend to all positions in the decoder up to and including that position. We need to prevent leftward information flow in the decoder to preserve the auto-regressive property. We implement this inside of scaled dot-product attention by masking out (setting to -\infty) all values in the input of the softmax which correspond to illegal connections. See Figure[2](https://arxiv.org/html/1706.03762v7#S3.F2 "Figure 2 ‣ 3.2.2 Multi-Head Attention ‣ 3.2 Attention ‣ 3 Model Architecture ‣ Attention Is All You Need").
+
+### 3.3 Position-wise Feed-Forward Networks
+
+In addition to attention sub-layers, each of the layers in our encoder and decoder contains a fully connected feed-forward network, which is applied to each position separately and identically. This consists of two linear transformations with a ReLU activation in between.
+
+\mathrm{FFN}(x)=\max(0,xW_{1}+b_{1})W_{2}+b_{2}(2)
+
+While the linear transformations are the same across different positions, they use different parameters from layer to layer. Another way of describing this is as two convolutions with kernel size 1. The dimensionality of input and output is d_{\text{model}}=512, and the inner-layer has dimensionality d_{ff}=2048.
+
+### 3.4 Embeddings and Softmax
+
+Similarly to other sequence transduction models, we use learned embeddings to convert the input tokens and output tokens to vectors of dimension d_{\text{model}}. We also use the usual learned linear transformation and softmax function to convert the decoder output to predicted next-token probabilities. In our model, we share the same weight matrix between the two embedding layers and the pre-softmax linear transformation, similar to [[30](https://arxiv.org/html/1706.03762v7#bib.bib30)]. In the embedding layers, we multiply those weights by \sqrt{d_{\text{model}}}.
+
+### 3.5 Positional Encoding
+
+Since our model contains no recurrence and no convolution, in order for the model to make use of the order of the sequence, we must inject some information about the relative or absolute position of the tokens in the sequence. To this end, we add "positional encodings" to the input embeddings at the bottoms of the encoder and decoder stacks. The positional encodings have the same dimension d_{\text{model}} as the embeddings, so that the two can be summed. There are many choices of positional encodings, learned and fixed [[9](https://arxiv.org/html/1706.03762v7#bib.bib9)].
+
+In this work, we use sine and cosine functions of different frequencies:
+
+\displaystyle PE_{(pos,2i)}=sin(pos/10000^{2i/d_{\text{model}}})
+\displaystyle PE_{(pos,2i+1)}=cos(pos/10000^{2i/d_{\text{model}}})
+
+where pos is the position and i is the dimension. That is, each dimension of the positional encoding corresponds to a sinusoid. The wavelengths form a geometric progression from 2\pi to 10000\cdot 2\pi. We chose this function because we hypothesized it would allow the model to easily learn to attend by relative positions, since for any fixed offset k, PE_{pos+k} can be represented as a linear function of PE_{pos}.
+
+We also experimented with using learned positional embeddings [[9](https://arxiv.org/html/1706.03762v7#bib.bib9)] instead, and found that the two versions produced nearly identical results (see Table[3](https://arxiv.org/html/1706.03762v7#S6.T3 "Table 3 ‣ 6.2 Model Variations ‣ 6 Results ‣ Attention Is All You Need") row (E)). We chose the sinusoidal version because it may allow the model to extrapolate to sequence lengths longer than the ones encountered during training.
+
+## 4 Why Self-Attention
+
+In this section we compare various aspects of self-attention layers to the recurrent and convolutional layers commonly used for mapping one variable-length sequence of symbol representations (x_{1},...,x_{n}) to another sequence of equal length (z_{1},...,z_{n}), with x_{i},z_{i}\in\mathbb{R}^{d}, such as a hidden layer in a typical sequence transduction encoder or decoder. Motivating our use of self-attention we consider three desiderata.
+
+One is the total computational complexity per layer. Another is the amount of computation that can be parallelized, as measured by the minimum number of sequential operations required.
+
+The third is the path length between long-range dependencies in the network. Learning long-range dependencies is a key challenge in many sequence transduction tasks. One key factor affecting the ability to learn such dependencies is the length of the paths forward and backward signals have to traverse in the network. The shorter these paths between any combination of positions in the input and output sequences, the easier it is to learn long-range dependencies [[12](https://arxiv.org/html/1706.03762v7#bib.bib12)]. Hence we also compare the maximum path length between any two input and output positions in networks composed of the different layer types.
+
+Table 1:  Maximum path lengths, per-layer complexity and minimum number of sequential operations for different layer types. n is the sequence length, d is the representation dimension, k is the kernel size of convolutions and r the size of the neighborhood in restricted self-attention.
+
+As noted in Table [1](https://arxiv.org/html/1706.03762v7#S4.T1 "Table 1 ‣ 4 Why Self-Attention ‣ Attention Is All You Need"), a self-attention layer connects all positions with a constant number of sequentially executed operations, whereas a recurrent layer requires O(n) sequential operations. In terms of computational complexity, self-attention layers are faster than recurrent layers when the sequence length n is smaller than the representation dimensionality d, which is most often the case with sentence representations used by state-of-the-art models in machine translations, such as word-piece [[38](https://arxiv.org/html/1706.03762v7#bib.bib38)] and byte-pair [[31](https://arxiv.org/html/1706.03762v7#bib.bib31)] representations. To improve computational performance for tasks involving very long sequences, self-attention could be restricted to considering only a neighborhood of size r in the input sequence centered around the respective output position. This would increase the maximum path length to O(n/r). We plan to investigate this approach further in future work.
+
+A single convolutional layer with kernel width k<n does not connect all pairs of input and output positions. Doing so requires a stack of O(n/k) convolutional layers in the case of contiguous kernels, or O(log_{k}(n)) in the case of dilated convolutions [[18](https://arxiv.org/html/1706.03762v7#bib.bib18)], increasing the length of the longest paths between any two positions in the network. Convolutional layers are generally more expensive than recurrent layers, by a factor of k. Separable convolutions [[6](https://arxiv.org/html/1706.03762v7#bib.bib6)], however, decrease the complexity considerably, to O(k\cdot n\cdot d+n\cdot d^{2}). Even with k=n, however, the complexity of a separable convolution is equal to the combination of a self-attention layer and a point-wise feed-forward layer, the approach we take in our model.
+
+As side benefit, self-attention could yield more interpretable models. We inspect attention distributions from our models and present and discuss examples in the appendix. Not only do individual attention heads clearly learn to perform different tasks, many appear to exhibit behavior related to the syntactic and semantic structure of the sentences.
+
+## 5 Training
+
+This section describes the training regime for our models.
+
+### 5.1 Training Data and Batching
+
+We trained on the standard WMT 2014 English-German dataset consisting of about 4.5 million sentence pairs. Sentences were encoded using byte-pair encoding [[3](https://arxiv.org/html/1706.03762v7#bib.bib3)], which has a shared source-target vocabulary of about 37000 tokens. For English-French, we used the significantly larger WMT 2014 English-French dataset consisting of 36M sentences and split tokens into a 32000 word-piece vocabulary [[38](https://arxiv.org/html/1706.03762v7#bib.bib38)]. Sentence pairs were batched together by approximate sequence length. Each training batch contained a set of sentence pairs containing approximately 25000 source tokens and 25000 target tokens.
+
+### 5.2 Hardware and Schedule
+
+We trained our models on one machine with 8 NVIDIA P100 GPUs. For our base models using the hyperparameters described throughout the paper, each training step took about 0.4 seconds. We trained the base models for a total of 100,000 steps or 12 hours. For our big models,(described on the bottom line of table [3](https://arxiv.org/html/1706.03762v7#S6.T3 "Table 3 ‣ 6.2 Model Variations ‣ 6 Results ‣ Attention Is All You Need")), step time was 1.0 seconds. The big models were trained for 300,000 steps (3.5 days).
+
+### 5.3 Optimizer
+
+We used the Adam optimizer[[20](https://arxiv.org/html/1706.03762v7#bib.bib20)] with \beta_{1}=0.9, \beta_{2}=0.98 and \epsilon=10^{-9}. We varied the learning rate over the course of training, according to the formula:
+
+lrate=d_{\text{model}}^{-0.5}\cdot\min({step\_num}^{-0.5},{step\_num}\cdot{warmup\_steps}^{-1.5})(3)
+
+This corresponds to increasing the learning rate linearly for the first warmup\_steps training steps, and decreasing it thereafter proportionally to the inverse square root of the step number. We used warmup\_steps=4000.
+
+### 5.4 Regularization
+
+We employ three types of regularization during training:
+
+##### Residual Dropout
+
+We apply dropout [[33](https://arxiv.org/html/1706.03762v7#bib.bib33)] to the output of each sub-layer, before it is added to the sub-layer input and normalized. In addition, we apply dropout to the sums of the embeddings and the positional encodings in both the encoder and decoder stacks. For the base model, we use a rate of P_{drop}=0.1.
+
+##### Label Smoothing
+
+During training, we employed label smoothing of value \epsilon_{ls}=0.1[[36](https://arxiv.org/html/1706.03762v7#bib.bib36)]. This hurts perplexity, as the model learns to be more unsure, but improves accuracy and BLEU score.
+
+## 6 Results
+
+### 6.1 Machine Translation
+
+Table 2: The Transformer achieves better BLEU scores than previous state-of-the-art models on the English-to-German and English-to-French newstest2014 tests at a fraction of the training cost. 
+
+On the WMT 2014 English-to-German translation task, the big transformer model (Transformer (big) in Table[2](https://arxiv.org/html/1706.03762v7#S6.T2 "Table 2 ‣ 6.1 Machine Translation ‣ 6 Results ‣ Attention Is All You Need")) outperforms the best previously reported models (including ensembles) by more than 2.0 BLEU, establishing a new state-of-the-art BLEU score of 28.4. The configuration of this model is listed in the bottom line of Table[3](https://arxiv.org/html/1706.03762v7#S6.T3 "Table 3 ‣ 6.2 Model Variations ‣ 6 Results ‣ Attention Is All You Need"). Training took 3.5 days on 8 P100 GPUs. Even our base model surpasses all previously published models and ensembles, at a fraction of the training cost of any of the competitive models.
+
+On the WMT 2014 English-to-French translation task, our big model achieves a BLEU score of 41.0, outperforming all of the previously published single models, at less than 1/4 the training cost of the previous state-of-the-art model. The Transformer (big) model trained for English-to-French used dropout rate P_{drop}=0.1, instead of 0.3.
+
+For the base models, we used a single model obtained by averaging the last 5 checkpoints, which were written at 10-minute intervals. For the big models, we averaged the last 20 checkpoints. We used beam search with a beam size of 4 and length penalty \alpha=0.6[[38](https://arxiv.org/html/1706.03762v7#bib.bib38)]. These hyperparameters were chosen after experimentation on the development set. We set the maximum output length during inference to input length + 50, but terminate early when possible [[38](https://arxiv.org/html/1706.03762v7#bib.bib38)].
+
+Table [2](https://arxiv.org/html/1706.03762v7#S6.T2 "Table 2 ‣ 6.1 Machine Translation ‣ 6 Results ‣ Attention Is All You Need") summarizes our results and compares our translation quality and training costs to other model architectures from the literature. We estimate the number of floating point operations used to train a model by multiplying the training time, the number of GPUs used, and an estimate of the sustained single-precision floating-point capacity of each GPU 2 2 2 We used values of 2.8, 3.7, 6.0 and 9.5 TFLOPS for K80, K40, M40 and P100, respectively..
+
+### 6.2 Model Variations
+
+Table 3: Variations on the Transformer architecture. Unlisted values are identical to those of the base model. All metrics are on the English-to-German translation development set, newstest2013. Listed perplexities are per-wordpiece, according to our byte-pair encoding, and should not be compared to per-word perplexities.
+
+N d_{\text{model}}d_{\text{ff}}h d_{k}d_{v}P_{drop}\epsilon_{ls}train PPL BLEU params
+steps(dev)(dev)\times 10^{6}
+base 6 512 2048 8 64 64 0.1 0.1 100K 4.92 25.8 65
+(A)1 512 512 5.29 24.9
+4 128 128 5.00 25.5
+16 32 32 4.91 25.8
+32 16 16 5.01 25.4
+(B)16 5.16 25.1 58
+32 5.01 25.4 60
+(C)2 6.11 23.7 36
+4 5.19 25.3 50
+8 4.88 25.5 80
+256 32 32 5.75 24.5 28
+1024 128 128 4.66 26.0 168
+1024 5.12 25.4 53
+4096 4.75 26.2 90
+(D)0.0 5.77 24.6
+0.2 4.95 25.5
+0.0 4.67 25.3
+0.2 5.47 25.7
+(E)positional embedding instead of sinusoids 4.92 25.7
+big 6 1024 4096 16 0.3 300K 4.33 26.4 213
+
+To evaluate the importance of different components of the Transformer, we varied our base model in different ways, measuring the change in performance on English-to-German translation on the development set, newstest2013. We used beam search as described in the previous section, but no checkpoint averaging. We present these results in Table[3](https://arxiv.org/html/1706.03762v7#S6.T3 "Table 3 ‣ 6.2 Model Variations ‣ 6 Results ‣ Attention Is All You Need").
+
+In Table[3](https://arxiv.org/html/1706.03762v7#S6.T3 "Table 3 ‣ 6.2 Model Variations ‣ 6 Results ‣ Attention Is All You Need") rows (A), we vary the number of attention heads and the attention key and value dimensions, keeping the amount of computation constant, as described in Section [3.2.2](https://arxiv.org/html/1706.03762v7#S3.SS2.SSS2 "3.2.2 Multi-Head Attention ‣ 3.2 Attention ‣ 3 Model Architecture ‣ Attention Is All You Need"). While single-head attention is 0.9 BLEU worse than the best setting, quality also drops off with too many heads.
+
+In Table[3](https://arxiv.org/html/1706.03762v7#S6.T3 "Table 3 ‣ 6.2 Model Variations ‣ 6 Results ‣ Attention Is All You Need") rows (B), we observe that reducing the attention key size d_{k} hurts model quality. This suggests that determining compatibility is not easy and that a more sophisticated compatibility function than dot product may be beneficial. We further observe in rows (C) and (D) that, as expected, bigger models are better, and dropout is very helpful in avoiding over-fitting. In row (E) we replace our sinusoidal positional encoding with learned positional embeddings [[9](https://arxiv.org/html/1706.03762v7#bib.bib9)], and observe nearly identical results to the base model.
+
+### 6.3 English Constituency Parsing
+
+Table 4: The Transformer generalizes well to English constituency parsing (Results are on Section 23 of WSJ)
+
+Parser Training WSJ 23 F1
+Vinyals & Kaiser el al. (2014) [[37](https://arxiv.org/html/1706.03762v7#bib.bib37)]WSJ only, discriminative 88.3
+Petrov et al. (2006) [[29](https://arxiv.org/html/1706.03762v7#bib.bib29)]WSJ only, discriminative 90.4
+Zhu et al. (2013) [[40](https://arxiv.org/html/1706.03762v7#bib.bib40)]WSJ only, discriminative 90.4
+Dyer et al. (2016) [[8](https://arxiv.org/html/1706.03762v7#bib.bib8)]WSJ only, discriminative 91.7
+Transformer (4 layers)WSJ only, discriminative 91.3
+Zhu et al. (2013) [[40](https://arxiv.org/html/1706.03762v7#bib.bib40)]semi-supervised 91.3
+Huang & Harper (2009) [[14](https://arxiv.org/html/1706.03762v7#bib.bib14)]semi-supervised 91.3
+McClosky et al. (2006) [[26](https://arxiv.org/html/1706.03762v7#bib.bib26)]semi-supervised 92.1
+Vinyals & Kaiser el al. (2014) [[37](https://arxiv.org/html/1706.03762v7#bib.bib37)]semi-supervised 92.1
+Transformer (4 layers)semi-supervised 92.7
+Luong et al. (2015) [[23](https://arxiv.org/html/1706.03762v7#bib.bib23)]multi-task 93.0
+Dyer et al. (2016) [[8](https://arxiv.org/html/1706.03762v7#bib.bib8)]generative 93.3
+
+To evaluate if the Transformer can generalize to other tasks we performed experiments on English constituency parsing. This task presents specific challenges: the output is subject to strong structural constraints and is significantly longer than the input. Furthermore, RNN sequence-to-sequence models have not been able to attain state-of-the-art results in small-data regimes [[37](https://arxiv.org/html/1706.03762v7#bib.bib37)].
+
+We trained a 4-layer transformer with d_{model}=1024 on the Wall Street Journal (WSJ) portion of the Penn Treebank [[25](https://arxiv.org/html/1706.03762v7#bib.bib25)], about 40K training sentences. We also trained it in a semi-supervised setting, using the larger high-confidence and BerkleyParser corpora from with approximately 17M sentences [[37](https://arxiv.org/html/1706.03762v7#bib.bib37)]. We used a vocabulary of 16K tokens for the WSJ only setting and a vocabulary of 32K tokens for the semi-supervised setting.
+
+We performed only a small number of experiments to select the dropout, both attention and residual (section[5.4](https://arxiv.org/html/1706.03762v7#S5.SS4 "5.4 Regularization ‣ 5 Training ‣ Attention Is All You Need")), learning rates and beam size on the Section 22 development set, all other parameters remained unchanged from the English-to-German base translation model. During inference, we increased the maximum output length to input length + 300. We used a beam size of 21 and \alpha=0.3 for both WSJ only and the semi-supervised setting.
+
+Our results in Table[4](https://arxiv.org/html/1706.03762v7#S6.T4 "Table 4 ‣ 6.3 English Constituency Parsing ‣ 6 Results ‣ Attention Is All You Need") show that despite the lack of task-specific tuning our model performs surprisingly well, yielding better results than all previously reported models with the exception of the Recurrent Neural Network Grammar [[8](https://arxiv.org/html/1706.03762v7#bib.bib8)].
+
+In contrast to RNN sequence-to-sequence models [[37](https://arxiv.org/html/1706.03762v7#bib.bib37)], the Transformer outperforms the BerkeleyParser [[29](https://arxiv.org/html/1706.03762v7#bib.bib29)] even when training only on the WSJ training set of 40K sentences.
+
+## 7 Conclusion
+
+In this work, we presented the Transformer, the first sequence transduction model based entirely on attention, replacing the recurrent layers most commonly used in encoder-decoder architectures with multi-headed self-attention.
+
+For translation tasks, the Transformer can be trained significantly faster than architectures based on recurrent or convolutional layers. On both WMT 2014 English-to-German and WMT 2014 English-to-French translation tasks, we achieve a new state of the art. In the former task our best model outperforms even all previously reported ensembles.
+
+We are excited about the future of attention-based models and plan to apply them to other tasks. We plan to extend the Transformer to problems involving input and output modalities other than text and to investigate local, restricted attention mechanisms to efficiently handle large inputs and outputs such as images, audio and video. Making generation less sequential is another research goals of ours.
+
+##### Acknowledgements
+
+We are grateful to Nal Kalchbrenner and Stephan Gouws for their fruitful comments, corrections and inspiration.
+
+## References
+
+*   [1] Jimmy Lei Ba, Jamie Ryan Kiros, and Geoffrey E Hinton. Layer normalization. arXiv preprint arXiv:1607.06450, 2016. 
+*   [2] Dzmitry Bahdanau, Kyunghyun Cho, and Yoshua Bengio. Neural machine translation by jointly learning to align and translate. CoRR, abs/1409.0473, 2014. 
+*   [3] Denny Britz, Anna Goldie, Minh-Thang Luong, and Quoc V. Le. Massive exploration of neural machine translation architectures. CoRR, abs/1703.03906, 2017. 
+*   [4] Jianpeng Cheng, Li Dong, and Mirella Lapata. Long short-term memory-networks for machine reading. arXiv preprint arXiv:1601.06733, 2016. 
+*   [5] Kyunghyun Cho, Bart van Merrienboer, Caglar Gulcehre, Fethi Bougares, Holger Schwenk, and Yoshua Bengio. Learning phrase representations using rnn encoder-decoder for statistical machine translation. CoRR, abs/1406.1078, 2014. 
+*   [6] Francois Chollet. Xception: Deep learning with depthwise separable convolutions. arXiv preprint arXiv:1610.02357, 2016. 
+*   [7] Junyoung Chung, Çaglar Gülçehre, Kyunghyun Cho, and Yoshua Bengio. Empirical evaluation of gated recurrent neural networks on sequence modeling. CoRR, abs/1412.3555, 2014. 
+*   [8] Chris Dyer, Adhiguna Kuncoro, Miguel Ballesteros, and Noah A. Smith. Recurrent neural network grammars. In Proc. of NAACL, 2016. 
+*   [9] Jonas Gehring, Michael Auli, David Grangier, Denis Yarats, and Yann N. Dauphin. Convolutional sequence to sequence learning. arXiv preprint arXiv:1705.03122v2, 2017. 
+*   [10] Alex Graves. Generating sequences with recurrent neural networks. arXiv preprint arXiv:1308.0850, 2013. 
+*   [11] Kaiming He, Xiangyu Zhang, Shaoqing Ren, and Jian Sun. Deep residual learning for image recognition. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pages 770–778, 2016. 
+*   [12] Sepp Hochreiter, Yoshua Bengio, Paolo Frasconi, and Jürgen Schmidhuber. Gradient flow in recurrent nets: the difficulty of learning long-term dependencies, 2001. 
+*   [13] Sepp Hochreiter and Jürgen Schmidhuber. Long short-term memory. Neural computation, 9(8):1735–1780, 1997. 
+*   [14] Zhongqiang Huang and Mary Harper. Self-training PCFG grammars with latent annotations across languages. In Proceedings of the 2009 Conference on Empirical Methods in Natural Language Processing, pages 832–841. ACL, August 2009. 
+*   [15] Rafal Jozefowicz, Oriol Vinyals, Mike Schuster, Noam Shazeer, and Yonghui Wu. Exploring the limits of language modeling. arXiv preprint arXiv:1602.02410, 2016. 
+*   [16] Łukasz Kaiser and Samy Bengio. Can active memory replace attention? In Advances in Neural Information Processing Systems, (NIPS), 2016. 
+*   [17] Łukasz Kaiser and Ilya Sutskever. Neural GPUs learn algorithms. In International Conference on Learning Representations (ICLR), 2016. 
+*   [18] Nal Kalchbrenner, Lasse Espeholt, Karen Simonyan, Aaron van den Oord, Alex Graves, and Koray Kavukcuoglu. Neural machine translation in linear time. arXiv preprint arXiv:1610.10099v2, 2017. 
+*   [19] Yoon Kim, Carl Denton, Luong Hoang, and Alexander M. Rush. Structured attention networks. In International Conference on Learning Representations, 2017. 
+*   [20] Diederik Kingma and Jimmy Ba. Adam: A method for stochastic optimization. In ICLR, 2015. 
+*   [21] Oleksii Kuchaiev and Boris Ginsburg. Factorization tricks for LSTM networks. arXiv preprint arXiv:1703.10722, 2017. 
+*   [22] Zhouhan Lin, Minwei Feng, Cicero Nogueira dos Santos, Mo Yu, Bing Xiang, Bowen Zhou, and Yoshua Bengio. A structured self-attentive sentence embedding. arXiv preprint arXiv:1703.03130, 2017. 
+*   [23] Minh-Thang Luong, Quoc V. Le, Ilya Sutskever, Oriol Vinyals, and Lukasz Kaiser. Multi-task sequence to sequence learning. arXiv preprint arXiv:1511.06114, 2015. 
+*   [24] Minh-Thang Luong, Hieu Pham, and Christopher D Manning. Effective approaches to attention-based neural machine translation. arXiv preprint arXiv:1508.04025, 2015. 
+*   [25] Mitchell P Marcus, Mary Ann Marcinkiewicz, and Beatrice Santorini. Building a large annotated corpus of english: The penn treebank. Computational linguistics, 19(2):313–330, 1993. 
+*   [26] David McClosky, Eugene Charniak, and Mark Johnson. Effective self-training for parsing. In Proceedings of the Human Language Technology Conference of the NAACL, Main Conference, pages 152–159. ACL, June 2006. 
+*   [27] Ankur Parikh, Oscar Täckström, Dipanjan Das, and Jakob Uszkoreit. A decomposable attention model. In Empirical Methods in Natural Language Processing, 2016. 
+*   [28] Romain Paulus, Caiming Xiong, and Richard Socher. A deep reinforced model for abstractive summarization. arXiv preprint arXiv:1705.04304, 2017. 
+*   [29] Slav Petrov, Leon Barrett, Romain Thibaux, and Dan Klein. Learning accurate, compact, and interpretable tree annotation. In Proceedings of the 21st International Conference on Computational Linguistics and 44th Annual Meeting of the ACL, pages 433–440. ACL, July 2006. 
+*   [30] Ofir Press and Lior Wolf. Using the output embedding to improve language models. arXiv preprint arXiv:1608.05859, 2016. 
+*   [31] Rico Sennrich, Barry Haddow, and Alexandra Birch. Neural machine translation of rare words with subword units. arXiv preprint arXiv:1508.07909, 2015. 
+*   [32] Noam Shazeer, Azalia Mirhoseini, Krzysztof Maziarz, Andy Davis, Quoc Le, Geoffrey Hinton, and Jeff Dean. Outrageously large neural networks: The sparsely-gated mixture-of-experts layer. arXiv preprint arXiv:1701.06538, 2017. 
+*   [33] Nitish Srivastava, Geoffrey E Hinton, Alex Krizhevsky, Ilya Sutskever, and Ruslan Salakhutdinov. Dropout: a simple way to prevent neural networks from overfitting. Journal of Machine Learning Research, 15(1):1929–1958, 2014. 
+*   [34] Sainbayar Sukhbaatar, Arthur Szlam, Jason Weston, and Rob Fergus. End-to-end memory networks. In C.Cortes, N.D. Lawrence, D.D. Lee, M.Sugiyama, and R.Garnett, editors, Advances in Neural Information Processing Systems 28, pages 2440–2448. Curran Associates, Inc., 2015. 
+*   [35] Ilya Sutskever, Oriol Vinyals, and Quoc VV Le. Sequence to sequence learning with neural networks. In Advances in Neural Information Processing Systems, pages 3104–3112, 2014. 
+*   [36] Christian Szegedy, Vincent Vanhoucke, Sergey Ioffe, Jonathon Shlens, and Zbigniew Wojna. Rethinking the inception architecture for computer vision. CoRR, abs/1512.00567, 2015. 
+*   [37] Vinyals & Kaiser, Koo, Petrov, Sutskever, and Hinton. Grammar as a foreign language. In Advances in Neural Information Processing Systems, 2015. 
+*   [38] Yonghui Wu, Mike Schuster, Zhifeng Chen, Quoc V Le, Mohammad Norouzi, Wolfgang Macherey, Maxim Krikun, Yuan Cao, Qin Gao, Klaus Macherey, et al. Google’s neural machine translation system: Bridging the gap between human and machine translation. arXiv preprint arXiv:1609.08144, 2016. 
+*   [39] Jie Zhou, Ying Cao, Xuguang Wang, Peng Li, and Wei Xu. Deep recurrent models with fast-forward connections for neural machine translation. CoRR, abs/1606.04199, 2016. 
+*   [40] Muhua Zhu, Yue Zhang, Wenliang Chen, Min Zhang, and Jingbo Zhu. Fast and accurate shift-reduce constituent parsing. In Proceedings of the 51st Annual Meeting of the ACL (Volume 1: Long Papers), pages 434–443. ACL, August 2013. 
+
+## Attention Visualizations
+
+![Image 4: Refer to caption](https://arxiv.org/html/1706.03762v7/x1.png)
+
+Figure 3: An example of the attention mechanism following long-distance dependencies in the encoder self-attention in layer 5 of 6. Many of the attention heads attend to a distant dependency of the verb ‘making’, completing the phrase ‘making…more difficult’. Attentions here shown only for the word ‘making’. Different colors represent different heads. Best viewed in color.
+
+![Image 5: Refer to caption](https://arxiv.org/html/1706.03762v7/x2.png)
+
+![Image 6: Refer to caption](https://arxiv.org/html/1706.03762v7/x3.png)
+
+Figure 4: Two attention heads, also in layer 5 of 6, apparently involved in anaphora resolution. Top: Full attentions for head 5. Bottom: Isolated attentions from just the word ‘its’ for attention heads 5 and 6. Note that the attentions are very sharp for this word.
+
+![Image 7: Refer to caption](https://arxiv.org/html/1706.03762v7/x4.png)
+
+![Image 8: Refer to caption](https://arxiv.org/html/1706.03762v7/x5.png)
+
+Figure 5: Many of the attention heads exhibit behaviour that seems related to the structure of the sentence. We give two such examples above, from two different heads from the encoder self-attention at layer 5 of 6. The heads clearly learned to perform different tasks.
diff --git a/apps/room-service/static/demo-kimi.md b/apps/room-service/static/demo-kimi.md
new file mode 100644
index 000000000..26bace096
--- /dev/null
+++ b/apps/room-service/static/demo-kimi.md
@@ -0,0 +1,1476 @@
+Title: Kimi K2.5: Visual Agentic Intelligence
+
+URL Source: https://arxiv.org/html/2602.02276v1
+
+Published Time: Tue, 03 Feb 2026 03:12:20 GMT
+
+Markdown Content:
+###### Abstract
+
+We introduce Kimi K2.5, an open-source multimodal agentic model designed to advance general agentic intelligence. K2.5 emphasizes the joint optimization of text and vision so that two modalities enhance each other. This includes a series of techniques such as joint text-vision pre-training, zero-vision SFT, and joint text-vision reinforcement learning. Building on this multimodal foundation, K2.5 introduces Agent Swarm, a self-directed parallel agent orchestration framework that dynamically decomposes complex tasks into heterogeneous sub-problems and executes them concurrently. Extensive evaluations show that Kimi K2.5 achieves state-of-the-art results across various domains including coding, vision, reasoning, and agentic tasks. Agent Swarm also reduces latency by up to 4.5\times over single-agent baselines. We release the post-trained Kimi K2.5 model checkpoint 1 1 1[https://huggingface.co/moonshotai/Kimi-K2.5](https://huggingface.co/moonshotai/Kimi-K2.5) to facilitate future research and real-world applications of agentic intelligence.
+
+![Image 1: Refer to caption](https://arxiv.org/html/2602.02276v1/figures/k25-main-result.png)
+
+Figure 1: Kimi K2.5 main results.
+
+## 1 Introduction
+
+Large Language Models (LLMs) are rapidly evolving toward agentic intelligence. Recent advances, such as GPT-5.2[[41](https://arxiv.org/html/2602.02276v1#bib.bib227 "Introducing gpt 5.2")], Claude Opus 4.5[[4](https://arxiv.org/html/2602.02276v1#bib.bib226 "Claude opus 4.5 system card")], Gemini 3 Pro[[19](https://arxiv.org/html/2602.02276v1#bib.bib228 "Gemini 3 pro")], and Kimi K2-Thinking[[1](https://arxiv.org/html/2602.02276v1#bib.bib222 "Introducing kimi k2 thinking")], demonstrate substantial progress in agentic capabilities, particularly in tool calling and reasoning. These models increasingly exhibit the ability to decompose complex problems into multi-step plans and to execute long sequences of interleaved reasoning and actions.
+
+In this report, we introduce the training methods and evaluation results of Kimi K2.5. Concretely, we improve the training of K2.5 over previous models in the following two key aspects.
+
+Joint Optimization of Text and Vision. A key insight from the practice of K2.5 is that joint optimization of text and vision enhances both modalities and avoids the conflict. Specifically, we devise a set of techniques for this purpose. During pre-training, in contrast to conventional approaches that add visual tokens to a text backbone at a late stage[[7](https://arxiv.org/html/2602.02276v1#bib.bib17 "Qwen3-vl technical report"), [20](https://arxiv.org/html/2602.02276v1#bib.bib18 "Seed1.5-vl technical report")], we find early vision fusion with lower ratios tends to yield better results given the fixed total vision-text tokens. Therefore, K2.5 mixes text and vision tokens with a constant ratio throughout the entire training process.
+
+Architecturally, Kimi K2.5 employs MoonViT-3D, a native-resolution vision encoder incorporating the NaViT packing strategy[[14](https://arxiv.org/html/2602.02276v1#bib.bib22 "Patch n’ pack: navit, a vision transformer for any aspect ratio and resolution")], enabling variable-resolution image inputs. For video understanding, we introduce a lightweight 3D ViT compression mechanism: consecutive frames are grouped in fours, processed through the shared MoonViT encoder, and temporally averaged at the patch level. This design allows Kimi K2.5 to process videos up to 4 \times longer within the same context window while maintaining complete weight sharing between image and video encoders.
+
+During post-training, we introduce zero-vision SFT—text-only SFT alone activates visual reasoning and tool use. We find that adding human-designed visual trajectories at this stage hurts generalization. In contrast, text-only SFT performs better—likely because joint pretraining already establishes strong vision-text alignment, enabling capabilities to generalize naturally across modalities. We then apply joint RL on both text and vision tasks. Crucially, we find visual RL enhances textual performance rather than degrading it, with improvements on MMLU-Pro and GPQA-Diamond. This bidirectional enhancement—text bootstraps vision, vision refines text—represents superior cross-modal alignment in joint training.
+
+Agent Swarm: Parallel Agent Orchestration. Most existing agentic models rely on sequential execution of tool calls. Even systems capable of hundreds of reasoning steps, such as Kimi K2-Thinking[[1](https://arxiv.org/html/2602.02276v1#bib.bib222 "Introducing kimi k2 thinking")], suffer from linear scaling of inference time, leading to unacceptable latency and limiting task complexity. As agentic workloads grow in scope and heterogeneity—e.g., building a complex project that involves massive-scale research, design, and development—the sequential paradigm becomes increasingly inefficient.
+
+To overcome the latency and scalability limits of sequential agent execution, Kimi K2.5 introduces Agent Swarm, a dynamic framework for parallel agent orchestration. We propose a Parallel-Agent Reinforcement Learning (PARL) paradigm that departs from traditional agentic RL[[2](https://arxiv.org/html/2602.02276v1#bib.bib224 "Kimi-researcher end-to-end rl training for emerging agentic capabilities")]. In addition to optimizing tool execution via verifiable rewards, the model is equipped with interfaces for sub-agent creation and task delegation. During training, sub-agents are frozen and their execution trajectories are excluded from the optimization objective; only the orchestrator is updated via reinforcement learning. This decoupling circumvents two challenges of end-to-end co-optimization: credit assignment ambiguity and training instability. Agent Swarm enables complex tasks to be decomposed into heterogeneous sub-problems executed concurrently by domain-specialized agents, transforming task complexity from linear scaling to parallel processing. In wide-search scenarios, Agent Swarm reduces inference latency by up to 4.5\times while improving item-level F1 from 72.8% to 79.0% compared to single-agent baselines.
+
+Kimi K2.5 represents a unified architecture for general-purpose agentic intelligence, integrating vision and language, thinking and instant modes, chats and agents. It achieves strong performance across a broad range of agentic and frontier benchmarks, including state-of-the-art results in visual-to-code generation (image/video-to-code) and real-world software engineering in our internal evaluations, while scaling both the diversity of specialized agents and the degree of parallelism. To accelerate community progress toward General Agentic Intelligence, we open-source our post-trained checkpoints of Kimi K2.5, enabling researchers and developers to explore, refine, and deploy scalable agentic intelligence.
+
+## 2 Joint Optimization of Text and Vision
+
+Kimi K2.5 is a native multimodal model built upon Kimi K2 through large-scale joint pre-training on approximately 15 trillion mixed visual and text tokens. Unlike vision-adapted models that compromise either linguistic or visual capabilities, our joint pre-training paradigm enhances both modalities simultaneously. This section describes the multimodal joint optimization methodology that extends Kimi K2 to Kimi K2.5.
+
+### 2.1 Native Multimodal Pre-Training
+
+Table 1: Performance comparison across different vision-text joint-training strategies. Early fusion with a lower vision ratio yields better results given a fixed total vision-text token budget.
+
+Vision Injection Timing Vision-Text Ratio Vision Knowledge Vision Reasoning OCR Text Knowledge Text Reasoning Code
+Early 0%10%:90%25.8 43.8 65.7 45.5 58.5 24.8
+Mid 50%20%:80%25.0 40.7 64.1 43.9 58.6 24.0
+Late 80%50%:50%24.2 39.0 61.5 43.1 57.8 24.0
+
+A key design question for multimodal pre-training is: Given a fixed vision-text token budget, what is the optimal vision-text joint-training strategy. Conventional wisdom[[7](https://arxiv.org/html/2602.02276v1#bib.bib17 "Qwen3-vl technical report"), [20](https://arxiv.org/html/2602.02276v1#bib.bib18 "Seed1.5-vl technical report")] suggests introducing vision tokens predominantly in the later stages of LLM training at high ratios (e.g., 50% or higher) should accelerate multimodal capability acquisition, treating multimodal capability as a post-hoc add-on to linguistic competence.
+
+However, our experiments (as shown in Table[1](https://arxiv.org/html/2602.02276v1#S2.T1 "Table 1 ‣ 2.1 Native Multimodal Pre-Training ‣ 2 Joint Optimization of Text and Vision ‣ Kimi K2.5: Visual Agentic Intelligence") Figure[9](https://arxiv.org/html/2602.02276v1#A2.F9 "Figure 9 ‣ Appendix B Pre-training ‣ Kimi K2.5: Visual Agentic Intelligence")) reveal a different story. We conducted ablation studies varying the vision ratio and vision injection timing while keeping the total vision and text token budgets fixed. To strictly meet the targets for different ratios, we pre-trained the model with text-only tokens for a specifically calculated number of tokens before introducing vision data. Surprisingly, we found that the vision ratio has minimal impact on final multimodal performance. In fact, early fusion with a lower vision ratio yields better results given a fixed total vision-text token budget. This motivates our native multimodal pre-training strategy: rather than aggressive vision-heavy training concentrated at the end, we adopt a moderate vision ratio integrated early in the training process, allowing the model to naturally develop balanced multimodal representations while benefiting from extended co-optimization of both modalities.
+
+### 2.2 Zero-Vision SFT
+
+Pretrained VLMs do not naturally perform vision-based tool-calling, which poses a cold-start problem for multimodal RL. Conventional approaches address this issue through manually annotated or prompt-engineered chain-of-thought (CoT) data[[7](https://arxiv.org/html/2602.02276v1#bib.bib17 "Qwen3-vl technical report")], but such methods are limited in diversity, often restricting visual reasoning to simple diagrams and primitive tool manipulations (crop, rotate, flip).
+
+An observation is that high-quality text SFT data are relatively abundant and diverse. We propose a novel approach, zero-vision SFT, that uses only text SFT data to activate the visual, agentic capabilities during post-training. In this approach, all image manipulations are proxied through programmatic operations in IPython, effectively serving as a generalization of traditional vision tool-use. This "zero-vision" activation enables diverse reasoning behaviors, including pixel-level operations such as object size estimation via binarization and counting, and generalizes to visually grounded tasks such as object localization, counting, and OCR.
+
+Figure[2](https://arxiv.org/html/2602.02276v1#S2.F2 "Figure 2 ‣ 2.3 Joint Multimodal Reinforcement Learning (RL) ‣ 2 Joint Optimization of Text and Vision ‣ Kimi K2.5: Visual Agentic Intelligence") illustrates the RL training curves, where the starting points are obtained from zero-vision SFT. The results show that zero-vision SFT is sufficient for activating vision capabilities while ensuring generalization across modalities. This phenomenon is likely due to the joint pretraining of text and vision data as described in Section[2.1](https://arxiv.org/html/2602.02276v1#S2.SS1 "2.1 Native Multimodal Pre-Training ‣ 2 Joint Optimization of Text and Vision ‣ Kimi K2.5: Visual Agentic Intelligence"). Compared to zero-vision SFT, our preliminary experiments show that text-vision SFT yields much worse performance on visual, agentic tasks, possibly because of the lack of high-quality vision data.
+
+### 2.3 Joint Multimodal Reinforcement Learning (RL)
+
+In this section, we describe the methodology implemented in K2.5 that enables effective multimodal RL, from outcome-based visual RL to emergent cross-modal transfer that enhances textual performance.
+
+![Image 2: Refer to caption](https://arxiv.org/html/2602.02276v1/x2.png)
+
+Figure 2: Vision RL training curves on vision benchmarks starting from minimal zero-vision SFT. By scaling vision RL FLOPs, the performance continues to improve, demonstrating that zero-vision activation paired with long-running RL is sufficient for acquiring robust visual capabilities.
+
+##### Outcome-Based Visual RL
+
+Following the zero-vision SFT, the model requires further refinement to reliably incorporate visual inputs into reasoning. Text-initiated activation alone exhibits notable failure modes: visual inputs are sometimes ignored, and images may not be attended to when necessary. We employ outcome-based RL on tasks that explicitly require visual comprehension for correct solutions. We categorize these tasks into three domains:
+
+*   •Visual grounding and counting: Accurate localization and enumeration of objects within images; 
+*   •Chart and document understanding: Interpretation of structured visual information and text extraction; 
+*   •Vision-critical STEM problems: Mathematical and scientific questions filtered to require visual inputs. 
+
+Outcome-based RL on these tasks improves both basic visual capabilities and more complex agentic behaviors. Extracting these trajectories for rejection-sampling fine-tuning (RFT) enables a self-improving data pipeline, allowing subsequent joint RL stages to leverage richer multimodal reasoning traces.
+
+##### Visual RL Improves Text Performance
+
+Table 2: Cross-Modal Transfer: Vision RL Improves Textual Knowledge
+
+Benchmark Before Vision-RL After Vision-RL Improvement
+MMLU-Pro 84.7 86.4+1.7
+GPQA-Diamond 84.3 86.4+2.1
+LongBench v2 56.7 58.9+2.2
+
+To investigate potential trade-offs between visual and textual performance, we evaluated text-only benchmarks before and after visual RL. Surprisingly, outcome-based visual RL produced measurable improvements in textual tasks, including MMLU-Pro (84.7% \rightarrow 86.4%), GPQA-Diamond (84.3% \rightarrow 86.4%), and LongBench v2 (56.7% \rightarrow 58.9%) (Table[2](https://arxiv.org/html/2602.02276v1#S2.T2 "Table 2 ‣ Visual RL Improves Text Performance ‣ 2.3 Joint Multimodal Reinforcement Learning (RL) ‣ 2 Joint Optimization of Text and Vision ‣ Kimi K2.5: Visual Agentic Intelligence")). Analysis suggests that visual RL enhances calibration in areas requiring structured information extraction, reducing uncertainty on queries that resemble visually grounded reasoning (e.g., counting, OCR). These findings indicate that visual RL can contribute to cross-modal generalization, improving textual reasoning without observable degradation of language capabilities.
+
+Joint Multimodal RL Motivated by the finding that robust visual capabilities can emerge from zero-vision SFT paired with vision RL—which further enhances general text abilities—we adopt a joint multimodal RL paradigm during Kimi K2.5’s post-training. Departing from conventional modality-specific expert divisions, we organize RL domains not by input modality but by abilities—knowledge, reasoning, coding, agentic, etc. These domain experts jointly learn from both pure-text and multimodal queries, while the Generative Reward Model (GRM) similarly optimizes across heterogeneous traces without modality barriers. This pardaigm ensures that capability improvements acquired through either textual or visual inputs inherently generalize to enhance related abilities across the alternate modality, thereby maximizing cross-modal capability transfer.
+
+## 3 Agent Swarm
+
+The primary challenge of existing agent-based systems lies in their reliance on sequential execution of reasoning and tool-calling steps. While this structure may be effective for simpler, short-horizon tasks, it becomes inadequate as the complexity of the task increases and the accumulated context grows. As tasks evolve to contain broad information gathering and intricate, multi-branch reasoning, sequential systems often encounter significant bottlenecks [[6](https://arxiv.org/html/2602.02276v1#bib.bib223 "Building multi-agent systems: when and how to use them"), [4](https://arxiv.org/html/2602.02276v1#bib.bib226 "Claude opus 4.5 system card"), [5](https://arxiv.org/html/2602.02276v1#bib.bib225 "How we built our multi-agent research system")]. The limited capacity of a single agent working through each step one by one can lead to the exhaustion of practical reasoning depth and tool-call budgets, ultimately hindering the system’s ability to handle more complex scenarios.
+
+To address this, we introduce Agent Swarm and Parallel Agent Reinforcement Learning (PARL). Instead of executing a task as a reasoning chain or relying on pre-specified parallelization heuristics, K2.5 initiates an Agent Swarm through dynamic task decomposition, subagent instantiation, and parallel subtask scheduling. Importantly, parallelism is not presumed to be inherently advantageous; decisions regarding whether, when, and how to parallelize are explicitly learned through environmental feedback and RL-driven exploration. As shown in Figure[4](https://arxiv.org/html/2602.02276v1#S3.F4 "Figure 4 ‣ Prompt Construction for Parallel-agent Capability Induction ‣ 3 Agent Swarm ‣ Kimi K2.5: Visual Agentic Intelligence"), the progression of performance demonstrates this adaptive capability, with the cumulative reward increasing smoothly as the orchestrator optimizes its parallelization strategy throughout training.
+
+![Image 3: Refer to caption](https://arxiv.org/html/2602.02276v1/figures/multi-agent-rl-system.png)
+
+Figure 3: An agent swarm has a trainable orchestrator that dynamically creates specialized frozen subagents and decomposes complex tasks into parallelizable subtasks for efficient distributed execution.
+
+##### Architecture and Learning Setup
+
+The PARL framework adopts a decoupled architecture comprising a trainable orchestrator and frozen subagents instantiated from fixed intermediate policy checkpoints. This design deliberately avoids end-to-end co-optimization to circumvent two fundamental challenges: credit assignment ambiguity and training instability. In this multi-agent setting, outcome-based rewards are inherently sparse and noisy; a correct final answer does not guarantee flawless subagent execution, just as a failure does not imply universal subagent error. By freezing the subagents and treating their outputs as environmental observations rather than differentiable decision points, we disentangle high-level coordination logic from low-level execution proficiency, leading to more robust convergence. To improve efficiency, we first train the orchestrator using small-size subagents before transitioning to larger models. Our RL framework also supports dynamically adjusting the inference instance ratios between subagents and the orchestrator, thereby maximizing the resource usage across the cluster.
+
+##### PARL Reward
+
+Training a reliable parallel orchestrator is challenging due to the delayed, sparse, and non-stationary feedback inherent in independent subagent execution. To address this, we define the PARL reward as:
+
+\displaystyle r_{\mathrm{PARL}}(x,y)=\lambda_{1}\cdot\mspace{-26.0mu}\underbrace{r_{\text{parallel}}}_{\text{instantiation reward}}\mspace{-9.0mu}+\mspace{18.0mu}\lambda_{2}\cdot\mspace{-32.0mu}\underbrace{r_{\text{finish}}}_{\text{sub-agent finish rate}}+\underbrace{r_{\text{perf}}(x,y)}_{\text{task-level outcome}}\,.
+
+The performance reward r_{\text{perf}} evaluates the overall success and quality of the solution y for a given task x. This is augmented by two auxiliary rewards, each addressing a distinct challenge in learning parallel orchestration. The reward r_{\text{parallel}} is introduced to mitigate _serial collapse_—a local optimum where the orchestrator defaults to single-agent execution. By incentivizing subagent instantiation, this term encourages the exploration of concurrent scheduling spaces. The r_{\text{finish}} reward focuses on the successful completion of assigned subtasks. It is used to prevent _spurious parallelism_, a reward-hacking behavior in which the orchestrator increases parallel metrics dramatically by spawning many subagents without meaningful task decomposition. By rewarding completed subtasks, r_{\text{finish}} enforces feasibility and guides the policy toward valid and effective decompositions.
+
+To ensure the final policy optimizes for the primary objective, the hyperparameters \lambda_{1} and \lambda_{2} are annealed to zero over the course of training.
+
+##### Critical Steps as Resource Constraint
+
+To measure computational time cost in a parallel-agent setting, we define _critical steps_ by analogy to the _critical path_ in a computation graph. We model an episode as a sequence of execution stages indexed by t=1,\dots,T. In each stage, the main agent executes an action, which corresponds to either direct tool invocation or the instantiation of a group of subagents running in parallel. Let S_{\mathrm{main}}^{(t)} denote the number of steps taken by the main agent in stage t (typically S_{\mathrm{main}}^{(t)}=1), and S_{\mathrm{sub},i}^{(t)} denote the number of steps taken by the i-th subagent in that parallel group. The duration of stage t is governed by the longest-running subagent within that cohort. Consequently, the total critical steps for an episode are defined as
+
+\displaystyle\text{CriticalSteps}=\sum_{t=1}^{T}\left(S_{\mathrm{main}}^{(t)}+\max_{i}S_{\mathrm{sub},i}^{(t)}\right).
+
+By constraining training and evaluation using critical steps rather than total steps, the framework explicitly incentivizes effective parallelization. Excessive subtask creation that does not reduce the maximum execution time of parallel groups yields little benefit under this metric, while well-balanced task decomposition that shortens the longest parallel branch directly reduces critical steps. As a result, the orchestrator is encouraged to allocate work across subagents in a way that minimizes end-to-end latency, rather than merely maximizing concurrency or total work performed.
+
+##### Prompt Construction for Parallel-agent Capability Induction
+
+To incentivize the orchestrator to leverage the advantages of parallelization, we construct a suite of synthetic prompts designed to stress the limits of sequential agentic execution. These prompts emphasize either _wide search_, requiring simultaneous exploration of many independent information sources, or _deep search_, requiring multiple reasoning branches with delayed aggregation. We additionally include tasks inspired by real-world workloads, such as long-context document analysis and large-scale file downloading. When executed sequentially, these tasks are difficult to complete within fixed reasoning-step and tool-call budgets. By construction, they encourage the orchestrator to allocate subtasks in parallel, enabling completion within fewer critical steps than would be feasible for a single sequential agent. Importantly, the prompts do not explicitly instruct the model to parallelize. Instead, they shape the task distribution such that parallel decomposition and scheduling strategies are naturally favored.
+
+![Image 4: Refer to caption](https://arxiv.org/html/2602.02276v1/x3.png)
+
+Figure 4: In our parallel-agent reinforcement learning environment, the training accuracy increases smoothly as training progresses. At the same time, the level of parallelism during training also gradually increases.
+
+## 4 Method Overview
+
+### 4.1 Foundation: Kimi K2 Base Model
+
+The foundation of Kimi K2.5 is Kimi K2[[53](https://arxiv.org/html/2602.02276v1#bib.bib108 "Kimi k2: open agentic intelligence")], a trillion-parameter mixture-of-experts (MoE) transformer[[59](https://arxiv.org/html/2602.02276v1#bib.bib67 "Attention is all you need")] model pre-trained on 15 trillion high-quality text tokens. Kimi K2 employs the token-efficient MuonClip optimizer[[29](https://arxiv.org/html/2602.02276v1#bib.bib180 "Muon: an optimizer for hidden layers in neural networks"), [33](https://arxiv.org/html/2602.02276v1#bib.bib179 "Muon is scalable for llm training")] with QK-Clip for training stability. The model comprises 1.04 trillion total parameters with 32 billion activated parameters, utilizing 384 experts with 8 activated per token (sparsity of 48). For detailed descriptions of MuonClip, architecture design, and training infrastructure, we refer to the Kimi K2 technical report[[53](https://arxiv.org/html/2602.02276v1#bib.bib108 "Kimi k2: open agentic intelligence")].
+
+### 4.2 Model Architecture
+
+The multimodal architecture of Kimi K2.5 consists of three components: a three-dimensional native-resolution vision encoder (MoonViT-3D), an MLP projector, and the Kimi K2 MoE language model, following the design principles established in Kimi-VL[[54](https://arxiv.org/html/2602.02276v1#bib.bib13 "Kimi-vl technical report")].
+
+##### MoonViT-3D: Shared Embedding Space for Images and Videos
+
+In Kimi-VL, we employ MoonViT to natively process images at their original resolutions, eliminating the need for complex sub-image splitting and splicing operations. Initialized from SigLIP-SO-400M[[77](https://arxiv.org/html/2602.02276v1#bib.bib23 "Sigmoid loss for language image pre-training")], MoonViT incorporates the patch packing strategy from NaViT[[14](https://arxiv.org/html/2602.02276v1#bib.bib22 "Patch n’ pack: navit, a vision transformer for any aspect ratio and resolution")], where single images are divided into patches, flattened, and sequentially concatenated into 1D sequences, thereby enabling efficient simultaneous training on images at varying resolutions.
+
+To maximize the transfer of image understanding capabilities to video, we introduce MoonViT-3D with a unified architecture, fully shared parameters, and a consistent embedding space. By generalizing the “patch n’ pack“ philosophy to the temporal dimension, up to four consecutive frames are treated as a spatiotemporal volume: 2D patches from these frames are jointly flattened and packed into a single 1D sequence, allowing the identical attention mechanism to operate seamlessly across both space and time. While the extra temporal attention improves understanding on high-speed motions and visual effects, the sharing maximizes knowledge generalization from static images to dynamic videos, achieving strong video understanding performance (see in Tab.[4](https://arxiv.org/html/2602.02276v1#S5.T4 "Table 4 ‣ Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence")) without requiring specialized video modules or architectural bifurcation. Prior to the MLP projector, lightweight temporal pooling aggregates patches within each temporal chunk, yielding 4\times temporal compression to significantly extend feasible video length. The result is a unified pipeline where knowledge and ability obtained from image pretraining transfers holistically to videos through one shared parameter space and feature representation.
+
+### 4.3 Pre-training Pipeline
+
+As illustrated in Table[3](https://arxiv.org/html/2602.02276v1#S4.T3 "Table 3 ‣ 4.3 Pre-training Pipeline ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"), Kimi K2.5’s pre-training builds upon the Kimi K2 language model checkpoint and processes approximately 15T tokens across three stages: first, standalone ViT training to establish a robust native-resolution visual encoder; second, joint pre-training to simultaneously enhance language and multimodal capabilities; and third, mid-training on high-quality data and long-context activation to refine capabilities and extend context windows.
+
+Table 3: Overview of training stages: data composition, token volumes, sequence lengths, and trainable components.
+
+Stages ViT Training Joint Pre-training Joint Long-context Mid-training
+Data Alt text Synthesis Caption Grounding, OCR, Video+Text, Knowledge Interleaving Video, OS Screenshot+High-quality Text & Multimodal Long Text, Long Video Reasoning, Long-CoT
+Sequence length 4096 4096 32768\rightarrow 262144
+Tokens 1T 15T 500B\rightarrow 200B
+Training ViT ViT & LLM ViT & LLM
+
+##### ViT Training Stage
+
+The MoonViT-3D is continual pre-trained from SigLIP[[77](https://arxiv.org/html/2602.02276v1#bib.bib23 "Sigmoid loss for language image pre-training")] on image-text and video-text pairs, where the text components consist of a variety of targets: image alt texts, synthetic captions of images and videos, grounding bboxes, and OCR texts. Unlike the implementation in Kimi-VL[[54](https://arxiv.org/html/2602.02276v1#bib.bib13 "Kimi-vl technical report")], this continual pre-training does not include a contrastive loss, but incorporates solely cross-entropy loss {L}_{caption} for caption generation conditioned on input images and videos. We adopt a two-stage alignment strategy. In the first stage, we update the MoonViT-3D to align it with Moonlight-16B-A3B[[33](https://arxiv.org/html/2602.02276v1#bib.bib179 "Muon is scalable for llm training")] via the caption loss, consuming about 1T tokens with very few training FLOPs. This stage allows MoonViT-3D to primarily understand high-resolution images and videos. A very short second stage follows, updating only the MLP projector to bridge the ViT with the 1T LLM for smoother joint pre-training.
+
+##### Joint Training Stages
+
+The joint pre-training stage continues from a near-end Kimi K2 checkpoint over additional 15T vision-text tokens at 4K sequence length. The data recipe extends Kimi K2’s pre-training distribution by introducing unique tokens, adjusting data proportions with increased weight on coding-related content, and controlling maximum epochs per data source. The third stage performs long-context activation with integrated higher-quality mid-training data, sequentially extending context length via YaRN[[44](https://arxiv.org/html/2602.02276v1#bib.bib45 "Yarn: efficient context window extension of large language models")] interpolation. This yields significant generalization improvements in long-context text understanding and long video comprehension.
+
+### 4.4 Post-Training
+
+#### 4.4.1 Supervised Fine-Tuning
+
+Following the SFT pipeline established by Kimi K2 [[53](https://arxiv.org/html/2602.02276v1#bib.bib108 "Kimi k2: open agentic intelligence")], we developed K2.5 by synthesizing high-quality candidate responses from K2, K2 Thinking and a suite of proprietary in-house expert models. Our data generation strategy employs specialized pipelines tailored to specific domains, integrating human annotation with advanced prompt engineering and multi-stage verification. This methodology produced a large-scale instruction-tuning dataset featuring diverse prompts and intricate reasoning trajectories, ultimately training the model to prioritize interactive reasoning and precise tool-calling for complex, real-world applications.
+
+#### 4.4.2 Reinforcement Learning
+
+Reinforcement learning constitutes a crucial phase of our post-training. To facilitate joint optimization across text and vision modalities, as well as to enable PARL for agent swarm, we develop a Unified Agentic Reinforcement Learning Environment (Appendix[D](https://arxiv.org/html/2602.02276v1#A4 "Appendix D Unified Agentic Reinforcement Learning Environment ‣ Kimi K2.5: Visual Agentic Intelligence")) and optimize the RL algorithms. Both text-vision joint RL and PARL are built upon the algorithms described in this section.
+
+##### Policy Optimization
+
+For each problem x sampled from a dataset \mathcal{D}, K responses \{y_{1},\dots,y_{K}\} are generated using the previous policy \pi_{\mathrm{old}}. We optimize the model \pi_{\theta} with respect to the following objective:
+
+\displaystyle L_{\mathrm{RL}}(\theta)=\mathbb{E}_{x\sim\mathcal{D}}\left[\frac{1}{N}\sum_{j=1}^{K}\sum_{i=1}^{|y_{j}|}\mathrm{Clip}\left(\frac{\pi_{\theta}(y_{j}^{i}|x,y_{j}^{0:i})}{\pi_{\mathrm{old}}(y_{j}^{i}|x,y_{j}^{0:i})},\alpha,\beta\right)({r}(x,y_{j})-\bar{r}(x))-\tau\left(\log\frac{\pi_{\theta}(y_{j}^{i}|x,y_{j}^{0:i})}{\pi_{\mathrm{old}}(y_{j}^{i}|x,y_{j}^{0:i})}\right)^{2}\right]\,.(1)
+
+Here \alpha,\beta,\tau>0 are hyperparameters, y^{j}_{0:i} is the prefix up to the i-th token of the j-th response, N=\sum_{i=1}^{K}|y_{i}| is the total number of generated tokens in a batch, \bar{r}(x)=\frac{1}{K}\sum_{j=1}^{K}r(x,y_{j}) is the mean reward of all generated responses.
+
+This loss function departs from the policy optimization algorithm used in K1.5[[30](https://arxiv.org/html/2602.02276v1#bib.bib107 "Kimi k1. 5: scaling reinforcement learning with llms")] by introducing a token-level clipping mechanism designed to mitigate the off-policy divergence amplified by discrepancies between training and inference frameworks. The mechanism functions as a simple gradient masking scheme: policy gradients are computed normally for tokens with log-ratios within the interval [\alpha,\beta], while gradients for tokens falling outside this range are zeroed out. Notably, a key distinction from standard PPO clipping [[50](https://arxiv.org/html/2602.02276v1#bib.bib203 "Proximal policy optimization algorithms")] is that our method relies strictly on the log-ratio to explicitly bound off-policy drift, regardless of the sign of the advantages. This approach aligns with recent strategies proposed to stabilize large-scale RL training [[74](https://arxiv.org/html/2602.02276v1#bib.bib201 "Your efficient rl framework secretly brings you off-policy rl training"), [78](https://arxiv.org/html/2602.02276v1#bib.bib202 "Small leak can sink a great ship–boost rl training on moe with icepop!")]. Empirically, we find this mechanism essential for maintaining training stability in complex domains requiring long-horizon, multi-step tool-use reasoning. We employ the MuonClip optimizer[[29](https://arxiv.org/html/2602.02276v1#bib.bib180 "Muon: an optimizer for hidden layers in neural networks"), [33](https://arxiv.org/html/2602.02276v1#bib.bib179 "Muon is scalable for llm training")] to minimize this objective.
+
+##### Reward Function
+
+We apply a rule-based outcome reward for tasks with verifiable solutions, such as reasoning and agentic tasks. To optimize resource consumption, we also incorporate a budget-control reward aimed at enhancing token efficiency. For general-purpose tasks, we employ Generative Reward Models (GRMs) that provide granular evaluations aligned with Kimi’s internal value criteria. In addition, for visual tasks, we design task-specific reward functions to provide fine-grained supervision. For visual grounding and point localization tasks, we employ an F1-based reward with soft matching: grounding tasks derive soft matches from Intersection over Union (IoU) and point tasks derive soft matches from Gaussian-weighted distances under optimal matching. For polygon segmentation tasks, we rasterize the predicted polygon into a binary mask and compute the segmentation IoU against the ground-truth mask to assign the reward. For OCR tasks, we adopt normalized edit distance to quantify character-level alignment between predictions and ground-truth. For counting tasks, rewards are assigned based on the absolute difference between predictions and ground-truth. Furthermore, we synthesize complex visual puzzle problems and utilize an LLM verifier (Kimi K2) to provide feedback.
+
+##### Generative Reward Models
+
+Kimi K2 leverages a self-critique rubric reward for open-ended generation [[53](https://arxiv.org/html/2602.02276v1#bib.bib108 "Kimi k2: open agentic intelligence")], and K2.5 extends this line of work by systematically deploying _Generative Reward Models (GRMs)_ across a broad range of agentic behaviors and multimodal trajectories. Rather than limiting reward modeling to conversational outputs, we apply GRMs on top of verified reward signals in diverse environments, including chat assistants, coding agents, search agents, and artifact-generating agents. Notably, GRMs function not as binary adjudicators, but as fine-grained evaluators aligned with Kimi’s values that are critical to user experiences, such as helpfulness, response readiness, contextual relevance, appropriate level of detail, aesthetic quality of generated artifacts, and strict instruction following. This design allows the reward signal to capture nuanced preference gradients that are difficult to encode with purely rule-based or task-specific verifiers. To mitigate reward hacking and overfitting to a single preference signal, we employ multiple alternative GRM rubrics tailored to different task contexts.
+
+##### Token Efficient Reinforcement Learning
+
+Token efficiency is central to LLMs with test-time scaling. While test-time scaling inherently trades computation for reasoning quality, practical gains require algorithmic innovations that actively navigate this trade-off. Our previous findings indicate that imposing a problem-dependent budget effectively constrains inference-time compute, incentivizing the model to generate more concise chain of thought reasoning patterns without unnecessary token expansion [[30](https://arxiv.org/html/2602.02276v1#bib.bib107 "Kimi k1. 5: scaling reinforcement learning with llms"), [53](https://arxiv.org/html/2602.02276v1#bib.bib108 "Kimi k2: open agentic intelligence")]. However, we also observe a _length-overfitting phenomenon_: models trained under rigid budget constraints often fail to generalize to higher compute scales. Consequently, they cannot effectively leverage additional inference-time tokens to solve complex problems, instead defaulting to truncated reasoning patterns.
+
+To this end, we propose _Toggle_, a training heuristic that alternates between inference-time scaling and budget-constrained optimization: for learning iteration t, the reward function is defined by
+
+\displaystyle\tilde{r}(x,y)=\begin{cases}r(x,y)\cdot\mathbb{I}\left\{\frac{1}{K}\sum_{i=1}^{K}r(x,y_{i})<\lambda\ \mathrm{or}\ |y_{i}|\leq\mathrm{budget(x)}\right\}&\text{if }\lfloor t/m\rfloor\pmod{2}=0\ (\mathrm{{Phase0}})\\
+r(x,y)&\text{if }\lfloor t/m\rfloor\pmod{2}=1\ (\mathrm{{Phase1}})\end{cases}\,.
+
+where \lambda and m are hyper-parameters of the algorithm and K is the number of rollouts per problem. Specifically, the algorithm alternates between two optimization phases every m iterations:
+
+*   •Phase0 (_budget limited phase_): The model is trained to solve the problem within a task-dependent token budget. To prevent a premature sacrifice of quality for efficiency, this constraint is conditionally applied: it is only enforced when the model’s mean accuracy for a given problem exceeds the threshold \lambda. 
+*   •Phase1 (_standard scaling phase_): The model generates responses up to the maximum token limit, encouraging the model to leverage computation for better inference-time scaling. 
+
+The problem-dependent budget is estimated from the \rho-th percentile of token lengths among the subset of correct responses:
+
+\mathrm{budget}(x)=\text{Percentile}\left(\{|y_{j}|\mid r(x,y_{i})=1,i=1,\dots,K\},\rho\right)\,.(2)
+
+This budget is estimated once at the beginning of training and remains fixed thereafter. Notably, Toggle functions as a stochastic alternating optimization for a bi-objective problem. It is specifically designed to reconcile reasoning capabilities with computational efficiency.
+
+![Image 5: Refer to caption](https://arxiv.org/html/2602.02276v1/figures/te-k2-thinking-radar.png)
+
+Figure 5: Comparison of model performance and token usage for Kimi K2 Thinking following token-efficient RL.
+
+We evaluate the effectiveness of Toggle on K2 Thinking[[1](https://arxiv.org/html/2602.02276v1#bib.bib222 "Introducing kimi k2 thinking")]. As shown in Figure[5](https://arxiv.org/html/2602.02276v1#S4.F5 "Figure 5 ‣ Token Efficient Reinforcement Learning ‣ 4.4.2 Reinforcement Learning ‣ 4.4 Post-Training ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"), we observe a consistent reduction in output length across nearly all benchmarks. On average, Toggle decreases output tokens by 25\sim 30% with a negligible impact on performance. We also observe that redundant patterns in the chain-of-thought, such as repeated verifications and mechanical calculations, decrease substantially. Furthermore, Toggle shows strong domain generalization. For example, when trained exclusively on mathematics and programming tasks, the model still achieves consistent token reductions on GPQA and MMLU-Pro with only marginal degradation in performance (Figure [5](https://arxiv.org/html/2602.02276v1#S4.F5 "Figure 5 ‣ Token Efficient Reinforcement Learning ‣ 4.4.2 Reinforcement Learning ‣ 4.4 Post-Training ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence")).
+
+### 4.5 Training Infrastructure
+
+Kimi K2.5 inherits the training infrastructure from Kimi K2[[53](https://arxiv.org/html/2602.02276v1#bib.bib108 "Kimi k2: open agentic intelligence")] with minimal modifications. For multimodal training, we propose Decoupled Encoder Process, where the vision encoder is incorporated into the existing pipeline with negligible additional overhead.
+
+#### 4.5.1 Decoupled Encoder Process (DEP)
+
+In a typical multimodal training paradigm utilizing Pipeline Parallelism (PP), the vision encoder and text embedding are co-located in the first stage of the pipeline (Stage-0). However, due to the inherent variations of multimodal input size (e.g., image counts and resolutions), Stage-0 suffers from drastic fluctuations in both computational load and memory usage. This forces existing solutions to adopt custom PP configurations for vision-language models — for instance, [[54](https://arxiv.org/html/2602.02276v1#bib.bib13 "Kimi-vl technical report")] manually adjusts the number of text decoder layers in Stage-0 to reserve memory. While this compromise alleviates memory pressure, it does not fundamentally resolve the load imbalance caused by multimodal input sizes. More critically, it precludes the direct reuse of parallel strategies that have been highly optimized for text-only training.
+
+Leveraging the unique topological position of the visual encoder within the computation graph — specifically, its role as the start of the forward pass and the end of the backward pass — our training uses Decoupled Encoder Process (DEP), which is composed of three stages in each training step:
+
+*   •Balanced Vision Forward: We first execute the forward pass for all visual data in the global batch. Because the vision encoder is small, we replicate it on all GPUs regardless of other parallelism strategies. During this phase, the forward computational workload is evenly distributed across all GPUs based on load metrics (e.g., image or patch counts). This eliminates load-imbalance caused by PP and visual token counts. To minimize peak memory usage, we discard all intermediate activations, retaining only the final output activations. The results are gathered back to PP Stage-0; 
+*   •Backbone Training: This phase performs the forward and backward passes for the main transformer backbone. By discarding intermediate activations in the preceding phase, we can now fully leverage any efficient parallel strategies validated in pure text training. After this phase, gradients are accumulated at the visual encoder output; 
+*   •Vision Recomputation & Backward: We re-compute the vision encoder forward pass, followed by a backward pass to compute gradients for parameters in the vision encoder; 
+
+DEP not only achieves load-balance, but also decouples the optimization strategy of the vision encoder and the main backbone. K2.5 seamlessly inherits the parallel strategy of K2, achieving a multimodal training efficiency of 90% relative to text-only training. We note a concurrent work, LongCat-Flash-Omni[[55](https://arxiv.org/html/2602.02276v1#bib.bib204 "Longcat-flash-omni technical report")], shares a similar design philosophy.
+
+## 5 Evaluations
+
+### 5.1 Main Results
+
+#### 5.1.1 Evaluation Settings
+
+##### Benchmarks
+
+We evaluate Kimi K2.5 on a comprehensive benchmark suite spanning text-based reasoning, competitive and agentic coding, multimodal understanding (image and video), autonomous agentic execution, and computer use. Our benchmark taxonomy is organized along the following capability axes:
+
+*   •Reasoning & General: Humanity’s Last Exam (HLE)[[46](https://arxiv.org/html/2602.02276v1#bib.bib187 "Humanity’s last exam")], AIME 2025[[40](https://arxiv.org/html/2602.02276v1#bib.bib243 "2025 american invitational mathematics examination i")], HMMT 2025 (Feb)[[58](https://arxiv.org/html/2602.02276v1#bib.bib244 "Harvard-mit mathematics tournament, february 2025")], IMO-AnswerBench[[36](https://arxiv.org/html/2602.02276v1#bib.bib236 "Towards robust mathematical reasoning")], GPQA-Diamond[[47](https://arxiv.org/html/2602.02276v1#bib.bib131 "Gpqa: a graduate-level google-proof q&a benchmark")], MMLU-Pro[[64](https://arxiv.org/html/2602.02276v1#bib.bib110 "MMLU-pro: a more robust and challenging multi-task language understanding benchmark")], SimpleQA Verified[[21](https://arxiv.org/html/2602.02276v1#bib.bib245 "SimpleQA verified: a reliable factuality benchmark to measure parametric knowledge")], AdvancedIF[[22](https://arxiv.org/html/2602.02276v1#bib.bib246 "AdvancedIF: rubric-based benchmarking and reinforcement learning for advancing llm instruction following")], and LongBench v2[[8](https://arxiv.org/html/2602.02276v1#bib.bib34 "LongBench v2: towards deeper understanding and reasoning on realistic long-context multitasks")]. 
+*   •Coding: SWE-Bench Verified[[28](https://arxiv.org/html/2602.02276v1#bib.bib238 "Swe-bench: can language models resolve real-world github issues?")], SWE-Bench Pro (public)[[15](https://arxiv.org/html/2602.02276v1#bib.bib239 "SWE-bench pro: can ai agents solve long-horizon software engineering tasks?")], SWE-Bench Multilingual[[28](https://arxiv.org/html/2602.02276v1#bib.bib238 "Swe-bench: can language models resolve real-world github issues?")], Terminal Bench 2.0[[38](https://arxiv.org/html/2602.02276v1#bib.bib240 "Terminal-bench: benchmarking agents on hard, realistic tasks in command line interfaces")], PaperBench (CodeDev)[[52](https://arxiv.org/html/2602.02276v1#bib.bib193 "PaperBench: evaluating ai’s ability to replicate ai research")], CyberGym[[66](https://arxiv.org/html/2602.02276v1#bib.bib237 "CyberGym: evaluating ai agents’ cybersecurity capabilities with real-world vulnerabilities at scale")], SciCode[[56](https://arxiv.org/html/2602.02276v1#bib.bib242 "Scicode: a research coding benchmark curated by scientists")], OJBench (cpp)[[65](https://arxiv.org/html/2602.02276v1#bib.bib241 "OJBench: a competition level code benchmark for large language models")], and LiveCodeBench (v6)[[27](https://arxiv.org/html/2602.02276v1#bib.bib121 "Livecodebench: holistic and contamination free evaluation of large language models for code")]. 
+*   •Agentic Capabilities: BrowseComp[[68](https://arxiv.org/html/2602.02276v1#bib.bib230 "BrowseComp: a simple yet challenging benchmark for browsing agents")], WideSearch[[69](https://arxiv.org/html/2602.02276v1#bib.bib231 "WideSearch: benchmarking agentic broad info-seeking")],DeepSearchQA[[60](https://arxiv.org/html/2602.02276v1#bib.bib232 "DeepSearchQA: bridging the comprehensiveness gap for deep research agents")], FinSearchComp (T2&T3)[[25](https://arxiv.org/html/2602.02276v1#bib.bib233 "FinSearchComp: towards a realistic, expert-level evaluation of financial search and reasoning")], Seal-0[[45](https://arxiv.org/html/2602.02276v1#bib.bib234 "SealQA: raising the bar for reasoning in search-augmented language models")], GDPVal[[43](https://arxiv.org/html/2602.02276v1#bib.bib235 "GDPval: evaluating AI model performance on real-world economically valuable tasks")]. 
+*   •Image Understanding: (math & reasoning) MMMU-Pro[[76](https://arxiv.org/html/2602.02276v1#bib.bib205 "MMMU-pro: a more robust multi-discipline multimodal understanding benchmark")], MMMU (val)[[75](https://arxiv.org/html/2602.02276v1#bib.bib1 "MMMU: a massive multi-discipline multimodal understanding and reasoning benchmark for expert agi")], CharXiv (RQ)[[67](https://arxiv.org/html/2602.02276v1#bib.bib214 "CharXiv: charting gaps in realistic chart understanding in multimodal llms")], MathVision[[61](https://arxiv.org/html/2602.02276v1#bib.bib206 "Measuring multimodal mathematical reasoning with math-vision dataset")] and MathVista (mini)[[35](https://arxiv.org/html/2602.02276v1#bib.bib213 "MathVista: evaluating mathematical reasoning of foundation models in visual contexts")]; (vision knowledge) SimpleVQA[[12](https://arxiv.org/html/2602.02276v1#bib.bib217 "SimpleVQA: multimodal factuality evaluation for multimodal large language models")] and WorldVQA 2 2 2 https://github.com/MoonshotAI/WorldVQA; (perception) ZeroBench (w/ and w/o tools)[[48](https://arxiv.org/html/2602.02276v1#bib.bib220 "ZeroBench: an impossible visual benchmark for contemporary large multimodal models")], BabyVision[[11](https://arxiv.org/html/2602.02276v1#bib.bib207 "BabyVision: visual reasoning beyond language")], BLINK[[17](https://arxiv.org/html/2602.02276v1#bib.bib2 "BLINK: multimodal large language models can see but not perceive")] and MMVP[[57](https://arxiv.org/html/2602.02276v1#bib.bib3 "Eyes wide shut? exploring the visual shortcomings of multimodal llms")]; (OCR & document) OCRBench[[34](https://arxiv.org/html/2602.02276v1#bib.bib219 "OCRBench: on the hidden mystery of ocr in large multimodal models")], OmniDocBench 1.5[[42](https://arxiv.org/html/2602.02276v1#bib.bib210 "OmniDocBench: benchmarking diverse pdf document parsing with comprehensive annotations")] and InfoVQA[[37](https://arxiv.org/html/2602.02276v1#bib.bib218 "InfographicVQA")]. 
+*   •Video Understanding: VideoMMMU[[24](https://arxiv.org/html/2602.02276v1#bib.bib211 "Video-mmmu: evaluating knowledge acquisition from multi-discipline professional videos")], MMVU[[79](https://arxiv.org/html/2602.02276v1#bib.bib209 "MMVU: measuring expert-level multi-discipline video understanding")], MotionBench[[23](https://arxiv.org/html/2602.02276v1#bib.bib208 "MotionBench: benchmarking and improving fine-grained video motion understanding for vision language models")], Video-MME[[16](https://arxiv.org/html/2602.02276v1#bib.bib212 "Video-mme: the first-ever comprehensive evaluation benchmark of multi-modal llms in video analysis")] (with subtitles), LongVideoBench[[70](https://arxiv.org/html/2602.02276v1#bib.bib215 "LongVideoBench: a benchmark for long-context interleaved video-language understanding")], and LVBench[[62](https://arxiv.org/html/2602.02276v1#bib.bib216 "LVBench: an extreme long video understanding benchmark")]. 
+*   •Computer Use: OSWorld-Verified[[72](https://arxiv.org/html/2602.02276v1#bib.bib5 "Introducing osworld-verified"), [73](https://arxiv.org/html/2602.02276v1#bib.bib4 "OSWorld: benchmarking multimodal agents for open-ended tasks in real computer environments")], and WebArena [[80](https://arxiv.org/html/2602.02276v1#bib.bib250 "WebArena: a realistic web environment for building autonomous agents")]. 
+
+Table 4: Performance comparison of Kimi K2.5 against open-source and proprietary models. Bold denotes the global SOTA; Data points marked with * are taken from our internal evaluations. † refers to their scores of text-only subset.
+
+Proprietary Open Source
+Benchmark Kimi K2.5 Claude Opus 4.5 GPT-5.2 (xhigh)Gemini 3 Pro DeepSeek-V3.2 Qwen3-VL-235B-A22B
+Reasoning & General
+HLE-Full 30.1 30.8 34.5 37.5 25.1†-
+HLE-Full w/ tools 50.2 43.2 45.5 45.8 40.8†-
+AIME 2025 96.1 92.8 100 95.0 93.1-
+HMMT 2025 (Feb)95.4 92.9*99.4 97.3*92.5-
+IMO-AnswerBench 81.8 78.5*86.3 83.1*78.3-
+GPQA-Diamond 87.6 87.0 92.4 91.9 82.4-
+MMLU-Pro 87.1 89.3*86.7*90.1 85.0-
+SimpleQA Verified 36.9 44.1 38.9 72.1 27.5-
+AdvancedIF 75.6 63.1 81.1 74.7 58.8-
+LongBench v2 61.0 64.4*54.5*68.2*59.8*-
+Coding
+SWE-Bench Verified 76.8 80.9 80.0 76.2 73.1-
+SWE-Bench Pro (public)50.7 55.4*55.6---
+SWE-Bench Multilingual 73.0 77.5 72.0 65.0 70.2-
+Terminal Bench 2.0 50.8 59.3 54.0 54.2 46.4-
+PaperBench (CodeDev)63.5 72.9*63.7*-47.1-
+CyberGym 41.3 50.6-39.9*17.3*-
+SciCode 48.7 49.5 52.1 56.1 38.9-
+OJBench (cpp)57.4 54.6*-68.5*54.7*-
+LiveCodeBench (v6)85.0 82.2*-87.4*83.3-
+Agentic
+BrowseComp 60.6 37.0 65.8 37.8 51.4-
+BrowseComp(w/ ctx manage)74.9 57.8 59.2 67.6-
+BrowseComp(Agent Swarm)78.4-----
+WideSearch 72.7 76.2*-57.0 32.5*-
+WideSearch(Agent Swarm)79.0-----
+DeepSearchQA 77.1 76.1*71.3*63.2*60.9*-
+FinSearchCompT2&T3 67.8 66.2*-49.9 59.1*-
+Seal-0 57.4 47.7*45.0 45.5*49.5*-
+GDPVal-AA 41.0 45.0 48.0 35.0 34.0-
+Image
+MMMU-Pro 78.5 74.0 79.5*81.0-69.3
+MMMU (val)84.3 80.7 86.7*87.5*-80.6
+CharXiv (RQ)77.5 67.2*82.1 81.4-66.1
+MathVision 84.2 77.1*83.0 86.1*-74.6
+MathVista (mini)90.1 80.2*82.8*89.8*-85.8
+SimpleVQA 71.2 69.7*55.8*69.7*-56.8*
+WorldVQA 46.3 36.8 28.0 47.4-23.5
+ZeroBench 9 3*9*8*-4*
+ZeroBench w/ tools 11 9*7*12*-3*
+BabyVision 36.5 14.2 34.4 49.7-22.2
+BLINK 78.9 68.8*-78.7*-68.9
+MMVP 87.0 80.0*83.0*90.0*-84.3
+OmniDocBench 1.5 88.8 87.7*85.7 88.5-82.0*
+OCRBench 92.3 86.5*80.7*90.3*-87.5
+InfoVQA (test)92.6 76.9*84*57.2*-89.5
+Video
+VideoMMMU 86.6 84.4*85.9 87.6-80.0
+MMVU 80.4 77.3*80.8*77.5*-71.1
+MotionBench 70.4 60.3*64.8*70.3--
+Video-MME 87.4 77.6*86.0*88.4*-79.0
+LongVideoBench 79.8 67.2*76.5*77.7*-65.6*
+LVBench 75.9 57.3-73.5*-63.6
+Computer Use
+OSWorld-Verified 63.3 66.3 8.6*20.7*-38.1
+WebArena 58.9 63.4*---26.4*
+
+Table 5: Performance and token efficiency of some reasoning models. Average output token counts (in thousands) are shown in parentheses.
+
+Benchmark Kimi K2.5 Kimi K2 Gemini-3.0 DeepSeek-V3.2
+Thinking Pro Thinking
+AIME 2025 96.1 (25k)94.5 (30k)95.0 (15k)93.1 (16k)
+HMMT Feb 2025 95.4 (27k)89.4 (35k)97.3 (16k)92.5 (19k)
+HMMT Nov 2025 91.1 (24k)89.2 (32k)94.5 (15k)90.2 (18k)
+IMO-AnswerBench 81.8 (36k)78.6 (37k)83.1 (18k)78.3 (27k)
+LiveCodeBench 85.0 (18k)82.6 (25k)87.4 (13k)83.3 (16k)
+GPQA Diamond 87.6 (14k)84.5 (13k)91.9 (8k)82.4 (7k)
+HLE-Text 31.5 (24k)23.9 (29k)38.4 (13k)25.1 (21k)
+
+##### Baselines
+
+We benchmark against state-of-the-art proprietary and open-source models. For proprietary models, we compare against Claude Opus 4.5 (with extended thinking) [[4](https://arxiv.org/html/2602.02276v1#bib.bib226 "Claude opus 4.5 system card")], GPT-5.2 (with xhigh reasoning effort) [[41](https://arxiv.org/html/2602.02276v1#bib.bib227 "Introducing gpt 5.2")], and Gemini 3 Pro (with high reasoning-level) [[19](https://arxiv.org/html/2602.02276v1#bib.bib228 "Gemini 3 pro")]. For open-source models, we include DeepSeek-V3.2 (with thinking mode enabled)[[13](https://arxiv.org/html/2602.02276v1#bib.bib247 "DeepSeek-v3.2: pushing the frontier of open large language models")] for text benchmarks, while vision benchmarks report Qwen3-VL-235B-A22B-Thinking[[7](https://arxiv.org/html/2602.02276v1#bib.bib17 "Qwen3-vl technical report")] instead.
+
+##### Evaluation Configurations
+
+Unless otherwise specified, all Kimi K2.5 evaluations use temperature = 1.0, top-p = 0.95, and a context length of 256k tokens. Benchmarks without publicly available scores were re-evaluated under identical conditions and marked with an asterisk (*). The full evaluation settings can be found in appendix[E](https://arxiv.org/html/2602.02276v1#A5 "Appendix E Evaluation Settings ‣ Kimi K2.5: Visual Agentic Intelligence").
+
+#### 5.1.2 Evaluation Results
+
+Comprehensive results comparing Kimi K2.5 against proprietary and open-source baselines are presented in Table[4](https://arxiv.org/html/2602.02276v1#S5.T4 "Table 4 ‣ Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). We highlight key observations across core capability domains:
+
+##### Reasoning and General
+
+Kimi K2.5 achieves competitive performance with top-tier proprietary models on rigorous STEM benchmarks. On Math tasks, AIME 2025, K2.5 scores 96.1%, approaching GPT-5.2’s perfect score while outperforming Claude Opus 4.5 (92.8%) and Gemini 3 Pro (95.0%). This high-level performance extends to the HMMT 2025 (95.4%) and IMO-AnswerBench (81.8%), demonstrating K2.5’s superior reasoning depth. Kimi K2.5 also exhibits remarkable knowledge and scientific reasoning capabilities, scoring 36.9% on SimpleQA Verified, 87.1% on MMLU-Pro and 87.6% on GPQA. Notably, on HLE without the use of tools, K2.5 achieves an HLE-Full score of 30.1%, with component-wise scores of 31.5% on text subset and 21.3% on image subset. When tool-use is enabled, K2.5’s HLE-Full score rises to 50.2%, with 51.8% (text) and 39.8% (image), significantly outperforming Gemini 3 Pro (45.8%) and GPT-5.2 (45.5%). In addition to reasoning and knowledge, K2.5 shows strong instruction-following performance (75.6% on AdvancedIF) and competitive long-context abilities, achieving 61.0% on LongBench v2 compared to both proprietary and open-source models.
+
+##### Complex Coding and Software Engineering
+
+Kimi K2.5 exhibits strong software engineering capabilities, especially on realistic coding and maintenance tasks. It achieves 76.8% on SWE-Bench Verified and 73.0% on SWE-Bench Multilingual, outperforming Gemini 3 Pro while remaining competitive with Claude Opus 4.5 and GPT‑5.2. On LiveCodeBench v6, Kimi K2.5 reaches 85.0%, surpassing DeepSeek‑V3.2 (83.3%) and Claude Opus 4.5 (82.2%), highlighting its robustness on live, continuously updated coding challenges. On TerminalBench 2.0, PaperBench, and SciCode, it scores 50.8%, 63.5%, and 48.7% respectively, demonstrating stable competition‑level performance in automated software engineering and problem solving across diverse domains. In addition, K2.5 attains a score of 41.3 on CyberGym, on the task of finding previously discovered vulnerabilities in real open‑source software projects given only a high‑level description of the weakness, further underscoring its effectiveness in security‑oriented software analysis.
+
+##### Agentic Capabilities
+
+Kimi K2.5 establishes new state-of-the-art performance on complex agentic search and browsing tasks. On BrowseComp, K2.5 achieves 60.6% without context management techniques, 74.9% with Discard-all context management [[13](https://arxiv.org/html/2602.02276v1#bib.bib247 "DeepSeek-v3.2: pushing the frontier of open large language models")] — substantially outperforming GPT-5.2’s reported 65.8%, Claude Opus 4.5 (37.0%) and Gemini 3 Pro (37.8%). Similarly, WideSearch reaches 72.7% on item-f1. On DeepSearchQA (77.1%), FinSearchCompT2&T3 (67.8%) and Seal-0 (57.4%), K2.5 leads all evaluated models, demonstrating superior capacity for agentic deep research, information synthesis, and multi-step tool orchestration.
+
+##### Vision Reasoning, Knowledge and Perception
+
+Kimi K2.5 demonstrates strong visual reasoning and world knowledge capabilities. It scores 78.5% on MMMU-Pro, spanning multi-disciplinary multimodal tasks. For world knowledge question answering, K2.5 achieves 71.2% on SimpleVQA and 46.3% on WorldVQA. For visual reasoning, it achieves 84.2% on MathVision, 90.1% on MathVista (mini), and 36.5% on BabyVision. For OCR and document understanding, K2.5 delivers outstanding results with 77.5% on CharXiv (RQ), 92.3% on OCRBench, 88.8% on OmniDocBench 1.5, and 92.6% on InfoVQA (test). On the challenging ZeroBench, Kimi K2.5 achieves 9% and 11% with tool augmentation, substantially ahead of competing models. On basic visual perception benchmarks BLINK (78.9%) and MMVP (87.0%), we also observe competitive performance of Kimi K2.5, demonstrating its robust real-world visual perceptions.
+
+##### Video Understanding
+
+Kimi K2.5 achieves state-of-the-art performance across diverse video understanding tasks. It attains 86.6% on VideoMMMU and 80.4% on MMVU, rivaling frontier leaderships. With the context-compression and dense temporal understanding abilities of MoonViT-3D, Kimi K2.5 also establishes new global SOTA records in long-video comprehension with 75.9% on LVBench and 79.8% on LongVideoBench by feeding over 2,000 frames, while demonstrating robust dense-motion understanding at 70.4% on the highly-dimensional MotionBench.
+
+##### Computer-Use Capability
+
+Kimi K2.5 demonstrates state-of-the-art computer-use capability on real-world tasks. On the computer-use benchmark OSWorld-Verified[[72](https://arxiv.org/html/2602.02276v1#bib.bib5 "Introducing osworld-verified"), [73](https://arxiv.org/html/2602.02276v1#bib.bib4 "OSWorld: benchmarking multimodal agents for open-ended tasks in real computer environments")], it achieves a 63.3% success rate relying solely on GUI actions without external tools. This substantially outperforms open-source models such as Qwen3-VL-235B-A22B (38.1%) and OpenAI’s computer-use agent framework Operator (o3-based) (42.9%), while remaining competitive with the current leading CUA model, Claude Opus 4.5 (66.3%). On WebArena[[80](https://arxiv.org/html/2602.02276v1#bib.bib250 "WebArena: a realistic web environment for building autonomous agents")], an established benchmark for GUI-based web browsing, Kimi K2.5 achieves a 58.9% success rate, surpassing OpenAI’s Operator (58.1%) and approaching the performance of Claude Opus 4.5 (63.4%).
+
+### 5.2 Agent Swarm Results
+
+##### Benchmarks
+
+To rigorously evaluate the effectiveness of the agent swarm framework, we select three representative benchmarks that collectively cover deep reasoning, large-scale retrieval, and real-world complexity:
+
+*   •BrowseComp: A challenging deep-research benchmark that requires multi-step reasoning and complex information synthesis. 
+*   •WideSearch: A benchmark designed to evaluate the ability to perform broad, multi-step information seeking and reasoning across diverse sources. 
+*   •In-house Swarm Bench: An internally developed Swarm benchmark, designed to evaluate the agent swarm performance under real-world, high-complexity conditions. It covers four domains: WildSearch (unconstrained, real-world information retrieval over the open web), Batch Download (large-scale acquisition of diverse resources), WideRead (large-scale document comprehension involving more than 100 input documents), and Long-Form Writing (coherent generation of extensive content exceeding 100k words). This benchmark incorporates extreme-scale scenarios that stress-test the orchestration, scalability, and coordination capabilities of agent-based systems. 
+
+Table 6: Performance comparison of Kimi K2.5 Agent Swarm against single-agent and proprietary baselines on agentic search benchmarks. Bold denotes the best result per benchmark.
+
+Benchmark K2.5 Agent Swarm Kimi K2.5 Claude Opus 4.5 GPT-5.2 GPT-5.2 Pro
+BrowseComp 78.4 60.6 37.0 65.8 77.9
+WideSearch 79.0 72.7 76.2--
+In-house Swarm Bench 58.3 41.6 45.8--
+
+##### Performance
+
+Table[6](https://arxiv.org/html/2602.02276v1#S5.T6 "Table 6 ‣ Benchmarks ‣ 5.2 Agent Swarm Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence") presents the performance of Kimi K2.5 Agent Swarm against single-agent configurations and proprietary baselines. The results demonstrate substantial performance improvements from multi-agent orchestration. On BrowseComp, Agent Swarm achieves 78.4%, representing a 17.8% absolute gain over the single-agent K2.5 (60.6%) and surpassing even GPT-5.2 Pro (77.9%). Similarly, WideSearch sees a 6.3% improvement (72.7% \to 79.0%) on Item-F1, enabling K2.5 Agent Swarm to outperform Claude Opus 4.5 (76.2%) and establish a new state-of-the-art. The gains are most pronounced on In-house Swarm bench (16.7%), where tasks are explicitly designed to reward parallel decomposition. These consistent improvements across benchmarks validate that Agent Swarm effectively converts computational parallelism into qualitative capability gains, particularly for problems requiring broad exploration, multi-source verification, or simultaneous handling of independent sub-tasks.
+
+![Image 6: Refer to caption](https://arxiv.org/html/2602.02276v1/x4.png)
+
+Figure 6: The word cloud visualizes heterogeneous K2.5-based sub-agents dynamically instantiated by the Orchestrator across tests.
+
+![Image 7: Refer to caption](https://arxiv.org/html/2602.02276v1/x5.png)
+
+Figure 7: Comparison of Kimi K2.5 performance under Agent Swarm and Discard-all context management in BrowseComp.
+
+![Image 8: Refer to caption](https://arxiv.org/html/2602.02276v1/x6.png)
+
+Figure 8: Agent Swarm achieves 3\times–4.5\times faster execution time compared to single-agent baselines as target Item-F1 increases from 30% to 70% in WideSearch testing.
+
+##### Execution Time Savings via Parallelism
+
+Beyond improved task performance, Agent Swarm achieves substantial wall-clock time reductions through parallel subagent execution. On the WideSearch benchmark, it reduces the execution time required to reach target performance by 3\times\sim 4.5\times compared to a single-agent baseline. As shown in Figure[8](https://arxiv.org/html/2602.02276v1#S5.F8 "Figure 8 ‣ Performance ‣ 5.2 Agent Swarm Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"), this efficiency gain scales with task complexity: as the target Item-F1 increases from 30% to 70%, the single agent’s execution time grows from approximately 1.8\times to over 7.0\times the baseline, whereas Agent Swarm maintains near-constant low latency in the range of 0.6\times\sim 1.6\times. These results indicate that Agent Swarm effectively transforms sequential tool invocations into parallel operations, preventing the linear growth in completion time typically observed as task difficulty increases.
+
+##### Dynamic Subagent Creation and Scheduling
+
+Within an agent swarm, subagents are dynamically instantiated rather than pre-defined. Through PARL, the orchestrator learns adaptive policies to create and schedule self-hosted subagents in response to evolving task structures and problem states. Unlike static decomposition approaches, this learned policy enables the Orchestrator to reason about the requisite number, timing, and specialization of subagents based on query. Consequently, a heterogeneous agent group emerges organically from this adaptive allocation strategy (Figure[7](https://arxiv.org/html/2602.02276v1#S5.F7 "Figure 7 ‣ Performance ‣ 5.2 Agent Swarm Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence")).
+
+##### Agent Swarm as Proactive Context Management
+
+Beyond better performance and runtime acceleration, an agent swarm is a kind of proactive and intelligent context management enabled by multi-agent architecture [[6](https://arxiv.org/html/2602.02276v1#bib.bib223 "Building multi-agent systems: when and how to use them")]. This approach differs from test-time context truncation strategies such as Hide-Tool-Result [[2](https://arxiv.org/html/2602.02276v1#bib.bib224 "Kimi-researcher end-to-end rl training for emerging agentic capabilities")], Summary [[71](https://arxiv.org/html/2602.02276v1#bib.bib248 "ReSum: unlocking long-horizon search intelligence via context summarization")], or Discard-all [[13](https://arxiv.org/html/2602.02276v1#bib.bib247 "DeepSeek-v3.2: pushing the frontier of open large language models")], which react to context overflow by compressing or discarding accumulated histories. While effective at reducing token usage, these methods are inherently reactive and often sacrifice structural information or intermediate reasoning.
+
+In contrast, Agent Swarm enables proactive context control through explicit orchestration. Long-horizon tasks are decomposed into parallel, semantically isolated subtasks, each executed by a specialized subagent with a bounded local context. Crucially, these subagents maintain independent working memories and perform local reasoning without directly mutating or contaminating the global context of the central orchestrator. Only task-relevant outputs—rather than full interaction traces—are selectively routed back to the orchestrator. This design induces context sharding rather than context truncation, allowing the system to scale effective context length along an additional architectural dimension while preserving modularity, information locality, and reasoning integrity.
+
+As shown in Figure[7](https://arxiv.org/html/2602.02276v1#S5.F7 "Figure 7 ‣ Performance ‣ 5.2 Agent Swarm Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"), this proactive strategy outperforms Discard-all in both efficiency and accuracy on BrowseComp. By preserving task-level coherence at the orchestrator level while keeping subagent contexts tightly bounded, Agent Swarm enables parallel execution with selective context persistence, retaining only high-level coordination signals or essential intermediate results. Consequently, Agent Swarm operates as an active, structured context manager, achieving higher accuracy with substantially fewer critical steps than uniform context truncation.
+
+## 6 Conclusions
+
+Kimi K2.5 shows that scalable and general agentic intelligence can be achieved through joint optimization of text and vision together with parallel agent execution. By unifying language and vision across pre-training and reinforcement learning, the model achieves strong cross-modal alignment and visual–text reasoning. Agent Swarm enables concurrent execution of heterogeneous sub-tasks, reducing inference latency while improving performance on complex agentic workloads. Grounded in vision–text intelligence and agent swarms, Kimi K2.5 demonstrates strong performance on benchmarks and real-world tasks. By open-sourcing the post-trained checkpoints, we aim to support the open-source community in building scalable and general-purpose agentic systems and to accelerate progress toward General Agentic Intelligence.
+
+## References
+
+*   [1]M. AI (2025)Introducing kimi k2 thinking. External Links: [Link](https://moonshotai.github.io/Kimi-K2/thinking.html)Cited by: [§1](https://arxiv.org/html/2602.02276v1#S1.p1.1 "1 Introduction ‣ Kimi K2.5: Visual Agentic Intelligence"), [§1](https://arxiv.org/html/2602.02276v1#S1.p6.1 "1 Introduction ‣ Kimi K2.5: Visual Agentic Intelligence"), [§4.4.2](https://arxiv.org/html/2602.02276v1#S4.SS4.SSS2.Px4.p4.1 "Token Efficient Reinforcement Learning ‣ 4.4.2 Reinforcement Learning ‣ 4.4 Post-Training ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [2]M. AI (2025)Kimi-researcher end-to-end rl training for emerging agentic capabilities. External Links: [Link](https://moonshotai.github.io/Kimi-Researcher/)Cited by: [§1](https://arxiv.org/html/2602.02276v1#S1.p7.1 "1 Introduction ‣ Kimi K2.5: Visual Agentic Intelligence"), [§5.2](https://arxiv.org/html/2602.02276v1#S5.SS2.SSS0.Px5.p1.1 "Agent Swarm as Proactive Context Management ‣ 5.2 Agent Swarm Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [3]Amazon Web Services (2023)Amazon simple storage service (amazon s3). Note: WebAvailable at: [https://aws.amazon.com/s3/](https://aws.amazon.com/s3/)External Links: [Link](https://aws.amazon.com/s3/)Cited by: [§C.1](https://arxiv.org/html/2602.02276v1#A3.SS1.p1.1 "C.1 Data Storage and Loading ‣ Appendix C Infra ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [4]Anthropic (2025)Claude opus 4.5 system card. External Links: [Link](https://www-cdn.anthropic.com/bf10f64990cfda0ba858290be7b8cc6317685f47.pdf)Cited by: [§E.7](https://arxiv.org/html/2602.02276v1#A5.SS7.SSS0.Px1.p1.5 "Hyperparameter Settings. ‣ E.7 Computer-Use Evaluation ‣ Appendix E Evaluation Settings ‣ Kimi K2.5: Visual Agentic Intelligence"), [§1](https://arxiv.org/html/2602.02276v1#S1.p1.1 "1 Introduction ‣ Kimi K2.5: Visual Agentic Intelligence"), [§3](https://arxiv.org/html/2602.02276v1#S3.p1.1 "3 Agent Swarm ‣ Kimi K2.5: Visual Agentic Intelligence"), [§5.1.1](https://arxiv.org/html/2602.02276v1#S5.SS1.SSS1.Px2.p1.1 "Baselines ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [5]Anthropic (2025)How we built our multi-agent research system. External Links: [Link](https://www.anthropic.com/engineering/multi-agent-research-system)Cited by: [§3](https://arxiv.org/html/2602.02276v1#S3.p1.1 "3 Agent Swarm ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [6]Anthropic (2026)Building multi-agent systems: when and how to use them. External Links: [Link](https://claude.com/blog/building-multi-agent-systems-when-and-how-to-use-them)Cited by: [§3](https://arxiv.org/html/2602.02276v1#S3.p1.1 "3 Agent Swarm ‣ Kimi K2.5: Visual Agentic Intelligence"), [§5.2](https://arxiv.org/html/2602.02276v1#S5.SS2.SSS0.Px5.p1.1 "Agent Swarm as Proactive Context Management ‣ 5.2 Agent Swarm Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [7]S. Bai, Y. Cai, R. Chen, K. Chen, X. Chen, Z. Cheng, L. Deng, W. Ding, C. Gao, C. Ge, W. Ge, Z. Guo, Q. Huang, J. Huang, F. Huang, B. Hui, S. Jiang, Z. Li, M. Li, M. Li, K. Li, Z. Lin, J. Lin, X. Liu, J. Liu, C. Liu, Y. Liu, D. Liu, S. Liu, D. Lu, R. Luo, C. Lv, R. Men, L. Meng, X. Ren, X. Ren, S. Song, Y. Sun, J. Tang, J. Tu, J. Wan, P. Wang, P. Wang, Q. Wang, Y. Wang, T. Xie, Y. Xu, H. Xu, J. Xu, Z. Yang, M. Yang, J. Yang, A. Yang, B. Yu, F. Zhang, H. Zhang, X. Zhang, B. Zheng, H. Zhong, J. Zhou, F. Zhou, J. Zhou, Y. Zhu, and K. Zhu (2025)Qwen3-vl technical report. External Links: 2511.21631, [Link](https://arxiv.org/abs/2511.21631)Cited by: [§1](https://arxiv.org/html/2602.02276v1#S1.p3.1 "1 Introduction ‣ Kimi K2.5: Visual Agentic Intelligence"), [§2.1](https://arxiv.org/html/2602.02276v1#S2.SS1.p1.1 "2.1 Native Multimodal Pre-Training ‣ 2 Joint Optimization of Text and Vision ‣ Kimi K2.5: Visual Agentic Intelligence"), [§2.2](https://arxiv.org/html/2602.02276v1#S2.SS2.p1.1 "2.2 Zero-Vision SFT ‣ 2 Joint Optimization of Text and Vision ‣ Kimi K2.5: Visual Agentic Intelligence"), [§5.1.1](https://arxiv.org/html/2602.02276v1#S5.SS1.SSS1.Px2.p1.1 "Baselines ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [8]Y. Bai, S. Tu, J. Zhang, H. Peng, X. Wang, X. Lv, S. Cao, J. Xu, L. Hou, Y. Dong, J. Tang, and J. Li (2025)LongBench v2: towards deeper understanding and reasoning on realistic long-context multitasks. External Links: 2412.15204, [Link](https://arxiv.org/abs/2412.15204)Cited by: [§E.3](https://arxiv.org/html/2602.02276v1#A5.SS3.SSS0.Px2.p1.1 "LongBench v2. ‣ E.3 Text Benchmarks ‣ Appendix E Evaluation Settings ‣ Kimi K2.5: Visual Agentic Intelligence"), [1st item](https://arxiv.org/html/2602.02276v1#S5.I1.i1.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [9]G. Brockman, V. Cheung, L. Pettersson, J. Schneider, J. Schulman, J. Tang, and W. Zaremba (2016)OpenAI gym. External Links: 1606.01540, [Link](https://arxiv.org/abs/1606.01540)Cited by: [Appendix D](https://arxiv.org/html/2602.02276v1#A4.SS0.SSS0.Px1.p1.2 "Environment ‣ Appendix D Unified Agentic Reinforcement Learning Environment ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [10]T. B. Brown, B. Mann, N. Ryder, M. Subbiah, J. Kaplan, P. Dhariwal, A. Neelakantan, P. Shyam, G. Sastry, A. Askell, S. Agarwal, A. Herbert-Voss, G. Krueger, T. Henighan, R. Child, A. Ramesh, D. M. Ziegler, J. Wu, C. Winter, C. Hesse, M. Chen, E. Sigler, M. Litwin, S. Gray, B. Chess, J. Clark, C. Berner, S. McCandlish, A. Radford, I. Sutskever, and D. Amodei (2020)Language models are few-shot learners. External Links: 2005.14165, [Link](https://arxiv.org/abs/2005.14165)Cited by: [§B.3](https://arxiv.org/html/2602.02276v1#A2.SS3.p2.1 "B.3 Vision data ‣ Appendix B Pre-training ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [11]L. Chen, W. Xie, Y. Liang, H. He, H. Zhao, Z. Yang, Z. Huang, H. Wu, H. Lu, Y. charles, Y. Bao, Y. Fan, G. Li, H. Shen, X. Chen, W. Xu, S. Si, Z. Cai, W. Chai, Z. Huang, F. Liu, T. Liu, B. Chang, X. Hu, K. Chen, Y. Ren, Y. Liu, Y. Gong, and K. Li (2026)BabyVision: visual reasoning beyond language. External Links: 2601.06521, [Link](https://arxiv.org/abs/2601.06521)Cited by: [4th item](https://arxiv.org/html/2602.02276v1#S5.I1.i4.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [12]X. Cheng, W. Zhang, S. Zhang, J. Yang, X. Guan, X. Wu, X. Li, G. Zhang, J. Liu, Y. Mai, Y. Zeng, Z. Wen, K. Jin, B. Wang, W. Zhou, Y. Lu, T. Li, W. Huang, and Z. Li (2025)SimpleVQA: multimodal factuality evaluation for multimodal large language models. External Links: 2502.13059, [Link](https://arxiv.org/abs/2502.13059)Cited by: [4th item](https://arxiv.org/html/2602.02276v1#S5.I1.i4.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [13]DeepSeek-AI, A. Liu, A. Mei, B. Lin, B. Xue, B. Wang, B. Xu, B. Wu, B. Zhang, C. Lin, C. Dong, C. Lu, C. Zhao, C. Deng, C. Xu, C. Ruan, D. Dai, D. Guo, D. Yang, D. Chen, E. Li, F. Zhou, F. Lin, F. Dai, G. Hao, G. Chen, G. Li, H. Zhang, H. Xu, H. Li, H. Liang, H. Wei, H. Zhang, H. Luo, H. Ji, H. Ding, H. Tang, H. Cao, H. Gao, H. Qu, H. Zeng, J. Huang, J. Li, J. Xu, J. Hu, J. Chen, J. Xiang, J. Yuan, J. Cheng, J. Zhu, J. Ran, J. Jiang, J. Qiu, J. Li, J. Song, K. Dong, K. Gao, K. Guan, K. Huang, K. Zhou, K. Huang, K. Yu, L. Wang, L. Zhang, L. Wang, L. Zhao, L. Yin, L. Guo, L. Luo, L. Ma, L. Wang, L. Zhang, M. S. Di, M. Y. Xu, M. Zhang, M. Zhang, M. Tang, M. Zhou, P. Huang, P. Cong, P. Wang, Q. Wang, Q. Zhu, Q. Li, Q. Chen, Q. Du, R. Xu, R. Ge, R. Zhang, R. Pan, R. Wang, R. Yin, R. Xu, R. Shen, R. Zhang, S. H. Liu, S. Lu, S. Zhou, S. Chen, S. Cai, S. Chen, S. Hu, S. Liu, S. Hu, S. Ma, S. Wang, S. Yu, S. Zhou, S. Pan, S. Zhou, T. Ni, T. Yun, T. Pei, T. Ye, T. Yue, W. Zeng, W. Liu, W. Liang, W. Pang, W. Luo, W. Gao, W. Zhang, X. Gao, X. Wang, X. Bi, X. Liu, X. Wang, X. Chen, X. Zhang, X. Nie, X. Cheng, X. Liu, X. Xie, X. Liu, X. Yu, X. Li, X. Yang, X. Li, X. Chen, X. Su, X. Pan, X. Lin, X. Fu, Y. Q. Wang, Y. Zhang, Y. Xu, Y. Ma, Y. Li, Y. Li, Y. Zhao, Y. Sun, Y. Wang, Y. Qian, Y. Yu, Y. Zhang, Y. Ding, Y. Shi, Y. Xiong, Y. He, Y. Zhou, Y. Zhong, Y. Piao, Y. Wang, Y. Chen, Y. Tan, Y. Wei, Y. Ma, Y. Liu, Y. Yang, Y. Guo, Y. Wu, Y. Wu, Y. Cheng, Y. Ou, Y. Xu, Y. Wang, Y. Gong, Y. Wu, Y. Zou, Y. Li, Y. Xiong, Y. Luo, Y. You, Y. Liu, Y. Zhou, Z. F. Wu, Z. Z. Ren, Z. Zhao, Z. Ren, Z. Sha, Z. Fu, Z. Xu, Z. Xie, Z. Zhang, Z. Hao, Z. Gou, Z. Ma, Z. Yan, Z. Shao, Z. Huang, Z. Wu, Z. Li, Z. Zhang, Z. Xu, Z. Wang, Z. Gu, Z. Zhu, Z. Li, Z. Zhang, Z. Xie, Z. Gao, Z. Pan, Z. Yao, B. Feng, H. Li, J. L. Cai, J. Ni, L. Xu, M. Li, N. Tian, R. J. Chen, R. L. Jin, S. S. Li, S. Zhou, T. Sun, X. Q. Li, X. Jin, X. Shen, X. Chen, X. Song, X. Zhou, Y. X. Zhu, Y. Huang, Y. Li, Y. Zheng, Y. Zhu, Y. Ma, Z. Huang, Z. Xu, Z. Zhang, D. Ji, J. Liang, J. Guo, J. Chen, L. Xia, M. Wang, M. Li, P. Zhang, R. Chen, S. Sun, S. Wu, S. Ye, T. Wang, W. L. Xiao, W. An, X. Wang, X. Sun, X. Wang, Y. Tang, Y. Zha, Z. Zhang, Z. Ju, Z. Zhang, and Z. Qu (2025)DeepSeek-v3.2: pushing the frontier of open large language models. External Links: 2512.02556, [Link](https://arxiv.org/abs/2512.02556)Cited by: [§5.1.1](https://arxiv.org/html/2602.02276v1#S5.SS1.SSS1.Px2.p1.1 "Baselines ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"), [§5.1.2](https://arxiv.org/html/2602.02276v1#S5.SS1.SSS2.Px3.p1.1 "Agentic Capabilities ‣ 5.1.2 Evaluation Results ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"), [§5.2](https://arxiv.org/html/2602.02276v1#S5.SS2.SSS0.Px5.p1.1 "Agent Swarm as Proactive Context Management ‣ 5.2 Agent Swarm Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [14]M. Dehghani, B. Mustafa, J. Djolonga, J. Heek, M. Minderer, M. Caron, A. Steiner, J. Puigcerver, R. Geirhos, I. Alabdulmohsin, A. Oliver, P. Padlewski, A. Gritsenko, M. Lučić, and N. Houlsby (2023)Patch n’ pack: navit, a vision transformer for any aspect ratio and resolution. External Links: 2307.06304, [Link](https://arxiv.org/abs/2307.06304)Cited by: [§1](https://arxiv.org/html/2602.02276v1#S1.p4.1 "1 Introduction ‣ Kimi K2.5: Visual Agentic Intelligence"), [§4.2](https://arxiv.org/html/2602.02276v1#S4.SS2.SSS0.Px1.p1.1 "MoonViT-3D: Shared Embedding Space for Images and Videos ‣ 4.2 Model Architecture ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [15]X. Deng, J. Da, E. Pan, Y. Y. He, C. Ide, K. Garg, N. Lauffer, A. Park, N. Pasari, C. Rane, et al. (2025)SWE-bench pro: can ai agents solve long-horizon software engineering tasks?. arXiv preprint arXiv:2509.16941. Cited by: [2nd item](https://arxiv.org/html/2602.02276v1#S5.I1.i2.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [16]C. Fu, Y. Dai, Y. Luo, L. Li, S. Ren, R. Zhang, Z. Wang, C. Zhou, Y. Shen, M. Zhang, P. Chen, Y. Li, S. Lin, S. Zhao, K. Li, T. Xu, X. Zheng, E. Chen, C. Shan, R. He, and X. Sun (2025)Video-mme: the first-ever comprehensive evaluation benchmark of multi-modal llms in video analysis. External Links: 2405.21075, [Link](https://arxiv.org/abs/2405.21075)Cited by: [5th item](https://arxiv.org/html/2602.02276v1#S5.I1.i5.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [17]X. Fu, Y. Hu, B. Li, Y. Feng, H. Wang, X. Lin, D. Roth, N. A. Smith, W. Ma, and R. Krishna (2024)BLINK: multimodal large language models can see but not perceive. External Links: 2404.12390, [Link](https://arxiv.org/abs/2404.12390)Cited by: [4th item](https://arxiv.org/html/2602.02276v1#S5.I1.i4.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [18]S. Y. Gadre, G. Ilharco, A. Fang, J. Hayase, G. Smyrnis, T. Nguyen, R. Marten, M. Wortsman, D. Ghosh, J. Zhang, et al. (2024)Datacomp: in search of the next generation of multimodal datasets. Advances in Neural Information Processing Systems 36. Cited by: [§B.3](https://arxiv.org/html/2602.02276v1#A2.SS3.p1.1 "B.3 Vision data ‣ Appendix B Pre-training ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [19]Google (2025)Gemini 3 pro. External Links: [Link](https://deepmind.google/models/gemini/pro/)Cited by: [§1](https://arxiv.org/html/2602.02276v1#S1.p1.1 "1 Introduction ‣ Kimi K2.5: Visual Agentic Intelligence"), [§5.1.1](https://arxiv.org/html/2602.02276v1#S5.SS1.SSS1.Px2.p1.1 "Baselines ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [20]D. Guo, F. Wu, F. Zhu, F. Leng, G. Shi, H. Chen, H. Fan, J. Wang, J. Jiang, J. Wang, J. Chen, J. Huang, K. Lei, L. Yuan, L. Luo, P. Liu, Q. Ye, R. Qian, S. Yan, S. Zhao, S. Peng, S. Li, S. Yuan, S. Wu, T. Cheng, W. Liu, W. Wang, X. Zeng, X. Liu, X. Qin, X. Ding, X. Xiao, X. Zhang, X. Zhang, X. Xiong, Y. Peng, Y. Chen, Y. Li, Y. Hu, Y. Lin, Y. Hu, Y. Zhang, Y. Wu, Y. Li, Y. Liu, Y. Ling, Y. Qin, Z. Wang, Z. He, A. Zhang, B. Yi, B. Liao, C. Huang, C. Zhang, C. Deng, C. Deng, C. Lin, C. Yuan, C. Li, C. Gou, C. Lou, C. Wei, C. Liu, C. Li, D. Zhu, D. Zhong, F. Li, F. Zhang, G. Wu, G. Li, G. Xiao, H. Lin, H. Yang, H. Wang, H. Ji, H. Hao, H. Shen, H. Li, J. Li, J. Wu, J. Zhu, J. Jiao, J. Feng, J. Chen, J. Duan, J. Liu, J. Zeng, J. Tang, J. Sun, J. Chen, J. Long, J. Feng, J. Zhan, J. Fang, J. Lu, K. Hua, K. Liu, K. Shen, K. Zhang, K. Shen, K. Wang, K. Pan, K. Zhang, K. Li, L. Li, L. Li, L. Shi, L. Han, L. Xiang, L. Chen, L. Chen, L. Li, L. Yan, L. Chi, L. Liu, M. Du, M. Wang, N. Pan, P. Chen, P. Chen, P. Wu, Q. Yuan, Q. Shuai, Q. Tao, R. Zheng, R. Zhang, R. Zhang, R. Wang, R. Yang, R. Zhao, S. Xu, S. Liang, S. Yan, S. Zhong, S. Cao, S. Wu, S. Liu, S. Chang, S. Cai, T. Ao, T. Yang, T. Zhang, W. Zhong, W. Jia, W. Weng, W. Yu, W. Huang, W. Zhu, W. Yang, W. Wang, X. Long, X. Yin, X. Li, X. Zhu, X. Jia, X. Zhang, X. Liu, X. Zhang, X. Yang, X. Luo, X. Chen, X. Zhong, X. Xiao, X. Li, Y. Wu, Y. Wen, Y. Du, Y. Zhang, Y. Ye, Y. Wu, Y. Liu, Y. Yue, Y. Zhou, Y. Yuan, Y. Xu, Y. Yang, Y. Zhang, Y. Fang, Y. Li, Y. Ren, Y. Xiong, Z. Hong, Z. Wang, Z. Sun, Z. Wang, Z. Cai, Z. Zha, Z. An, Z. Zhao, Z. Xu, Z. Chen, Z. Wu, Z. Zheng, Z. Wang, Z. Huang, Z. Zhu, and Z. Song (2025)Seed1.5-vl technical report. External Links: 2505.07062, [Link](https://arxiv.org/abs/2505.07062)Cited by: [§1](https://arxiv.org/html/2602.02276v1#S1.p3.1 "1 Introduction ‣ Kimi K2.5: Visual Agentic Intelligence"), [§2.1](https://arxiv.org/html/2602.02276v1#S2.SS1.p1.1 "2.1 Native Multimodal Pre-Training ‣ 2 Joint Optimization of Text and Vision ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [21]L. Haas, G. Yona, G. D’Antonio, S. Goldshtein, and D. Das (2025)SimpleQA verified: a reliable factuality benchmark to measure parametric knowledge. External Links: 2509.07968, [Link](https://arxiv.org/abs/2509.07968)Cited by: [1st item](https://arxiv.org/html/2602.02276v1#S5.I1.i1.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [22]Y. He, W. Li, H. Zhang, S. Li, K. Mandyam, S. Khosla, Y. Xiong, N. Wang, X. Peng, B. Li, S. Bi, S. G. Patil, Q. Qi, S. Feng, J. Katz-Samuels, R. Y. Pang, S. Gonugondla, H. Lang, Y. Yu, Y. Qian, M. Fazel-Zarandi, L. Yu, A. Benhalloum, H. Awadalla, and M. Faruqui (2025)AdvancedIF: rubric-based benchmarking and reinforcement learning for advancing llm instruction following. External Links: 2511.10507, [Link](https://arxiv.org/abs/2511.10507)Cited by: [1st item](https://arxiv.org/html/2602.02276v1#S5.I1.i1.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [23]W. Hong, Y. Cheng, Z. Yang, W. Wang, L. Wang, X. Gu, S. Huang, Y. Dong, and J. Tang (2025)MotionBench: benchmarking and improving fine-grained video motion understanding for vision language models. External Links: 2501.02955, [Link](https://arxiv.org/abs/2501.02955)Cited by: [5th item](https://arxiv.org/html/2602.02276v1#S5.I1.i5.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [24]K. Hu, P. Wu, F. Pu, W. Xiao, Y. Zhang, X. Yue, B. Li, and Z. Liu (2025)Video-mmmu: evaluating knowledge acquisition from multi-discipline professional videos. External Links: 2501.13826, [Link](https://arxiv.org/abs/2501.13826)Cited by: [5th item](https://arxiv.org/html/2602.02276v1#S5.I1.i5.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [25]L. Hu, J. Jiao, J. Liu, Y. Ren, Z. Wen, K. Zhang, X. Zhang, X. Gao, T. He, F. Hu, Y. Liao, Z. Wang, C. Yang, Q. Yang, M. Yin, Z. Zeng, G. Zhang, X. Zhang, X. Zhao, Z. Zhu, H. Namkoong, W. Huang, and Y. Tang (2025)FinSearchComp: towards a realistic, expert-level evaluation of financial search and reasoning. External Links: 2509.13160, [Link](https://arxiv.org/abs/2509.13160)Cited by: [3rd item](https://arxiv.org/html/2602.02276v1#S5.I1.i3.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [26]Y. Huang, Y. Cheng, A. Bapna, O. Firat, M. X. Chen, D. Chen, H. Lee, J. Ngiam, Q. V. Le, Y. Wu, and Z. Chen (2019)GPipe: efficient training of giant neural networks using pipeline parallelism. External Links: 1811.06965, [Link](https://arxiv.org/abs/1811.06965)Cited by: [Appendix C](https://arxiv.org/html/2602.02276v1#A3.p1.1 "Appendix C Infra ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [27]N. Jain, K. Han, A. Gu, W. Li, F. Yan, T. Zhang, S. Wang, A. Solar-Lezama, K. Sen, and I. Stoica (2024)Livecodebench: holistic and contamination free evaluation of large language models for code. arXiv preprint arXiv:2403.07974. Cited by: [2nd item](https://arxiv.org/html/2602.02276v1#S5.I1.i2.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [28]C. E. Jimenez, J. Yang, A. Wettig, S. Yao, K. Pei, O. Press, and K. Narasimhan (2023)Swe-bench: can language models resolve real-world github issues?. arXiv preprint arXiv:2310.06770. Cited by: [2nd item](https://arxiv.org/html/2602.02276v1#S5.I1.i2.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [29]K. Jordan, Y. Jin, V. Boza, J. You, F. Cesista, L. Newhouse, and J. Bernstein (2024)Muon: an optimizer for hidden layers in neural networks. External Links: [Link](https://kellerjordan.github.io/posts/muon/)Cited by: [§4.1](https://arxiv.org/html/2602.02276v1#S4.SS1.p1.1 "4.1 Foundation: Kimi K2 Base Model ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"), [§4.4.2](https://arxiv.org/html/2602.02276v1#S4.SS4.SSS2.Px1.p2.1 "Policy Optimization ‣ 4.4.2 Reinforcement Learning ‣ 4.4 Post-Training ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [30]Kimi Team (2025)Kimi k1. 5: scaling reinforcement learning with llms. arXiv preprint arXiv:2501.12599. Cited by: [Appendix D](https://arxiv.org/html/2602.02276v1#A4.SS0.SSS0.Px1.p2.1 "Environment ‣ Appendix D Unified Agentic Reinforcement Learning Environment ‣ Kimi K2.5: Visual Agentic Intelligence"), [§4.4.2](https://arxiv.org/html/2602.02276v1#S4.SS4.SSS2.Px1.p2.1 "Policy Optimization ‣ 4.4.2 Reinforcement Learning ‣ 4.4 Post-Training ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"), [§4.4.2](https://arxiv.org/html/2602.02276v1#S4.SS4.SSS2.Px4.p1.1 "Token Efficient Reinforcement Learning ‣ 4.4.2 Reinforcement Learning ‣ 4.4 Post-Training ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [31]H. Laurençon, L. Saulnier, L. Tronchon, S. Bekman, A. Singh, A. Lozhkov, T. Wang, S. Karamcheti, A. Rush, D. Kiela, et al. (2024)Obelics: an open web-scale filtered dataset of interleaved image-text documents. Advances in Neural Information Processing Systems 36. Cited by: [§B.3](https://arxiv.org/html/2602.02276v1#A2.SS3.p1.1 "B.3 Vision data ‣ Appendix B Pre-training ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [32]D. Lepikhin, H. Lee, Y. Xu, D. Chen, O. Firat, Y. Huang, M. Krikun, N. Shazeer, and Z. Chen (2020)Gshard: scaling giant models with conditional computation and automatic sharding. arXiv preprint arXiv:2006.16668. Cited by: [Appendix C](https://arxiv.org/html/2602.02276v1#A3.p1.1 "Appendix C Infra ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [33]J. Liu, J. Su, X. Yao, Z. Jiang, G. Lai, Y. Du, Y. Qin, W. Xu, E. Lu, J. Yan, et al. (2025)Muon is scalable for llm training. arXiv preprint arXiv:2502.16982. Cited by: [§4.1](https://arxiv.org/html/2602.02276v1#S4.SS1.p1.1 "4.1 Foundation: Kimi K2 Base Model ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"), [§4.3](https://arxiv.org/html/2602.02276v1#S4.SS3.SSS0.Px1.p1.1 "ViT Training Stage ‣ 4.3 Pre-training Pipeline ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"), [§4.4.2](https://arxiv.org/html/2602.02276v1#S4.SS4.SSS2.Px1.p2.1 "Policy Optimization ‣ 4.4.2 Reinforcement Learning ‣ 4.4 Post-Training ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [34]Y. Liu, Z. Li, M. Huang, B. Yang, W. Yu, C. Li, X. Yin, C. Liu, L. Jin, and X. Bai (2024-12)OCRBench: on the hidden mystery of ocr in large multimodal models. Science China Information Sciences 67 (12). External Links: ISSN 1869-1919, [Link](http://dx.doi.org/10.1007/s11432-024-4235-6), [Document](https://dx.doi.org/10.1007/s11432-024-4235-6)Cited by: [4th item](https://arxiv.org/html/2602.02276v1#S5.I1.i4.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [35]P. Lu, H. Bansal, T. Xia, J. Liu, C. Li, H. Hajishirzi, H. Cheng, K. Chang, M. Galley, and J. Gao (2024)MathVista: evaluating mathematical reasoning of foundation models in visual contexts. External Links: 2310.02255, [Link](https://arxiv.org/abs/2310.02255)Cited by: [4th item](https://arxiv.org/html/2602.02276v1#S5.I1.i4.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [36]T. Luong, D. Hwang, H. H. Nguyen, G. Ghiasi, Y. Chervonyi, I. Seo, J. Kim, G. Bingham, J. Lee, S. Mishra, A. Zhai, H. Hu, H. Michalewski, J. Kim, J. Ahn, J. Bae, X. Song, T. H. Trinh, Q. V. Le, and J. Jung (2025-11)Towards robust mathematical reasoning. In Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing, C. Christodoulopoulos, T. Chakraborty, C. Rose, and V. Peng (Eds.), Suzhou, China,  pp.35418–35442. External Links: [Link](https://aclanthology.org/2025.emnlp-main.1794/), [Document](https://dx.doi.org/10.18653/v1/2025.emnlp-main.1794), ISBN 979-8-89176-332-6 Cited by: [1st item](https://arxiv.org/html/2602.02276v1#S5.I1.i1.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [37]M. Mathew, V. Bagal, R. P. Tito, D. Karatzas, E. Valveny, and C. V. Jawahar (2021)InfographicVQA. External Links: 2104.12756, [Link](https://arxiv.org/abs/2104.12756)Cited by: [4th item](https://arxiv.org/html/2602.02276v1#S5.I1.i4.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [38]M. A. Merrill, A. G. Shaw, N. Carlini, B. Li, H. Raj, I. Bercovich, L. Shi, J. Y. Shin, T. Walshe, E. K. Buchanan, et al. (2026)Terminal-bench: benchmarking agents on hard, realistic tasks in command line interfaces. arXiv preprint arXiv:2601.11868. Cited by: [2nd item](https://arxiv.org/html/2602.02276v1#S5.I1.i2.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [39]D. Narayanan, M. Shoeybi, J. Casper, P. LeGresley, M. Patwary, V. A. Korthikanti, D. Vainbrand, P. Kashinkunti, J. Bernauer, B. Catanzaro, A. Phanishayee, and M. Zaharia (2021)Efficient large-scale language model training on gpu clusters using megatron-lm. External Links: 2104.04473, [Link](https://arxiv.org/abs/2104.04473)Cited by: [Appendix C](https://arxiv.org/html/2602.02276v1#A3.p1.1 "Appendix C Infra ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [40]M. A. of America (2025)2025 american invitational mathematics examination i. Note: Held on February 6, 2025 External Links: [Link](https://artofproblemsolving.com/wiki/index.php/2025_AIME_I)Cited by: [1st item](https://arxiv.org/html/2602.02276v1#S5.I1.i1.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [41]OpenAI (2025)Introducing gpt 5.2. External Links: [Link](https://openai.com/index/introducing-gpt-5-2/)Cited by: [§1](https://arxiv.org/html/2602.02276v1#S1.p1.1 "1 Introduction ‣ Kimi K2.5: Visual Agentic Intelligence"), [§5.1.1](https://arxiv.org/html/2602.02276v1#S5.SS1.SSS1.Px2.p1.1 "Baselines ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [42]L. Ouyang, Y. Qu, H. Zhou, J. Zhu, R. Zhang, Q. Lin, B. Wang, Z. Zhao, M. Jiang, X. Zhao, J. Shi, F. Wu, P. Chu, M. Liu, Z. Li, C. Xu, B. Zhang, B. Shi, Z. Tu, and C. He (2025)OmniDocBench: benchmarking diverse pdf document parsing with comprehensive annotations. External Links: 2412.07626, [Link](https://arxiv.org/abs/2412.07626)Cited by: [4th item](https://arxiv.org/html/2602.02276v1#S5.I1.i4.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [43]T. Patwardhan, R. Dias, E. Proehl, G. Kim, M. Wang, O. Watkins, S. P. Fishman, M. Aljubeh, P. Thacker, L. Fauconnet, N. S. Kim, P. Chao, S. Miserendino, G. Chabot, D. Li, M. Sharman, A. Barr, A. Glaese, and J. Tworek (2025)GDPval: evaluating AI model performance on real-world economically valuable tasks. External Links: 2510.04374, [Link](https://arxiv.org/abs/2510.04374)Cited by: [3rd item](https://arxiv.org/html/2602.02276v1#S5.I1.i3.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [44]B. Peng, J. Quesnelle, H. Fan, and E. Shippole (2023)Yarn: efficient context window extension of large language models. arXiv preprint arXiv:2309.00071. Cited by: [§4.3](https://arxiv.org/html/2602.02276v1#S4.SS3.SSS0.Px2.p1.1 "Joint Training Stages ‣ 4.3 Pre-training Pipeline ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [45]T. Pham, N. Nguyen, P. Zunjare, W. Chen, Y. Tseng, and T. Vu (2025)SealQA: raising the bar for reasoning in search-augmented language models. Note: Seal-0 is the main subset of this benchmark External Links: 2506.01062, [Link](https://arxiv.org/abs/2506.01062)Cited by: [3rd item](https://arxiv.org/html/2602.02276v1#S5.I1.i3.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [46]L. Phan, A. Gatti, Z. Han, N. Li, J. Hu, H. Zhang, C. B. C. Zhang, M. Shaaban, J. Ling, S. Shi, M. Choi, A. Agrawal, A. Chopra, A. Khoja, R. Kim, R. Ren, J. Hausenloy, O. Zhang, M. Mazeika, D. Dodonov, T. Nguyen, J. Lee, D. Anderson, M. Doroshenko, A. C. Stokes, M. Mahmood, O. Pokutnyi, O. Iskra, J. P. Wang, J. Levin, M. Kazakov, F. Feng, S. Y. Feng, H. Zhao, M. Yu, V. Gangal, C. Zou, Z. Wang, S. Popov, R. Gerbicz, G. Galgon, J. Schmitt, W. Yeadon, Y. Lee, S. Sauers, A. Sanchez, F. Giska, M. Roth, S. Riis, S. Utpala, N. Burns, G. M. Goshu, M. M. Naiya, C. Agu, Z. Giboney, A. Cheatom, F. Fournier-Facio, S. Crowson, L. Finke, Z. Cheng, J. Zampese, R. G. Hoerr, M. Nandor, H. Park, T. Gehrunger, J. Cai, B. McCarty, A. C. Garretson, E. Taylor, D. Sileo, Q. Ren, U. Qazi, L. Li, J. Nam, J. B. Wydallis, P. Arkhipov, J. W. L. Shi, A. Bacho, C. G. Willcocks, H. Cao, S. Motwani, E. de Oliveira Santos, J. Veith, E. Vendrow, D. Cojoc, K. Zenitani, J. Robinson, L. Tang, Y. Li, J. Vendrow, N. W. Fraga, V. Kuchkin, A. P. Maksimov, P. Marion, D. Efremov, J. Lynch, K. Liang, A. Mikov, A. Gritsevskiy, J. Guillod, G. Demir, D. Martinez, B. Pageler, K. Zhou, S. Soori, O. Press, H. Tang, P. Rissone, S. R. Green, L. Brüssel, M. Twayana, A. Dieuleveut, J. M. Imperial, A. Prabhu, J. Yang, N. Crispino, A. Rao, D. Zvonkine, G. Loiseau, M. Kalinin, M. Lukas, C. Manolescu, N. Stambaugh, S. Mishra, T. Hogg, C. Bosio, B. P. Coppola, J. Salazar, J. Jin, R. Sayous, S. Ivanov, P. Schwaller, S. Senthilkuma, A. M. Bran, A. Algaba, K. V. den Houte, L. V. D. Sypt, B. Verbeken, D. Noever, A. Kopylov, B. Myklebust, B. Li, L. Schut, E. Zheltonozhskii, Q. Yuan, D. Lim, R. Stanley, T. Yang, J. Maar, J. Wykowski, M. Oller, A. Sahu, C. G. Ardito, Y. Hu, A. G. K. Kamdoum, A. Jin, T. G. Vilchis, Y. Zu, M. Lackner, J. Koppel, G. Sun, D. S. Antonenko, S. Chern, B. Zhao, P. Arsene, J. M. Cavanagh, D. Li, J. Shen, D. Crisostomi, W. Zhang, A. Dehghan, S. Ivanov, D. Perrella, N. Kaparov, A. Zang, I. Sucholutsky, A. Kharlamova, D. Orel, V. Poritski, S. Ben-David, Z. Berger, P. Whitfill, M. Foster, D. Munro, L. Ho, S. Sivarajan, D. B. Hava, A. Kuchkin, D. Holmes, A. Rodriguez-Romero, F. Sommerhage, A. Zhang, R. Moat, K. Schneider, Z. Kazibwe, D. Clarke, D. H. Kim, F. M. Dias, S. Fish, V. Elser, T. Kreiman, V. E. G. Vilchis, I. Klose, U. Anantheswaran, A. Zweiger, K. Rawal, J. Li, J. Nguyen, N. Daans, H. Heidinger, M. Radionov, V. Rozhoň, V. Ginis, C. Stump, N. Cohen, R. Poświata, J. Tkadlec, A. Goldfarb, C. Wang, P. Padlewski, S. Barzowski, K. Montgomery, R. Stendall, J. Tucker-Foltz, J. Stade, T. R. Rogers, T. Goertzen, D. Grabb, A. Shukla, A. Givré, J. A. Ambay, A. Sen, M. F. Aziz, M. H. Inlow, H. He, L. Zhang, Y. Kaddar, I. Ängquist, Y. Chen, H. K. Wang, K. Ramakrishnan, E. Thornley, A. Terpin, H. Schoelkopf, E. Zheng, A. Carmi, E. D. L. Brown, K. Zhu, M. Bartolo, R. Wheeler, M. Stehberger, P. Bradshaw, J. Heimonen, K. Sridhar, I. Akov, J. Sandlin, Y. Makarychev, J. Tam, H. Hoang, D. M. Cunningham, V. Goryachev, D. Patramanis, M. Krause, A. Redenti, D. Aldous, J. Lai, S. Coleman, J. Xu, S. Lee, I. Magoulas, S. Zhao, N. Tang, M. K. Cohen, O. Paradise, J. H. Kirchner, M. Ovchynnikov, J. O. Matos, A. Shenoy, M. Wang, Y. Nie, A. Sztyber-Betley, P. Faraboschi, R. Riblet, J. Crozier, S. Halasyamani, S. Verma, P. Joshi, E. Meril, Z. Ma, J. Andréoletti, R. Singhal, J. Platnick, V. Nevirkovets, L. Basler, A. Ivanov, S. Khoury, N. Gustafsson, M. Piccardo, H. Mostaghimi, Q. Chen, V. Singh, T. Q. Khánh, P. Rosu, H. Szlyk, Z. Brown, H. Narayan, A. Menezes, J. Roberts, W. Alley, K. Sun, A. Patel, M. Lamparth, A. Reuel, L. Xin, H. Xu, J. Loader, F. Martin, Z. Wang, A. Achilleos, T. Preu, T. Korbak, I. Bosio, F. Kazemi, Z. Chen, B. Bálint, E. J. Y. Lo, J. Wang, M. I. S. Nunes, J. Milbauer, M. S. Bari, Z. Wang, B. Ansarinejad, Y. Sun, S. Durand, H. Elgnainy, G. Douville, D. Tordera, G. Balabanian, H. Wolff, L. Kvistad, H. Milliron, A. Sakor, M. Eron, A. F. D. O., S. Shah, X. Zhou, F. Kamalov, S. Abdoli, T. Santens, S. Barkan, A. Tee, R. Zhang, A. Tomasiello, G. B. D. Luca, S. Looi, V. Le, N. Kolt, J. Pan, E. Rodman, J. Drori, C. J. Fossum, N. Muennighoff, M. Jagota, R. Pradeep, H. Fan, J. Eicher, M. Chen, K. Thaman, W. Merrill, M. Firsching, C. Harris, S. Ciobâcă, J. Gross, R. Pandey, I. Gusev, A. Jones, S. Agnihotri, P. Zhelnov, M. Mofayezi, A. Piperski, D. K. Zhang, K. Dobarskyi, R. Leventov, I. Soroko, J. Duersch, V. Taamazyan, A. Ho, W. Ma, W. Held, R. Xian, A. R. Zebaze, M. Mohamed, J. N. Leser, M. X. Yuan, L. Yacar, J. Lengler, K. Olszewska, C. D. Fratta, E. Oliveira, J. W. Jackson, A. Zou, M. Chidambaram, T. Manik, H. Haffenden, D. Stander, A. Dasouqi, A. Shen, B. Golshani, D. Stap, E. Kretov, M. Uzhou, A. B. Zhidkovskaya, N. Winter, M. O. Rodriguez, R. Lauff, D. Wehr, C. Tang, Z. Hossain, S. Phillips, F. Samuele, F. Ekström, A. Hammon, O. Patel, F. Farhidi, G. Medley, F. Mohammadzadeh, M. Peñaflor, H. Kassahun, A. Friedrich, R. H. Perez, D. Pyda, T. Sakal, O. Dhamane, A. K. Mirabadi, E. Hallman, K. Okutsu, M. Battaglia, M. Maghsoudimehrabani, A. Amit, D. Hulbert, R. Pereira, S. Weber, Handoko, A. Peristyy, S. Malina, M. Mehkary, R. Aly, F. Reidegeld, A. Dick, C. Friday, M. Singh, H. Shapourian, W. Kim, M. Costa, H. Gurdogan, H. Kumar, C. Ceconello, C. Zhuang, H. Park, M. Carroll, A. R. Tawfeek, S. Steinerberger, D. Aggarwal, M. Kirchhof, L. Dai, E. Kim, J. Ferret, J. Shah, Y. Wang, M. Yan, K. Burdzy, L. Zhang, A. Franca, D. T. Pham, K. Y. Loh, J. Robinson, A. Jackson, P. Giordano, P. Petersen, A. Cosma, J. Colino, C. White, J. Votava, V. Vinnikov, E. Delaney, P. Spelda, V. Stritecky, S. M. Shahid, J. Mourrat, L. Vetoshkin, K. Sponselee, R. Bacho, Z. Yong, F. de la Rosa, N. Cho, X. Li, G. Malod, O. Weller, G. Albani, L. Lang, J. Laurendeau, D. Kazakov, F. Adesanya, J. Portier, L. Hollom, V. Souza, Y. A. Zhou, J. Degorre, Y. Yalın, G. D. Obikoya, Rai, F. Bigi, M. C. Boscá, O. Shumar, K. Bacho, G. Recchia, M. Popescu, N. Shulga, N. M. Tanwie, T. C. H. Lux, B. Rank, C. Ni, M. Brooks, A. Yakimchyk, Huanxu, Liu, S. Cavalleri, O. Häggström, E. Verkama, J. Newbould, H. Gundlach, L. Brito-Santana, B. Amaro, V. Vajipey, R. Grover, T. Wang, Y. Kratish, W. Li, S. Gopi, A. Caciolai, C. S. de Witt, P. Hernández-Cámara, E. Rodolà, J. Robins, D. Williamson, V. Cheng, B. Raynor, H. Qi, B. Segev, J. Fan, S. Martinson, E. Y. Wang, K. Hausknecht, M. P. Brenner, M. Mao, C. Demian, P. Kassani, X. Zhang, D. Avagian, E. J. Scipio, A. Ragoler, J. Tan, B. Sims, R. Plecnik, A. Kirtland, O. F. Bodur, D. P. Shinde, Y. C. L. Labrador, Z. Adoul, M. Zekry, A. Karakoc, T. C. B. Santos, S. Shamseldeen, L. Karim, A. Liakhovitskaia, N. Resman, N. Farina, J. C. Gonzalez, G. Maayan, E. Anderson, R. D. O. Pena, E. Kelley, H. Mariji, R. Pouriamanesh, W. Wu, R. Finocchio, I. Alarab, J. Cole, D. Ferreira, B. Johnson, M. Safdari, L. Dai, S. Arthornthurasuk, I. C. McAlister, A. J. Moyano, A. Pronin, J. Fan, A. Ramirez-Trinidad, Y. Malysheva, D. Pottmaier, O. Taheri, S. Stepanic, S. Perry, L. Askew, R. A. H. Rodríguez, A. M. R. Minissi, R. Lorena, K. Iyer, A. A. Fasiludeen, R. Clark, J. Ducey, M. Piza, M. Somrak, E. Vergo, J. Qin, B. Borbás, E. Chu, J. Lindsey, A. Jallon, I. M. J. McInnis, E. Chen, A. Semler, L. Gloor, T. Shah, M. Carauleanu, P. Lauer, T. Đ. Huy, H. Shahrtash, E. Duc, L. Lewark, A. Brown, S. Albanie, B. Weber, W. S. Vaz, P. Clavier, Y. Fan, G. P. R. e Silva, Long, Lian, M. Abramovitch, X. Jiang, S. Mendoza, M. Islam, J. Gonzalez, V. Mavroudis, J. Xu, P. Kumar, L. P. Goswami, D. Bugas, N. Heydari, F. Jeanplong, T. Jansen, A. Pinto, A. Apronti, A. Galal, N. Ze-An, A. Singh, T. Jiang, J. of Arc Xavier, K. P. Agarwal, M. Berkani, G. Zhang, Z. Du, B. A. de Oliveira Junior, D. Malishev, N. Remy, T. D. Hartman, T. Tarver, S. Mensah, G. A. Loume, W. Morak, F. Habibi, S. Hoback, W. Cai, J. Gimenez, R. G. Montecillo, J. Łucki, R. Campbell, A. Sharma, K. Meer, S. Gul, D. E. Gonzalez, X. Alapont, A. Hoover, G. Chhablani, F. Vargus, A. Agarwal, Y. Jiang, D. Patil, D. Outevsky, K. J. Scaria, R. Maheshwari, A. Dendane, P. Shukla, A. Cartwright, S. Bogdanov, N. Mündler, S. Möller, L. Arnaboldi, K. Thaman, M. R. Siddiqi, P. Saxena, H. Gupta, T. Fruhauff, G. Sherman, M. Vincze, S. Usawasutsakorn, D. Ler, A. Radhakrishnan, I. Enyekwe, S. M. Salauddin, J. Muzhen, A. Maksapetyan, V. Rossbach, C. Harjadi, M. Bahaloohoreh, C. Sparrow, J. Sidhu, S. Ali, S. Bian, J. Lai, E. Singer, J. L. Uro, G. Bateman, M. Sayed, A. Menshawy, D. Duclosel, D. Bezzi, Y. Jain, A. Aaron, M. Tiryakioglu, S. Siddh, K. Krenek, I. A. Shah, J. Jin, S. Creighton, D. Peskoff, Z. EL-Wasif, R. P. V, M. Richmond, J. McGowan, T. Patwardhan, H. Sun, T. Sun, N. Zubić, S. Sala, S. Ebert, J. Kaddour, M. Schottdorf, D. Wang, G. Petruzella, A. Meiburg, T. Medved, A. ElSheikh, S. A. Hebbar, L. Vaquero, X. Yang, J. Poulos, V. Zouhar, S. Bogdanik, M. Zhang, J. Sanz-Ros, D. Anugraha, Y. Dai, A. N. Nhu, X. Wang, A. A. Demircali, Z. Jia, Y. Zhou, J. Wu, M. He, N. Chandok, A. Sinha, G. Luo, L. Le, M. Noyé, M. Perełkiewicz, I. Pantidis, T. Qi, S. S. Purohit, L. Parcalabescu, T. Nguyen, G. I. Winata, E. M. Ponti, H. Li, K. Dhole, J. Park, D. Abbondanza, Y. Wang, A. Nayak, D. M. Caetano, A. A. W. L. Wong, M. del Rio-Chanona, D. Kondor, P. Francois, E. Chalstrey, J. Zsambok, D. Hoyer, J. Reddish, J. Hauser, F. Rodrigo-Ginés, S. Datta, M. Shepherd, T. Kamphuis, Q. Zhang, H. Kim, R. Sun, J. Yao, F. Dernoncourt, S. Krishna, S. Rismanchian, B. Pu, F. Pinto, Y. Wang, K. Shridhar, K. J. Overholt, G. Briia, H. Nguyen, David, S. Bartomeu, T. C. Pang, A. Wecker, Y. Xiong, F. Li, L. S. Huber, J. Jaeger, R. D. Maddalena, X. H. Lù, Y. Zhang, C. Beger, P. T. J. Kon, S. Li, V. Sanker, M. Yin, Y. Liang, X. Zhang, A. Agrawal, L. S. Yifei, Z. Zhang, M. Cai, Y. Sonmez, C. Cozianu, C. Li, A. Slen, S. Yu, H. K. Park, G. Sarti, M. Briański, A. Stolfo, T. A. Nguyen, M. Zhang, Y. Perlitz, J. Hernandez-Orallo, R. Li, A. Shabani, F. Juefei-Xu, S. Dhingra, O. Zohar, M. C. Nguyen, A. Pondaven, A. Yilmaz, X. Zhao, C. Jin, M. Jiang, S. Todoran, X. Han, J. Kreuer, B. Rabern, A. Plassart, M. Maggetti, L. Yap, R. Geirhos, J. Kean, D. Wang, S. Mollaei, C. Sun, Y. Yin, S. Wang, R. Li, Y. Chang, A. Wei, A. Bizeul, X. Wang, A. O. Arrais, K. Mukherjee, J. Chamorro-Padial, J. Liu, X. Qu, J. Guan, A. Bouyamourn, S. Wu, M. Plomecka, J. Chen, M. Tang, J. Deng, S. Subramanian, H. Xi, H. Chen, W. Zhang, Y. Ren, H. Tu, S. Kim, Y. Chen, S. V. Marjanović, J. Ha, G. Luczyna, J. J. Ma, Z. Shen, D. Song, C. E. Zhang, Z. Wang, G. Gendron, Y. Xiao, L. Smucker, E. Weng, K. H. Lee, Z. Ye, S. Ermon, I. D. Lopez-Miguel, T. Knights, A. Gitter, N. Park, B. Wei, H. Chen, K. Pai, A. Elkhanany, H. Lin, P. D. Siedler, J. Fang, R. Mishra, K. Zsolnai-Fehér, X. Jiang, S. Khan, J. Yuan, R. K. Jain, X. Lin, M. Peterson, Z. Wang, A. Malusare, M. Tang, I. Gupta, I. Fosin, T. Kang, B. Dworakowska, K. Matsumoto, G. Zheng, G. Sewuster, J. P. Villanueva, I. Rannev, I. Chernyavsky, J. Chen, D. Banik, B. Racz, W. Dong, J. Wang, L. Bashmal, D. V. Gonçalves, W. Hu, K. Bar, O. Bohdal, A. S. Patlan, S. Dhuliawala, C. Geirhos, J. Wist, Y. Kansal, B. Chen, K. Tire, A. T. Yücel, B. Christof, V. Singla, Z. Song, S. Chen, J. Ge, K. Ponkshe, I. Park, T. Shi, M. Q. Ma, J. Mak, S. Lai, A. Moulin, Z. Cheng, Z. Zhu, Z. Zhang, V. Patil, K. Jha, Q. Men, J. Wu, T. Zhang, B. H. Vieira, A. F. Aji, J. Chung, M. Mahfoud, H. T. Hoang, M. Sperzel, W. Hao, K. Meding, S. Xu, V. Kostakos, D. Manini, Y. Liu, C. Toukmaji, J. Paek, E. Yu, A. E. Demircali, Z. Sun, I. Dewerpe, H. Qin, R. Pflugfelder, J. Bailey, J. Morris, V. Heilala, S. Rosset, Z. Yu, P. E. Chen, W. Yeo, E. Jain, R. Yang, S. Chigurupati, J. Chernyavsky, S. P. Reddy, S. Venugopalan, H. Batra, C. F. Park, H. Tran, G. Maximiano, G. Zhang, Y. Liang, H. Shiyu, R. Xu, R. Pan, S. Suresh, Z. Liu, S. Gulati, S. Zhang, P. Turchin, C. W. Bartlett, C. R. Scotese, P. M. Cao, A. Nattanmai, G. McKellips, A. Cheraku, A. Suhail, E. Luo, M. Deng, J. Luo, A. Zhang, K. Jindel, J. Paek, K. Halevy, A. Baranov, M. Liu, A. Avadhanam, D. Zhang, V. Cheng, B. Ma, E. Fu, L. Do, J. Lass, H. Yang, S. Sunkari, V. Bharath, V. Ai, J. Leung, R. Agrawal, A. Zhou, K. Chen, T. Kalpathi, Z. Xu, G. Wang, T. Xiao, E. Maung, S. Lee, R. Yang, R. Yue, B. Zhao, J. Yoon, S. Sun, A. Singh, E. Luo, C. Peng, T. Osbey, T. Wang, D. Echeazu, H. Yang, T. Wu, S. Patel, V. Kulkarni, V. Sundarapandiyan, A. Zhang, A. Le, Z. Nasim, S. Yalam, R. Kasamsetty, S. Samal, H. Yang, D. Sun, N. Shah, A. Saha, A. Zhang, L. Nguyen, L. Nagumalli, K. Wang, A. Zhou, A. Wu, J. Luo, A. Telluri, S. Yue, A. Wang, and D. Hendrycks (2025)Humanity’s last exam. External Links: 2501.14249, [Link](https://arxiv.org/abs/2501.14249)Cited by: [1st item](https://arxiv.org/html/2602.02276v1#S5.I1.i1.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [47]D. Rein, B. L. Hou, A. C. Stickland, J. Petty, R. Y. Pang, J. Dirani, J. Michael, and S. R. Bowman (2024)Gpqa: a graduate-level google-proof q&a benchmark. In First Conference on Language Modeling, Cited by: [1st item](https://arxiv.org/html/2602.02276v1#S5.I1.i1.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [48]J. Roberts, M. R. Taesiri, A. Sharma, A. Gupta, S. Roberts, I. Croitoru, S. Bogolin, J. Tang, F. Langer, V. Raina, V. Raina, H. Xiong, V. Udandarao, J. Lu, S. Chen, S. Purkis, T. Yan, W. Lin, G. Shin, Q. Yang, A. T. Nguyen, D. I. Atkinson, A. Baranwal, A. Coca, M. Dang, S. Dziadzio, J. D. Kunz, K. Liang, A. Lo, B. Pulfer, S. Walton, C. Yang, K. Han, and S. Albanie (2025)ZeroBench: an impossible visual benchmark for contemporary large multimodal models. External Links: 2502.09696, [Link](https://arxiv.org/abs/2502.09696)Cited by: [4th item](https://arxiv.org/html/2602.02276v1#S5.I1.i4.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [49]C. Schuhmann, R. Beaumont, R. Vencu, C. Gordon, R. Wightman, M. Cherti, T. Coombes, A. Katta, C. Mullis, M. Wortsman, et al. (2022)Laion-5b: an open large-scale dataset for training next generation image-text models. Advances in Neural Information Processing Systems 35,  pp.25278–25294. Cited by: [§B.3](https://arxiv.org/html/2602.02276v1#A2.SS3.p1.1 "B.3 Vision data ‣ Appendix B Pre-training ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [50]J. Schulman, F. Wolski, P. Dhariwal, A. Radford, and O. Klimov (2017)Proximal policy optimization algorithms. arXiv preprint arXiv:1707.06347. External Links: [Link](https://arxiv.org/abs/1707.06347)Cited by: [§4.4.2](https://arxiv.org/html/2602.02276v1#S4.SS4.SSS2.Px1.p2.1 "Policy Optimization ‣ 4.4.2 Reinforcement Learning ‣ 4.4 Post-Training ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [51]T. Song, H. Lu, H. Yang, L. Sui, H. Wu, Z. Zhou, Z. Huang, Y. Bao, Y. Charles, X. Zhou, and L. Wang (2026)Towards pixel-level vlm perception via simple points prediction. External Links: 2601.19228, [Link](https://arxiv.org/abs/2601.19228)Cited by: [§B.3](https://arxiv.org/html/2602.02276v1#A2.SS3.p3.1 "B.3 Vision data ‣ Appendix B Pre-training ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [52]G. Starace, O. Jaffe, D. Sherburn, J. Aung, J. S. Chan, L. Maksin, R. Dias, E. Mays, B. Kinsella, W. Thompson, et al. (2025)PaperBench: evaluating ai’s ability to replicate ai research. arXiv preprint arXiv:2504.01848. Cited by: [2nd item](https://arxiv.org/html/2602.02276v1#S5.I1.i2.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [53]K. Team, Y. Bai, Y. Bao, G. Chen, J. Chen, N. Chen, R. Chen, Y. Chen, Y. Chen, Y. Chen, et al. (2025)Kimi k2: open agentic intelligence. arXiv preprint arXiv:2507.20534. Cited by: [§B.2](https://arxiv.org/html/2602.02276v1#A2.SS2.p1.1 "B.2 Text data ‣ Appendix B Pre-training ‣ Kimi K2.5: Visual Agentic Intelligence"), [§4.1](https://arxiv.org/html/2602.02276v1#S4.SS1.p1.1 "4.1 Foundation: Kimi K2 Base Model ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"), [§4.4.1](https://arxiv.org/html/2602.02276v1#S4.SS4.SSS1.p1.1 "4.4.1 Supervised Fine-Tuning ‣ 4.4 Post-Training ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"), [§4.4.2](https://arxiv.org/html/2602.02276v1#S4.SS4.SSS2.Px3.p1.1 "Generative Reward Models ‣ 4.4.2 Reinforcement Learning ‣ 4.4 Post-Training ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"), [§4.4.2](https://arxiv.org/html/2602.02276v1#S4.SS4.SSS2.Px4.p1.1 "Token Efficient Reinforcement Learning ‣ 4.4.2 Reinforcement Learning ‣ 4.4 Post-Training ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"), [§4.5](https://arxiv.org/html/2602.02276v1#S4.SS5.p1.1 "4.5 Training Infrastructure ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [54]K. Team, A. Du, B. Yin, B. Xing, B. Qu, B. Wang, C. Chen, C. Zhang, C. Du, C. Wei, et al. (2025)Kimi-vl technical report. arXiv preprint arXiv:2504.07491. Cited by: [§4.2](https://arxiv.org/html/2602.02276v1#S4.SS2.p1.1 "4.2 Model Architecture ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"), [§4.3](https://arxiv.org/html/2602.02276v1#S4.SS3.SSS0.Px1.p1.1 "ViT Training Stage ‣ 4.3 Pre-training Pipeline ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"), [§4.5.1](https://arxiv.org/html/2602.02276v1#S4.SS5.SSS1.p1.1 "4.5.1 Decoupled Encoder Process (DEP) ‣ 4.5 Training Infrastructure ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [55]M. L. Team, B. Wang, B. Xiao, B. Zhang, B. Rong, B. Chen, C. Wan, C. Zhang, C. Huang, C. Chen, et al. (2025)Longcat-flash-omni technical report. arXiv preprint arXiv:2511.00279. Cited by: [§4.5.1](https://arxiv.org/html/2602.02276v1#S4.SS5.SSS1.p4.1 "4.5.1 Decoupled Encoder Process (DEP) ‣ 4.5 Training Infrastructure ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [56]M. Tian, L. Gao, S. Zhang, X. Chen, C. Fan, X. Guo, R. Haas, P. Ji, K. Krongchon, Y. Li, et al. (2024)Scicode: a research coding benchmark curated by scientists. Advances in Neural Information Processing Systems 37,  pp.30624–30650. Cited by: [2nd item](https://arxiv.org/html/2602.02276v1#S5.I1.i2.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [57]S. Tong, Z. Liu, Y. Zhai, Y. Ma, Y. LeCun, and S. Xie (2024)Eyes wide shut? exploring the visual shortcomings of multimodal llms. External Links: 2401.06209, [Link](https://arxiv.org/abs/2401.06209)Cited by: [4th item](https://arxiv.org/html/2602.02276v1#S5.I1.i4.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [58]H. M. Tournament (2025)Harvard-mit mathematics tournament, february 2025. Note: Held on February 15, 2025 External Links: [Link](https://www.hmmt.org/www/archive/282)Cited by: [1st item](https://arxiv.org/html/2602.02276v1#S5.I1.i1.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [59]A. Vaswani, N. Shazeer, N. Parmar, J. Uszkoreit, L. Jones, A. N. Gomez, Ł. Kaiser, and I. Polosukhin (2017)Attention is all you need. In Advances in Neural Information Processing Systems, I. Guyon, U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vishwanathan, and R. Garnett (Eds.), Vol. 30,  pp.. External Links: [Link](https://proceedings.neurips.cc/paper_files/paper/2017/file/3f5ee243547dee91fbd053c1c4a845aa-Paper.pdf)Cited by: [§4.1](https://arxiv.org/html/2602.02276v1#S4.SS1.p1.1 "4.1 Foundation: Kimi K2 Base Model ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [60]N. Vedula, M. Collins, E. Agichtein, and O. Rokhlenko (2025)DeepSearchQA: bridging the comprehensiveness gap for deep research agents. Google DeepMind, Google Search, Kaggle, and Google Research. External Links: [Link](https://storage.googleapis.com/deepmind-media/DeepSearchQA/DeepSearchQA_benchmark_paper.pdf)Cited by: [3rd item](https://arxiv.org/html/2602.02276v1#S5.I1.i3.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [61]K. Wang, J. Pan, W. Shi, Z. Lu, M. Zhan, and H. Li (2024)Measuring multimodal mathematical reasoning with math-vision dataset. External Links: 2402.14804, [Link](https://arxiv.org/abs/2402.14804)Cited by: [4th item](https://arxiv.org/html/2602.02276v1#S5.I1.i4.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [62]W. Wang, Z. He, W. Hong, Y. Cheng, X. Zhang, J. Qi, X. Gu, S. Huang, B. Xu, Y. Dong, M. Ding, and J. Tang (2025)LVBench: an extreme long video understanding benchmark. External Links: 2406.08035, [Link](https://arxiv.org/abs/2406.08035)Cited by: [5th item](https://arxiv.org/html/2602.02276v1#S5.I1.i5.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [63]X. Wang, B. Wang, D. Lu, J. Yang, T. Xie, J. Wang, J. Deng, X. Guo, Y. Xu, C. H. Wu, Z. Shen, Z. Li, R. Li, X. Li, J. Chen, B. Zheng, P. Li, F. Lei, R. Cao, Y. Fu, D. Shin, M. Shin, J. Hu, Y. Wang, J. Chen, Y. Ye, D. Zhang, D. Du, H. Hu, H. Chen, Z. Zhou, H. Yao, Z. Chen, Q. Gu, Y. Wang, H. Wang, D. Yang, V. Zhong, F. Sung, Y. Charles, Z. Yang, and T. Yu (2025)OpenCUA: open foundations for computer-use agents. External Links: 2508.09123, [Link](https://arxiv.org/abs/2508.09123)Cited by: [§E.7](https://arxiv.org/html/2602.02276v1#A5.SS7.SSS0.Px1.p1.5 "Hyperparameter Settings. ‣ E.7 Computer-Use Evaluation ‣ Appendix E Evaluation Settings ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [64]Y. Wang, X. Ma, G. Zhang, Y. Ni, A. Chandra, S. Guo, W. Ren, A. Arulraj, X. He, Z. Jiang, T. Li, M. Ku, K. Wang, A. Zhuang, R. Fan, X. Yue, and W. Chen (2024)MMLU-pro: a more robust and challenging multi-task language understanding benchmark. External Links: 2406.01574, [Link](https://arxiv.org/abs/2406.01574)Cited by: [1st item](https://arxiv.org/html/2602.02276v1#S5.I1.i1.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [65]Z. Wang, Y. Liu, Y. Wang, W. He, B. Gao, M. Diao, Y. Chen, K. Fu, F. Sung, Z. Yang, et al. (2025)OJBench: a competition level code benchmark for large language models. arXiv preprint arXiv:2506.16395. Cited by: [2nd item](https://arxiv.org/html/2602.02276v1#S5.I1.i2.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [66]Z. Wang, T. Shi, J. He, M. Cai, J. Zhang, and D. Song (2025)CyberGym: evaluating ai agents’ cybersecurity capabilities with real-world vulnerabilities at scale. arXiv preprint arXiv:2506.02548. Cited by: [2nd item](https://arxiv.org/html/2602.02276v1#S5.I1.i2.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [67]Z. Wang, M. Xia, L. He, H. Chen, Y. Liu, R. Zhu, K. Liang, X. Wu, H. Liu, S. Malladi, A. Chevalier, S. Arora, and D. Chen (2024)CharXiv: charting gaps in realistic chart understanding in multimodal llms. External Links: 2406.18521, [Link](https://arxiv.org/abs/2406.18521)Cited by: [4th item](https://arxiv.org/html/2602.02276v1#S5.I1.i4.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [68]J. Wei, Z. Sun, S. Papay, S. McKinney, J. Han, I. Fulford, H. W. Chung, A. T. Passos, W. Fedus, and A. Glaese (2025)BrowseComp: a simple yet challenging benchmark for browsing agents. External Links: 2504.12516, [Link](https://arxiv.org/abs/2504.12516)Cited by: [3rd item](https://arxiv.org/html/2602.02276v1#S5.I1.i3.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [69]R. Wong, J. Wang, J. Zhao, L. Chen, Y. Gao, L. Zhang, X. Zhou, Z. Wang, K. Xiang, G. Zhang, W. Huang, Y. Wang, and K. Wang (2025)WideSearch: benchmarking agentic broad info-seeking. External Links: 2508.07999, [Link](https://arxiv.org/abs/2508.07999)Cited by: [3rd item](https://arxiv.org/html/2602.02276v1#S5.I1.i3.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [70]H. Wu, D. Li, B. Chen, and J. Li (2024)LongVideoBench: a benchmark for long-context interleaved video-language understanding. External Links: 2407.15754, [Link](https://arxiv.org/abs/2407.15754)Cited by: [5th item](https://arxiv.org/html/2602.02276v1#S5.I1.i5.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [71]X. Wu, K. Li, Y. Zhao, L. Zhang, L. Ou, H. Yin, Z. Zhang, X. Yu, D. Zhang, Y. Jiang, P. Xie, F. Huang, M. Cheng, S. Wang, H. Cheng, and J. Zhou (2025)ReSum: unlocking long-horizon search intelligence via context summarization. External Links: 2509.13313, [Link](https://arxiv.org/abs/2509.13313)Cited by: [§5.2](https://arxiv.org/html/2602.02276v1#S5.SS2.SSS0.Px5.p1.1 "Agent Swarm as Proactive Context Management ‣ 5.2 Agent Swarm Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [72]T. Xie, M. Yuan, D. Zhang, X. Xiong, Z. Shen, Z. Zhou, X. Wang, Y. Chen, J. Deng, J. Chen, B. Wang, H. Wu, J. Chen, J. Wang, D. Lu, H. Hu, and T. Yu (2025-07)Introducing osworld-verified. xlang.ai. External Links: [Link](https://xlang.ai/blog/osworld-verified)Cited by: [6th item](https://arxiv.org/html/2602.02276v1#S5.I1.i6.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"), [§5.1.2](https://arxiv.org/html/2602.02276v1#S5.SS1.SSS2.Px6.p1.1 "Computer-Use Capability ‣ 5.1.2 Evaluation Results ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [73]T. Xie, D. Zhang, J. Chen, X. Li, S. Zhao, R. Cao, T. J. Hua, Z. Cheng, D. Shin, F. Lei, Y. Liu, Y. Xu, S. Zhou, S. Savarese, C. Xiong, V. Zhong, and T. Yu (2024)OSWorld: benchmarking multimodal agents for open-ended tasks in real computer environments. External Links: 2404.07972 Cited by: [6th item](https://arxiv.org/html/2602.02276v1#S5.I1.i6.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"), [§5.1.2](https://arxiv.org/html/2602.02276v1#S5.SS1.SSS2.Px6.p1.1 "Computer-Use Capability ‣ 5.1.2 Evaluation Results ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [74]F. Yao, L. Liu, D. Zhang, C. Dong, J. Shang, and J. Gao (2025-08)Your efficient rl framework secretly brings you off-policy rl training. External Links: [Link](https://fengyao.notion.site/off-policy-rl)Cited by: [§4.4.2](https://arxiv.org/html/2602.02276v1#S4.SS4.SSS2.Px1.p2.1 "Policy Optimization ‣ 4.4.2 Reinforcement Learning ‣ 4.4 Post-Training ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [75]X. Yue, Y. Ni, K. Zhang, T. Zheng, R. Liu, G. Zhang, S. Stevens, D. Jiang, W. Ren, Y. Sun, C. Wei, B. Yu, R. Yuan, R. Sun, M. Yin, B. Zheng, Z. Yang, Y. Liu, W. Huang, H. Sun, Y. Su, and W. Chen (2024)MMMU: a massive multi-discipline multimodal understanding and reasoning benchmark for expert agi. In Proceedings of CVPR, Cited by: [4th item](https://arxiv.org/html/2602.02276v1#S5.I1.i4.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [76]X. Yue, T. Zheng, Y. Ni, Y. Wang, K. Zhang, S. Tong, Y. Sun, B. Yu, G. Zhang, H. Sun, Y. Su, W. Chen, and G. Neubig (2025)MMMU-pro: a more robust multi-discipline multimodal understanding benchmark. External Links: 2409.02813, [Link](https://arxiv.org/abs/2409.02813)Cited by: [4th item](https://arxiv.org/html/2602.02276v1#S5.I1.i4.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [77]X. Zhai, B. Mustafa, A. Kolesnikov, and L. Beyer (2023)Sigmoid loss for language image pre-training. External Links: 2303.15343, [Link](https://arxiv.org/abs/2303.15343)Cited by: [§4.2](https://arxiv.org/html/2602.02276v1#S4.SS2.SSS0.Px1.p1.1 "MoonViT-3D: Shared Embedding Space for Images and Videos ‣ 4.2 Model Architecture ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"), [§4.3](https://arxiv.org/html/2602.02276v1#S4.SS3.SSS0.Px1.p1.1 "ViT Training Stage ‣ 4.3 Pre-training Pipeline ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [78]X. Zhao, Y. Liu, K. Xu, J. Guo, Z. Wang, Y. Sun, X. Kong, Q. Cao, L. Jiang, Z. Wen, Z. Zhang, and J. Zhou (2025-09)Small leak can sink a great ship–boost rl training on moe with icepop!. External Links: [Link](https://ringtech.notion.site/icepop)Cited by: [§4.4.2](https://arxiv.org/html/2602.02276v1#S4.SS4.SSS2.Px1.p2.1 "Policy Optimization ‣ 4.4.2 Reinforcement Learning ‣ 4.4 Post-Training ‣ 4 Method Overview ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [79]Y. Zhao, L. Xie, H. Zhang, G. Gan, Y. Long, Z. Hu, T. Hu, W. Chen, C. Li, J. Song, Z. Xu, C. Wang, W. Pan, Z. Shangguan, X. Tang, Z. Liang, Y. Liu, C. Zhao, and A. Cohan (2025)MMVU: measuring expert-level multi-discipline video understanding. External Links: 2501.12380, [Link](https://arxiv.org/abs/2501.12380)Cited by: [5th item](https://arxiv.org/html/2602.02276v1#S5.I1.i5.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [80]S. Zhou, F. F. Xu, H. Zhu, X. Zhou, R. Lo, A. Sridhar, X. Cheng, T. Ou, Y. Bisk, D. Fried, U. Alon, and G. Neubig (2023)WebArena: a realistic web environment for building autonomous agents. arXiv preprint arXiv:2307.13854. External Links: [Link](https://webarena.dev/)Cited by: [6th item](https://arxiv.org/html/2602.02276v1#S5.I1.i6.p1.1 "In Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"), [§5.1.2](https://arxiv.org/html/2602.02276v1#S5.SS1.SSS2.Px6.p1.1 "Computer-Use Capability ‣ 5.1.2 Evaluation Results ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+*   [81]W. Zhu, J. Hessel, A. Awadalla, S. Y. Gadre, J. Dodge, A. Fang, Y. Yu, L. Schmidt, W. Y. Wang, and Y. Choi (2024)Multimodal c4: an open, billion-scale corpus of images interleaved with text. Advances in Neural Information Processing Systems 36. Cited by: [§B.3](https://arxiv.org/html/2602.02276v1#A2.SS3.p1.1 "B.3 Vision data ‣ Appendix B Pre-training ‣ Kimi K2.5: Visual Agentic Intelligence"). 
+
+## Appendix A Contributors
+
+Tongtong Bai 
+
+Yifan Bai 
+
+Yiping Bao 
+
+S.H. Cai 
+
+Yuan Cao 
+
+Y. Charles 
+
+H.S. Che 
+
+Cheng Chen 
+
+Guanduo Chen 
+
+Huarong Chen 
+
+Jia Chen 
+
+Jiahao Chen 
+
+Jianlong Chen 
+
+Jun Chen 
+
+Kefan Chen 
+
+Liang Chen 
+
+Ruijue Chen 
+
+Xinhao Chen 
+
+Yanru Chen 
+
+Yanxu Chen 
+
+Yicun Chen 
+
+Yimin Chen 
+
+Yingjiang Chen 
+
+Yuankun Chen 
+
+Yujie Chen 
+
+Yutian Chen 
+
+Zhirong Chen 
+
+Ziwei Chen 
+
+Dazhi Cheng 
+
+Minghan Chu 
+
+Jialei Cui 
+
+Jiaqi Deng 
+
+Muxi Diao 
+
+Hao Ding 
+
+Mengfan Dong 
+
+Mengnan Dong 
+
+Yuxin Dong 
+
+Yuhao Dong 
+
+Ang’ang Du 
+
+Chenzhuang Du 
+
+Dikang Du 
+
+Lingxiao Du 
+
+Yulun Du 
+
+Yu Fan 
+
+Shengjun Fang 
+
+Qiulin Feng 
+
+Yichen Feng 
+
+Garimugai Fu 
+
+Kelin Fu 
+
+Hongcheng Gao 
+
+Tong Gao 
+
+Yuyao Ge 
+
+Shangyi Geng 
+
+Chengyang Gong 
+
+Xiaochen Gong 
+
+Zhuoma Gongque 
+
+Qizheng Gu 
+
+Xinran Gu 
+
+Yicheng Gu 
+
+Longyu Guan 
+
+Yuanying Guo 
+
+Xiaoru Hao 
+
+Weiran He 
+
+Wenyang He 
+
+Yunjia He 
+
+Chao Hong 
+
+Hao Hu 
+
+Jiaxi Hu 
+
+Yangyang Hu 
+
+Zhenxing Hu 
+
+Ke Huang 
+
+Ruiyuan Huang 
+
+Weixiao Huang 
+
+Zhiqi Huang 
+
+Tao Jiang 
+
+Zhejun Jiang 
+
+Xinyi Jin 
+
+Yu Jing 
+
+Guokun Lai 
+
+Aidi Li 
+
+C. Li 
+
+Cheng Li 
+
+Fang Li 
+
+Guanghe Li 
+
+Guanyu Li 
+
+Haitao Li 
+
+Haoyang Li 
+
+Jia Li 
+
+Jingwei Li 
+
+Junxiong Li 
+
+Lincan Li 
+
+Mo Li 
+
+Weihong Li 
+
+Wentao Li 
+
+Xinhang Li 
+
+Xinhao Li 
+
+Yang Li 
+
+Yanhao Li 
+
+Yiwei Li 
+
+Yuxiao Li 
+
+Zhaowei Li 
+
+Zheming Li 
+
+Weilong Liao 
+
+Jiawei Lin 
+
+Xiaohan Lin 
+
+Zhishan Lin 
+
+Zichao Lin 
+
+Cheng Liu 
+
+Chenyu Liu 
+
+Hongzhang Liu 
+
+Liang Liu 
+
+Shaowei Liu 
+
+Shudong Liu 
+
+Shuran Liu 
+
+Tianwei Liu 
+
+Tianyu Liu 
+
+Weizhou Liu 
+
+Xiangyan Liu 
+
+Yangyang Liu 
+
+Yanming Liu 
+
+Yibo Liu 
+
+Yuanxin Liu 
+
+Yue Liu 
+
+Zhengying Liu 
+
+Zhongnuo Liu 
+
+Enzhe Lu 
+
+Haoyu Lu 
+
+Zhiyuan Lu 
+
+Junyu Luo 
+
+Tongxu Luo 
+
+Yashuo Luo 
+
+Long Ma 
+
+Yingwei Ma 
+
+Shaoguang Mao 
+
+Yuan Mei 
+
+Xin Men 
+
+Fanqing Meng 
+
+Zhiyong Meng 
+
+Yibo Miao 
+
+Minqing Ni 
+
+Kun Ouyang 
+
+Siyuan Pan 
+
+Bo Pang 
+
+Yuchao Qian 
+
+Ruoyu Qin 
+
+Zeyu Qin 
+
+Jiezhong Qiu 
+
+Bowen Qu 
+
+Zeyu Shang 
+
+Youbo Shao 
+
+Tianxiao Shen 
+
+Zhennan Shen 
+
+Juanfeng Shi 
+
+Lidong Shi 
+
+Shengyuan Shi 
+
+Feifan Song 
+
+Pengwei Song 
+
+Tianhui Song 
+
+Xiaoxi Song 
+
+Hongjin Su 
+
+Jianlin Su 
+
+Zhaochen Su 
+
+Lin Sui 
+
+Jinsong Sun 
+
+Junyao Sun 
+
+Tongyu Sun 
+
+Flood Sung 
+
+Yunpeng Tai 
+
+Chuning Tang 
+
+Heyi Tang 
+
+Xiaojuan Tang 
+
+Zhengyang Tang 
+
+Jiawen Tao 
+
+Shiyuan Teng 
+
+Chaoran Tian 
+
+Pengfei Tian 
+
+Ao Wang 
+
+Bowen Wang 
+
+Chensi Wang 
+
+Chuang Wang 
+
+Congcong Wang 
+
+Dingkun Wang 
+
+Dinglu Wang 
+
+Dongliang Wang 
+
+Feng Wang 
+
+Hailong Wang 
+
+Haiming Wang 
+
+Hengzhi Wang 
+
+Huaqing Wang 
+
+Hui Wang 
+
+Jiahao Wang 
+
+Jinhong Wang 
+
+Jiuzheng Wang 
+
+Kaixin Wang 
+
+Linian Wang 
+
+Qibin Wang 
+
+Shengjie Wang 
+
+Shuyi Wang 
+
+Si Wang 
+
+Wei Wang 
+
+Xiaochen Wang 
+
+Xinyuan Wang 
+
+Yao Wang 
+
+Yejie Wang 
+
+Yipu Wang 
+
+Yiqin Wang 
+
+Yucheng Wang 
+
+Yuzhi Wang 
+
+Zhaoji Wang 
+
+Zhaowei Wang 
+
+Zhengtao Wang 
+
+Zhexu Wang 
+
+Zihan Wang 
+
+Zizhe Wang 
+
+Chu Wei 
+
+Ming Wei 
+
+Chuan Wen 
+
+Zichen Wen 
+
+Chengjie Wu 
+
+Haoning Wu 
+
+Junyan Wu 
+
+Rucong Wu 
+
+Wenhao Wu 
+
+Yuefeng Wu 
+
+Yuhao Wu 
+
+Yuxin Wu 
+
+Zijian Wu 
+
+Chenjun Xiao 
+
+Jin Xie 
+
+Xiaotong Xie 
+
+Yuchong Xie 
+
+Yifei Xin 
+
+Bowei Xing 
+
+Boyu Xu 
+
+Jianfan Xu 
+
+Jing Xu 
+
+Jinjing Xu 
+
+L.H. Xu 
+
+Lin Xu 
+
+Suting Xu 
+
+Weixin Xu 
+
+Xinbo Xu 
+
+Xinran Xu 
+
+Yangchuan Xu 
+
+Yichang Xu 
+
+Yuemeng Xu 
+
+Zelai Xu 
+
+Ziyao Xu 
+
+Junjie Yan 
+
+Yuzi Yan 
+
+Guangyao Yang 
+
+Hao Yang 
+
+Junwei Yang 
+
+Kai Yang 
+
+Ningyuan Yang 
+
+Ruihan Yang 
+
+Xiaofei Yang 
+
+Xinlong Yang 
+
+Ying Yang 
+
+Yi(弋) Yang 
+
+Yi(翌) Yang 
+
+Zhen Yang 
+
+Zhilin Yang 
+
+Zonghan Yang 
+
+Haotian Yao 
+
+Dan Ye 
+
+Wenjie Ye 
+
+Zhuorui Ye 
+
+Bohong Yin 
+
+Chengzhen Yu 
+
+Longhui Yu 
+
+Tao Yu†
+
+Tianxiang Yu 
+
+Enming Yuan 
+
+Mengjie Yuan 
+
+Xiaokun Yuan 
+
+Yang Yue 
+
+Weihao Zeng 
+
+Dunyuan Zha 
+
+Haobing Zhan 
+
+Dehao Zhang 
+
+Hao Zhang 
+
+Jin Zhang 
+
+Puqi Zhang 
+
+Qiao Zhang 
+
+Rui Zhang 
+
+Xiaobin Zhang 
+
+Y. Zhang 
+
+Yadong Zhang 
+
+Yangkun Zhang 
+
+Yichi Zhang 
+
+Yizhi Zhang 
+
+Yongting Zhang 
+
+Yu Zhang 
+
+Yushun Zhang 
+
+Yutao Zhang 
+
+Yutong Zhang 
+
+Zheng Zhang 
+
+Chenguang Zhao 
+
+Feifan Zhao 
+
+Jinxiang Zhao 
+
+Shuai Zhao 
+
+Xiangyu Zhao 
+
+Yikai Zhao 
+
+Zijia Zhao 
+
+Huabin Zheng 
+
+Ruihan Zheng 
+
+Shaojie Zheng 
+
+Tengyang Zheng 
+
+Junfeng Zhong 
+
+Longguang Zhong 
+
+Weiming Zhong 
+
+M. Zhou 
+
+Runjie Zhou 
+
+Xinyu Zhou 
+
+Zaida Zhou 
+
+Jinguo Zhu 
+
+Liya Zhu 
+
+Xinhao Zhu 
+
+Yuxuan Zhu 
+
+Zhen Zhu 
+
+Jingze Zhuang 
+
+Weiyu Zhuang 
+
+Ying Zou 
+
+Xinxing Zu 
+
+ Kimi K2 
+
+Kimi K2.5
+
+2 2 footnotetext: The listing of authors is in alphabetical order based on their last names. 2 2 footnotetext: †The University of Hong Kong
+
+## Appendix B Pre-training
+
+![Image 9: Refer to caption](https://arxiv.org/html/2602.02276v1/x7.png)
+
+Figure 9: Learning curves comparing vision-to-text ratios (10:90, 20:80, 50:50) under fixed vision-text token budget across vision and language tasks. Early fusion with lower vision ratios tend to yield better results.
+
+### B.1 Joint-Training
+
+We further provide the full training curves for all configurations in Figure[9](https://arxiv.org/html/2602.02276v1#A2.F9 "Figure 9 ‣ Appendix B Pre-training ‣ Kimi K2.5: Visual Agentic Intelligence"). Notably, we observe a "dip-and-recover" pattern in text performance during mid-fusion and late-fusion stages: when vision data is first introduced, text capability initially degrades before gradually recovering. We attribute this to the modality domain shift—the sudden introduction of vision tokens disrupts the established linguistic representation space, forcing the model to temporarily sacrifice text-specific competence for cross-modal alignment.
+
+In contrast, early fusion maintains a healthier and more stable text performance curve throughout training. By co-optimizing vision and language from the outset, the model naturally evolves unified multimodal representations without the shock of late-stage domain migration. This suggests that early exposure not only prevents the representation collapse observed in late fusion but also facilitates smoother gradient landscapes for both modalities. Collectively, these findings reinforce our proposal of native multimodal pre-training: moderate vision ratios combined with early fusion yield superior convergence properties and more robust bi-modal competence under fixed token budgets.
+
+### B.2 Text data
+
+The Kimi K2.5 pre-training text corpus comprises curated, high-quality data spanning four primary domains: Web Text, Code, Mathematics, and Knowledge. Most data processing pipelines follow the methodologies outlined in Kimi K2[[53](https://arxiv.org/html/2602.02276v1#bib.bib108 "Kimi k2: open agentic intelligence")]. For each domain, we performed rigorous correctness and quality validation and designed targeted data experiments to ensure the curated dataset achieved both high diversity and effectiveness.
+
+Enhanced Code Intelligence We upweighted code-centric data, significantly expanding (1) repository-level code supporting cross-file reasoning and architectural understanding, (2) issues, code reviews and commit histories from the internet capturing real-world development patterns, and (3) code-related documents retrieved from PDF and webtext corpora. These efforts strengthen repository-level comprehension for complex coding tasks, improve performance on agentic coding subtasks such as patch generation and unit test writing, and enhance code-related knowledge capabilities.
+
+### B.3 Vision data
+
+Our multimodal pre-training corpus includes seven categories: caption, interleaving, OCR, knowledge, perception, video, and agent data. Caption data[[49](https://arxiv.org/html/2602.02276v1#bib.bib41 "Laion-5b: an open large-scale dataset for training next generation image-text models"), [18](https://arxiv.org/html/2602.02276v1#bib.bib42 "Datacomp: in search of the next generation of multimodal datasets")] provides fundamental modality alignment, with strict limits on synthetic captions to mitigate hallucination. Image-text interleaving data from books, web pages, and tutorials[[81](https://arxiv.org/html/2602.02276v1#bib.bib43 "Multimodal c4: an open, billion-scale corpus of images interleaved with text"), [31](https://arxiv.org/html/2602.02276v1#bib.bib44 "Obelics: an open web-scale filtered dataset of interleaved image-text documents")] enables multi-image comprehension and longer context learning. OCR data spans multilingual text, dense layouts, and multi-page documents. Knowledge data incorporates academic materials processed via layout parsers to develop visual reasoning capabilities.
+
+Furthermore, we curate a specialized multimodal problem-solving corpus to bolster reasoning within Science, Technology, Engineering, and Mathematics domains. This data is aggregated through targeted retrieval and web crawling; for informational content lacking explicit query formats, we employ in-context learning[[10](https://arxiv.org/html/2602.02276v1#bib.bib9 "Language models are few-shot learners")] to automatically reformulate raw materials into structured academic problems spanning K-12 to university levels. To bridge the modality gap between visual layouts and code data, we incorporate extensive image-code paired data. This includes a diverse array of code formats—such as HTML, React, and SVG, among others—paired with their corresponding rendered screenshots, enabling the model to align abstract structural logic with concrete visual geometry.
+
+For agentic and temporal understanding, we collect GUI screenshots and action trajectories across desktop, mobile, and web environments, including human-annotated demonstrations. Video data from diverse sources enables both hour-long video comprehension and fine-grained spatio-temporal perception. Additionally, we incorporate grounding data to enhance fine-grained visual localization, including perception annotations (bounding boxes), point-based references. We also introduce a new contour-level segmentation task[[51](https://arxiv.org/html/2602.02276v1#bib.bib16 "Towards pixel-level vlm perception via simple points prediction")] for pixel-level perception learning. All data undergoes rigorous filtering, deduplication, and quality control to ensure high diversity and effectiveness.
+
+## Appendix C Infra
+
+Kimi K2.5 is trained on NVIDIA H800 GPU clusters with 8\times 400 Gbps RoCE interconnects across nodes. We employ a flexible parallelism strategy combining 16-way Pipeline Parallelism (PP) with virtual stages[[26](https://arxiv.org/html/2602.02276v1#bib.bib10 "GPipe: efficient training of giant neural networks using pipeline parallelism"), [39](https://arxiv.org/html/2602.02276v1#bib.bib11 "Efficient large-scale language model training on gpu clusters using megatron-lm")], 16-way Expert Parallelism (EP)[[32](https://arxiv.org/html/2602.02276v1#bib.bib12 "Gshard: scaling giant models with conditional computation and automatic sharding")], and ZeRO-1 Data Parallelism, enabling training on any number of nodes that is a multiple of 32. EP all-to-all communication is overlapped with computation under interleaved 1F1B scheduling. To fit activations within GPU memory constraints, we apply selective recomputation for LayerNorm, SwiGLU, and MLA up-projections, compress insensitive activations to FP8-E4M3, and offload remaining activations to CPU with overlapped streaming.
+
+### C.1 Data Storage and Loading
+
+We employ S3 [[3](https://arxiv.org/html/2602.02276v1#bib.bib15 "Amazon simple storage service (amazon s3)")] compatible object storage solutions from cloud providers to house our VLM datasets. To bridge the gap between data preparation and model training, we retain visual data in its native format and have engineered a highly efficient and adaptable data loading infrastructure. This infrastructure offers several critical advantages:
+
+*   •Flexibility: Facilitates dynamic data shuffling, blending, tokenization, loss masking, and sequence packing throughout the training process, enabling adjustable data ratios as requirements evolve; 
+*   •Augmentation: Allows for stochastic augmentation of both visual and textual modalities, while maintaining the integrity of 2D spatial coordinates and orientation metadata during geometric transformations; 
+*   •Determinism: Guarantees fully deterministic training through meticulous management of random seeds and worker states, ensuring that any training interruption can be resumed seamlessly — the data sequence after resumption remains identical to an uninterrupted run; 
+*   •Scalability: Achieves superior data loading throughput via tiered caching mechanisms, robustly scaling to large distributed clusters while regulating request frequency to object storage within acceptable bounds. 
+
+Furthermore, to uphold uniform dataset quality standards, we have built a unified platform overseeing data registration, visualization, statistical analysis, cross-cloud synchronization, and lifecycle governance.
+
+## Appendix D Unified Agentic Reinforcement Learning Environment
+
+![Image 10: Refer to caption](https://arxiv.org/html/2602.02276v1/x8.png)
+
+Figure 10: Overview of our agentic RL framework.
+
+##### Environment
+
+To support unified Agentic RL, our RL framework features a standardized Gym-like [[9](https://arxiv.org/html/2602.02276v1#bib.bib195 "OpenAI gym")] interface to streamline the implementation of diverse environments. Such design empowers users to implement and customize environments with minimal overhead. Our design prioritizes compositional modularity by integrating a suite of pluggable components, such as a Toolset module for supporting various tools with sandboxes, a Judge module for multi-faceted reward signals, and specialized modules for prompt diversification and instruction-following enhancement. These components can be dynamically composed with core agent loops, offering high flexibility and enhancing model generalization.
+
+At the execution level, our RL framework treats every agent task as an independent asynchronous coroutine. Each task can recursively trigger sub-task rollouts, simplifying the implementation of complex multi-agent paradigms such as Parallel-Agent RL and Agent-as-Judge. As shown in the figure [10](https://arxiv.org/html/2602.02276v1#A4.F10 "Figure 10 ‣ Appendix D Unified Agentic Reinforcement Learning Environment ‣ Kimi K2.5: Visual Agentic Intelligence"), a dedicated Rollout Manager orchestrates up to 100,000 concurrent agent tasks during the RL process, providing fine-grained control to enable features like partial rollout [[30](https://arxiv.org/html/2602.02276v1#bib.bib107 "Kimi k1. 5: scaling reinforcement learning with llms")]. Upon activation, each task acquires an environment instance from a managed pool, equipped with a sandbox and specialized tools.
+
+##### Inference Engine Co-design
+
+Our framework strictly follows a Token-in-Token-out paradigm. We also record log probabilities for all inference engine outputs to perform train-inference mismatch correction, ensuring stable RL training. A co-design of inference engine for RL requirements has allowed us to support these features by custom inference APIs for RL.
+
+Besides a comprehensive suite of built-in white-box environments, there are also black-box environments that can only run under standard LLM API protocol, missing the opportunity to use advanced features offered by our custom API protocol. To facilitate model optimization under black-box environments, we developed LLM Gateway, which is a proxy service that keeps detailed records of rollout requests and responses under our custom protocol.
+
+##### Monitoring and debugging
+
+It is a challenging task to optimize performance of a highly-parallel asynchronous execution system, while ensuring correctness. We develop a series of tools for performance monitoring, profiling, data visualization and data verification. We found these to be instrumental in debugging and ensuring both the efficiency and correctness of our Agentic RL.
+
+## Appendix E Evaluation Settings
+
+This section provides comprehensive configuration details and testing protocols for all benchmarks reported in Table[4](https://arxiv.org/html/2602.02276v1#S5.T4 "Table 4 ‣ Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence").
+
+### E.1 General Evaluation Protocol
+
+Unless explicitly stated otherwise, all experiments for Kimi-K2.5 adhere to the following hyperparameter configuration:
+
+*   •Temperature:1.0 
+*   •Top-p:0.95 
+*   •Context Length:256\text{k} tokens 
+
+### E.2 Baselines
+
+For baseline models, we report results under their respective high-performance reasoning configurations:
+
+*   •Claude Opus 4.5: Extended thinking mode 
+*   •GPT-5.2: Maximum reasoning effort (xhigh) 
+*   •Gemini 3 Pro: High thinking level 
+*   •DeepSeek-V3.2: Thinking mode enabled (for text-only benchmarks) 
+*   •Qwen3-VL-235B-A22B: Thinking mode (for vision benchmarks only) 
+
+For vision and multimodal benchmarks, GPT-5.2-xhigh exhibited an approximate 10% failure rate (i.e., no output generated despite three retry attempts) during vision evaluations. These failures were treated as incorrect predictions, meaning that the reported scores may be conservative lower bounds of the model’s true capability.
+
+In addition, because we were unable to consistently access a stable GPT-5.2 API, we skipped some benchmarks with high evaluation costs, such as WideSearch.
+
+### E.3 Text Benchmarks
+
+##### Reasoning Benchmarks.
+
+For high-complexity reasoning benchmarks, including HLE-Full, AIME 2025, HMMT 2025, GPQA-Diamond, and IMO-AnswerBench, we enforce a maximum completion budget of 96\text{k} tokens to ensure sufficient reasoning depth. To reduce variance arising from stochastic reasoning paths, results on AIME 2025 and HMMT 2025 (Feb) are averaged over 64 independent runs (Avg@64), while GPQA-Diamond is averaged over 8 runs (Avg@8).
+
+##### LongBench v2.
+
+For a fair comparison, we standardize all input contexts to approximately 128\text{k} tokens using the same truncation strategy as in[[8](https://arxiv.org/html/2602.02276v1#bib.bib34 "LongBench v2: towards deeper understanding and reasoning on realistic long-context multitasks")]. We observe that GPT5.2-xhigh frequently produces free-form question–answer style responses rather than the required multiple-choice format. Therefore, we report results using GPT5.2-high, which consistently adheres to the expected output format.
+
+### E.4 Image and Video Benchmarks
+
+All image and video understanding evaluations utilize the following configuration:
+
+*   •Maximum Tokens:64\text{k} 
+*   •Sampling: Averaged over 3 independent runs (Avg@3) 
+
+##### ZeroBench (w/ tools).
+
+Multi-step reasoning evaluations use constrained step-wise generation:
+
+*   •Max Tokens per Step:24\text{k} 
+*   •Maximum Steps:30 
+
+##### MMMU-Pro.
+
+We adhere strictly to the official evaluation protocol: input order is preserved for all modalities, with images prepended to text sequences as specified in the benchmark guidelines.
+
+##### Sampling Strategies for Video Benchmarks.
+
+For short video benchmarks (VideoMMMU, MMVU & MotionBench), we sample 128 uniform input frames with a maximum spatial resolution at 896; 2048 uniform frames are sampled for long video benchmarks (Video-MME, LongVideoBench & LVBench) with 448 spatial resolution.
+
+##### Specialized Metrics.
+
+*   •OmniDocBench 1.5: Scores are computed as (1-\text{normalized Levenshtein distance})\times 100, where higher values indicate superior OCR and document understanding accuracy. 
+*   •WorldVQA: Access available at [https://github.com/MoonshotAI/WorldVQA](https://github.com/MoonshotAI/WorldVQA). This benchmark evaluates atomic, vision-centric world knowledge requiring fine-grained visual recognition and geographic understanding. 
+
+### E.5 Coding and Software Engineering
+
+##### Terminal Bench 2.0.
+
+All scores are obtained using the default Terminus-2 agent framework with the provided JSON parser. Notably, we evaluate under non-thinking mode because our current context management implementation for thinking mode is technically incompatible with Terminus-2’s conversation state handling.
+
+##### SWE-Bench Series.
+
+We employ an internally developed evaluation framework featuring a minimal tool set: bash, create_file, insert, view, str_replace, and submit. System prompts are specifically tailored for repository-level code manipulation. Peak performance is achieved under non-thinking mode across all SWE-Bench variants (Verified, Multilingual, and Pro).
+
+##### CyberGym.
+
+Claude Opus 4.5 results for this benchmark are reported under non-thinking settings as specified in their technical documentation. We report scores in the difficulty level 1 (the primary setting).
+
+##### PaperBench.
+
+We report the scores under the CodeDev setting.
+
+##### Sampling.
+
+All coding task results are averaged over 5 independent runs (Avg@5) to ensure stability across environment initialization and non-deterministic test case ordering.
+
+### E.6 Agentic Evaluation
+
+##### Tool Setting.
+
+Kimi-K2.5 is equipped with web search tool, code interpreter (Python execution environment), and web browsing tools for all agentic evaluations, including HLE with tools and agentic search benchmarks (BrowseComp, WideSearch, DeepSearchQA, FinSearchComp T2&T3 and Seal-0).
+
+##### Context Management Strategies.
+
+To handle the extended trajectory lengths inherent in complex agentic tasks, we implement domain-specific context management protocols. Unless otherwise specified below, no context management is applied to agentic evaluations; tasks exceeding the model’s supported context window are directly counted as failures rather than truncated.
+
+*   •Humanity’s Last Exam (HLE). For the HLE tool-augmented setting, we employ a Hide-Tool-Result Context Management strategy: when the context length exceeds predefined thresholds, only the most recent round of tool messages (observations and return values) is retained, while the reasoning chain and thinking processes from all previous steps are preserved in full. 
+*   •BrowseComp. For BrowseComp evaluations, our evaluation contains both with and without context management settings. Under the context management setting, we adopt the same discard-all strategy proposed by DeepSeek, where all history is truncated once token thresholds are exceeded. 
+
+##### System Prompt.
+
+All agentic search and HLE evaluations utilize the following unified system prompt, where DATE is dynamically set to the current timestamp:
+
+You are Kimi, today’s date: DATE.
+Your task is to help the user with their questions by using various tools,
+thinking deeply, and ultimately answering the user’s questions.
+
+Please follow the following principles strictly during the deep research:
+1. Always focus on the user’s original question during the research process,
+   avoiding deviating from the topic.
+2. When facing uncertain information, use search tools to confirm.
+3. When searching, filter high-trust sources (such as authoritative websites,
+   academic databases, and professional media) and maintain a critical mindset
+   towards low-trust sources.
+4. When performing numerical calculations, prioritize using programming tools
+   to ensure accuracy.
+5. Please use the format [^index^] to cite any information you use.
+6. This is a **Very Difficult** problemdo not underestimate it. You must use
+   tools to help your reasoning and then solve the problem.
+7. Before you finally give your answer, please recall what the question is
+   asking for.
+
+##### Sampling Protocol.
+
+To account for the inherent stochasticity in search engine result rankings and dynamic web content availability, results for Seal-0 and WideSearch are averaged over 4 independent runs (Avg@4). All other agentic benchmarks are evaluated under single-run protocols unless explicitly stated otherwise.
+
+### E.7 Computer-Use Evaluation
+
+##### Hyperparameter Settings.
+
+We set \texttt{max\_steps\_per\_episode}=100 for all experiments, with \texttt{temperature}=0 for OSWorld-Verified and \texttt{temperature}=0.1 for WebArena. Due to resource constraints, all models are evaluated in a one-shot setting. Adhering to the OpenCUA configuration[[63](https://arxiv.org/html/2602.02276v1#bib.bib6 "OpenCUA: open foundations for computer-use agents")], the agent context includes the last 3 history images, the complete thought history, and the task instruction. For WebArena, we manually corrected errors in the evaluation scripts and employed GPT-4o as the judge model for the fuzzy_match function. To ensure fair comparison, Claude Opus 4.5 is evaluated solely with computer-use tools (excluding browser tools), a departure from the System Card configuration[[4](https://arxiv.org/html/2602.02276v1#bib.bib226 "Claude opus 4.5 system card")].
+
+##### System Prompt
+
+We utilize a unified system prompt for all computer use tasks:
+
+You are a GUI agent. You are given an instruction, a screenshot of the screen and your
+previous interactions with the computer. You need to perform a series of actions to
+complete the task. The password of the computer is {password}.
+
+For each step, provide your response in this format:
+{thought}
+## Action:
+{action}
+## Code:
+{code}
+
+In the code section, the code should be either pyautogui code or one of the following
+functions wrapped in the code block:
+- {"name": "computer.wait", "description": "Make the computer wait for 20 seconds
+for installation, running code, etc.", "parameters": {"type": "object", "properties":
+{}, "required": []}}
+- {"name": "computer.terminate", "description": "Terminate the current task and report
+its completion status", "parameters": {"type": "object", "properties": {"status":
+{"type": "string", "enum": ["success", "failure"], "description": "The status of the
+task"}, "answer": {"type": "string", "description": "The answer of the task"}},
+"required": ["status"]}}
+
+### E.8 Agent Swarm Configuration
+
+##### Tool Setting.
+
+In addition to the core toolset described in Appendix[E.6](https://arxiv.org/html/2602.02276v1#A5.SS6 "E.6 Agentic Evaluation ‣ Appendix E Evaluation Settings ‣ Kimi K2.5: Visual Agentic Intelligence") (web search, code interpreter, and web browsing), the orchestrator is equipped with two specialized tools for sub-agent creation and scheduling:
+
+*   •create_subagent: Instantiates a specialized sub-agent with a custom system prompt and identifier for reuse across tasks. 
+*   •assign_task: Dispatches assignments to created sub-agents. 
+
+The tool schemas are provided below:
+
+{
+ "name": "create_subagent",
+ "description": "Create a custom subagent with specific system prompt
+   and name for reuse.",
+ "parameters": {
+   "type": "object",
+   "properties": {
+     "name": {
+       "type": "string",
+       "description": "Unique name for this agent configuration"
+     },
+     "system_prompt": {
+       "type": "string",
+       "description": "System prompt defining the agent’s role,
+         capabilities, and boundaries"
+     }
+   },
+   "required": ["name", "system_prompt"]
+ }
+}
+{
+ "name": "assign_task",
+ "description": "Launch a new agent.\nUsage notes:\n
+   1. You can launch multiple agents concurrently whenever possible,
+      to maximize performance;\n
+   2. When the agent is done, it will return a single message back to you.",
+ "parameters": {
+   "type": "object",
+   "properties": {
+     "agent": {
+       "type": "string",
+       "description": "Specify which created agent to use."
+     },
+     "prompt": {
+       "type": "string",
+       "description": "The task for the agent to perform"
+     }
+   },
+   "required": ["agent", "prompt"]
+ }
+}
+
+##### Step Limits.
+
+When operating in Agent Swarm mode, we set computational budgets for the orchestrator and sub-agents. Step limits apply to the aggregate count of tool invocations and environment interactions.
+
+*   •BrowseComp: The orchestrator is constrained to a maximum of 15 steps. Each spawned sub-agent operates under a limit of 100 steps (i.e., up to 100 tool calls per sub-agent). 
+*   •WideSearch: Both the orchestrator and each sub-agent are allocated a maximum budget of 100 steps. 
+*   •In-house Bench: The orchestrator is constrained to a maximum of 100 steps. Each spawned sub-agent operates under a limit of 50 steps . 
+
+##### System Prompt.
+
+You are Kimi, a professional and meticulous expert in information collection and organization.
+You fully understand user needs, skillfully use various tools, and complete tasks with the
+highest efficiency.
+# Task Description
+After receiving users’ questions, you need to fully understand their needs and think
+about and plan how to complete the tasks efficiently and quickly.
+# Available Tools
+To help you complete tasks better and faster, I have provided you with the following tools:
+1. Search tool: You can use the search engine to retrieve information, supporting multiple
+queries in parallel.
+2. Browser tools: You can visit web links (web pages, PDFs, etc.), get page content, and
+perform interactions such as clicking, inputting, finding, and scrolling.
+3. Sub Agent tools:
+   - ‘create_subagent‘: Create a new sub-agent with a unique name and clear, specific
+   system prompt.
+   - ‘assign_task‘: Delegate tasks to created sub-agents. Sub-agents can also use search
+   and browser tools.
+4. Other tools: Including code execution (IPython, Shell).
+
+### E.9 GDPVal
+
+We cite the GDPVal-AA evaluation by Artificial Analysis, and the scores reported in Table[4](https://arxiv.org/html/2602.02276v1#S5.T4 "Table 4 ‣ Benchmarks ‣ 5.1.1 Evaluation Settings ‣ 5.1 Main Results ‣ 5 Evaluations ‣ Kimi K2.5: Visual Agentic Intelligence") reflect the official leaderboard metrics as of January 28, 2026.
+
+![Image 11: Refer to caption](https://arxiv.org/html/2602.02276v1/x9.png)
+
+Figure 11: Qualitative example of Kimi K2.5 analyzing a complete playthrough of Black Myth: Wukong (24 hours of continuous gameplay across 32 videos at 1080p) using parallel visual agents. See [generated webpage](https://statics.moonshot.cn/k25-vibe-cases/blackmyth-wukong/index.html) and [source videos](https://www.bilibili.com/video/BV1dbyaBZE8n/) (all rights reserved by source authors).
+
+![Image 12: Refer to caption](https://arxiv.org/html/2602.02276v1/x10.png)
+
+Figure 12: Qualitative examples of Kimi K2.5 solving visual reasoning tasks via tool use.
+
+## Appendix F Visualization
+
+Figure[11](https://arxiv.org/html/2602.02276v1#A5.F11 "Figure 11 ‣ E.9 GDPVal ‣ Appendix E Evaluation Settings ‣ Kimi K2.5: Visual Agentic Intelligence") demonstrates our Agent Swarm tackling a challenging long-form video understanding task: analyzing a complete playthrough of Black Myth: Wukong (24 hours of continuous gameplay across 32 videos, totaling 40GB). The system employs a hierarchical multi-agent architecture where a Main Agent orchestrates parallel Sub Agents to process individual video segments independently. Each sub agent performs frame extraction, temporal event analysis, and key moment identification (e.g., boss fights, level-ups). The Main Agent subsequently aggregates these distributed analyses to synthesize a comprehensive HTML showcase featuring chronological timelines, embedded video clips, and interactive visualizations. This example demonstrates the system’s ability to handle massive-scale multimodal content through parallelization while maintaining coherent long-context understanding.
+
+Figure[12](https://arxiv.org/html/2602.02276v1#A5.F12 "Figure 12 ‣ E.9 GDPVal ‣ Appendix E Evaluation Settings ‣ Kimi K2.5: Visual Agentic Intelligence") presents qualitative examples of Kimi K2.5 solving diverse visual reasoning tasks via tool-augmented reasoning. The model demonstrates: (1) Maze Solving—processing binary image segmentation and implementing pathfinding algorithms (BFS) to navigate complex mazes; (2) Pie Chart Analysis—performing pixel-level color segmentation and geometric calculations to determine precise area proportions; and (3) Spot-the-Difference—employing computer vision techniques to detect pixel-level discrepancies between image pairs. These examples highlight the model’s capability to decompose complex visual problems into executable code, iteratively refine strategies based on intermediate results, and synthesize precise answers through quantitative visual analysis.
diff --git a/apps/room-service/static/favicon.svg b/apps/room-service/static/favicon.svg
new file mode 100644
index 000000000..070e83e2e
--- /dev/null
+++ b/apps/room-service/static/favicon.svg
@@ -0,0 +1,5 @@
+<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 64 64">
+  <rect width="64" height="64" rx="14" fill="#070b14"/>
+  <rect x="12" y="28" width="40" height="14" rx="3" fill="#E0BA55" opacity="0.35"/>
+  <text x="32" y="46" text-anchor="middle" font-family="Inter,system-ui,sans-serif" font-weight="800" font-size="42" fill="white">P</text>
+</svg>
diff --git a/apps/room-service/static/sprite.png b/apps/room-service/static/sprite.png
new file mode 100644
index 000000000..2030b5679
Binary files /dev/null and b/apps/room-service/static/sprite.png differ
diff --git a/apps/room-service/targets/cloudflare.ts b/apps/room-service/targets/cloudflare.ts
new file mode 100644
index 000000000..2d01efeb5
--- /dev/null
+++ b/apps/room-service/targets/cloudflare.ts
@@ -0,0 +1,22 @@
+/**
+ * Cloudflare Worker entrypoint for room.plannotator.ai.
+ *
+ * Routes HTTP requests and WebSocket upgrades to the handler.
+ * Re-exports the Durable Object class for wrangler discovery.
+ */
+
+import { handleRequest } from '../core/handler';
+import { corsHeaders, getAllowedOrigins } from '../core/cors';
+import type { Env } from '../core/types';
+
+export default {
+  async fetch(request: Request, env: Env): Promise<Response> {
+    const origin = request.headers.get('Origin') ?? '';
+    const allowed = getAllowedOrigins(env.ALLOWED_ORIGINS);
+    const allowLocalhost = env.ALLOW_LOCALHOST_ORIGINS === 'true';
+    const cors = corsHeaders(origin, allowed, allowLocalhost);
+    return handleRequest(request, env, cors);
+  },
+};
+
+export { RoomDurableObject } from '../core/room-do';
diff --git a/apps/room-service/tsconfig.browser.json b/apps/room-service/tsconfig.browser.json
new file mode 100644
index 000000000..722f5e0fd
--- /dev/null
+++ b/apps/room-service/tsconfig.browser.json
@@ -0,0 +1,23 @@
+{
+  "//": "Aspirational typecheck for the browser entry. NOT currently a green CI gate — TypeScript follows the AppRoot import into packages/editor + packages/ui, which surface pre-existing implicit-any, missing @types/react, CSS module, and __APP_VERSION__ errors from the broader codebase. Those are shared-package tech-debt items, not room-service issues. Run via: bunx tsc --noEmit -p apps/room-service/tsconfig.browser.json. Entry.tsx itself is clean; the transitive errors are inherited. Once the shared packages carry their own tsconfig with strict: false or the missing declarations are added, this config becomes a usable gate.",
+  "compilerOptions": {
+    "target": "ES2022",
+    "module": "ESNext",
+    "lib": ["ES2022", "DOM", "DOM.Iterable"],
+    "moduleResolution": "bundler",
+    "jsx": "react-jsx",
+    "strict": true,
+    "skipLibCheck": true,
+    "noEmit": true,
+    "allowImportingTsExtensions": true,
+    "isolatedModules": true,
+    "paths": {
+      "@plannotator/ui/*": ["../../packages/ui/*"],
+      "@plannotator/editor": ["../../packages/editor/AppRoot.tsx"],
+      "@plannotator/editor/App": ["../../packages/editor/App.tsx"],
+      "@plannotator/editor/*": ["../../packages/editor/*"],
+      "@plannotator/editor/styles": ["../../packages/editor/index.css"]
+    }
+  },
+  "include": ["entry.tsx", "vite.config.ts"]
+}
diff --git a/apps/room-service/tsconfig.json b/apps/room-service/tsconfig.json
new file mode 100644
index 000000000..28fc62cc9
--- /dev/null
+++ b/apps/room-service/tsconfig.json
@@ -0,0 +1,15 @@
+{
+  "compilerOptions": {
+    "target": "ES2022",
+    "module": "ESNext",
+    "moduleResolution": "bundler",
+    "strict": true,
+    "skipLibCheck": true,
+    "noEmit": true,
+    "allowImportingTsExtensions": true,
+    "isolatedModules": true,
+    "types": ["@cloudflare/workers-types"]
+  },
+  "//exclude": "entry.tsx and vite.config.ts are browser-only and typechecked separately via tsconfig.browser.json (with DOM + React libs). This Worker config stays Cloudflare-scoped.",
+  "exclude": ["**/*.test.ts", "scripts/**", "entry.tsx", "vite.config.ts"]
+}
diff --git a/apps/room-service/vite.config.ts b/apps/room-service/vite.config.ts
new file mode 100644
index 000000000..4ec81fe32
--- /dev/null
+++ b/apps/room-service/vite.config.ts
@@ -0,0 +1,67 @@
+/**
+ * Vite config for the Cloudflare-served live-room editor.
+ *
+ * Opposite constraints from apps/hook:
+ *   - apps/hook: single-file HTML, embedded into a Bun binary that
+ *     streams it over a one-shot localhost HTTP server. Uses
+ *     vite-plugin-singlefile, inlineDynamicImports, and
+ *     assetsInlineLimit=∞ to produce a standalone blob.
+ *   - apps/room-service: served by Cloudflare's [assets] binding.
+ *     Emits normal chunked output (hashed assets/*.js, *.css).
+ *     Wrangler + Cloudflare edge do HTTP/2 multiplexing, Brotli,
+ *     per-chunk edge caching, and immutable Cache-Control on hashed
+ *     assets. Single-file would defeat all of that.
+ *
+ * Aliases mirror apps/hook: @plannotator/editor → AppRoot.tsx so the
+ * default import is room-mode-aware; @plannotator/editor/App remains
+ * available for callers that explicitly want the local shell.
+ */
+
+import path from 'path';
+import { defineConfig } from 'vite';
+import react from '@vitejs/plugin-react';
+import tailwindcss from '@tailwindcss/vite';
+import pkg from '../../package.json';
+
+export default defineConfig({
+  base: '/',
+  define: {
+    __APP_VERSION__: JSON.stringify(pkg.version),
+  },
+  plugins: [react(), tailwindcss()],
+  resolve: {
+    alias: {
+      '@plannotator/ui': path.resolve(__dirname, '../../packages/ui'),
+      '@plannotator/editor/styles': path.resolve(__dirname, '../../packages/editor/index.css'),
+      '@plannotator/editor/App': path.resolve(__dirname, '../../packages/editor/App.tsx'),
+      '@plannotator/editor': path.resolve(__dirname, '../../packages/editor/AppRoot.tsx'),
+    },
+  },
+  // Static assets (favicon.svg) are copied verbatim from ./static/ into
+  // the build output root. Vite's default publicDir is 'public' but our
+  // outDir is also 'public' — using a separate 'static' avoids the
+  // "publicDir and outDir overlap" warning.
+  publicDir: 'static',
+  build: {
+    outDir: 'public',
+    emptyOutDir: true,
+    target: 'esnext',
+    // No singlefile, no inlineDynamicImports, no bloated
+    // assetsInlineLimit — default Vite chunk shape is what Cloudflare
+    // wants. Hashed filenames in assets/ allow indefinite caching with
+    // the handler's immutable Cache-Control header.
+    rollupOptions: {
+      output: {
+        // Keep the Vite default naming: [name]-[hash].js under assets/,
+        // which the handler's /assets/* passthrough serves verbatim.
+      },
+    },
+  },
+  server: {
+    // Not used for deploy — just for local `vite` dev if someone wants
+    // to iterate on the room UI without Wrangler. The Worker still
+    // serves the compiled output.
+    port: 3002,
+    host: '0.0.0.0',
+  },
+});
diff --git a/apps/room-service/wrangler.toml b/apps/room-service/wrangler.toml
new file mode 100644
index 000000000..b064cbbf4
--- /dev/null
+++ b/apps/room-service/wrangler.toml
@@ -0,0 +1,33 @@
+name = "plannotator-room"
+main = "targets/cloudflare.ts"
+compatibility_date = "2024-12-01"
+compatibility_flags = ["nodejs_compat_v2"]
+
+# Chunked Vite build output lives in ./public (index.html + hashed
+# assets/*.js, *.css). Produced by `bun run build:shell` from
+# apps/room-service/vite.config.ts. The directory is gitignored —
+# always generated, never checked in. The Worker's handler rewrites
+# /c/:roomId → /index.html and /assets/* → passthrough with long-lived
+# immutable Cache-Control on hashed chunks; see core/handler.ts.
+[assets]
+directory = "./public"
+binding = "ASSETS"
+run_worker_first = true
+html_handling = "none"
+
+[[durable_objects.bindings]]
+name = "ROOM"
+class_name = "RoomDurableObject"
+
+[[migrations]]
+tag = "v1"
+new_sqlite_classes = ["RoomDurableObject"]
+
+[[routes]]
+pattern = "room.plannotator.ai"
+custom_domain = true
+
+[vars]
+ALLOWED_ORIGINS = "https://room.plannotator.ai"
+ALLOW_LOCALHOST_ORIGINS = "true"
+BASE_URL = "https://room.plannotator.ai"
diff --git a/bun.lock b/bun.lock
index 0eada16a0..383b45899 100644
--- a/bun.lock
+++ b/bun.lock
@@ -20,6 +20,19 @@
         "@types/node": "^25.5.2",
         "@types/turndown": "^5.0.6",
         "bun-types": "^1.3.11",
+        "wrangler": "^4.81.1",
+      },
+    },
+    "apps/collab-agent": {
+      "name": "@plannotator/collab-agent",
+      "version": "0.1.0",
+      "dependencies": {
+        "@plannotator/shared": "workspace:*",
+        "@plannotator/ui": "workspace:*",
+      },
+      "devDependencies": {
+        "bun-types": "^1.3.11",
+        "typescript": "~5.8.2",
       },
     },
     "apps/hook": {
@@ -143,6 +156,28 @@
         "vite-plugin-singlefile": "^2.0.3",
       },
     },
+    "apps/room-service": {
+      "name": "@plannotator/room-service",
+      "version": "0.1.0",
+      "dependencies": {
+        "@plannotator/editor": "workspace:*",
+        "@plannotator/shared": "workspace:*",
+        "@plannotator/ui": "workspace:*",
+        "react": "^19.2.3",
+        "react-dom": "^19.2.3",
+      },
+      "devDependencies": {
+        "@cloudflare/workers-types": "^4.20241218.0",
+        "@tailwindcss/vite": "^4.1.18",
+        "@types/react": "^19.2.0",
+        "@types/react-dom": "^19.2.0",
+        "@vitejs/plugin-react": "^5.0.0",
+        "tailwindcss": "^4.1.18",
+        "typescript": "~5.8.2",
+        "vite": "^6.2.0",
+        "wrangler": "^4.80.0",
+      },
+    },
     "apps/vscode-extension": {
       "name": "plannotator-webview",
       "version": "0.16.5",
@@ -169,6 +204,12 @@
         "sonner": "^2.0.7",
         "tailwindcss": "^4.1.18",
       },
+      "devDependencies": {
+        "@happy-dom/global-registrator": "^20.8.9",
+        "@testing-library/react": "^16.3.2",
+        "@types/react": "^19.2.0",
+        "@types/react-dom": "^19.2.0",
+      },
     },
     "packages/review-editor": {
       "name": "@plannotator/review-editor",
@@ -235,10 +276,13 @@
         "unique-username-generator": "^1.5.1",
       },
       "devDependencies": {
+        "@happy-dom/global-registrator": "^20.8.9",
+        "@testing-library/react": "^16.3.2",
         "@types/bun": "^1.2.0",
         "@types/dompurify": "^3.0.5",
         "@types/react": "^19.2.0",
         "@types/react-dom": "^19.2.0",
+        "happy-dom": "^20.8.9",
         "typescript": "~5.8.2",
       },
     },
@@ -418,19 +462,19 @@
 
     "@chevrotain/utils": ["@chevrotain/utils@11.0.3", "", {}, "sha512-YslZMgtJUyuMbZ+aKvfF3x1f5liK4mWNxghFRv7jqRR9C3R3fAOGTTKvxXDa2Y1s9zSbcpuO0cAxDYsc9SrXoQ=="],
 
-    "@cloudflare/kv-asset-handler": ["@cloudflare/kv-asset-handler@0.3.4", "", { "dependencies": { "mime": "^3.0.0" } }, "sha512-YLPHc8yASwjNkmcDMQMY35yiWjoKAKnhUbPRszBRS0YgH+IXtsMp61j+yTcnCE3oO2DgP0U3iejLC8FTtKDC8Q=="],
+    "@cloudflare/kv-asset-handler": ["@cloudflare/kv-asset-handler@0.5.0", "", {}, "sha512-jxQYkj8dSIzc0cD6cMMNdOc1UVjqSqu8BZdor5s8cGjW2I8BjODt/kWPVdY+u9zj3ms75Q5qaZgnxUad83+eAg=="],
 
-    "@cloudflare/unenv-preset": ["@cloudflare/unenv-preset@2.0.2", "", { "peerDependencies": { "unenv": "2.0.0-rc.14", "workerd": "^1.20250124.0" }, "optionalPeers": ["workerd"] }, "sha512-nyzYnlZjjV5xT3LizahG1Iu6mnrCaxglJ04rZLpDwlDVDZ7v46lNsfxhV3A/xtfgQuSHmLnc6SVI+KwBpc3Lwg=="],
+    "@cloudflare/unenv-preset": ["@cloudflare/unenv-preset@2.16.1", "", { "peerDependencies": { "unenv": "2.0.0-rc.24", "workerd": ">1.20260305.0 <2.0.0-0" }, "optionalPeers": ["workerd"] }, "sha512-ECxObrMfyTl5bhQf/lZCXwo5G6xX9IAUo+nDMKK4SZ8m4Jvvxp52vilxyySSWh2YTZz8+HQ07qGH/2rEom1vDw=="],
 
-    "@cloudflare/workerd-darwin-64": ["@cloudflare/workerd-darwin-64@1.20250718.0", "", { "os": "darwin", "cpu": "x64" }, "sha512-FHf4t7zbVN8yyXgQ/r/GqLPaYZSGUVzeR7RnL28Mwj2djyw2ZergvytVc7fdGcczl6PQh+VKGfZCfUqpJlbi9g=="],
+    "@cloudflare/workerd-darwin-64": ["@cloudflare/workerd-darwin-64@1.20260504.1", "", { "os": "darwin", "cpu": "x64" }, "sha512-IOMjYoftNRXabFt+QzY2Bo2mR2TNl8xsGvE0HnQ+K0S2c61VOUGUkr9gpJjnwrJ65yA9Qed4xfg0RRqXHO+nfA=="],
 
-    "@cloudflare/workerd-darwin-arm64": ["@cloudflare/workerd-darwin-arm64@1.20250718.0", "", { "os": "darwin", "cpu": "arm64" }, "sha512-fUiyUJYyqqp4NqJ0YgGtp4WJh/II/YZsUnEb6vVy5Oeas8lUOxnN+ZOJ8N/6/5LQCVAtYCChRiIrBbfhTn5Z8Q=="],
+    "@cloudflare/workerd-darwin-arm64": ["@cloudflare/workerd-darwin-arm64@1.20260504.1", "", { "os": "darwin", "cpu": "arm64" }, "sha512-7iMXxIU0N5KklZpQm2kuwTm0XtrpHXNqhejJyGquky8gSTnm31zBdutjMekH8VRr6ckbvZIl6lvqXzXdfOEojg=="],
 
-    "@cloudflare/workerd-linux-64": ["@cloudflare/workerd-linux-64@1.20250718.0", "", { "os": "linux", "cpu": "x64" }, "sha512-5+eb3rtJMiEwp08Kryqzzu8d1rUcK+gdE442auo5eniMpT170Dz0QxBrqkg2Z48SFUPYbj+6uknuA5tzdRSUSg=="],
+    "@cloudflare/workerd-linux-64": ["@cloudflare/workerd-linux-64@1.20260504.1", "", { "os": "linux", "cpu": "x64" }, "sha512-YLB0EH5FQV++oWlalFgPF3p2Bp3dn/D6RWNMw0ukEC8gKnNX6o61A+dlFUl8hRD35ja1zKRxGFUojs4U2+MoJA=="],
 
-    "@cloudflare/workerd-linux-arm64": ["@cloudflare/workerd-linux-arm64@1.20250718.0", "", { "os": "linux", "cpu": "arm64" }, "sha512-Aa2M/DVBEBQDdATMbn217zCSFKE+ud/teS+fFS+OQqKABLn0azO2qq6ANAHYOIE6Q3Sq4CxDIQr8lGdaJHwUog=="],
+    "@cloudflare/workerd-linux-arm64": ["@cloudflare/workerd-linux-arm64@1.20260504.1", "", { "os": "linux", "cpu": "arm64" }, "sha512-FAh/82jDXDArfn9xDih6f/IJfF2SHXBb4nFeQAyHyvXrn18zM6Q3yl2Vj0U7LybbNbmu7TNGghwaM2NoSQS+0A=="],
 
-    "@cloudflare/workerd-windows-64": ["@cloudflare/workerd-windows-64@1.20250718.0", "", { "os": "win32", "cpu": "x64" }, "sha512-dY16RXKffmugnc67LTbyjdDHZn5NoTF1yHEf2fN4+OaOnoGSp3N1x77QubTDwqZ9zECWxgQfDLjddcH8dWeFhg=="],
+    "@cloudflare/workerd-windows-64": ["@cloudflare/workerd-windows-64@1.20260504.1", "", { "os": "win32", "cpu": "x64" }, "sha512-QUg/B3dfrK/KHHHhiJzdkLkTg5mG7lA3t8iplbBoUa3XKCLOHOOXhbU4WSYlLqg8YnsQ6XLZ1HVA99fmZhJh7A=="],
 
     "@cloudflare/workers-types": ["@cloudflare/workers-types@4.20260301.1", "", {}, "sha512-klKnECMb5A4GtVF0P5NH6rCjtyjqIEKJaz6kEtx9YPHhfFO2HUEarO+MI4F8WPchgeZqpGlEpDhRapzrOTw51Q=="],
 
@@ -484,7 +528,7 @@
 
     "@esbuild/openbsd-x64": ["@esbuild/openbsd-x64@0.24.2", "", { "os": "openbsd", "cpu": "x64" }, "sha512-+iDS6zpNM6EnJyWv0bMGLWSWeXGN/HTaF/LXHXHwejGsVi+ooqDfMCCTerNFxEkM3wYVcExkeGXNqshc9iMaOA=="],
 
-    "@esbuild/openharmony-arm64": ["@esbuild/openharmony-arm64@0.25.12", "", { "os": "none", "cpu": "arm64" }, "sha512-rm0YWsqUSRrjncSXGA7Zv78Nbnw4XL6/dzr20cyrQf7ZmRcsovpcRBdhD43Nuk3y7XIoW2OxMVvwuRvk9XdASg=="],
+    "@esbuild/openharmony-arm64": ["@esbuild/openharmony-arm64@0.27.3", "", { "os": "none", "cpu": "arm64" }, "sha512-NinAEgr/etERPTsZJ7aEZQvvg/A6IsZG/LgZy+81wON2huV7SrK3e63dU0XhyZP4RKGyTm7aOgmQk0bGp0fy2g=="],
 
     "@esbuild/sunos-x64": ["@esbuild/sunos-x64@0.24.2", "", { "os": "sunos", "cpu": "x64" }, "sha512-hTdsW27jcktEvpwNHJU4ZwWFGkz2zRJUz8pvddmXPtXDzVKTTINmlmga3ZzwcuMpUvLw7JkLy9QLKyGpD2Yxig=="],
 
@@ -506,6 +550,8 @@
 
     "@google/genai": ["@google/genai@1.42.0", "", { "dependencies": { "google-auth-library": "^10.3.0", "p-retry": "^4.6.2", "protobufjs": "^7.5.4", "ws": "^8.18.0" }, "peerDependencies": { "@modelcontextprotocol/sdk": "^1.25.2" }, "optionalPeers": ["@modelcontextprotocol/sdk"] }, "sha512-+3nlMTcrQufbQ8IumGkOphxD5Pd5kKyJOzLcnY0/1IuE8upJk5aLmoexZ2BJhBp1zAjRJMEB4a2CJwKI9e2EYw=="],
 
+    "@happy-dom/global-registrator": ["@happy-dom/global-registrator@20.9.0", "", { "dependencies": { "@types/node": ">=20.0.0", "happy-dom": "^20.9.0" } }, "sha512-lBW6/m5BIFl3pMuWPNN0lIOYw9LMCmPfix53ExS3FBi4E+NELEljQ3xH6aAV9IYiQRfn9YIIgzzMrD0vIcD7tw=="],
+
     "@hono/node-server": ["@hono/node-server@1.19.11", "", { "peerDependencies": { "hono": "^4" } }, "sha512-dr8/3zEaB+p0D2n/IUrlPF1HZm586qgJNXK1a9fhg/PzdtkK7Ksd5l312tJX2yBuALqDYBlG20QEbayqPyxn+g=="],
 
     "@iconify/types": ["@iconify/types@2.0.0", "", {}, "sha512-+wluvCrRhXrhyOmRDJ3q8mux9JkKy5SJ/v8ol2tu4FVjyYvtEzkc/3pK15ET6RKg4b4w4BmTk1+gsCUhf21Ykg=="],
@@ -574,7 +620,7 @@
 
     "@jridgewell/sourcemap-codec": ["@jridgewell/sourcemap-codec@1.5.5", "", {}, "sha512-cYQ9310grqxueWbl+WuIUIaiUaDcj7WOq5fVhEljNVgRfOUhY9fy2zTvfoqWsnebh8Sl70VScFbICvJnLKB0Og=="],
 
-    "@jridgewell/trace-mapping": ["@jridgewell/trace-mapping@0.3.31", "", { "dependencies": { "@jridgewell/resolve-uri": "^3.1.0", "@jridgewell/sourcemap-codec": "^1.4.14" } }, "sha512-zzNR+SdQSDJzc8joaeP8QQoCQr8NuYx2dIIytl1QeBEZHJ9uW6hebsrYgbz8hJwUQao3TWCMtmfV8Nu1twOLAw=="],
+    "@jridgewell/trace-mapping": ["@jridgewell/trace-mapping@0.3.9", "", { "dependencies": { "@jridgewell/resolve-uri": "^3.0.3", "@jridgewell/sourcemap-codec": "^1.4.10" } }, "sha512-3Belt6tdc8bPgAtbcmdtNJlirVoTmEb5e2gC94PnkwEW9jI6CAHUeoG85tjWP5WquqfavoMtMwiG4P926ZKKuQ=="],
 
     "@mariozechner/clipboard": ["@mariozechner/clipboard@0.3.2", "", { "optionalDependencies": { "@mariozechner/clipboard-darwin-arm64": "0.3.2", "@mariozechner/clipboard-darwin-universal": "0.3.2", "@mariozechner/clipboard-darwin-x64": "0.3.2", "@mariozechner/clipboard-linux-arm64-gnu": "0.3.2", "@mariozechner/clipboard-linux-arm64-musl": "0.3.2", "@mariozechner/clipboard-linux-riscv64-gnu": "0.3.2", "@mariozechner/clipboard-linux-x64-gnu": "0.3.2", "@mariozechner/clipboard-linux-x64-musl": "0.3.2", "@mariozechner/clipboard-win32-arm64-msvc": "0.3.2", "@mariozechner/clipboard-win32-x64-msvc": "0.3.2" } }, "sha512-IHQpksNjo7EAtGuHFU+tbWDp5LarH3HU/8WiB9O70ZEoBPHOg0/6afwSLK0QyNMMmx4Bpi/zl6+DcBXe95nWYA=="],
 
@@ -676,6 +722,8 @@
 
     "@plannotator/ai": ["@plannotator/ai@workspace:packages/ai"],
 
+    "@plannotator/collab-agent": ["@plannotator/collab-agent@workspace:apps/collab-agent"],
+
     "@plannotator/editor": ["@plannotator/editor@workspace:packages/editor"],
 
     "@plannotator/hooks": ["@plannotator/hooks@workspace:apps/hook"],
@@ -694,6 +742,8 @@
 
     "@plannotator/review-editor": ["@plannotator/review-editor@workspace:packages/review-editor"],
 
+    "@plannotator/room-service": ["@plannotator/room-service@workspace:apps/room-service"],
+
     "@plannotator/server": ["@plannotator/server@workspace:packages/server"],
 
     "@plannotator/shared": ["@plannotator/shared@workspace:packages/shared"],
@@ -702,6 +752,12 @@
 
     "@plannotator/web-highlighter": ["@plannotator/web-highlighter@0.8.1", "", {}, "sha512-FlteNOwRj9iNSY/AhFMtqOnVS4FvsACvTw6IiOM1y8iDyhiU/WeZOgjURENvIY+wuUaiS9DDFmg0PrHMyuMR1Q=="],
 
+    "@poppinss/colors": ["@poppinss/colors@4.1.6", "", { "dependencies": { "kleur": "^4.1.5" } }, "sha512-H9xkIdFswbS8n1d6vmRd8+c10t2Qe+rZITbbDHHkQixH5+2x1FDGmi/0K+WgWiqQFKPSlIYB7jlH6Kpfn6Fleg=="],
+
+    "@poppinss/dumper": ["@poppinss/dumper@0.6.5", "", { "dependencies": { "@poppinss/colors": "^4.1.5", "@sindresorhus/is": "^7.0.2", "supports-color": "^10.0.0" } }, "sha512-NBdYIb90J7LfOI32dOewKI1r7wnkiH6m920puQ3qHUeZkxNkQiFnXVWoE6YtFSv6QOiPPf7ys6i+HWWecDz7sw=="],
+
+    "@poppinss/exception": ["@poppinss/exception@1.2.3", "", {}, "sha512-dCED+QRChTVatE9ibtoaxc+WkdzOSjYTKi/+uacHWIsfodVfpsueo3+DKpgU5Px8qXjgmXkSvhXvSCz3fnP9lw=="],
+
     "@protobufjs/aspromise": ["@protobufjs/aspromise@1.1.2", "", {}, "sha512-j+gKExEuLmKwvz3OgROXtrJ2UG2x8Ch2YZUxahh+s1F2HZ+wAceUNLkvy6zKCPVRkU++ZWQrdxsUeQXmcg4uoQ=="],
 
     "@protobufjs/base64": ["@protobufjs/base64@1.1.2", "", {}, "sha512-AZkcAA5vnN/v4PDqKyMR5lx7hZttPDgClv83E//FMNhR2TMcLUhfRUBHCmSl0oi9zMgDDqRUJkSxO3wm85+XLg=="],
@@ -882,6 +938,8 @@
 
     "@sinclair/typebox": ["@sinclair/typebox@0.34.48", "", {}, "sha512-kKJTNuK3AQOrgjjotVxMrCn1sUJwM76wMszfq1kdU4uYVJjvEWuFQ6HgvLt4Xz3fSmZlTOxJ/Ie13KnIcWQXFA=="],
 
+    "@sindresorhus/is": ["@sindresorhus/is@7.2.0", "", {}, "sha512-P1Cz1dWaFfR4IR+U13mqqiGsLFf1KbayybWwdd2vfctdV6hDpUkgCY0nKOLLTMSoRd/jJNjtbqzf13K8DCCXQw=="],
+
     "@sindresorhus/merge-streams": ["@sindresorhus/merge-streams@2.3.0", "", {}, "sha512-LtoMMhxAlorcGhmFYI+LhPgbPZCkgP6ra1YL604EeF6U98pLlQ3iWIGMdWSC+vWmPBWBNgmDBAhnAobLROJmwg=="],
 
     "@smithy/abort-controller": ["@smithy/abort-controller@4.2.8", "", { "dependencies": { "@smithy/types": "^4.12.0", "tslib": "^2.6.2" } }, "sha512-peuVfkYHAmS5ybKxWcfraK7WBBP0J+rkfUcbHJJKQ4ir3UAUNQI+Y4Vt/PqSzGqgloJ5O1dk7+WzNL8wcCSXbw=="],
@@ -974,6 +1032,8 @@
 
     "@smithy/uuid": ["@smithy/uuid@1.1.0", "", { "dependencies": { "tslib": "^2.6.2" } }, "sha512-4aUIteuyxtBUhVdiQqcDhKFitwfd9hqoSDYY2KRXiWtgoWJ9Bmise+KfEPDiVHWeJepvF8xJO9/9+WDIciMFFw=="],
 
+    "@speed-highlight/core": ["@speed-highlight/core@1.2.15", "", {}, "sha512-BMq1K3DsElxDWawkX6eLg9+CKJrTVGCBAWVuHXVUV2u0s2711qiChLSId6ikYPfxhdYocLNt3wWwSvDiTvFabw=="],
+
     "@tailwindcss/node": ["@tailwindcss/node@4.1.18", "", { "dependencies": { "@jridgewell/remapping": "^2.3.4", "enhanced-resolve": "^5.18.3", "jiti": "^2.6.1", "lightningcss": "1.30.2", "magic-string": "^0.30.21", "source-map-js": "^1.2.1", "tailwindcss": "4.1.18" } }, "sha512-DoR7U1P7iYhw16qJ49fgXUlry1t4CpXeErJHnQ44JgTSKMaZUdf17cfn5mHchfJ4KRBZRFA/Coo+MUF5+gOaCQ=="],
 
     "@tailwindcss/oxide": ["@tailwindcss/oxide@4.1.18", "", { "optionalDependencies": { "@tailwindcss/oxide-android-arm64": "4.1.18", "@tailwindcss/oxide-darwin-arm64": "4.1.18", "@tailwindcss/oxide-darwin-x64": "4.1.18", "@tailwindcss/oxide-freebsd-x64": "4.1.18", "@tailwindcss/oxide-linux-arm-gnueabihf": "4.1.18", "@tailwindcss/oxide-linux-arm64-gnu": "4.1.18", "@tailwindcss/oxide-linux-arm64-musl": "4.1.18", "@tailwindcss/oxide-linux-x64-gnu": "4.1.18", "@tailwindcss/oxide-linux-x64-musl": "4.1.18", "@tailwindcss/oxide-wasm32-wasi": "4.1.18", "@tailwindcss/oxide-win32-arm64-msvc": "4.1.18", "@tailwindcss/oxide-win32-x64-msvc": "4.1.18" } }, "sha512-EgCR5tTS5bUSKQgzeMClT6iCY3ToqE1y+ZB0AKldj809QXk1Y+3jB0upOYZrn9aGIzPtUsP7sX4QQ4XtjBB95A=="],
@@ -1008,6 +1068,10 @@
 
     "@tanstack/table-core": ["@tanstack/table-core@8.21.3", "", {}, "sha512-ldZXEhOBb8Is7xLs01fR3YEc3DERiz5silj8tnGkFZytt1abEvl/GhUmCE0PMLaMPTa3Jk4HbKmRlHmu+gCftg=="],
 
+    "@testing-library/dom": ["@testing-library/dom@10.4.1", "", { "dependencies": { "@babel/code-frame": "^7.10.4", "@babel/runtime": "^7.12.5", "@types/aria-query": "^5.0.1", "aria-query": "5.3.0", "dom-accessibility-api": "^0.5.9", "lz-string": "^1.5.0", "picocolors": "1.1.1", "pretty-format": "^27.0.2" } }, "sha512-o4PXJQidqJl82ckFaXUeoAW+XysPLauYI43Abki5hABd853iMhitooc6znOnczgbTYmEP6U6/y1ZyKAIsvMKGg=="],
+
+    "@testing-library/react": ["@testing-library/react@16.3.2", "", { "dependencies": { "@babel/runtime": "^7.12.5" }, "peerDependencies": { "@testing-library/dom": "^10.0.0", "@types/react": "^18.0.0 || ^19.0.0", "@types/react-dom": "^18.0.0 || ^19.0.0", "react": "^18.0.0 || ^19.0.0", "react-dom": "^18.0.0 || ^19.0.0" }, "optionalPeers": ["@types/react", "@types/react-dom"] }, "sha512-XU5/SytQM+ykqMnAnvB2umaJNIOsLF3PVv//1Ew4CTcpz0/BRyy/af40qqrt7SjKpDdT1saBMc42CUok5gaw+g=="],
+
     "@textlint/ast-node-types": ["@textlint/ast-node-types@15.5.2", "", {}, "sha512-fCaOxoup5LIyBEo7R1oYWE7V4bSX0KQeHh66twon9e9usaLE3ijgF8QjYsR6joCssdeCHVd0wHm7ppsEyTr6vg=="],
 
     "@textlint/linter-formatter": ["@textlint/linter-formatter@15.5.2", "", { "dependencies": { "@azu/format-text": "^1.0.2", "@azu/style-format": "^1.0.1", "@textlint/module-interop": "15.5.2", "@textlint/resolver": "15.5.2", "@textlint/types": "15.5.2", "chalk": "^4.1.2", "debug": "^4.4.3", "js-yaml": "^4.1.1", "lodash": "^4.17.23", "pluralize": "^2.0.0", "string-width": "^4.2.3", "strip-ansi": "^6.0.1", "table": "^6.9.0", "text-table": "^0.2.0" } }, "sha512-jAw7jWM8+wU9cG6Uu31jGyD1B+PAVePCvnPKC/oov+2iBPKk3ao30zc/Itmi7FvXo4oPaL9PmzPPQhyniPVgVg=="],
@@ -1024,6 +1088,8 @@
 
     "@tootallnate/quickjs-emscripten": ["@tootallnate/quickjs-emscripten@0.23.0", "", {}, "sha512-C5Mc6rdnsaJDjO3UpGW/CQTHtCKaYlScZTly4JIu97Jxo/odCiH0ITnDXSJPTOrEKk/ycSZ0AOgTmkDtkOsvIA=="],
 
+    "@types/aria-query": ["@types/aria-query@5.0.4", "", {}, "sha512-rfT93uj5s0PRL7EzccGMs3brplhcrghnDoV26NqKhCAS1hVo+WdNsPvE/yb6ilfr5hi2MEk6d5EWJTKdxg8jVw=="],
+
     "@types/babel__core": ["@types/babel__core@7.20.5", "", { "dependencies": { "@babel/parser": "^7.20.7", "@babel/types": "^7.20.7", "@types/babel__generator": "*", "@types/babel__template": "*", "@types/babel__traverse": "*" } }, "sha512-qoQprZvz5wQFJwMDqeseRXWv3rqMvhgpbXFfVyWhbx9X47POIA6i/+dXefEmZKoAgOaTdaIgNSMqMIU61yRyzA=="],
 
     "@types/babel__generator": ["@types/babel__generator@7.27.0", "", { "dependencies": { "@babel/types": "^7.0.0" } }, "sha512-ufFd2Xi92OAVPYsy+P4n7/U7e68fex0+Ee8gSG9KX7eo084CWiQ4sdxktvdl0bOPupXtVJPY19zk6EwWqUQ8lg=="],
@@ -1140,6 +1206,10 @@
 
     "@types/vscode": ["@types/vscode@1.109.0", "", {}, "sha512-0Pf95rnwEIwDbmXGC08r0B4TQhAbsHQ5UyTIgVgoieDe4cOnf92usuR5dEczb6bTKEp7ziZH4TV1TRGPPCExtw=="],
 
+    "@types/whatwg-mimetype": ["@types/whatwg-mimetype@3.0.2", "", {}, "sha512-c2AKvDT8ToxLIOUlN51gTiHXflsfIFisS4pO7pDPoKouJCESkhZnEy623gwP9laCy5lnLDAw1vAzu2vM2YLOrA=="],
+
+    "@types/ws": ["@types/ws@8.18.1", "", { "dependencies": { "@types/node": "*" } }, "sha512-ThVF6DCVhA8kUGy+aazFQ4kXQ7E1Ty7A3ypFOe0IcJV8O/M511G99AW24irKrW56Wt44yG9+ij8FaqoBGkuBXg=="],
+
     "@typespec/ts-http-runtime": ["@typespec/ts-http-runtime@0.3.3", "", { "dependencies": { "http-proxy-agent": "^7.0.0", "https-proxy-agent": "^7.0.0", "tslib": "^2.6.2" } }, "sha512-91fp6CAAJSRtH5ja95T1FHSKa8aPW9/Zw6cta81jlZTUw/+Vq8jM/AfF/14h2b71wwR84JUTW/3Y8QPhDAawFA=="],
 
     "@ungap/structured-clone": ["@ungap/structured-clone@1.3.0", "", {}, "sha512-WmoN8qaIAo7WTYWbAZuG8PYEhn5fkz7dZrqTBZ7dtt//lL2Gwms1IcnQ5yHqjDfX8Ft5j4YzDM23f87zBfDe9g=="],
@@ -1188,7 +1258,7 @@
 
     "ansi-escapes": ["ansi-escapes@7.3.0", "", { "dependencies": { "environment": "^1.0.0" } }, "sha512-BvU8nYgGQBxcmMuEeUEmNTvrMVjJNSH7RgW24vXexN4Ven6qCvy4TntnvlnwnMLTVlcRQQdbRY8NKnaIoeWDNg=="],
 
-    "ansi-regex": ["ansi-regex@6.2.2", "", {}, "sha512-Bq3SmSpyFHaWjPk8If9yc6svM8c56dB5BAtW4Qbw5jHTwwXXcTLoRMkpDJp6VL0XzlWaCHTXrkFURMYmD0sLqg=="],
+    "ansi-regex": ["ansi-regex@5.0.1", "", {}, "sha512-quJQXlTSUGL2LH9SUXo8VwsY4soanhgo6LNSm84E1LBcE8s3O0wpdiRzyR9z/ZZJMlMWv37qOOb9pdJlMUEKFQ=="],
 
     "ansi-styles": ["ansi-styles@4.3.0", "", { "dependencies": { "color-convert": "^2.0.1" } }, "sha512-zbB9rCJAT1rbjiVDb2hqKFHNYLxgtk8NURxZ3IZwD3F6NtxbXZQCnnSi1Lkx+IDohdPlFp222wVALIheZJQSEg=="],
 
@@ -1494,6 +1564,8 @@
 
     "dockview-react": ["dockview-react@5.2.0", "", { "dependencies": { "dockview": "^5.2.0" } }, "sha512-xJU5EiViiYYoP0ez5KxN8I+5CWSiPC27KVgVJBpRYRYJN6wKjMUpUqqSHwTlN1PGw5OzCu7UGQlUl1RQew74ag=="],
 
+    "dom-accessibility-api": ["dom-accessibility-api@0.5.16", "", {}, "sha512-X7BJ2yElsnOJ30pZF4uIIDfBEVgF4XEBxL9Bxhy6dnrm5hkzqmsWHGTiHqRiITNhMyFLyAiWndIJP7Z1NTteDg=="],
+
     "dom-serializer": ["dom-serializer@2.0.0", "", { "dependencies": { "domelementtype": "^2.3.0", "domhandler": "^5.0.2", "entities": "^4.2.0" } }, "sha512-wIkAryiqt/nV5EQKqQpo3SToSOV9J0DnbJqwK7Wv/Trc92zIAYZ4FlMu+JPFW1DfGFt81ZTCGgDEabffXeLyJg=="],
 
     "domelementtype": ["domelementtype@2.3.0", "", {}, "sha512-OLETBj6w0OsagBwdXnPdN0cnMfF9opN69co+7ZrbfPGrdpPVNBUj02spi6B1N7wChLQiPn4CSH/zJvXw56gmHw=="],
@@ -1528,10 +1600,12 @@
 
     "enhanced-resolve": ["enhanced-resolve@5.18.4", "", { "dependencies": { "graceful-fs": "^4.2.4", "tapable": "^2.2.0" } }, "sha512-LgQMM4WXU3QI+SYgEc2liRgznaD5ojbmY3sb8LxyguVkIg5FxdpTkvk72te2R38/TGKxH634oLxXRGY6d7AP+Q=="],
 
-    "entities": ["entities@4.5.0", "", {}, "sha512-V0hjH4dGPh9Ao5p0MoRY6BVqtwCjhz6vI5LT8AJ55H+4g9/4vbHx1I54fS0XuclLhDHArPQCiMjDxjaL8fPxhw=="],
+    "entities": ["entities@7.0.1", "", {}, "sha512-TWrgLOFUQTH994YUyl1yT4uyavY5nNB5muff+RtWaqNVCAK408b5ZnnbNAUEWLTCpum9w6arT70i1XdQ4UeOPA=="],
 
     "environment": ["environment@1.1.0", "", {}, "sha512-xUtoPkMggbz0MPyPiIWr1Kp4aeWJjDZ6SMvURhimjdZgsRuDplF5/s9hcgGhyXMhs+6vpnuoiZ2kFiu3FMnS8Q=="],
 
+    "error-stack-parser-es": ["error-stack-parser-es@1.0.5", "", {}, "sha512-5qucVt2XcuGMcEGgWI7i+yZpmpByQ8J1lHhcL7PwqCwu9FPP3VUXzT4ltHe5i2z9dePwEHcDVOAfSnHsOlCXRA=="],
+
     "es-define-property": ["es-define-property@1.0.1", "", {}, "sha512-e3nRfgfUZ4rNGL232gUgX06QNyyez04KdjFrF+LTRoOXmrOgFKDg4BCdsjW8EnT69eqdYGmRpJwiPVYNrCaW3g=="],
 
     "es-errors": ["es-errors@1.3.0", "", {}, "sha512-Zf5H2Kxt2xjTvbJvP2ZWLEICxA6j+hAmMzIlypy4xcBg1vKVnx89Wy0GbS+kf5cwCVFFzdCFh2XSCFNULS6csw=="],
@@ -1690,6 +1764,8 @@
 
     "hachure-fill": ["hachure-fill@0.5.2", "", {}, "sha512-3GKBOn+m2LX9iq+JC1064cSFprJY4jL1jCXTcpnfER5HYE2l/4EfWSGzkPa/ZDBmYI0ZOEj5VHV/eKnPGkHuOg=="],
 
+    "happy-dom": ["happy-dom@20.9.0", "", { "dependencies": { "@types/node": ">=20.0.0", "@types/whatwg-mimetype": "^3.0.2", "@types/ws": "^8.18.1", "entities": "^7.0.1", "whatwg-mimetype": "^3.0.0", "ws": "^8.18.3" } }, "sha512-GZZ9mKe8r646NUAf/zemnGbjYh4Bt8/MqASJY+pSm5ZDtc3YQox+4gsLI7yi1hba6o+eCsGxpHn5+iEVn31/FQ=="],
+
     "has-flag": ["has-flag@4.0.0", "", {}, "sha512-EykJT/Q1KjTWctppgIAgfSO0tKVuZUjhgMr17kqTumMl6Afv3EISleU7qZUzoXDFTAHTDC4NOoG/ZxU3EvlMPQ=="],
 
     "has-symbols": ["has-symbols@1.1.0", "", {}, "sha512-1cDNdwJ2Jaohmb3sg4OmKaMBwuC48sYni5HUw2DvsC8LjGTLK9h+eb1X6RyuOHe4hT0ULCW68iomhjUoKUqlPQ=="],
@@ -1900,6 +1976,8 @@
 
     "lru_map": ["lru_map@0.4.1", "", {}, "sha512-I+lBvqMMFfqaV8CJCISjI3wbjmwVu/VyOoU7+qtu9d7ioW5klMgsTTiUOUp+DJvfTTzKXoPbyC6YfgkNcyPSOg=="],
 
+    "lz-string": ["lz-string@1.5.0", "", { "bin": { "lz-string": "bin/bin.js" } }, "sha512-h5bgJWpxJNswbU7qCrV0tIKQCaS3blPDrqKWx+QxzuzL1zGUzij9XCWLrSLsJPu5t+eWA/ycetzYAO5IOMcWAQ=="],
+
     "magic-string": ["magic-string@0.30.21", "", { "dependencies": { "@jridgewell/sourcemap-codec": "^1.5.5" } }, "sha512-vd2F4YUyEXKGcLHoq+TEyCjxueSeHnFxyyjNp80yg0XV4vUhnDer/lvvlqM/arB5bXQN5K2/3oinyCRyx8T2CQ=="],
 
     "magicast": ["magicast@0.5.2", "", { "dependencies": { "@babel/parser": "^7.29.0", "@babel/types": "^7.29.0", "source-map-js": "^1.2.1" } }, "sha512-E3ZJh4J3S9KfwdjZhe2afj6R9lGIN5Pher1pF39UGrXRqq/VDaGVIGN13BjHd2u8B61hArAGOnso7nBOouW3TQ=="],
@@ -2040,7 +2118,7 @@
 
     "mimic-response": ["mimic-response@3.1.0", "", {}, "sha512-z0yWI+4FDrrweS8Zmt4Ej5HdJmky15+L2e6Wgn3+iK5fWzb6T3fhNFq2+MeTRb064c6Wr4N/wv0DzQTjNzHNGQ=="],
 
-    "miniflare": ["miniflare@3.20250718.3", "", { "dependencies": { "@cspotcode/source-map-support": "0.8.1", "acorn": "8.14.0", "acorn-walk": "8.3.2", "exit-hook": "2.2.1", "glob-to-regexp": "0.4.1", "stoppable": "1.1.0", "undici": "^5.28.5", "workerd": "1.20250718.0", "ws": "8.18.0", "youch": "3.3.4", "zod": "3.22.3" }, "bin": { "miniflare": "bootstrap.js" } }, "sha512-JuPrDJhwLrNLEJiNLWO7ZzJrv/Vv9kZuwMYCfv0LskQDM6Eonw4OvywO3CH/wCGjgHzha/qyjUh8JQ068TjDgQ=="],
+    "miniflare": ["miniflare@4.20260504.0", "", { "dependencies": { "@cspotcode/source-map-support": "0.8.1", "sharp": "^0.34.5", "undici": "7.24.8", "workerd": "1.20260504.1", "ws": "8.18.0", "youch": "4.1.0-beta.10" }, "bin": { "miniflare": "bootstrap.js" } }, "sha512-HeI/HLx+rbeo/UB4qb6NsNcFdUVD7xDzyCexZJTVtFMlfpfexUKEDmdeTRRpzeHrJseZFGua+v9JO1kfPublUw=="],
 
     "minimatch": ["minimatch@10.2.2", "", { "dependencies": { "brace-expansion": "^5.0.2" } }, "sha512-+G4CpNBxa5MprY+04MbgOw1v7So6n5JY166pFi9KfYwT78fxScCeSNQSNzp6dpPSW2rONOps6Ocam1wFhCgoVw=="],
 
@@ -2200,6 +2278,8 @@
 
     "prebuild-install": ["prebuild-install@7.1.3", "", { "dependencies": { "detect-libc": "^2.0.0", "expand-template": "^2.0.3", "github-from-package": "0.0.0", "minimist": "^1.2.3", "mkdirp-classic": "^0.5.3", "napi-build-utils": "^2.0.0", "node-abi": "^3.3.0", "pump": "^3.0.0", "rc": "^1.2.7", "simple-get": "^4.0.0", "tar-fs": "^2.0.0", "tunnel-agent": "^0.6.0" }, "bin": { "prebuild-install": "bin.js" } }, "sha512-8Mf2cbV7x1cXPUILADGI3wuhfqWvtiLA1iclTDbFRZkgRQS0NqsPZphna9V+HyTEadheuPmjaJMsbzKQFOzLug=="],
 
+    "pretty-format": ["pretty-format@27.5.1", "", { "dependencies": { "ansi-regex": "^5.0.1", "ansi-styles": "^5.0.0", "react-is": "^17.0.1" } }, "sha512-Qb1gy5OrP5+zDf2Bvnzdl3jsTf1qXVMazbvCoKhtKqVs4/YK4ozX4gKQJJVyNe+cajNPn0KoC0MC3FUmaHWEmQ=="],
+
     "printable-characters": ["printable-characters@1.0.42", "", {}, "sha512-dKp+C4iXWK4vVYZmYSd0KBH5F/h1HoZRsbJ82AVKRO3PEo8L4lBS/vLwhVtpwwuYcoIsVY+1JYKR268yn480uQ=="],
 
     "prismjs": ["prismjs@1.30.0", "", {}, "sha512-DEvV2ZF2r2/63V+tK8hQvrR2ZGn10srHbXviTlcv7Kpzw8jWiNTqbVgjO3IY8RxrrOUF8VPMQQFysYYYv0YZxw=="],
@@ -2240,6 +2320,8 @@
 
     "react-dom": ["react-dom@19.2.3", "", { "dependencies": { "scheduler": "^0.27.0" }, "peerDependencies": { "react": "^19.2.3" } }, "sha512-yELu4WmLPw5Mr/lmeEpox5rw3RETacE++JgHqQzd2dg+YbJuat3jH4ingc+WPZhxaoFzdv9y33G+F7Nl5O0GBg=="],
 
+    "react-is": ["react-is@17.0.2", "", {}, "sha512-w2GsyukL62IJnlaff/nRegPQR94C/XXamvMWmSHRJ4y7Ts/4ocGRmTHvOs8PSE6pB3dWOrD/nueuU5sduBsQ4w=="],
+
     "react-refresh": ["react-refresh@0.18.0", "", {}, "sha512-QgT5//D3jfjJb6Gsjxv0Slpj23ip+HtOpnNgnb2S5zU3CB26G/IDPGoy4RJB42wzFE46DRsstbW6tKHoKbhAxw=="],
 
     "react-remove-scroll": ["react-remove-scroll@2.7.2", "", { "dependencies": { "react-remove-scroll-bar": "^2.3.7", "react-style-singleton": "^2.2.3", "tslib": "^2.1.0", "use-callback-ref": "^1.3.3", "use-sidecar": "^1.1.3" }, "peerDependencies": { "@types/react": "*", "react": "^16.8.0 || ^17.0.0 || ^18.0.0 || ^19.0.0 || ^19.0.0-rc" }, "optionalPeers": ["@types/react"] }, "sha512-Iqb9NjCCTt6Hf+vOdNIZGdTiH1QSqr27H/Ek9sv/a97gfueI/5h1s3yRi1nngzMUaOOToin5dI1dXKdXiF+u0Q=="],
@@ -2524,7 +2606,7 @@
 
     "undici-types": ["undici-types@7.18.2", "", {}, "sha512-AsuCzffGHJybSaRrmr5eHr81mwJU3kjw6M+uprWvCXiNeN9SOGwQ3Jn8jb8m3Z6izVgknn1R0FTCEAP2QrLY/w=="],
 
-    "unenv": ["unenv@2.0.0-rc.14", "", { "dependencies": { "defu": "^6.1.4", "exsolve": "^1.0.1", "ohash": "^2.0.10", "pathe": "^2.0.3", "ufo": "^1.5.4" } }, "sha512-od496pShMen7nOy5VmVJCnq8rptd45vh6Nx/r2iPbrba6pa6p+tS2ywuIHRZ/OBvSbQZB0kWvpO9XBNVFXHD3Q=="],
+    "unenv": ["unenv@2.0.0-rc.24", "", { "dependencies": { "pathe": "^2.0.3" } }, "sha512-i7qRCmY42zmCwnYlh9H2SvLEypEFGye5iRmEMKjcGi7zk9UquigRjFtTLz0TYqr0ZGLZhaMHl/foy1bZR+Cwlw=="],
 
     "unicorn-magic": ["unicorn-magic@0.3.0", "", {}, "sha512-+QBBXBCvifc56fsbuxZQ6Sic3wqqc3WWaqxs58gvJrcOuN83HGTCwz3oS5phzU9LthRNE9VrJCFCLUgHeeFnfA=="],
 
@@ -2608,7 +2690,7 @@
 
     "whatwg-encoding": ["whatwg-encoding@3.1.1", "", { "dependencies": { "iconv-lite": "0.6.3" } }, "sha512-6qN4hJdMwfYBtE3YBTTHhoeuUrDBPZmbQaxWAqSALV/MeEnR5z1xd8UKud2RAkFoPkmB+hli1TZSnyi84xz1vQ=="],
 
-    "whatwg-mimetype": ["whatwg-mimetype@4.0.0", "", {}, "sha512-QaKxh0eNIi2mE9p2vEdzfagOKHCcj1pJ56EEHGQOVxp8r9/iszLUUV7v89x9O1p/T+NlTM5W7jW6+cz4Fq1YVg=="],
+    "whatwg-mimetype": ["whatwg-mimetype@3.0.0", "", {}, "sha512-nt+N2dzIutVRxARx1nghPKGv1xHikU7HKdfafKkLNLindmPU/ch3U31NOCGGA/dmPcmb1VlofO0vnKAcsm0o/Q=="],
 
     "which": ["which@2.0.2", "", { "dependencies": { "isexe": "^2.0.0" }, "bin": { "node-which": "./bin/node-which" } }, "sha512-BLI3Tl1TW3Pvl70l3yq3Y64i+awpwXqsGBYWkkqMtnbXgrMD+yj7rhW0kuEDxzJaYXGjEW5ogapKNMEKNMjibA=="],
 
@@ -2616,9 +2698,9 @@
 
     "widest-line": ["widest-line@5.0.0", "", { "dependencies": { "string-width": "^7.0.0" } }, "sha512-c9bZp7b5YtRj2wOe6dlj32MK+Bx/M/d+9VB2SHM1OtsUHR0aV0tdP6DWh/iMt0kWi1t5g1Iudu6hQRNd1A4PVA=="],
 
-    "workerd": ["workerd@1.20250718.0", "", { "optionalDependencies": { "@cloudflare/workerd-darwin-64": "1.20250718.0", "@cloudflare/workerd-darwin-arm64": "1.20250718.0", "@cloudflare/workerd-linux-64": "1.20250718.0", "@cloudflare/workerd-linux-arm64": "1.20250718.0", "@cloudflare/workerd-windows-64": "1.20250718.0" }, "bin": { "workerd": "bin/workerd" } }, "sha512-kqkIJP/eOfDlUyBzU7joBg+tl8aB25gEAGqDap+nFWb+WHhnooxjGHgxPBy3ipw2hnShPFNOQt5lFRxbwALirg=="],
+    "workerd": ["workerd@1.20260504.1", "", { "optionalDependencies": { "@cloudflare/workerd-darwin-64": "1.20260504.1", "@cloudflare/workerd-darwin-arm64": "1.20260504.1", "@cloudflare/workerd-linux-64": "1.20260504.1", "@cloudflare/workerd-linux-arm64": "1.20260504.1", "@cloudflare/workerd-windows-64": "1.20260504.1" }, "bin": { "workerd": "bin/workerd" } }, "sha512-AQTXSHbYNP9tLPgJNn0TmizyE4aDh2VuZZXlTAL0uu4fbCY436NAnQSJIzZbaFHM3DnAtVs9G8tkiJztSdYqDg=="],
 
-    "wrangler": ["wrangler@3.114.17", "", { "dependencies": { "@cloudflare/kv-asset-handler": "0.3.4", "@cloudflare/unenv-preset": "2.0.2", "@esbuild-plugins/node-globals-polyfill": "0.2.3", "@esbuild-plugins/node-modules-polyfill": "0.2.2", "blake3-wasm": "2.1.5", "esbuild": "0.17.19", "miniflare": "3.20250718.3", "path-to-regexp": "6.3.0", "unenv": "2.0.0-rc.14", "workerd": "1.20250718.0" }, "optionalDependencies": { "fsevents": "~2.3.2", "sharp": "^0.33.5" }, "peerDependencies": { "@cloudflare/workers-types": "^4.20250408.0" }, "optionalPeers": ["@cloudflare/workers-types"], "bin": { "wrangler": "bin/wrangler.js", "wrangler2": "bin/wrangler.js" } }, "sha512-tAvf7ly+tB+zwwrmjsCyJ2pJnnc7SZhbnNwXbH+OIdVas3zTSmjcZOjmLKcGGptssAA3RyTKhcF9BvKZzMUycA=="],
+    "wrangler": ["wrangler@4.88.0", "", { "dependencies": { "@cloudflare/kv-asset-handler": "0.5.0", "@cloudflare/unenv-preset": "2.16.1", "blake3-wasm": "2.1.5", "esbuild": "0.27.3", "miniflare": "4.20260504.0", "path-to-regexp": "6.3.0", "unenv": "2.0.0-rc.24", "workerd": "1.20260504.1" }, "optionalDependencies": { "fsevents": "~2.3.2" }, "peerDependencies": { "@cloudflare/workers-types": "^4.20260504.1" }, "optionalPeers": ["@cloudflare/workers-types"], "bin": { "wrangler": "bin/wrangler.js", "wrangler2": "bin/wrangler.js" } }, "sha512-f470QwbeT/JM1S0duq+sLtkss7UBxIFDtYHgujv9tdQUyA/dLGDq51am0rqrsuFtCi97lTM1P5sqtt8xra1AlA=="],
 
     "wrap-ansi": ["wrap-ansi@9.0.2", "", { "dependencies": { "ansi-styles": "^6.2.1", "string-width": "^7.0.0", "strip-ansi": "^7.1.0" } }, "sha512-42AtmgqjV+X1VpdOfyTGOYRi0/zsoLqtXQckTmqTeybT+BDIbM/Guxo7x3pE2vtpr1ok6xRqM9OpBe+Jyoqyww=="],
 
@@ -2626,7 +2708,7 @@
 
     "wrappy": ["wrappy@1.0.2", "", {}, "sha512-l4Sp/DRseor9wL6EvV2+TuQn63dMkPjZ/sp9XkghTEbV9KlPS1xUsZ3u7/IQO4wxtcFB4bgpQPRcR3QCvezPcQ=="],
 
-    "ws": ["ws@8.18.0", "", { "peerDependencies": { "bufferutil": "^4.0.1", "utf-8-validate": ">=5.0.2" }, "optionalPeers": ["bufferutil", "utf-8-validate"] }, "sha512-8VbfWfHLbbwu3+N6OKsOMpBdT4kXPDDB9cJk2bJ6mh9ucxdlnNvH1e+roYkKmN9Nxw2yjz7VzeO9oOz2zJ04Pw=="],
+    "ws": ["ws@8.19.0", "", { "peerDependencies": { "bufferutil": "^4.0.1", "utf-8-validate": ">=5.0.2" }, "optionalPeers": ["bufferutil", "utf-8-validate"] }, "sha512-blAT2mjOEIi0ZzruJfIhb3nps74PRWTCz1IjglWEEpQl5XS/UNama6u2/rjFkDDouqr4L67ry+1aGIALViWjDg=="],
 
     "wsl-utils": ["wsl-utils@0.1.0", "", { "dependencies": { "is-wsl": "^3.1.0" } }, "sha512-h3Fbisa2nKGPxCpm89Hk33lBLsnaGBvctQopaBSOW/uIs6FTe1ATyAnKFJrzVs9vpGdsTe73WF3V4lIsk4Gacw=="],
 
@@ -2656,7 +2738,9 @@
 
     "yoctocolors": ["yoctocolors@2.1.2", "", {}, "sha512-CzhO+pFNo8ajLM2d2IW/R93ipy99LWjtwblvC1RsoSUMZgyLbYFr221TnSNT7GjGdYui6P459mw9JH/g/zW2ug=="],
 
-    "youch": ["youch@3.3.4", "", { "dependencies": { "cookie": "^0.7.1", "mustache": "^4.2.0", "stacktracey": "^2.1.8" } }, "sha512-UeVBXie8cA35DS6+nBkls68xaBBXCye0CNznrhszZjTbRVnJKQuNsyLKBTTL4ln1o1rh2PKtv35twV7irj5SEg=="],
+    "youch": ["youch@4.1.0-beta.10", "", { "dependencies": { "@poppinss/colors": "^4.1.5", "@poppinss/dumper": "^0.6.4", "@speed-highlight/core": "^1.2.7", "cookie": "^1.0.2", "youch-core": "^0.3.3" } }, "sha512-rLfVLB4FgQneDr0dv1oddCVZmKjcJ6yX6mS4pU82Mq/Dt9a3cLZQ62pDBL4AUO+uVrCvtWz3ZFUL2HFAFJ/BXQ=="],
+
+    "youch-core": ["youch-core@0.3.3", "", { "dependencies": { "@poppinss/exception": "^1.2.2", "error-stack-parser-es": "^1.0.5" } }, "sha512-ho7XuGjLaJ2hWHoK8yFnsUGy2Y5uDpqSTq1FkHLK4/oqKtyUU1AFbOOxY4IpC9f0fTLjwYbslUz0Po5BpD1wrA=="],
 
     "zod": ["zod@4.1.8", "", {}, "sha512-5R1P+WwQqmmMIEACyzSvo4JXHY5WiAFHRMg+zBZKgKS+Q1viRa0C1hmUKtHltoIFKtIdki3pRxkmpP74jnNYHQ=="],
 
@@ -2692,6 +2776,8 @@
 
     "@babel/core/semver": ["semver@6.3.1", "", { "bin": { "semver": "bin/semver.js" } }, "sha512-BR7VvDCVHO+q2xBEWskxS6DJE1qRnb7DxzUrogb71CWoSficBxYsiAGd+Kl0mmq/MprG9yArRkyrQxTO6XjMzA=="],
 
+    "@babel/generator/@jridgewell/trace-mapping": ["@jridgewell/trace-mapping@0.3.31", "", { "dependencies": { "@jridgewell/resolve-uri": "^3.1.0", "@jridgewell/sourcemap-codec": "^1.4.14" } }, "sha512-zzNR+SdQSDJzc8joaeP8QQoCQr8NuYx2dIIytl1QeBEZHJ9uW6hebsrYgbz8hJwUQao3TWCMtmfV8Nu1twOLAw=="],
+
     "@babel/helper-compilation-targets/lru-cache": ["lru-cache@5.1.1", "", { "dependencies": { "yallist": "^3.0.2" } }, "sha512-KpNARQA3Iwv+jTA0utUVVbrh+Jlrr1Fv0e56GGzAFOXN7dk/FviaDW8LHmK52DlcH4WP2n6gI8vN1aesBFgo9w=="],
 
     "@babel/helper-compilation-targets/semver": ["semver@6.3.1", "", { "bin": { "semver": "bin/semver.js" } }, "sha512-BR7VvDCVHO+q2xBEWskxS6DJE1qRnb7DxzUrogb71CWoSficBxYsiAGd+Kl0mmq/MprG9yArRkyrQxTO6XjMzA=="],
@@ -2700,11 +2786,9 @@
 
     "@chevrotain/gast/lodash-es": ["lodash-es@4.17.21", "", {}, "sha512-mKnC+QJ9pWVzv+C4/U3rRsHapFfHvQFoFB92e52xeyGMcX6/OlIl78je1u8vePzYZSkkogMPJ2yjxxsb89cxyw=="],
 
-    "@cloudflare/kv-asset-handler/mime": ["mime@3.0.0", "", { "bin": { "mime": "cli.js" } }, "sha512-jSCU7/VB1loIWBZe14aEYHU/+1UMEHoaO7qxCOVJOw9GgH72VAWppxNcjU+x9a2k3GSIBXNKxXQFqRvvZ7vr3A=="],
+    "@jridgewell/gen-mapping/@jridgewell/trace-mapping": ["@jridgewell/trace-mapping@0.3.31", "", { "dependencies": { "@jridgewell/resolve-uri": "^3.1.0", "@jridgewell/sourcemap-codec": "^1.4.14" } }, "sha512-zzNR+SdQSDJzc8joaeP8QQoCQr8NuYx2dIIytl1QeBEZHJ9uW6hebsrYgbz8hJwUQao3TWCMtmfV8Nu1twOLAw=="],
 
-    "@cspotcode/source-map-support/@jridgewell/trace-mapping": ["@jridgewell/trace-mapping@0.3.9", "", { "dependencies": { "@jridgewell/resolve-uri": "^3.0.3", "@jridgewell/sourcemap-codec": "^1.4.10" } }, "sha512-3Belt6tdc8bPgAtbcmdtNJlirVoTmEb5e2gC94PnkwEW9jI6CAHUeoG85tjWP5WquqfavoMtMwiG4P926ZKKuQ=="],
-
-    "@google/genai/ws": ["ws@8.19.0", "", { "peerDependencies": { "bufferutil": "^4.0.1", "utf-8-validate": ">=5.0.2" }, "optionalPeers": ["bufferutil", "utf-8-validate"] }, "sha512-blAT2mjOEIi0ZzruJfIhb3nps74PRWTCz1IjglWEEpQl5XS/UNama6u2/rjFkDDouqr4L67ry+1aGIALViWjDg=="],
+    "@jridgewell/remapping/@jridgewell/trace-mapping": ["@jridgewell/trace-mapping@0.3.31", "", { "dependencies": { "@jridgewell/resolve-uri": "^3.1.0", "@jridgewell/sourcemap-codec": "^1.4.14" } }, "sha512-zzNR+SdQSDJzc8joaeP8QQoCQr8NuYx2dIIytl1QeBEZHJ9uW6hebsrYgbz8hJwUQao3TWCMtmfV8Nu1twOLAw=="],
 
     "@mariozechner/pi-ai/@anthropic-ai/sdk": ["@anthropic-ai/sdk@0.73.0", "", { "dependencies": { "json-schema-to-ts": "^3.1.1" }, "peerDependencies": { "zod": "^3.25.0 || ^4.0.0" }, "optionalPeers": ["zod"], "bin": { "anthropic-ai-sdk": "bin/cli" } }, "sha512-URURVzhxXGJDGUGFunIOtBlSl7KWvZiAAKY/ttTkZAkXT9bTPqdk2eK0b8qqSxXpikh3QKPnPYpiyX98zf5ebw=="],
 
@@ -2722,12 +2806,18 @@
 
     "@plannotator/hooks/@types/node": ["@types/node@22.19.3", "", { "dependencies": { "undici-types": "~6.21.0" } }, "sha512-1N9SBnWYOJTrNZCdh/yJE+t910Y128BoyY+zBLWhL3r0TYzlTmFdXrPwHL9DyFZmlEXNQQolTZh3KHV31QDhyA=="],
 
+    "@plannotator/paste-service/wrangler": ["wrangler@3.114.17", "", { "dependencies": { "@cloudflare/kv-asset-handler": "0.3.4", "@cloudflare/unenv-preset": "2.0.2", "@esbuild-plugins/node-globals-polyfill": "0.2.3", "@esbuild-plugins/node-modules-polyfill": "0.2.2", "blake3-wasm": "2.1.5", "esbuild": "0.17.19", "miniflare": "3.20250718.3", "path-to-regexp": "6.3.0", "unenv": "2.0.0-rc.14", "workerd": "1.20250718.0" }, "optionalDependencies": { "fsevents": "~2.3.2", "sharp": "^0.33.5" }, "peerDependencies": { "@cloudflare/workers-types": "^4.20250408.0" }, "optionalPeers": ["@cloudflare/workers-types"], "bin": { "wrangler": "bin/wrangler.js", "wrangler2": "bin/wrangler.js" } }, "sha512-tAvf7ly+tB+zwwrmjsCyJ2pJnnc7SZhbnNwXbH+OIdVas3zTSmjcZOjmLKcGGptssAA3RyTKhcF9BvKZzMUycA=="],
+
     "@plannotator/portal/@types/node": ["@types/node@22.19.3", "", { "dependencies": { "undici-types": "~6.21.0" } }, "sha512-1N9SBnWYOJTrNZCdh/yJE+t910Y128BoyY+zBLWhL3r0TYzlTmFdXrPwHL9DyFZmlEXNQQolTZh3KHV31QDhyA=="],
 
     "@plannotator/review/@pierre/diffs": ["@pierre/diffs@1.1.12", "", { "dependencies": { "@pierre/theme": "0.0.28", "@shikijs/transformers": "^3.0.0", "diff": "8.0.3", "hast-util-to-html": "9.0.5", "lru_map": "0.4.1", "shiki": "^3.0.0" }, "peerDependencies": { "react": "^18.3.1 || ^19.0.0", "react-dom": "^18.3.1 || ^19.0.0" } }, "sha512-InssHHM7f0nkazIRkuaiNCy6GkBLfwJlqc7LtTkMD/KSqsuc6bnL2V9sIQoG5PZu9jwinQiXUb/gT7itFa6U9A=="],
 
     "@plannotator/review/@types/node": ["@types/node@22.19.3", "", { "dependencies": { "undici-types": "~6.21.0" } }, "sha512-1N9SBnWYOJTrNZCdh/yJE+t910Y128BoyY+zBLWhL3r0TYzlTmFdXrPwHL9DyFZmlEXNQQolTZh3KHV31QDhyA=="],
 
+    "@poppinss/colors/kleur": ["kleur@4.1.5", "", {}, "sha512-o+NO+8WrRiQEE4/7nwRJhN1HWpVmJm511pBHUxPLtp0BUISzlBplORYSmTclCnJvQq2tKu/sgl3xVpkc7ZWuQQ=="],
+
+    "@poppinss/dumper/supports-color": ["supports-color@10.2.2", "", {}, "sha512-SS+jx45GF1QjgEXQx4NJZV9ImqmO2NPz5FNsIHrsDjh2YsHnawpan7SNQ1o8NuhrbHZy9AZhIoCUiCeaW/C80g=="],
+
     "@rollup/pluginutils/estree-walker": ["estree-walker@2.0.2", "", {}, "sha512-Rfkk/Mp/DL7JVje3u18FxFujQlTNR2q6QfMSMB7AvCBx91NGj/ba3kCfza0f6dVDbw7YlRf/nDrn7pQrCCyQ/w=="],
 
     "@tailwindcss/oxide-wasm32-wasi/@emnapi/core": ["@emnapi/core@1.7.1", "", { "dependencies": { "@emnapi/wasi-threads": "1.1.0", "tslib": "^2.4.0" }, "bundled": true }, "sha512-o1uhUASyo921r2XtHYOHy7gdkGLge8ghBEQHMWmyJFoXlpU58kIrhhN3w26lpQb6dspetweapMn2CSNwQ8I4wg=="],
@@ -2742,6 +2832,8 @@
 
     "@tailwindcss/oxide-wasm32-wasi/tslib": ["tslib@2.8.1", "", { "bundled": true }, "sha512-oJFu94HQb+KVduSUQL7wnpmqnfmLsOA/nAh6b6EH0wCEoK0/mPeXU6c3wKDV83MkOuHPRHtSXKKU99IBazS/2w=="],
 
+    "@testing-library/dom/aria-query": ["aria-query@5.3.0", "", { "dependencies": { "dequal": "^2.0.3" } }, "sha512-b0P0sZPKtyu8HkeRAfCq0IfURZK+SuwMjY1UXGBU27wpAiTwQAIlq56IbIO+ytk/JjS1fMR14ee5WBBfKi5J6A=="],
+
     "@textlint/linter-formatter/chalk": ["chalk@4.1.2", "", { "dependencies": { "ansi-styles": "^4.1.0", "supports-color": "^7.1.0" } }, "sha512-oKnbhFyRIXpUuez8iBMmyEa4nbj4IOQyuhc/wy9kY7/WVPcwIO9VA668Pu8RkO7+0G76SLROeyw9CpQ061i4mA=="],
 
     "@textlint/linter-formatter/pluralize": ["pluralize@2.0.0", "", {}, "sha512-TqNZzQCD4S42De9IfnnBvILN7HAW7riLqsCyp8lgjXeysyPlX5HhqKAcJHHHb9XskE4/a+7VGC9zzx8Ls0jOAw=="],
@@ -2776,6 +2868,8 @@
 
     "cheerio/parse5-htmlparser2-tree-adapter": ["parse5-htmlparser2-tree-adapter@7.1.0", "", { "dependencies": { "domhandler": "^5.0.3", "parse5": "^7.0.0" } }, "sha512-ruw5xyKs6lrpo9x9rCZqZZnIUntICjQAd0Wsmp396Ul9lN/h+ifgVV1x1gZHi8euej6wTfpqX8j+BFQxF0NS/g=="],
 
+    "cheerio/whatwg-mimetype": ["whatwg-mimetype@4.0.0", "", {}, "sha512-QaKxh0eNIi2mE9p2vEdzfagOKHCcj1pJ56EEHGQOVxp8r9/iszLUUV7v89x9O1p/T+NlTM5W7jW6+cz4Fq1YVg=="],
+
     "chevrotain/lodash-es": ["lodash-es@4.17.21", "", {}, "sha512-mKnC+QJ9pWVzv+C4/U3rRsHapFfHvQFoFB92e52xeyGMcX6/OlIl78je1u8vePzYZSkkogMPJ2yjxxsb89cxyw=="],
 
     "cli-highlight/chalk": ["chalk@4.1.2", "", { "dependencies": { "ansi-styles": "^4.1.0", "supports-color": "^7.1.0" } }, "sha512-oKnbhFyRIXpUuez8iBMmyEa4nbj4IOQyuhc/wy9kY7/WVPcwIO9VA668Pu8RkO7+0G76SLROeyw9CpQ061i4mA=="],
@@ -2800,6 +2894,8 @@
 
     "d3-sankey/d3-shape": ["d3-shape@1.3.7", "", { "dependencies": { "d3-path": "1" } }, "sha512-EUkvKjqPFUAZyOlhY5gzCxCeI0Aep04LwIRpsZ/mLFelJiUfnK56jo5JMDSE7yyP2kLSb6LtF+S5chMk7uqPqw=="],
 
+    "dom-serializer/entities": ["entities@4.5.0", "", {}, "sha512-V0hjH4dGPh9Ao5p0MoRY6BVqtwCjhz6vI5LT8AJ55H+4g9/4vbHx1I54fS0XuclLhDHArPQCiMjDxjaL8fPxhw=="],
+
     "encoding-sniffer/iconv-lite": ["iconv-lite@0.6.3", "", { "dependencies": { "safer-buffer": ">= 2.1.2 < 3.0.0" } }, "sha512-4fCk79wshMdzMp2rH06qWrJE4iolqLhCUH+OiuIgU++RB0+94NlDL81atO7GX55uUKueo0txHNtvEyI6D7WdMw=="],
 
     "escodegen/source-map": ["source-map@0.6.1", "", {}, "sha512-UjgapumWlbMhkBgzT7Ykc5YXUT46F0iKu8SGXq0bcwP5dz/h0Plj6enJqjz1Zbq2l5WaqYnrVbwWOWMyF3F47g=="],
@@ -2818,14 +2914,14 @@
 
     "hast-util-raw/parse5": ["parse5@7.3.0", "", { "dependencies": { "entities": "^6.0.0" } }, "sha512-IInvU7fabl34qmi9gY8XOVxhYyMyuH2xUNpb2q8/Y+7552KlejkRvqvD19nMoUW/uQGGbqNpA6Tufu5FL5BZgw=="],
 
-    "htmlparser2/entities": ["entities@7.0.1", "", {}, "sha512-TWrgLOFUQTH994YUyl1yT4uyavY5nNB5muff+RtWaqNVCAK408b5ZnnbNAUEWLTCpum9w6arT70i1XdQ4UeOPA=="],
-
     "katex/commander": ["commander@8.3.0", "", {}, "sha512-OkTL9umf+He2DZkUq8f8J9of7yL6RJKI24dVITBmNfZBmri9zYZQrKkuXiKhyfPSu8tUhnVBB1iKXevvnlR4Ww=="],
 
     "magicast/@babel/parser": ["@babel/parser@7.29.0", "", { "dependencies": { "@babel/types": "^7.29.0" }, "bin": "./bin/babel-parser.js" }, "sha512-IyDgFV5GeDUVX4YdF/3CPULtVGSXXMLh1xVIgdCgxApktqnQV0r7/8Nqthg+8YLGaAtdyIlo2qIdZrbCv4+7ww=="],
 
     "magicast/@babel/types": ["@babel/types@7.29.0", "", { "dependencies": { "@babel/helper-string-parser": "^7.27.1", "@babel/helper-validator-identifier": "^7.28.5" } }, "sha512-LwdZHpScM4Qz8Xw2iKSzS+cfglZzJGvofQICy7W7v4caru4EaAmyUuO6BGrbyQ2mYV11W0U8j5mBhd14dd3B0A=="],
 
+    "markdown-it/entities": ["entities@4.5.0", "", {}, "sha512-V0hjH4dGPh9Ao5p0MoRY6BVqtwCjhz6vI5LT8AJ55H+4g9/4vbHx1I54fS0XuclLhDHArPQCiMjDxjaL8fPxhw=="],
+
     "mdast-util-find-and-replace/escape-string-regexp": ["escape-string-regexp@5.0.0", "", {}, "sha512-/veY75JbMK4j1yjvuUxuVsiS/hr/4iHs9FTT6cgTexxdE0Ly/glccBAkloH/DofkjRbZU3bnoj38mOmhkZ0lHw=="],
 
     "mermaid/dompurify": ["dompurify@3.3.1", "", { "optionalDependencies": { "@types/trusted-types": "^2.0.7" } }, "sha512-qkdCKzLNtrgPFP1Vo+98FRzJnBRGe4ffyCea9IwHB1fyxPOeNTHpLKYGd4Uk9xvNoH0ZoOjwZxNptyMwqrId1Q=="],
@@ -2834,11 +2930,9 @@
 
     "micromatch/picomatch": ["picomatch@2.3.1", "", {}, "sha512-JU3teHTNjmE2VCGFzuY8EXzCDVwEqB2a8fsIvwaStHhAWJEeVd1o1QD80CU6+ZdEXXSLbSsuLwJjkCBWqRQUVA=="],
 
-    "miniflare/acorn": ["acorn@8.14.0", "", { "bin": { "acorn": "bin/acorn" } }, "sha512-cl669nCJTZBsL97OF4kUQm5g5hC2uihk0NxY3WENAC0TYdILVkAyHymAntgxGkl7K+t0cXIrH5siy5S4XkFycA=="],
-
-    "miniflare/undici": ["undici@5.29.0", "", { "dependencies": { "@fastify/busboy": "^2.0.0" } }, "sha512-raqeBD6NQK4SkWhQzeYKd1KmIG6dllBOTt55Rmkt4HtI9mwdWtJljnrXjAFUBLTSN67HWrOIZ3EPF4kjUw80Bg=="],
+    "miniflare/undici": ["undici@7.24.8", "", {}, "sha512-6KQ/+QxK49Z/p3HO6E5ZCZWNnCasyZLa5ExaVYyvPxUwKtbCPMKELJOqh7EqOle0t9cH/7d2TaaTRRa6Nhs4YQ=="],
 
-    "miniflare/zod": ["zod@3.22.3", "", {}, "sha512-EjIevzuJRiRPbVH4mGc8nApb/lVLKVpmUhAaR5R5doKGfAnGJ6Gr3CViAVjP+4FWSxCsybeWQdcgCtbX+7oZug=="],
+    "miniflare/ws": ["ws@8.18.0", "", { "peerDependencies": { "bufferutil": "^4.0.1", "utf-8-validate": ">=5.0.2" }, "optionalPeers": ["bufferutil", "utf-8-validate"] }, "sha512-8VbfWfHLbbwu3+N6OKsOMpBdT4kXPDDB9cJk2bJ6mh9ucxdlnNvH1e+roYkKmN9Nxw2yjz7VzeO9oOz2zJ04Pw=="],
 
     "node-fetch/data-uri-to-buffer": ["data-uri-to-buffer@4.0.1", "", {}, "sha512-0R9ikRb668HB7QDxT1vkpuUBtqc53YyAwMwGeUFKRojY/NWKvdZ+9UYtRfGmhqNbRkTSVpMbmyhXipFFv2cb/A=="],
 
@@ -2854,6 +2948,8 @@
 
     "parse5-parser-stream/parse5": ["parse5@7.3.0", "", { "dependencies": { "entities": "^6.0.0" } }, "sha512-IInvU7fabl34qmi9gY8XOVxhYyMyuH2xUNpb2q8/Y+7552KlejkRvqvD19nMoUW/uQGGbqNpA6Tufu5FL5BZgw=="],
 
+    "pretty-format/ansi-styles": ["ansi-styles@5.2.0", "", {}, "sha512-Cxwpt2SfTzTtXcfOlzGEee8O+c+MmUgGrNiBcXnuWxuFJHe6a5Hz7qwhwe5OgaSYI0IJvkLqWX1ASG+cJOkEiA=="],
+
     "protobufjs/@types/node": ["@types/node@22.19.3", "", { "dependencies": { "undici-types": "~6.21.0" } }, "sha512-1N9SBnWYOJTrNZCdh/yJE+t910Y128BoyY+zBLWhL3r0TYzlTmFdXrPwHL9DyFZmlEXNQQolTZh3KHV31QDhyA=="],
 
     "proxy-agent/lru-cache": ["lru-cache@7.18.3", "", {}, "sha512-jumlc0BIUrS3qJGgIkWZsyfAM7NCWiBcCDhnd+3NNM5KbBmLTgHVfWBcg6W+rLUsIpzpERPsvwUP7CckAQSOoA=="],
@@ -2876,7 +2972,7 @@
 
     "string-width-cjs/strip-ansi": ["strip-ansi@6.0.1", "", { "dependencies": { "ansi-regex": "^5.0.1" } }, "sha512-Y38VPSHcqkFrCpFnQ9vuSXmquuv5oXOKpGeT6aGrr3o3Gc9AlVa6JBfUSOCnbxGGZF+/0ooI7KrPuUSztUdU5A=="],
 
-    "strip-ansi-cjs/ansi-regex": ["ansi-regex@5.0.1", "", {}, "sha512-quJQXlTSUGL2LH9SUXo8VwsY4soanhgo6LNSm84E1LBcE8s3O0wpdiRzyR9z/ZZJMlMWv37qOOb9pdJlMUEKFQ=="],
+    "strip-ansi/ansi-regex": ["ansi-regex@6.2.2", "", {}, "sha512-Bq3SmSpyFHaWjPk8If9yc6svM8c56dB5BAtW4Qbw5jHTwwXXcTLoRMkpDJp6VL0XzlWaCHTXrkFURMYmD0sLqg=="],
 
     "svgo/commander": ["commander@11.1.0", "", {}, "sha512-yPVavfyCcRhmorC7rWlkHn15b4wDVgVmBA7kV4QVBsF7kv/9TKJAbAXVTxvTnwP8HHKjRCJDClKbciiYS7p0DQ=="],
 
@@ -2888,9 +2984,7 @@
 
     "whatwg-encoding/iconv-lite": ["iconv-lite@0.6.3", "", { "dependencies": { "safer-buffer": ">= 2.1.2 < 3.0.0" } }, "sha512-4fCk79wshMdzMp2rH06qWrJE4iolqLhCUH+OiuIgU++RB0+94NlDL81atO7GX55uUKueo0txHNtvEyI6D7WdMw=="],
 
-    "wrangler/esbuild": ["esbuild@0.17.19", "", { "optionalDependencies": { "@esbuild/android-arm": "0.17.19", "@esbuild/android-arm64": "0.17.19", "@esbuild/android-x64": "0.17.19", "@esbuild/darwin-arm64": "0.17.19", "@esbuild/darwin-x64": "0.17.19", "@esbuild/freebsd-arm64": "0.17.19", "@esbuild/freebsd-x64": "0.17.19", "@esbuild/linux-arm": "0.17.19", "@esbuild/linux-arm64": "0.17.19", "@esbuild/linux-ia32": "0.17.19", "@esbuild/linux-loong64": "0.17.19", "@esbuild/linux-mips64el": "0.17.19", "@esbuild/linux-ppc64": "0.17.19", "@esbuild/linux-riscv64": "0.17.19", "@esbuild/linux-s390x": "0.17.19", "@esbuild/linux-x64": "0.17.19", "@esbuild/netbsd-x64": "0.17.19", "@esbuild/openbsd-x64": "0.17.19", "@esbuild/sunos-x64": "0.17.19", "@esbuild/win32-arm64": "0.17.19", "@esbuild/win32-ia32": "0.17.19", "@esbuild/win32-x64": "0.17.19" }, "bin": { "esbuild": "bin/esbuild" } }, "sha512-XQ0jAPFkK/u3LcVRcvVHQcTIqD6E2H1fvZMA5dQPSOWb3suUbWbfbRf94pjc0bNzRYLfIrDRQXr7X+LHIm5oHw=="],
-
-    "wrangler/sharp": ["sharp@0.33.5", "", { "dependencies": { "color": "^4.2.3", "detect-libc": "^2.0.3", "semver": "^7.6.3" }, "optionalDependencies": { "@img/sharp-darwin-arm64": "0.33.5", "@img/sharp-darwin-x64": "0.33.5", "@img/sharp-libvips-darwin-arm64": "1.0.4", "@img/sharp-libvips-darwin-x64": "1.0.4", "@img/sharp-libvips-linux-arm": "1.0.5", "@img/sharp-libvips-linux-arm64": "1.0.4", "@img/sharp-libvips-linux-s390x": "1.0.4", "@img/sharp-libvips-linux-x64": "1.0.4", "@img/sharp-libvips-linuxmusl-arm64": "1.0.4", "@img/sharp-libvips-linuxmusl-x64": "1.0.4", "@img/sharp-linux-arm": "0.33.5", "@img/sharp-linux-arm64": "0.33.5", "@img/sharp-linux-s390x": "0.33.5", "@img/sharp-linux-x64": "0.33.5", "@img/sharp-linuxmusl-arm64": "0.33.5", "@img/sharp-linuxmusl-x64": "0.33.5", "@img/sharp-wasm32": "0.33.5", "@img/sharp-win32-ia32": "0.33.5", "@img/sharp-win32-x64": "0.33.5" } }, "sha512-haPVm1EkS9pgvHrQ/F3Xy+hgcuMV0Wm9vfIBSiwZ05k+xgb0PkBQpGsAA/oWdDobNaZTH5ppvHtzCFbnSEwHVw=="],
+    "wrangler/esbuild": ["esbuild@0.27.3", "", { "optionalDependencies": { "@esbuild/aix-ppc64": "0.27.3", "@esbuild/android-arm": "0.27.3", "@esbuild/android-arm64": "0.27.3", "@esbuild/android-x64": "0.27.3", "@esbuild/darwin-arm64": "0.27.3", "@esbuild/darwin-x64": "0.27.3", "@esbuild/freebsd-arm64": "0.27.3", "@esbuild/freebsd-x64": "0.27.3", "@esbuild/linux-arm": "0.27.3", "@esbuild/linux-arm64": "0.27.3", "@esbuild/linux-ia32": "0.27.3", "@esbuild/linux-loong64": "0.27.3", "@esbuild/linux-mips64el": "0.27.3", "@esbuild/linux-ppc64": "0.27.3", "@esbuild/linux-riscv64": "0.27.3", "@esbuild/linux-s390x": "0.27.3", "@esbuild/linux-x64": "0.27.3", "@esbuild/netbsd-arm64": "0.27.3", "@esbuild/netbsd-x64": "0.27.3", "@esbuild/openbsd-arm64": "0.27.3", "@esbuild/openbsd-x64": "0.27.3", "@esbuild/openharmony-arm64": "0.27.3", "@esbuild/sunos-x64": "0.27.3", "@esbuild/win32-arm64": "0.27.3", "@esbuild/win32-ia32": "0.27.3", "@esbuild/win32-x64": "0.27.3" }, "bin": { "esbuild": "bin/esbuild" } }, "sha512-8VwMnyGCONIs6cWue2IdpHxHnAjzxnw2Zr7MkVxB2vjmQ2ivqGFb4LEG3SMnv0Gb2F/G/2yA8zUaiL1gywDCCg=="],
 
     "wrap-ansi/ansi-styles": ["ansi-styles@6.2.3", "", {}, "sha512-4Dj6M28JB+oAH8kFkTLUo+a2jwOFkuqb3yucU0CANcRRUbxS0cP0nZYCGjcc3BNXwRIsUVmDGgzawme7zvJHvg=="],
 
@@ -2902,8 +2996,6 @@
 
     "yargs/yargs-parser": ["yargs-parser@20.2.9", "", {}, "sha512-y11nGElTIV+CT3Zv9t7VKl+Q3hTQoT9a1Qzezhhl6Rp21gJ/IVTW7Z3y9EWXhuUBC2Shnf+DX0antecpAwSP8w=="],
 
-    "youch/cookie": ["cookie@0.7.2", "", {}, "sha512-yki5XnKuf750l50uGTllt6kKILY4nQ1eNIQatoXEByZ5dWgnKqbnqmTrBE5B4N7lrMJKQ2ytWMiTO2o0v6Ew/w=="],
-
     "zod-to-ts/zod": ["zod@3.25.76", "", {}, "sha512-gzUt/qt81nXsFGKIFcC3YnfEAx5NkunCfnDlvuBSSFS02bcXu4Lmea0AFIUwbLWxWPx3d9p8S5QoaujKcNQxcQ=="],
 
     "@astrojs/react/@vitejs/plugin-react/@rolldown/pluginutils": ["@rolldown/pluginutils@1.0.0-beta.27", "", {}, "sha512-+d0F4MKMCbeVUJwG96uQ4SgAznZNSq93I3V+9NHA4OpvqG8mRCpGdKmK8l/dl02h2CCDHwW2FqilnTyDcAnqjA=="],
@@ -2926,6 +3018,20 @@
 
     "@plannotator/hooks/@types/node/undici-types": ["undici-types@6.21.0", "", {}, "sha512-iwDZqg0QAGrg9Rav5H4n0M64c3mkR59cJ6wQp+7C4nI0gsmExaedaYLNO44eT4AtBBwjbTiGPMlt2Md0T9H9JQ=="],
 
+    "@plannotator/paste-service/wrangler/@cloudflare/kv-asset-handler": ["@cloudflare/kv-asset-handler@0.3.4", "", { "dependencies": { "mime": "^3.0.0" } }, "sha512-YLPHc8yASwjNkmcDMQMY35yiWjoKAKnhUbPRszBRS0YgH+IXtsMp61j+yTcnCE3oO2DgP0U3iejLC8FTtKDC8Q=="],
+
+    "@plannotator/paste-service/wrangler/@cloudflare/unenv-preset": ["@cloudflare/unenv-preset@2.0.2", "", { "peerDependencies": { "unenv": "2.0.0-rc.14", "workerd": "^1.20250124.0" }, "optionalPeers": ["workerd"] }, "sha512-nyzYnlZjjV5xT3LizahG1Iu6mnrCaxglJ04rZLpDwlDVDZ7v46lNsfxhV3A/xtfgQuSHmLnc6SVI+KwBpc3Lwg=="],
+
+    "@plannotator/paste-service/wrangler/esbuild": ["esbuild@0.17.19", "", { "optionalDependencies": { "@esbuild/android-arm": "0.17.19", "@esbuild/android-arm64": "0.17.19", "@esbuild/android-x64": "0.17.19", "@esbuild/darwin-arm64": "0.17.19", "@esbuild/darwin-x64": "0.17.19", "@esbuild/freebsd-arm64": "0.17.19", "@esbuild/freebsd-x64": "0.17.19", "@esbuild/linux-arm": "0.17.19", "@esbuild/linux-arm64": "0.17.19", "@esbuild/linux-ia32": "0.17.19", "@esbuild/linux-loong64": "0.17.19", "@esbuild/linux-mips64el": "0.17.19", "@esbuild/linux-ppc64": "0.17.19", "@esbuild/linux-riscv64": "0.17.19", "@esbuild/linux-s390x": "0.17.19", "@esbuild/linux-x64": "0.17.19", "@esbuild/netbsd-x64": "0.17.19", "@esbuild/openbsd-x64": "0.17.19", "@esbuild/sunos-x64": "0.17.19", "@esbuild/win32-arm64": "0.17.19", "@esbuild/win32-ia32": "0.17.19", "@esbuild/win32-x64": "0.17.19" }, "bin": { "esbuild": "bin/esbuild" } }, "sha512-XQ0jAPFkK/u3LcVRcvVHQcTIqD6E2H1fvZMA5dQPSOWb3suUbWbfbRf94pjc0bNzRYLfIrDRQXr7X+LHIm5oHw=="],
+
+    "@plannotator/paste-service/wrangler/miniflare": ["miniflare@3.20250718.3", "", { "dependencies": { "@cspotcode/source-map-support": "0.8.1", "acorn": "8.14.0", "acorn-walk": "8.3.2", "exit-hook": "2.2.1", "glob-to-regexp": "0.4.1", "stoppable": "1.1.0", "undici": "^5.28.5", "workerd": "1.20250718.0", "ws": "8.18.0", "youch": "3.3.4", "zod": "3.22.3" }, "bin": { "miniflare": "bootstrap.js" } }, "sha512-JuPrDJhwLrNLEJiNLWO7ZzJrv/Vv9kZuwMYCfv0LskQDM6Eonw4OvywO3CH/wCGjgHzha/qyjUh8JQ068TjDgQ=="],
+
+    "@plannotator/paste-service/wrangler/sharp": ["sharp@0.33.5", "", { "dependencies": { "color": "^4.2.3", "detect-libc": "^2.0.3", "semver": "^7.6.3" }, "optionalDependencies": { "@img/sharp-darwin-arm64": "0.33.5", "@img/sharp-darwin-x64": "0.33.5", "@img/sharp-libvips-darwin-arm64": "1.0.4", "@img/sharp-libvips-darwin-x64": "1.0.4", "@img/sharp-libvips-linux-arm": "1.0.5", "@img/sharp-libvips-linux-arm64": "1.0.4", "@img/sharp-libvips-linux-s390x": "1.0.4", "@img/sharp-libvips-linux-x64": "1.0.4", "@img/sharp-libvips-linuxmusl-arm64": "1.0.4", "@img/sharp-libvips-linuxmusl-x64": "1.0.4", "@img/sharp-linux-arm": "0.33.5", "@img/sharp-linux-arm64": "0.33.5", "@img/sharp-linux-s390x": "0.33.5", "@img/sharp-linux-x64": "0.33.5", "@img/sharp-linuxmusl-arm64": "0.33.5", "@img/sharp-linuxmusl-x64": "0.33.5", "@img/sharp-wasm32": "0.33.5", "@img/sharp-win32-ia32": "0.33.5", "@img/sharp-win32-x64": "0.33.5" } }, "sha512-haPVm1EkS9pgvHrQ/F3Xy+hgcuMV0Wm9vfIBSiwZ05k+xgb0PkBQpGsAA/oWdDobNaZTH5ppvHtzCFbnSEwHVw=="],
+
+    "@plannotator/paste-service/wrangler/unenv": ["unenv@2.0.0-rc.14", "", { "dependencies": { "defu": "^6.1.4", "exsolve": "^1.0.1", "ohash": "^2.0.10", "pathe": "^2.0.3", "ufo": "^1.5.4" } }, "sha512-od496pShMen7nOy5VmVJCnq8rptd45vh6Nx/r2iPbrba6pa6p+tS2ywuIHRZ/OBvSbQZB0kWvpO9XBNVFXHD3Q=="],
+
+    "@plannotator/paste-service/wrangler/workerd": ["workerd@1.20250718.0", "", { "optionalDependencies": { "@cloudflare/workerd-darwin-64": "1.20250718.0", "@cloudflare/workerd-darwin-arm64": "1.20250718.0", "@cloudflare/workerd-linux-64": "1.20250718.0", "@cloudflare/workerd-linux-arm64": "1.20250718.0", "@cloudflare/workerd-windows-64": "1.20250718.0" }, "bin": { "workerd": "bin/workerd" } }, "sha512-kqkIJP/eOfDlUyBzU7joBg+tl8aB25gEAGqDap+nFWb+WHhnooxjGHgxPBy3ipw2hnShPFNOQt5lFRxbwALirg=="],
+
     "@plannotator/portal/@types/node/undici-types": ["undici-types@6.21.0", "", {}, "sha512-iwDZqg0QAGrg9Rav5H4n0M64c3mkR59cJ6wQp+7C4nI0gsmExaedaYLNO44eT4AtBBwjbTiGPMlt2Md0T9H9JQ=="],
 
     "@plannotator/review/@pierre/diffs/diff": ["diff@8.0.3", "", {}, "sha512-qejHi7bcSD4hQAZE0tNAawRK1ZtafHDmMTMkrrIGgSLl7hTnQHmKCeB45xAcbfTqK2zowkM3j3bHt/4b/ARbYQ=="],
@@ -2934,8 +3040,6 @@
 
     "@textlint/linter-formatter/string-width/emoji-regex": ["emoji-regex@8.0.0", "", {}, "sha512-MSjYzcWNOA0ewAHpz0MxpYFvwg6yjy1NG3xteoqz644VCo/RPgnr1/GGt+ic3iJTzQ8Eu3TdM14SawnVUmGE6A=="],
 
-    "@textlint/linter-formatter/strip-ansi/ansi-regex": ["ansi-regex@5.0.1", "", {}, "sha512-quJQXlTSUGL2LH9SUXo8VwsY4soanhgo6LNSm84E1LBcE8s3O0wpdiRzyR9z/ZZJMlMWv37qOOb9pdJlMUEKFQ=="],
-
     "@types/sax/@types/node/undici-types": ["undici-types@6.21.0", "", {}, "sha512-iwDZqg0QAGrg9Rav5H4n0M64c3mkR59cJ6wQp+7C4nI0gsmExaedaYLNO44eT4AtBBwjbTiGPMlt2Md0T9H9JQ=="],
 
     "@vscode/vsce/glob/minimatch": ["minimatch@10.2.2", "", { "dependencies": { "brace-expansion": "^5.0.2" } }, "sha512-+G4CpNBxa5MprY+04MbgOw1v7So6n5JY166pFi9KfYwT78fxScCeSNQSNzp6dpPSW2rONOps6Ocam1wFhCgoVw=="],
@@ -2990,8 +3094,6 @@
 
     "astro/esbuild/@esbuild/openbsd-x64": ["@esbuild/openbsd-x64@0.27.3", "", { "os": "openbsd", "cpu": "x64" }, "sha512-DnW2sRrBzA+YnE70LKqnM3P+z8vehfJWHXECbwBmH/CU51z6FiqTQTHFenPlHmo3a8UgpLyH3PT+87OViOh1AQ=="],
 
-    "astro/esbuild/@esbuild/openharmony-arm64": ["@esbuild/openharmony-arm64@0.27.3", "", { "os": "none", "cpu": "arm64" }, "sha512-NinAEgr/etERPTsZJ7aEZQvvg/A6IsZG/LgZy+81wON2huV7SrK3e63dU0XhyZP4RKGyTm7aOgmQk0bGp0fy2g=="],
-
     "astro/esbuild/@esbuild/sunos-x64": ["@esbuild/sunos-x64@0.27.3", "", { "os": "sunos", "cpu": "x64" }, "sha512-PanZ+nEz+eWoBJ8/f8HKxTTD172SKwdXebZ0ndd953gt1HRBbhMsaNqjTyYLGLPdoWHy4zLU7bDVJztF5f3BHA=="],
 
     "astro/esbuild/@esbuild/win32-arm64": ["@esbuild/win32-arm64@0.27.3", "", { "os": "win32", "cpu": "arm64" }, "sha512-B2t59lWWYrbRDw/tjiWOuzSsFh1Y/E95ofKz7rIVYSQkUYBjfSgf6oeYPNWHToFRr2zx52JKApIcAS/D5TUBnA=="],
@@ -3004,8 +3106,6 @@
 
     "cliui/string-width/emoji-regex": ["emoji-regex@8.0.0", "", {}, "sha512-MSjYzcWNOA0ewAHpz0MxpYFvwg6yjy1NG3xteoqz644VCo/RPgnr1/GGt+ic3iJTzQ8Eu3TdM14SawnVUmGE6A=="],
 
-    "cliui/strip-ansi/ansi-regex": ["ansi-regex@5.0.1", "", {}, "sha512-quJQXlTSUGL2LH9SUXo8VwsY4soanhgo6LNSm84E1LBcE8s3O0wpdiRzyR9z/ZZJMlMWv37qOOb9pdJlMUEKFQ=="],
-
     "csso/css-tree/mdn-data": ["mdn-data@2.0.28", "", {}, "sha512-aylIc7Z9y4yzHYAJNuESG3hfhC+0Ibp/MAMiaOZgNv4pmEdFyfZhhhny4MNiAfWdBQ1RQ2mfDWmM1x8SvGyp8g=="],
 
     "cytoscape-fcose/cose-base/layout-base": ["layout-base@2.0.1", "", {}, "sha512-dp3s92+uNI1hWIpPGH3jK2kxE2lMjdXdr+DH8ynZHpd6PUlH6x6cbuXnoMmiNumznqaNO31xu9e79F0uuZ0JFg=="],
@@ -3032,12 +3132,8 @@
 
     "rimraf/glob/path-scurry": ["path-scurry@1.11.1", "", { "dependencies": { "lru-cache": "^10.2.0", "minipass": "^5.0.0 || ^6.0.2 || ^7.0.0" } }, "sha512-Xa4Nw17FS9ApQFJ9umLiJS4orGjm7ZzwUrwamcGQuHSzDyth9boKDaycYdDcZDuqYATXw4HFXgaqWTctW/v1HA=="],
 
-    "string-width-cjs/strip-ansi/ansi-regex": ["ansi-regex@5.0.1", "", {}, "sha512-quJQXlTSUGL2LH9SUXo8VwsY4soanhgo6LNSm84E1LBcE8s3O0wpdiRzyR9z/ZZJMlMWv37qOOb9pdJlMUEKFQ=="],
-
     "table/string-width/emoji-regex": ["emoji-regex@8.0.0", "", {}, "sha512-MSjYzcWNOA0ewAHpz0MxpYFvwg6yjy1NG3xteoqz644VCo/RPgnr1/GGt+ic3iJTzQ8Eu3TdM14SawnVUmGE6A=="],
 
-    "table/strip-ansi/ansi-regex": ["ansi-regex@5.0.1", "", {}, "sha512-quJQXlTSUGL2LH9SUXo8VwsY4soanhgo6LNSm84E1LBcE8s3O0wpdiRzyR9z/ZZJMlMWv37qOOb9pdJlMUEKFQ=="],
-
     "vite/esbuild/@esbuild/aix-ppc64": ["@esbuild/aix-ppc64@0.25.12", "", { "os": "aix", "cpu": "ppc64" }, "sha512-Hhmwd6CInZ3dwpuGTF8fJG6yoWmsToE+vYgD4nytZVxcu1ulHpUQRAB1UJ8+N1Am3Mz4+xOByoQoSZf4D+CpkA=="],
 
     "vite/esbuild/@esbuild/android-arm": ["@esbuild/android-arm@0.25.12", "", { "os": "android", "cpu": "arm" }, "sha512-VJ+sKvNA/GE7Ccacc9Cha7bpS8nyzVv0jdVgwNDaR4gDMC/2TTRc33Ip8qrNYUcpkOHUT5OZ0bUcNNVZQ9RLlg=="],
@@ -3080,6 +3176,8 @@
 
     "vite/esbuild/@esbuild/openbsd-x64": ["@esbuild/openbsd-x64@0.25.12", "", { "os": "openbsd", "cpu": "x64" }, "sha512-MZyXUkZHjQxUvzK7rN8DJ3SRmrVrke8ZyRusHlP+kuwqTcfWLyqMOE3sScPPyeIXN/mDJIfGXvcMqCgYKekoQw=="],
 
+    "vite/esbuild/@esbuild/openharmony-arm64": ["@esbuild/openharmony-arm64@0.25.12", "", { "os": "none", "cpu": "arm64" }, "sha512-rm0YWsqUSRrjncSXGA7Zv78Nbnw4XL6/dzr20cyrQf7ZmRcsovpcRBdhD43Nuk3y7XIoW2OxMVvwuRvk9XdASg=="],
+
     "vite/esbuild/@esbuild/sunos-x64": ["@esbuild/sunos-x64@0.25.12", "", { "os": "sunos", "cpu": "x64" }, "sha512-3wGSCDyuTHQUzt0nV7bocDy72r2lI33QL3gkDNGkod22EsYl04sMf0qLb8luNKTOmgF/eDEDP5BFNwoBKH441w=="],
 
     "vite/esbuild/@esbuild/win32-arm64": ["@esbuild/win32-arm64@0.25.12", "", { "os": "win32", "cpu": "arm64" }, "sha512-rMmLrur64A7+DKlnSuwqUdRKyd3UE7oPJZmnljqEptesKM8wx9J8gx5u0+9Pq0fQQW8vqeKebwNXdfOyP+8Bsg=="],
@@ -3088,111 +3186,179 @@
 
     "vite/esbuild/@esbuild/win32-x64": ["@esbuild/win32-x64@0.25.12", "", { "os": "win32", "cpu": "x64" }, "sha512-alJC0uCZpTFrSL0CCDjcgleBXPnCrEAhTBILpeAp7M/OFgoqtAetfBzX0xM00MUsVVPpVjlPuMbREqnZCXaTnA=="],
 
-    "wrangler/esbuild/@esbuild/android-arm": ["@esbuild/android-arm@0.17.19", "", { "os": "android", "cpu": "arm" }, "sha512-rIKddzqhmav7MSmoFCmDIb6e2W57geRsM94gV2l38fzhXMwq7hZoClug9USI2pFRGL06f4IOPHHpFNOkWieR8A=="],
+    "wrangler/esbuild/@esbuild/aix-ppc64": ["@esbuild/aix-ppc64@0.27.3", "", { "os": "aix", "cpu": "ppc64" }, "sha512-9fJMTNFTWZMh5qwrBItuziu834eOCUcEqymSH7pY+zoMVEZg3gcPuBNxH1EvfVYe9h0x/Ptw8KBzv7qxb7l8dg=="],
 
-    "wrangler/esbuild/@esbuild/android-arm64": ["@esbuild/android-arm64@0.17.19", "", { "os": "android", "cpu": "arm64" }, "sha512-KBMWvEZooR7+kzY0BtbTQn0OAYY7CsiydT63pVEaPtVYF0hXbUaOyZog37DKxK7NF3XacBJOpYT4adIJh+avxA=="],
+    "wrangler/esbuild/@esbuild/android-arm": ["@esbuild/android-arm@0.27.3", "", { "os": "android", "cpu": "arm" }, "sha512-i5D1hPY7GIQmXlXhs2w8AWHhenb00+GxjxRncS2ZM7YNVGNfaMxgzSGuO8o8SJzRc/oZwU2bcScvVERk03QhzA=="],
 
-    "wrangler/esbuild/@esbuild/android-x64": ["@esbuild/android-x64@0.17.19", "", { "os": "android", "cpu": "x64" }, "sha512-uUTTc4xGNDT7YSArp/zbtmbhO0uEEK9/ETW29Wk1thYUJBz3IVnvgEiEwEa9IeLyvnpKrWK64Utw2bgUmDveww=="],
+    "wrangler/esbuild/@esbuild/android-arm64": ["@esbuild/android-arm64@0.27.3", "", { "os": "android", "cpu": "arm64" }, "sha512-YdghPYUmj/FX2SYKJ0OZxf+iaKgMsKHVPF1MAq/P8WirnSpCStzKJFjOjzsW0QQ7oIAiccHdcqjbHmJxRb/dmg=="],
 
-    "wrangler/esbuild/@esbuild/darwin-arm64": ["@esbuild/darwin-arm64@0.17.19", "", { "os": "darwin", "cpu": "arm64" }, "sha512-80wEoCfF/hFKM6WE1FyBHc9SfUblloAWx6FJkFWTWiCoht9Mc0ARGEM47e67W9rI09YoUxJL68WHfDRYEAvOhg=="],
+    "wrangler/esbuild/@esbuild/android-x64": ["@esbuild/android-x64@0.27.3", "", { "os": "android", "cpu": "x64" }, "sha512-IN/0BNTkHtk8lkOM8JWAYFg4ORxBkZQf9zXiEOfERX/CzxW3Vg1ewAhU7QSWQpVIzTW+b8Xy+lGzdYXV6UZObQ=="],
 
-    "wrangler/esbuild/@esbuild/darwin-x64": ["@esbuild/darwin-x64@0.17.19", "", { "os": "darwin", "cpu": "x64" }, "sha512-IJM4JJsLhRYr9xdtLytPLSH9k/oxR3boaUIYiHkAawtwNOXKE8KoU8tMvryogdcT8AU+Bflmh81Xn6Q0vTZbQw=="],
+    "wrangler/esbuild/@esbuild/darwin-arm64": ["@esbuild/darwin-arm64@0.27.3", "", { "os": "darwin", "cpu": "arm64" }, "sha512-Re491k7ByTVRy0t3EKWajdLIr0gz2kKKfzafkth4Q8A5n1xTHrkqZgLLjFEHVD+AXdUGgQMq+Godfq45mGpCKg=="],
 
-    "wrangler/esbuild/@esbuild/freebsd-arm64": ["@esbuild/freebsd-arm64@0.17.19", "", { "os": "freebsd", "cpu": "arm64" }, "sha512-pBwbc7DufluUeGdjSU5Si+P3SoMF5DQ/F/UmTSb8HXO80ZEAJmrykPyzo1IfNbAoaqw48YRpv8shwd1NoI0jcQ=="],
+    "wrangler/esbuild/@esbuild/darwin-x64": ["@esbuild/darwin-x64@0.27.3", "", { "os": "darwin", "cpu": "x64" }, "sha512-vHk/hA7/1AckjGzRqi6wbo+jaShzRowYip6rt6q7VYEDX4LEy1pZfDpdxCBnGtl+A5zq8iXDcyuxwtv3hNtHFg=="],
 
-    "wrangler/esbuild/@esbuild/freebsd-x64": ["@esbuild/freebsd-x64@0.17.19", "", { "os": "freebsd", "cpu": "x64" }, "sha512-4lu+n8Wk0XlajEhbEffdy2xy53dpR06SlzvhGByyg36qJw6Kpfk7cp45DR/62aPH9mtJRmIyrXAS5UWBrJT6TQ=="],
+    "wrangler/esbuild/@esbuild/freebsd-arm64": ["@esbuild/freebsd-arm64@0.27.3", "", { "os": "freebsd", "cpu": "arm64" }, "sha512-ipTYM2fjt3kQAYOvo6vcxJx3nBYAzPjgTCk7QEgZG8AUO3ydUhvelmhrbOheMnGOlaSFUoHXB6un+A7q4ygY9w=="],
 
-    "wrangler/esbuild/@esbuild/linux-arm": ["@esbuild/linux-arm@0.17.19", "", { "os": "linux", "cpu": "arm" }, "sha512-cdmT3KxjlOQ/gZ2cjfrQOtmhG4HJs6hhvm3mWSRDPtZ/lP5oe8FWceS10JaSJC13GBd4eH/haHnqf7hhGNLerA=="],
+    "wrangler/esbuild/@esbuild/freebsd-x64": ["@esbuild/freebsd-x64@0.27.3", "", { "os": "freebsd", "cpu": "x64" }, "sha512-dDk0X87T7mI6U3K9VjWtHOXqwAMJBNN2r7bejDsc+j03SEjtD9HrOl8gVFByeM0aJksoUuUVU9TBaZa2rgj0oA=="],
 
-    "wrangler/esbuild/@esbuild/linux-arm64": ["@esbuild/linux-arm64@0.17.19", "", { "os": "linux", "cpu": "arm64" }, "sha512-ct1Tg3WGwd3P+oZYqic+YZF4snNl2bsnMKRkb3ozHmnM0dGWuxcPTTntAF6bOP0Sp4x0PjSF+4uHQ1xvxfRKqg=="],
+    "wrangler/esbuild/@esbuild/linux-arm": ["@esbuild/linux-arm@0.27.3", "", { "os": "linux", "cpu": "arm" }, "sha512-s6nPv2QkSupJwLYyfS+gwdirm0ukyTFNl3KTgZEAiJDd+iHZcbTPPcWCcRYH+WlNbwChgH2QkE9NSlNrMT8Gfw=="],
 
-    "wrangler/esbuild/@esbuild/linux-ia32": ["@esbuild/linux-ia32@0.17.19", "", { "os": "linux", "cpu": "ia32" }, "sha512-w4IRhSy1VbsNxHRQpeGCHEmibqdTUx61Vc38APcsRbuVgK0OPEnQ0YD39Brymn96mOx48Y2laBQGqgZ0j9w6SQ=="],
+    "wrangler/esbuild/@esbuild/linux-arm64": ["@esbuild/linux-arm64@0.27.3", "", { "os": "linux", "cpu": "arm64" }, "sha512-sZOuFz/xWnZ4KH3YfFrKCf1WyPZHakVzTiqji3WDc0BCl2kBwiJLCXpzLzUBLgmp4veFZdvN5ChW4Eq/8Fc2Fg=="],
 
-    "wrangler/esbuild/@esbuild/linux-loong64": ["@esbuild/linux-loong64@0.17.19", "", { "os": "linux", "cpu": "none" }, "sha512-2iAngUbBPMq439a+z//gE+9WBldoMp1s5GWsUSgqHLzLJ9WoZLZhpwWuym0u0u/4XmZ3gpHmzV84PonE+9IIdQ=="],
+    "wrangler/esbuild/@esbuild/linux-ia32": ["@esbuild/linux-ia32@0.27.3", "", { "os": "linux", "cpu": "ia32" }, "sha512-yGlQYjdxtLdh0a3jHjuwOrxQjOZYD/C9PfdbgJJF3TIZWnm/tMd/RcNiLngiu4iwcBAOezdnSLAwQDPqTmtTYg=="],
 
-    "wrangler/esbuild/@esbuild/linux-mips64el": ["@esbuild/linux-mips64el@0.17.19", "", { "os": "linux", "cpu": "none" }, "sha512-LKJltc4LVdMKHsrFe4MGNPp0hqDFA1Wpt3jE1gEyM3nKUvOiO//9PheZZHfYRfYl6AwdTH4aTcXSqBerX0ml4A=="],
+    "wrangler/esbuild/@esbuild/linux-loong64": ["@esbuild/linux-loong64@0.27.3", "", { "os": "linux", "cpu": "none" }, "sha512-WO60Sn8ly3gtzhyjATDgieJNet/KqsDlX5nRC5Y3oTFcS1l0KWba+SEa9Ja1GfDqSF1z6hif/SkpQJbL63cgOA=="],
 
-    "wrangler/esbuild/@esbuild/linux-ppc64": ["@esbuild/linux-ppc64@0.17.19", "", { "os": "linux", "cpu": "ppc64" }, "sha512-/c/DGybs95WXNS8y3Ti/ytqETiW7EU44MEKuCAcpPto3YjQbyK3IQVKfF6nbghD7EcLUGl0NbiL5Rt5DMhn5tg=="],
+    "wrangler/esbuild/@esbuild/linux-mips64el": ["@esbuild/linux-mips64el@0.27.3", "", { "os": "linux", "cpu": "none" }, "sha512-APsymYA6sGcZ4pD6k+UxbDjOFSvPWyZhjaiPyl/f79xKxwTnrn5QUnXR5prvetuaSMsb4jgeHewIDCIWljrSxw=="],
 
-    "wrangler/esbuild/@esbuild/linux-riscv64": ["@esbuild/linux-riscv64@0.17.19", "", { "os": "linux", "cpu": "none" }, "sha512-FC3nUAWhvFoutlhAkgHf8f5HwFWUL6bYdvLc/TTuxKlvLi3+pPzdZiFKSWz/PF30TB1K19SuCxDTI5KcqASJqA=="],
+    "wrangler/esbuild/@esbuild/linux-ppc64": ["@esbuild/linux-ppc64@0.27.3", "", { "os": "linux", "cpu": "ppc64" }, "sha512-eizBnTeBefojtDb9nSh4vvVQ3V9Qf9Df01PfawPcRzJH4gFSgrObw+LveUyDoKU3kxi5+9RJTCWlj4FjYXVPEA=="],
 
-    "wrangler/esbuild/@esbuild/linux-s390x": ["@esbuild/linux-s390x@0.17.19", "", { "os": "linux", "cpu": "s390x" }, "sha512-IbFsFbxMWLuKEbH+7sTkKzL6NJmG2vRyy6K7JJo55w+8xDk7RElYn6xvXtDW8HCfoKBFK69f3pgBJSUSQPr+4Q=="],
+    "wrangler/esbuild/@esbuild/linux-riscv64": ["@esbuild/linux-riscv64@0.27.3", "", { "os": "linux", "cpu": "none" }, "sha512-3Emwh0r5wmfm3ssTWRQSyVhbOHvqegUDRd0WhmXKX2mkHJe1SFCMJhagUleMq+Uci34wLSipf8Lagt4LlpRFWQ=="],
 
-    "wrangler/esbuild/@esbuild/linux-x64": ["@esbuild/linux-x64@0.17.19", "", { "os": "linux", "cpu": "x64" }, "sha512-68ngA9lg2H6zkZcyp22tsVt38mlhWde8l3eJLWkyLrp4HwMUr3c1s/M2t7+kHIhvMjglIBrFpncX1SzMckomGw=="],
+    "wrangler/esbuild/@esbuild/linux-s390x": ["@esbuild/linux-s390x@0.27.3", "", { "os": "linux", "cpu": "s390x" }, "sha512-pBHUx9LzXWBc7MFIEEL0yD/ZVtNgLytvx60gES28GcWMqil8ElCYR4kvbV2BDqsHOvVDRrOxGySBM9Fcv744hw=="],
 
-    "wrangler/esbuild/@esbuild/netbsd-x64": ["@esbuild/netbsd-x64@0.17.19", "", { "os": "none", "cpu": "x64" }, "sha512-CwFq42rXCR8TYIjIfpXCbRX0rp1jo6cPIUPSaWwzbVI4aOfX96OXY8M6KNmtPcg7QjYeDmN+DD0Wp3LaBOLf4Q=="],
+    "wrangler/esbuild/@esbuild/linux-x64": ["@esbuild/linux-x64@0.27.3", "", { "os": "linux", "cpu": "x64" }, "sha512-Czi8yzXUWIQYAtL/2y6vogER8pvcsOsk5cpwL4Gk5nJqH5UZiVByIY8Eorm5R13gq+DQKYg0+JyQoytLQas4dA=="],
 
-    "wrangler/esbuild/@esbuild/openbsd-x64": ["@esbuild/openbsd-x64@0.17.19", "", { "os": "openbsd", "cpu": "x64" }, "sha512-cnq5brJYrSZ2CF6c35eCmviIN3k3RczmHz8eYaVlNasVqsNY+JKohZU5MKmaOI+KkllCdzOKKdPs762VCPC20g=="],
+    "wrangler/esbuild/@esbuild/netbsd-arm64": ["@esbuild/netbsd-arm64@0.27.3", "", { "os": "none", "cpu": "arm64" }, "sha512-sDpk0RgmTCR/5HguIZa9n9u+HVKf40fbEUt+iTzSnCaGvY9kFP0YKBWZtJaraonFnqef5SlJ8/TiPAxzyS+UoA=="],
 
-    "wrangler/esbuild/@esbuild/sunos-x64": ["@esbuild/sunos-x64@0.17.19", "", { "os": "sunos", "cpu": "x64" }, "sha512-vCRT7yP3zX+bKWFeP/zdS6SqdWB8OIpaRq/mbXQxTGHnIxspRtigpkUcDMlSCOejlHowLqII7K2JKevwyRP2rg=="],
+    "wrangler/esbuild/@esbuild/netbsd-x64": ["@esbuild/netbsd-x64@0.27.3", "", { "os": "none", "cpu": "x64" }, "sha512-P14lFKJl/DdaE00LItAukUdZO5iqNH7+PjoBm+fLQjtxfcfFE20Xf5CrLsmZdq5LFFZzb5JMZ9grUwvtVYzjiA=="],
 
-    "wrangler/esbuild/@esbuild/win32-arm64": ["@esbuild/win32-arm64@0.17.19", "", { "os": "win32", "cpu": "arm64" }, "sha512-yYx+8jwowUstVdorcMdNlzklLYhPxjniHWFKgRqH7IFlUEa0Umu3KuYplf1HUZZ422e3NU9F4LGb+4O0Kdcaag=="],
+    "wrangler/esbuild/@esbuild/openbsd-arm64": ["@esbuild/openbsd-arm64@0.27.3", "", { "os": "openbsd", "cpu": "arm64" }, "sha512-AIcMP77AvirGbRl/UZFTq5hjXK+2wC7qFRGoHSDrZ5v5b8DK/GYpXW3CPRL53NkvDqb9D+alBiC/dV0Fb7eJcw=="],
 
-    "wrangler/esbuild/@esbuild/win32-ia32": ["@esbuild/win32-ia32@0.17.19", "", { "os": "win32", "cpu": "ia32" }, "sha512-eggDKanJszUtCdlVs0RB+h35wNlb5v4TWEkq4vZcmVt5u/HiDZrTXe2bWFQUez3RgNHwx/x4sk5++4NSSicKkw=="],
+    "wrangler/esbuild/@esbuild/openbsd-x64": ["@esbuild/openbsd-x64@0.27.3", "", { "os": "openbsd", "cpu": "x64" }, "sha512-DnW2sRrBzA+YnE70LKqnM3P+z8vehfJWHXECbwBmH/CU51z6FiqTQTHFenPlHmo3a8UgpLyH3PT+87OViOh1AQ=="],
 
-    "wrangler/esbuild/@esbuild/win32-x64": ["@esbuild/win32-x64@0.17.19", "", { "os": "win32", "cpu": "x64" }, "sha512-lAhycmKnVOuRYNtRtatQR1LPQf2oYCkRGkSFnseDAKPl8lu5SOsK/e1sXe5a0Pc5kHIHe6P2I/ilntNv2xf3cA=="],
+    "wrangler/esbuild/@esbuild/sunos-x64": ["@esbuild/sunos-x64@0.27.3", "", { "os": "sunos", "cpu": "x64" }, "sha512-PanZ+nEz+eWoBJ8/f8HKxTTD172SKwdXebZ0ndd953gt1HRBbhMsaNqjTyYLGLPdoWHy4zLU7bDVJztF5f3BHA=="],
 
-    "wrangler/sharp/@img/sharp-darwin-arm64": ["@img/sharp-darwin-arm64@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-darwin-arm64": "1.0.4" }, "os": "darwin", "cpu": "arm64" }, "sha512-UT4p+iz/2H4twwAoLCqfA9UH5pI6DggwKEGuaPy7nCVQ8ZsiY5PIcrRvD1DzuY3qYL07NtIQcWnBSY/heikIFQ=="],
+    "wrangler/esbuild/@esbuild/win32-arm64": ["@esbuild/win32-arm64@0.27.3", "", { "os": "win32", "cpu": "arm64" }, "sha512-B2t59lWWYrbRDw/tjiWOuzSsFh1Y/E95ofKz7rIVYSQkUYBjfSgf6oeYPNWHToFRr2zx52JKApIcAS/D5TUBnA=="],
 
-    "wrangler/sharp/@img/sharp-darwin-x64": ["@img/sharp-darwin-x64@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-darwin-x64": "1.0.4" }, "os": "darwin", "cpu": "x64" }, "sha512-fyHac4jIc1ANYGRDxtiqelIbdWkIuQaI84Mv45KvGRRxSAa7o7d1ZKAOBaYbnepLC1WqxfpimdeWfvqqSGwR2Q=="],
+    "wrangler/esbuild/@esbuild/win32-ia32": ["@esbuild/win32-ia32@0.27.3", "", { "os": "win32", "cpu": "ia32" }, "sha512-QLKSFeXNS8+tHW7tZpMtjlNb7HKau0QDpwm49u0vUp9y1WOF+PEzkU84y9GqYaAVW8aH8f3GcBck26jh54cX4Q=="],
 
-    "wrangler/sharp/@img/sharp-libvips-darwin-arm64": ["@img/sharp-libvips-darwin-arm64@1.0.4", "", { "os": "darwin", "cpu": "arm64" }, "sha512-XblONe153h0O2zuFfTAbQYAX2JhYmDHeWikp1LM9Hul9gVPjFY427k6dFEcOL72O01QxQsWi761svJ/ev9xEDg=="],
+    "wrangler/esbuild/@esbuild/win32-x64": ["@esbuild/win32-x64@0.27.3", "", { "os": "win32", "cpu": "x64" }, "sha512-4uJGhsxuptu3OcpVAzli+/gWusVGwZZHTlS63hh++ehExkVT8SgiEf7/uC/PclrPPkLhZqGgCTjd0VWLo6xMqA=="],
 
-    "wrangler/sharp/@img/sharp-libvips-darwin-x64": ["@img/sharp-libvips-darwin-x64@1.0.4", "", { "os": "darwin", "cpu": "x64" }, "sha512-xnGR8YuZYfJGmWPvmlunFaWJsb9T/AO2ykoP3Fz/0X5XV2aoYBPkX6xqCQvUTKKiLddarLaxpzNe+b1hjeWHAQ=="],
+    "wrap-ansi-cjs/string-width/emoji-regex": ["emoji-regex@8.0.0", "", {}, "sha512-MSjYzcWNOA0ewAHpz0MxpYFvwg6yjy1NG3xteoqz644VCo/RPgnr1/GGt+ic3iJTzQ8Eu3TdM14SawnVUmGE6A=="],
 
-    "wrangler/sharp/@img/sharp-libvips-linux-arm": ["@img/sharp-libvips-linux-arm@1.0.5", "", { "os": "linux", "cpu": "arm" }, "sha512-gvcC4ACAOPRNATg/ov8/MnbxFDJqf/pDePbBnuBDcjsI8PssmjoKMAz4LtLaVi+OnSb5FK/yIOamqDwGmXW32g=="],
+    "yargs/string-width/emoji-regex": ["emoji-regex@8.0.0", "", {}, "sha512-MSjYzcWNOA0ewAHpz0MxpYFvwg6yjy1NG3xteoqz644VCo/RPgnr1/GGt+ic3iJTzQ8Eu3TdM14SawnVUmGE6A=="],
 
-    "wrangler/sharp/@img/sharp-libvips-linux-arm64": ["@img/sharp-libvips-linux-arm64@1.0.4", "", { "os": "linux", "cpu": "arm64" }, "sha512-9B+taZ8DlyyqzZQnoeIvDVR/2F4EbMepXMc/NdVbkzsJbzkUjhXv/70GQJ7tdLA4YJgNP25zukcxpX2/SueNrA=="],
+    "yargs/string-width/strip-ansi": ["strip-ansi@6.0.1", "", { "dependencies": { "ansi-regex": "^5.0.1" } }, "sha512-Y38VPSHcqkFrCpFnQ9vuSXmquuv5oXOKpGeT6aGrr3o3Gc9AlVa6JBfUSOCnbxGGZF+/0ooI7KrPuUSztUdU5A=="],
 
-    "wrangler/sharp/@img/sharp-libvips-linux-s390x": ["@img/sharp-libvips-linux-s390x@1.0.4", "", { "os": "linux", "cpu": "s390x" }, "sha512-u7Wz6ntiSSgGSGcjZ55im6uvTrOxSIS8/dgoVMoiGE9I6JAfU50yH5BoDlYA1tcuGS7g/QNtetJnxA6QEsCVTA=="],
+    "@aws-crypto/sha256-browser/@smithy/util-utf8/@smithy/util-buffer-from/@smithy/is-array-buffer": ["@smithy/is-array-buffer@2.2.0", "", { "dependencies": { "tslib": "^2.6.2" } }, "sha512-GGP3O9QFD24uGeAXYUjwSTXARoqpZykHadOmA8G5vfJPK0/DC67qa//0qvqrJzL1xc8WQWX7/yc7fwudjPHPhA=="],
 
-    "wrangler/sharp/@img/sharp-libvips-linux-x64": ["@img/sharp-libvips-linux-x64@1.0.4", "", { "os": "linux", "cpu": "x64" }, "sha512-MmWmQ3iPFZr0Iev+BAgVMb3ZyC4KeFc3jFxnNbEPas60e1cIfevbtuyf9nDGIzOaW9PdnDciJm+wFFaTlj5xYw=="],
+    "@aws-crypto/util/@smithy/util-utf8/@smithy/util-buffer-from/@smithy/is-array-buffer": ["@smithy/is-array-buffer@2.2.0", "", { "dependencies": { "tslib": "^2.6.2" } }, "sha512-GGP3O9QFD24uGeAXYUjwSTXARoqpZykHadOmA8G5vfJPK0/DC67qa//0qvqrJzL1xc8WQWX7/yc7fwudjPHPhA=="],
 
-    "wrangler/sharp/@img/sharp-libvips-linuxmusl-arm64": ["@img/sharp-libvips-linuxmusl-arm64@1.0.4", "", { "os": "linux", "cpu": "arm64" }, "sha512-9Ti+BbTYDcsbp4wfYib8Ctm1ilkugkA/uscUn6UXK1ldpC1JjiXbLfFZtRlBhjPZ5o1NCLiDbg8fhUPKStHoTA=="],
+    "@aws-sdk/credential-provider-sso/@aws-sdk/token-providers/@aws-sdk/nested-clients/@aws-sdk/util-endpoints": ["@aws-sdk/util-endpoints@3.993.0", "", { "dependencies": { "@aws-sdk/types": "^3.973.1", "@smithy/types": "^4.12.0", "@smithy/url-parser": "^4.2.8", "@smithy/util-endpoints": "^3.2.8", "tslib": "^2.6.2" } }, "sha512-j6vioBeRZ4eHX4SWGvGPpwGg/xSOcK7f1GL0VM+rdf3ZFTIsUEhCFmD78B+5r2PgztcECSzEfvHQX01k8dPQPw=="],
 
-    "wrangler/sharp/@img/sharp-libvips-linuxmusl-x64": ["@img/sharp-libvips-linuxmusl-x64@1.0.4", "", { "os": "linux", "cpu": "x64" }, "sha512-viYN1KX9m+/hGkJtvYYp+CCLgnJXwiQB39damAO7WMdKWlIhmYTfHjwSbQeUK/20vY154mwezd9HflVFM1wVSw=="],
+    "@plannotator/paste-service/wrangler/@cloudflare/kv-asset-handler/mime": ["mime@3.0.0", "", { "bin": { "mime": "cli.js" } }, "sha512-jSCU7/VB1loIWBZe14aEYHU/+1UMEHoaO7qxCOVJOw9GgH72VAWppxNcjU+x9a2k3GSIBXNKxXQFqRvvZ7vr3A=="],
 
-    "wrangler/sharp/@img/sharp-linux-arm": ["@img/sharp-linux-arm@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-linux-arm": "1.0.5" }, "os": "linux", "cpu": "arm" }, "sha512-JTS1eldqZbJxjvKaAkxhZmBqPRGmxgu+qFKSInv8moZ2AmT5Yib3EQ1c6gp493HvrvV8QgdOXdyaIBrhvFhBMQ=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/android-arm": ["@esbuild/android-arm@0.17.19", "", { "os": "android", "cpu": "arm" }, "sha512-rIKddzqhmav7MSmoFCmDIb6e2W57geRsM94gV2l38fzhXMwq7hZoClug9USI2pFRGL06f4IOPHHpFNOkWieR8A=="],
 
-    "wrangler/sharp/@img/sharp-linux-arm64": ["@img/sharp-linux-arm64@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-linux-arm64": "1.0.4" }, "os": "linux", "cpu": "arm64" }, "sha512-JMVv+AMRyGOHtO1RFBiJy/MBsgz0x4AWrT6QoEVVTyh1E39TrCUpTRI7mx9VksGX4awWASxqCYLCV4wBZHAYxA=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/android-arm64": ["@esbuild/android-arm64@0.17.19", "", { "os": "android", "cpu": "arm64" }, "sha512-KBMWvEZooR7+kzY0BtbTQn0OAYY7CsiydT63pVEaPtVYF0hXbUaOyZog37DKxK7NF3XacBJOpYT4adIJh+avxA=="],
 
-    "wrangler/sharp/@img/sharp-linux-s390x": ["@img/sharp-linux-s390x@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-linux-s390x": "1.0.4" }, "os": "linux", "cpu": "s390x" }, "sha512-y/5PCd+mP4CA/sPDKl2961b+C9d+vPAveS33s6Z3zfASk2j5upL6fXVPZi7ztePZ5CuH+1kW8JtvxgbuXHRa4Q=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/android-x64": ["@esbuild/android-x64@0.17.19", "", { "os": "android", "cpu": "x64" }, "sha512-uUTTc4xGNDT7YSArp/zbtmbhO0uEEK9/ETW29Wk1thYUJBz3IVnvgEiEwEa9IeLyvnpKrWK64Utw2bgUmDveww=="],
 
-    "wrangler/sharp/@img/sharp-linux-x64": ["@img/sharp-linux-x64@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-linux-x64": "1.0.4" }, "os": "linux", "cpu": "x64" }, "sha512-opC+Ok5pRNAzuvq1AG0ar+1owsu842/Ab+4qvU879ippJBHvyY5n2mxF1izXqkPYlGuP/M556uh53jRLJmzTWA=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/darwin-arm64": ["@esbuild/darwin-arm64@0.17.19", "", { "os": "darwin", "cpu": "arm64" }, "sha512-80wEoCfF/hFKM6WE1FyBHc9SfUblloAWx6FJkFWTWiCoht9Mc0ARGEM47e67W9rI09YoUxJL68WHfDRYEAvOhg=="],
 
-    "wrangler/sharp/@img/sharp-linuxmusl-arm64": ["@img/sharp-linuxmusl-arm64@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-linuxmusl-arm64": "1.0.4" }, "os": "linux", "cpu": "arm64" }, "sha512-XrHMZwGQGvJg2V/oRSUfSAfjfPxO+4DkiRh6p2AFjLQztWUuY/o8Mq0eMQVIY7HJ1CDQUJlxGGZRw1a5bqmd1g=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/darwin-x64": ["@esbuild/darwin-x64@0.17.19", "", { "os": "darwin", "cpu": "x64" }, "sha512-IJM4JJsLhRYr9xdtLytPLSH9k/oxR3boaUIYiHkAawtwNOXKE8KoU8tMvryogdcT8AU+Bflmh81Xn6Q0vTZbQw=="],
 
-    "wrangler/sharp/@img/sharp-linuxmusl-x64": ["@img/sharp-linuxmusl-x64@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-linuxmusl-x64": "1.0.4" }, "os": "linux", "cpu": "x64" }, "sha512-WT+d/cgqKkkKySYmqoZ8y3pxx7lx9vVejxW/W4DOFMYVSkErR+w7mf2u8m/y4+xHe7yY9DAXQMWQhpnMuFfScw=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/freebsd-arm64": ["@esbuild/freebsd-arm64@0.17.19", "", { "os": "freebsd", "cpu": "arm64" }, "sha512-pBwbc7DufluUeGdjSU5Si+P3SoMF5DQ/F/UmTSb8HXO80ZEAJmrykPyzo1IfNbAoaqw48YRpv8shwd1NoI0jcQ=="],
 
-    "wrangler/sharp/@img/sharp-wasm32": ["@img/sharp-wasm32@0.33.5", "", { "dependencies": { "@emnapi/runtime": "^1.2.0" }, "cpu": "none" }, "sha512-ykUW4LVGaMcU9lu9thv85CbRMAwfeadCJHRsg2GmeRa/cJxsVY9Rbd57JcMxBkKHag5U/x7TSBpScF4U8ElVzg=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/freebsd-x64": ["@esbuild/freebsd-x64@0.17.19", "", { "os": "freebsd", "cpu": "x64" }, "sha512-4lu+n8Wk0XlajEhbEffdy2xy53dpR06SlzvhGByyg36qJw6Kpfk7cp45DR/62aPH9mtJRmIyrXAS5UWBrJT6TQ=="],
 
-    "wrangler/sharp/@img/sharp-win32-ia32": ["@img/sharp-win32-ia32@0.33.5", "", { "os": "win32", "cpu": "ia32" }, "sha512-T36PblLaTwuVJ/zw/LaH0PdZkRz5rd3SmMHX8GSmR7vtNSP5Z6bQkExdSK7xGWyxLw4sUknBuugTelgw2faBbQ=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/linux-arm": ["@esbuild/linux-arm@0.17.19", "", { "os": "linux", "cpu": "arm" }, "sha512-cdmT3KxjlOQ/gZ2cjfrQOtmhG4HJs6hhvm3mWSRDPtZ/lP5oe8FWceS10JaSJC13GBd4eH/haHnqf7hhGNLerA=="],
 
-    "wrangler/sharp/@img/sharp-win32-x64": ["@img/sharp-win32-x64@0.33.5", "", { "os": "win32", "cpu": "x64" }, "sha512-MpY/o8/8kj+EcnxwvrP4aTJSWw/aZ7JIGR4aBeZkZw5B7/Jn+tY9/VNwtcoGmdT7GfggGIU4kygOMSbYnOrAbg=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/linux-arm64": ["@esbuild/linux-arm64@0.17.19", "", { "os": "linux", "cpu": "arm64" }, "sha512-ct1Tg3WGwd3P+oZYqic+YZF4snNl2bsnMKRkb3ozHmnM0dGWuxcPTTntAF6bOP0Sp4x0PjSF+4uHQ1xvxfRKqg=="],
 
-    "wrap-ansi-cjs/string-width/emoji-regex": ["emoji-regex@8.0.0", "", {}, "sha512-MSjYzcWNOA0ewAHpz0MxpYFvwg6yjy1NG3xteoqz644VCo/RPgnr1/GGt+ic3iJTzQ8Eu3TdM14SawnVUmGE6A=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/linux-ia32": ["@esbuild/linux-ia32@0.17.19", "", { "os": "linux", "cpu": "ia32" }, "sha512-w4IRhSy1VbsNxHRQpeGCHEmibqdTUx61Vc38APcsRbuVgK0OPEnQ0YD39Brymn96mOx48Y2laBQGqgZ0j9w6SQ=="],
 
-    "wrap-ansi-cjs/strip-ansi/ansi-regex": ["ansi-regex@5.0.1", "", {}, "sha512-quJQXlTSUGL2LH9SUXo8VwsY4soanhgo6LNSm84E1LBcE8s3O0wpdiRzyR9z/ZZJMlMWv37qOOb9pdJlMUEKFQ=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/linux-loong64": ["@esbuild/linux-loong64@0.17.19", "", { "os": "linux", "cpu": "none" }, "sha512-2iAngUbBPMq439a+z//gE+9WBldoMp1s5GWsUSgqHLzLJ9WoZLZhpwWuym0u0u/4XmZ3gpHmzV84PonE+9IIdQ=="],
 
-    "yargs/string-width/emoji-regex": ["emoji-regex@8.0.0", "", {}, "sha512-MSjYzcWNOA0ewAHpz0MxpYFvwg6yjy1NG3xteoqz644VCo/RPgnr1/GGt+ic3iJTzQ8Eu3TdM14SawnVUmGE6A=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/linux-mips64el": ["@esbuild/linux-mips64el@0.17.19", "", { "os": "linux", "cpu": "none" }, "sha512-LKJltc4LVdMKHsrFe4MGNPp0hqDFA1Wpt3jE1gEyM3nKUvOiO//9PheZZHfYRfYl6AwdTH4aTcXSqBerX0ml4A=="],
 
-    "yargs/string-width/strip-ansi": ["strip-ansi@6.0.1", "", { "dependencies": { "ansi-regex": "^5.0.1" } }, "sha512-Y38VPSHcqkFrCpFnQ9vuSXmquuv5oXOKpGeT6aGrr3o3Gc9AlVa6JBfUSOCnbxGGZF+/0ooI7KrPuUSztUdU5A=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/linux-ppc64": ["@esbuild/linux-ppc64@0.17.19", "", { "os": "linux", "cpu": "ppc64" }, "sha512-/c/DGybs95WXNS8y3Ti/ytqETiW7EU44MEKuCAcpPto3YjQbyK3IQVKfF6nbghD7EcLUGl0NbiL5Rt5DMhn5tg=="],
 
-    "@aws-crypto/sha256-browser/@smithy/util-utf8/@smithy/util-buffer-from/@smithy/is-array-buffer": ["@smithy/is-array-buffer@2.2.0", "", { "dependencies": { "tslib": "^2.6.2" } }, "sha512-GGP3O9QFD24uGeAXYUjwSTXARoqpZykHadOmA8G5vfJPK0/DC67qa//0qvqrJzL1xc8WQWX7/yc7fwudjPHPhA=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/linux-riscv64": ["@esbuild/linux-riscv64@0.17.19", "", { "os": "linux", "cpu": "none" }, "sha512-FC3nUAWhvFoutlhAkgHf8f5HwFWUL6bYdvLc/TTuxKlvLi3+pPzdZiFKSWz/PF30TB1K19SuCxDTI5KcqASJqA=="],
 
-    "@aws-crypto/util/@smithy/util-utf8/@smithy/util-buffer-from/@smithy/is-array-buffer": ["@smithy/is-array-buffer@2.2.0", "", { "dependencies": { "tslib": "^2.6.2" } }, "sha512-GGP3O9QFD24uGeAXYUjwSTXARoqpZykHadOmA8G5vfJPK0/DC67qa//0qvqrJzL1xc8WQWX7/yc7fwudjPHPhA=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/linux-s390x": ["@esbuild/linux-s390x@0.17.19", "", { "os": "linux", "cpu": "s390x" }, "sha512-IbFsFbxMWLuKEbH+7sTkKzL6NJmG2vRyy6K7JJo55w+8xDk7RElYn6xvXtDW8HCfoKBFK69f3pgBJSUSQPr+4Q=="],
 
-    "@aws-sdk/credential-provider-sso/@aws-sdk/token-providers/@aws-sdk/nested-clients/@aws-sdk/util-endpoints": ["@aws-sdk/util-endpoints@3.993.0", "", { "dependencies": { "@aws-sdk/types": "^3.973.1", "@smithy/types": "^4.12.0", "@smithy/url-parser": "^4.2.8", "@smithy/util-endpoints": "^3.2.8", "tslib": "^2.6.2" } }, "sha512-j6vioBeRZ4eHX4SWGvGPpwGg/xSOcK7f1GL0VM+rdf3ZFTIsUEhCFmD78B+5r2PgztcECSzEfvHQX01k8dPQPw=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/linux-x64": ["@esbuild/linux-x64@0.17.19", "", { "os": "linux", "cpu": "x64" }, "sha512-68ngA9lg2H6zkZcyp22tsVt38mlhWde8l3eJLWkyLrp4HwMUr3c1s/M2t7+kHIhvMjglIBrFpncX1SzMckomGw=="],
 
-    "@vscode/vsce/minimatch/brace-expansion/balanced-match": ["balanced-match@1.0.2", "", {}, "sha512-3oSeUO0TMV67hN1AmbXsK4yaqU7tjiHlbxRDZOpH0KW9+CeX4bRAaX0Anxt0tx2MrpRpWwQaPwIlISEJhYU5Pw=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/netbsd-x64": ["@esbuild/netbsd-x64@0.17.19", "", { "os": "none", "cpu": "x64" }, "sha512-CwFq42rXCR8TYIjIfpXCbRX0rp1jo6cPIUPSaWwzbVI4aOfX96OXY8M6KNmtPcg7QjYeDmN+DD0Wp3LaBOLf4Q=="],
+
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/openbsd-x64": ["@esbuild/openbsd-x64@0.17.19", "", { "os": "openbsd", "cpu": "x64" }, "sha512-cnq5brJYrSZ2CF6c35eCmviIN3k3RczmHz8eYaVlNasVqsNY+JKohZU5MKmaOI+KkllCdzOKKdPs762VCPC20g=="],
+
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/sunos-x64": ["@esbuild/sunos-x64@0.17.19", "", { "os": "sunos", "cpu": "x64" }, "sha512-vCRT7yP3zX+bKWFeP/zdS6SqdWB8OIpaRq/mbXQxTGHnIxspRtigpkUcDMlSCOejlHowLqII7K2JKevwyRP2rg=="],
+
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/win32-arm64": ["@esbuild/win32-arm64@0.17.19", "", { "os": "win32", "cpu": "arm64" }, "sha512-yYx+8jwowUstVdorcMdNlzklLYhPxjniHWFKgRqH7IFlUEa0Umu3KuYplf1HUZZ422e3NU9F4LGb+4O0Kdcaag=="],
 
-    "ansi-align/string-width/strip-ansi/ansi-regex": ["ansi-regex@5.0.1", "", {}, "sha512-quJQXlTSUGL2LH9SUXo8VwsY4soanhgo6LNSm84E1LBcE8s3O0wpdiRzyR9z/ZZJMlMWv37qOOb9pdJlMUEKFQ=="],
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/win32-ia32": ["@esbuild/win32-ia32@0.17.19", "", { "os": "win32", "cpu": "ia32" }, "sha512-eggDKanJszUtCdlVs0RB+h35wNlb5v4TWEkq4vZcmVt5u/HiDZrTXe2bWFQUez3RgNHwx/x4sk5++4NSSicKkw=="],
+
+    "@plannotator/paste-service/wrangler/esbuild/@esbuild/win32-x64": ["@esbuild/win32-x64@0.17.19", "", { "os": "win32", "cpu": "x64" }, "sha512-lAhycmKnVOuRYNtRtatQR1LPQf2oYCkRGkSFnseDAKPl8lu5SOsK/e1sXe5a0Pc5kHIHe6P2I/ilntNv2xf3cA=="],
+
+    "@plannotator/paste-service/wrangler/miniflare/acorn": ["acorn@8.14.0", "", { "bin": { "acorn": "bin/acorn" } }, "sha512-cl669nCJTZBsL97OF4kUQm5g5hC2uihk0NxY3WENAC0TYdILVkAyHymAntgxGkl7K+t0cXIrH5siy5S4XkFycA=="],
+
+    "@plannotator/paste-service/wrangler/miniflare/undici": ["undici@5.29.0", "", { "dependencies": { "@fastify/busboy": "^2.0.0" } }, "sha512-raqeBD6NQK4SkWhQzeYKd1KmIG6dllBOTt55Rmkt4HtI9mwdWtJljnrXjAFUBLTSN67HWrOIZ3EPF4kjUw80Bg=="],
+
+    "@plannotator/paste-service/wrangler/miniflare/ws": ["ws@8.18.0", "", { "peerDependencies": { "bufferutil": "^4.0.1", "utf-8-validate": ">=5.0.2" }, "optionalPeers": ["bufferutil", "utf-8-validate"] }, "sha512-8VbfWfHLbbwu3+N6OKsOMpBdT4kXPDDB9cJk2bJ6mh9ucxdlnNvH1e+roYkKmN9Nxw2yjz7VzeO9oOz2zJ04Pw=="],
+
+    "@plannotator/paste-service/wrangler/miniflare/youch": ["youch@3.3.4", "", { "dependencies": { "cookie": "^0.7.1", "mustache": "^4.2.0", "stacktracey": "^2.1.8" } }, "sha512-UeVBXie8cA35DS6+nBkls68xaBBXCye0CNznrhszZjTbRVnJKQuNsyLKBTTL4ln1o1rh2PKtv35twV7irj5SEg=="],
+
+    "@plannotator/paste-service/wrangler/miniflare/zod": ["zod@3.22.3", "", {}, "sha512-EjIevzuJRiRPbVH4mGc8nApb/lVLKVpmUhAaR5R5doKGfAnGJ6Gr3CViAVjP+4FWSxCsybeWQdcgCtbX+7oZug=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-darwin-arm64": ["@img/sharp-darwin-arm64@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-darwin-arm64": "1.0.4" }, "os": "darwin", "cpu": "arm64" }, "sha512-UT4p+iz/2H4twwAoLCqfA9UH5pI6DggwKEGuaPy7nCVQ8ZsiY5PIcrRvD1DzuY3qYL07NtIQcWnBSY/heikIFQ=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-darwin-x64": ["@img/sharp-darwin-x64@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-darwin-x64": "1.0.4" }, "os": "darwin", "cpu": "x64" }, "sha512-fyHac4jIc1ANYGRDxtiqelIbdWkIuQaI84Mv45KvGRRxSAa7o7d1ZKAOBaYbnepLC1WqxfpimdeWfvqqSGwR2Q=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-libvips-darwin-arm64": ["@img/sharp-libvips-darwin-arm64@1.0.4", "", { "os": "darwin", "cpu": "arm64" }, "sha512-XblONe153h0O2zuFfTAbQYAX2JhYmDHeWikp1LM9Hul9gVPjFY427k6dFEcOL72O01QxQsWi761svJ/ev9xEDg=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-libvips-darwin-x64": ["@img/sharp-libvips-darwin-x64@1.0.4", "", { "os": "darwin", "cpu": "x64" }, "sha512-xnGR8YuZYfJGmWPvmlunFaWJsb9T/AO2ykoP3Fz/0X5XV2aoYBPkX6xqCQvUTKKiLddarLaxpzNe+b1hjeWHAQ=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-libvips-linux-arm": ["@img/sharp-libvips-linux-arm@1.0.5", "", { "os": "linux", "cpu": "arm" }, "sha512-gvcC4ACAOPRNATg/ov8/MnbxFDJqf/pDePbBnuBDcjsI8PssmjoKMAz4LtLaVi+OnSb5FK/yIOamqDwGmXW32g=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-libvips-linux-arm64": ["@img/sharp-libvips-linux-arm64@1.0.4", "", { "os": "linux", "cpu": "arm64" }, "sha512-9B+taZ8DlyyqzZQnoeIvDVR/2F4EbMepXMc/NdVbkzsJbzkUjhXv/70GQJ7tdLA4YJgNP25zukcxpX2/SueNrA=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-libvips-linux-s390x": ["@img/sharp-libvips-linux-s390x@1.0.4", "", { "os": "linux", "cpu": "s390x" }, "sha512-u7Wz6ntiSSgGSGcjZ55im6uvTrOxSIS8/dgoVMoiGE9I6JAfU50yH5BoDlYA1tcuGS7g/QNtetJnxA6QEsCVTA=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-libvips-linux-x64": ["@img/sharp-libvips-linux-x64@1.0.4", "", { "os": "linux", "cpu": "x64" }, "sha512-MmWmQ3iPFZr0Iev+BAgVMb3ZyC4KeFc3jFxnNbEPas60e1cIfevbtuyf9nDGIzOaW9PdnDciJm+wFFaTlj5xYw=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-libvips-linuxmusl-arm64": ["@img/sharp-libvips-linuxmusl-arm64@1.0.4", "", { "os": "linux", "cpu": "arm64" }, "sha512-9Ti+BbTYDcsbp4wfYib8Ctm1ilkugkA/uscUn6UXK1ldpC1JjiXbLfFZtRlBhjPZ5o1NCLiDbg8fhUPKStHoTA=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-libvips-linuxmusl-x64": ["@img/sharp-libvips-linuxmusl-x64@1.0.4", "", { "os": "linux", "cpu": "x64" }, "sha512-viYN1KX9m+/hGkJtvYYp+CCLgnJXwiQB39damAO7WMdKWlIhmYTfHjwSbQeUK/20vY154mwezd9HflVFM1wVSw=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-linux-arm": ["@img/sharp-linux-arm@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-linux-arm": "1.0.5" }, "os": "linux", "cpu": "arm" }, "sha512-JTS1eldqZbJxjvKaAkxhZmBqPRGmxgu+qFKSInv8moZ2AmT5Yib3EQ1c6gp493HvrvV8QgdOXdyaIBrhvFhBMQ=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-linux-arm64": ["@img/sharp-linux-arm64@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-linux-arm64": "1.0.4" }, "os": "linux", "cpu": "arm64" }, "sha512-JMVv+AMRyGOHtO1RFBiJy/MBsgz0x4AWrT6QoEVVTyh1E39TrCUpTRI7mx9VksGX4awWASxqCYLCV4wBZHAYxA=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-linux-s390x": ["@img/sharp-linux-s390x@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-linux-s390x": "1.0.4" }, "os": "linux", "cpu": "s390x" }, "sha512-y/5PCd+mP4CA/sPDKl2961b+C9d+vPAveS33s6Z3zfASk2j5upL6fXVPZi7ztePZ5CuH+1kW8JtvxgbuXHRa4Q=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-linux-x64": ["@img/sharp-linux-x64@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-linux-x64": "1.0.4" }, "os": "linux", "cpu": "x64" }, "sha512-opC+Ok5pRNAzuvq1AG0ar+1owsu842/Ab+4qvU879ippJBHvyY5n2mxF1izXqkPYlGuP/M556uh53jRLJmzTWA=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-linuxmusl-arm64": ["@img/sharp-linuxmusl-arm64@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-linuxmusl-arm64": "1.0.4" }, "os": "linux", "cpu": "arm64" }, "sha512-XrHMZwGQGvJg2V/oRSUfSAfjfPxO+4DkiRh6p2AFjLQztWUuY/o8Mq0eMQVIY7HJ1CDQUJlxGGZRw1a5bqmd1g=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-linuxmusl-x64": ["@img/sharp-linuxmusl-x64@0.33.5", "", { "optionalDependencies": { "@img/sharp-libvips-linuxmusl-x64": "1.0.4" }, "os": "linux", "cpu": "x64" }, "sha512-WT+d/cgqKkkKySYmqoZ8y3pxx7lx9vVejxW/W4DOFMYVSkErR+w7mf2u8m/y4+xHe7yY9DAXQMWQhpnMuFfScw=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-wasm32": ["@img/sharp-wasm32@0.33.5", "", { "dependencies": { "@emnapi/runtime": "^1.2.0" }, "cpu": "none" }, "sha512-ykUW4LVGaMcU9lu9thv85CbRMAwfeadCJHRsg2GmeRa/cJxsVY9Rbd57JcMxBkKHag5U/x7TSBpScF4U8ElVzg=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-win32-ia32": ["@img/sharp-win32-ia32@0.33.5", "", { "os": "win32", "cpu": "ia32" }, "sha512-T36PblLaTwuVJ/zw/LaH0PdZkRz5rd3SmMHX8GSmR7vtNSP5Z6bQkExdSK7xGWyxLw4sUknBuugTelgw2faBbQ=="],
+
+    "@plannotator/paste-service/wrangler/sharp/@img/sharp-win32-x64": ["@img/sharp-win32-x64@0.33.5", "", { "os": "win32", "cpu": "x64" }, "sha512-MpY/o8/8kj+EcnxwvrP4aTJSWw/aZ7JIGR4aBeZkZw5B7/Jn+tY9/VNwtcoGmdT7GfggGIU4kygOMSbYnOrAbg=="],
+
+    "@plannotator/paste-service/wrangler/workerd/@cloudflare/workerd-darwin-64": ["@cloudflare/workerd-darwin-64@1.20250718.0", "", { "os": "darwin", "cpu": "x64" }, "sha512-FHf4t7zbVN8yyXgQ/r/GqLPaYZSGUVzeR7RnL28Mwj2djyw2ZergvytVc7fdGcczl6PQh+VKGfZCfUqpJlbi9g=="],
+
+    "@plannotator/paste-service/wrangler/workerd/@cloudflare/workerd-darwin-arm64": ["@cloudflare/workerd-darwin-arm64@1.20250718.0", "", { "os": "darwin", "cpu": "arm64" }, "sha512-fUiyUJYyqqp4NqJ0YgGtp4WJh/II/YZsUnEb6vVy5Oeas8lUOxnN+ZOJ8N/6/5LQCVAtYCChRiIrBbfhTn5Z8Q=="],
+
+    "@plannotator/paste-service/wrangler/workerd/@cloudflare/workerd-linux-64": ["@cloudflare/workerd-linux-64@1.20250718.0", "", { "os": "linux", "cpu": "x64" }, "sha512-5+eb3rtJMiEwp08Kryqzzu8d1rUcK+gdE442auo5eniMpT170Dz0QxBrqkg2Z48SFUPYbj+6uknuA5tzdRSUSg=="],
+
+    "@plannotator/paste-service/wrangler/workerd/@cloudflare/workerd-linux-arm64": ["@cloudflare/workerd-linux-arm64@1.20250718.0", "", { "os": "linux", "cpu": "arm64" }, "sha512-Aa2M/DVBEBQDdATMbn217zCSFKE+ud/teS+fFS+OQqKABLn0azO2qq6ANAHYOIE6Q3Sq4CxDIQr8lGdaJHwUog=="],
+
+    "@plannotator/paste-service/wrangler/workerd/@cloudflare/workerd-windows-64": ["@cloudflare/workerd-windows-64@1.20250718.0", "", { "os": "win32", "cpu": "x64" }, "sha512-dY16RXKffmugnc67LTbyjdDHZn5NoTF1yHEf2fN4+OaOnoGSp3N1x77QubTDwqZ9zECWxgQfDLjddcH8dWeFhg=="],
+
+    "@vscode/vsce/minimatch/brace-expansion/balanced-match": ["balanced-match@1.0.2", "", {}, "sha512-3oSeUO0TMV67hN1AmbXsK4yaqU7tjiHlbxRDZOpH0KW9+CeX4bRAaX0Anxt0tx2MrpRpWwQaPwIlISEJhYU5Pw=="],
 
     "rimraf/glob/jackspeak/@isaacs/cliui": ["@isaacs/cliui@8.0.2", "", { "dependencies": { "string-width": "^5.1.2", "string-width-cjs": "npm:string-width@^4.2.0", "strip-ansi": "^7.0.1", "strip-ansi-cjs": "npm:strip-ansi@^6.0.1", "wrap-ansi": "^8.1.0", "wrap-ansi-cjs": "npm:wrap-ansi@^7.0.0" } }, "sha512-O8jcjabXaleOG9DQ0+ARXWZBTfnP4WNAqzuiJK7ll44AmxGKv/J2M4TPjxjY3znBCfvBXFzucm1twdyFybFqEA=="],
 
     "rimraf/glob/path-scurry/lru-cache": ["lru-cache@10.4.3", "", {}, "sha512-JNAzZcXrCt42VGLuYz0zfAzDfAvJWW6AfYlDBQyDV5DClI2m5sAmK+OIO7s59XfsRsWHp02jAJrRadPRGTt6SQ=="],
 
-    "yargs/string-width/strip-ansi/ansi-regex": ["ansi-regex@5.0.1", "", {}, "sha512-quJQXlTSUGL2LH9SUXo8VwsY4soanhgo6LNSm84E1LBcE8s3O0wpdiRzyR9z/ZZJMlMWv37qOOb9pdJlMUEKFQ=="],
+    "@plannotator/paste-service/wrangler/miniflare/youch/cookie": ["cookie@0.7.2", "", {}, "sha512-yki5XnKuf750l50uGTllt6kKILY4nQ1eNIQatoXEByZ5dWgnKqbnqmTrBE5B4N7lrMJKQ2ytWMiTO2o0v6Ew/w=="],
 
     "rimraf/glob/jackspeak/@isaacs/cliui/string-width": ["string-width@5.1.2", "", { "dependencies": { "eastasianwidth": "^0.2.0", "emoji-regex": "^9.2.2", "strip-ansi": "^7.0.1" } }, "sha512-HnLOCR3vjcY8beoNLtcjZ5/nxn2afmME6lhrDrebokqMap+XbeW8n9TXpPDOqdGK5qcI3oT0GKTW6wC7EMiVqA=="],
 
diff --git a/package.json b/package.json
index eec3548ba..a015d0b74 100644
--- a/package.json
+++ b/package.json
@@ -22,6 +22,9 @@
     "dev:portal": "bun run --cwd apps/portal dev",
     "dev:marketing": "bun run --cwd apps/marketing dev",
     "dev:review": "bun run --cwd apps/review dev",
+    "dev:room": "bun run --cwd apps/room-service dev",
+    "dev:live-room": "scripts/dev-live-room-local.sh",
+    "agent:run": "bun run apps/collab-agent/index.ts",
     "build:hook": "bun run --cwd apps/hook build",
     "build:portal": "bun run --cwd apps/portal build",
     "build:marketing": "bun run --cwd apps/marketing build",
@@ -32,8 +35,8 @@
     "dev:vscode": "bun run --cwd apps/vscode-extension watch",
     "build:vscode": "bun run --cwd apps/vscode-extension build",
     "package:vscode": "bun run --cwd apps/vscode-extension package",
-    "test": "bun test",
-    "typecheck": "bash apps/pi-extension/vendor.sh && tsc --noEmit -p packages/shared/tsconfig.json && tsc --noEmit -p packages/ai/tsconfig.json && tsc --noEmit -p packages/server/tsconfig.json && tsc --noEmit -p packages/ui/tsconfig.json && tsc --noEmit -p apps/pi-extension/tsconfig.json"
+    "test": "bun test --path-ignore-patterns 'packages/ui/**' --path-ignore-patterns 'packages/editor/**' && bun test --cwd packages/ui && bun test --cwd packages/editor",
+    "typecheck": "bash apps/pi-extension/vendor.sh && bunx tsc --noEmit -p packages/shared/tsconfig.json && bunx tsc --noEmit -p packages/ai/tsconfig.json && bunx tsc --noEmit -p packages/server/tsconfig.json && bunx tsc --noEmit -p packages/ui/tsconfig.slice5.json && bunx tsc --noEmit -p packages/editor/tsconfig.json && bunx tsc --noEmit -p apps/pi-extension/tsconfig.json"
   },
   "dependencies": {
     "@anthropic-ai/claude-agent-sdk": "^0.2.92",
@@ -50,6 +53,7 @@
     "@types/dompurify": "^3.2.0",
     "@types/node": "^25.5.2",
     "@types/turndown": "^5.0.6",
-    "bun-types": "^1.3.11"
+    "bun-types": "^1.3.11",
+    "wrangler": "^4.81.1"
   }
 }
diff --git a/packages/editor/App.tsx b/packages/editor/App.tsx
index c48b7eb2f..2bba1290b 100644
--- a/packages/editor/App.tsx
+++ b/packages/editor/App.tsx
@@ -12,6 +12,7 @@ import { Annotation, Block, EditorMode, type CodeAnnotation, type InputMethod, t
 import { ThemeProvider } from '@plannotator/ui/components/ThemeProvider';
 import { Tooltip, TooltipProvider } from '@plannotator/ui/components/Tooltip';
 import { AnnotationToolstrip } from '@plannotator/ui/components/AnnotationToolstrip';
+import { AppHeader } from './components/AppHeader';
 import { StickyHeaderLane } from '@plannotator/ui/components/StickyHeaderLane';
 import { TaterSpriteRunning } from '@plannotator/ui/components/TaterSpriteRunning';
 import { TaterSpritePullup } from '@plannotator/ui/components/TaterSpritePullup';
@@ -20,6 +21,10 @@ import { getCallbackConfig, CallbackAction, executeCallback } from '@plannotator
 import { useAgents } from '@plannotator/ui/hooks/useAgents';
 import { useActiveSection } from '@plannotator/ui/hooks/useActiveSection';
 import { storage } from '@plannotator/ui/utils/storage';
+import {
+  getIdentity,
+  getPresenceColor,
+} from '@plannotator/ui/utils/identity';
 import { configStore } from '@plannotator/ui/config';
 import { CompletionOverlay } from '@plannotator/ui/components/CompletionOverlay';
 import { UpdateBanner } from '@plannotator/ui/components/UpdateBanner';
@@ -57,7 +62,13 @@ import { useArchive } from '@plannotator/ui/hooks/useArchive';
 import { useEditorAnnotations } from '@plannotator/ui/hooks/useEditorAnnotations';
 import { useExternalAnnotations } from '@plannotator/ui/hooks/useExternalAnnotations';
 import { useExternalAnnotationHighlights } from '@plannotator/ui/hooks/useExternalAnnotationHighlights';
+import { useAnnotationHighlightReconciler } from '@plannotator/ui/hooks/useAnnotationHighlightReconciler';
+import { useRoomAdminActions } from '@plannotator/ui/hooks/collab/useRoomAdminActions';
+import { RoomHeaderControls } from '@plannotator/ui/components/collab/RoomHeaderControls';
+import { RoomAdminErrorToast } from '@plannotator/ui/components/collab/RoomAdminErrorToast';
+import { ImageStripNotice } from '@plannotator/ui/components/collab/ImageStripNotice';
 import { buildPlanAgentInstructions } from '@plannotator/ui/utils/planAgentInstructions';
+import { buildRoomAgentInstructions } from '@plannotator/ui/utils/roomAgentInstructions';
 import { useFileBrowser } from '@plannotator/ui/hooks/useFileBrowser';
 import { isVaultBrowserEnabled } from '@plannotator/ui/utils/obsidian';
 import { isFileBrowserEnabled, getFileBrowserSettings } from '@plannotator/ui/utils/fileBrowser';
@@ -81,8 +92,10 @@ const USE_DIFF_DEMO =
 const DEMO_PLAN_CONTENT = USE_DIFF_DEMO
   ? DIFF_DEMO_PLAN_CONTENT
   : DEFAULT_DEMO_PLAN_CONTENT;
-import { useCheckboxOverrides } from './hooks/useCheckboxOverrides';
-import { AppHeader } from './components/AppHeader';
+import { useCheckboxOverrides, derivePendingCheckboxBlockIds } from './hooks/useCheckboxOverrides';
+import { useAnnotationController } from '@plannotator/ui/hooks/useAnnotationController';
+import { StartRoomModal } from '@plannotator/ui/components/collab/StartRoomModal';
+import { useStartLiveRoom } from './hooks/collab/useStartLiveRoom';
 
 type NoteAutoSaveResults = {
   obsidian?: boolean;
@@ -90,10 +103,48 @@ type NoteAutoSaveResults = {
   octarine?: boolean;
 };
 
-const App: React.FC = () => {
-  const [markdown, setMarkdown] = useState(DEMO_PLAN_CONTENT);
-  const [annotations, setAnnotations] = useState<Annotation[]>([]);
+export interface AppProps {
+  roomSession?: import('@plannotator/ui/hooks/collab/useCollabRoomSession').UseCollabRoomSessionReturn;
+}
+
+const App: React.FC<AppProps> = ({ roomSession }) => {
+  const roomModeActive = !!roomSession?.room;
+  const [markdown, setMarkdown] = useState(
+    roomModeActive ? '' : DEMO_PLAN_CONTENT,
+  );
+
+  const roomAdmin = useRoomAdminActions(roomSession?.room);
+
+  const [strippedImagesCount, setStrippedImagesCount] = useState<number>(() => {
+    if (!roomModeActive || typeof window === 'undefined') return 0;
+    const w = window as { __PLANNOTATOR_STRIPPED_IMAGES__?: number };
+    return w.__PLANNOTATOR_STRIPPED_IMAGES__ ?? 0;
+  });
+  useEffect(() => {
+    if (typeof window === 'undefined') return;
+    const w = window as { __PLANNOTATOR_STRIPPED_IMAGES__?: number };
+    if (w.__PLANNOTATOR_STRIPPED_IMAGES__ !== undefined) {
+      delete w.__PLANNOTATOR_STRIPPED_IMAGES__;
+    }
+  }, []);
+
+  const annotationController = useAnnotationController({
+    initial: [],
+    room: roomSession?.room,
+  });
+  const { annotations } = annotationController;
+  const setAnnotations: React.Dispatch<React.SetStateAction<Annotation[]>> =
+    annotationController.setAll ??
+    ((_: React.SetStateAction<Annotation[]>) => {});
+
   const [codeAnnotations, setCodeAnnotations] = useState<CodeAnnotation[]>([]);
+
+  useEffect(() => {
+    if (!roomSession?.room) return;
+    const plan = roomSession.room.planMarkdown;
+    if (plan && plan !== markdown) setMarkdown(plan);
+    // eslint-disable-next-line react-hooks/exhaustive-deps
+  }, [roomSession?.room?.planMarkdown]);
   const [selectedAnnotationId, setSelectedAnnotationId] = useState<string | null>(null);
   const [selectedCodeAnnotationId, setSelectedCodeAnnotationId] = useState<string | null>(null);
   const frontmatter = useMemo(() => extractFrontmatter(markdown).frontmatter, [markdown]);
@@ -147,6 +198,15 @@ const App: React.FC = () => {
     return () => ro.disconnect();
   }, []);
   const [isApiMode, setIsApiMode] = useState(false);
+  // Approve / Deny are a LOCAL (same-origin) capability. In room mode
+  // the editor is served from room.plannotator.ai, which has no
+  // path to the blocked agent hook — so the buttons aren't offered
+  // there, even for admins. Decisions are made from the creator's
+  // localhost tab; room-side feedback flows back via the existing
+  // import paths (share hash / paste short URL / "Copy consolidated
+  // feedback" → paste). If a future change wants a room-origin
+  // approve path, it has to change THIS line.
+  const approveDenyAvailable = isApiMode;
   const [origin, setOrigin] = useState<Origin | null>(null);
   const [gitUser, setGitUser] = useState<string | undefined>();
   const [isWSL, setIsWSL] = useState(false);
@@ -164,6 +224,8 @@ const App: React.FC = () => {
   const [isSubmitting, setIsSubmitting] = useState(false);
   const [isExiting, setIsExiting] = useState(false);
   const [submitted, setSubmitted] = useState<'approved' | 'denied' | 'exited' | null>(null);
+  /** Visible error message for failed approve/deny. Cleared on next attempt. */
+  const [submitError, setSubmitError] = useState<string | null>(null);
   const [pendingPasteImage, setPendingPasteImage] = useState<{ file: File; blobUrl: string; initialName: string } | null>(null);
   const [showPermissionModeSetup, setShowPermissionModeSetup] = useState(false);
   const [permissionMode, setPermissionMode] = useState<PermissionMode>('bypassPermissions');
@@ -188,6 +250,21 @@ const App: React.FC = () => {
   const isMobile = useIsMobile();
 
   const viewerRef = useRef<ViewerHandle>(null);
+  // Monotonic generation driven by Viewer's highlight-surface lifecycle
+  // (init + `clearAllHighlights`). Reconcilers that track which annotation
+  // IDs are already materialized as DOM marks watch this value so they
+  // repaint from scratch when the underlying surface is reset out from
+  // under them (e.g. share-import wiping the DOM via clearAllHighlights).
+  //
+  // The counter is parent-owned on purpose: if the Viewer remounts (key
+  // change, conditional render) and emitted its own first-mount number
+  // again, React's setState bailout would silently drop the update and
+  // the reconciler's applied map would stay stale. The Viewer just emits
+  // "I reset" and we bump here.
+  const [highlightSurfaceGeneration, setHighlightSurfaceGeneration] = useState(0);
+  const bumpHighlightSurfaceGeneration = useCallback(() => {
+    setHighlightSurfaceGeneration(g => g + 1);
+  }, []);
   // containerRef + scrollViewport both point at the OverlayScrollbars
   // viewport element (the node that actually scrolls), not the <main>
   // host. Consumers: useActiveSection (IntersectionObserver root) and
@@ -198,6 +275,29 @@ const App: React.FC = () => {
     onViewportReady: handleViewportReady,
   } = useOverlayViewport();
 
+  // Expose the scroll viewport to sibling components outside App's
+  // React tree (LocalPresenceEmitter, RemoteCursorLayer — both live
+  // in RoomApp as React-siblings of App, so they can't consume
+  // `ScrollViewportContext`). They use content coordinates for
+  // remote cursor presence: "pointer at pixel (x, y) inside the
+  // scrolling content" is the one coordinate space that stays
+  // consistent across participants regardless of scroll / window
+  // size / zoom. Tagging the element with a data attribute lets
+  // those components `document.querySelector` for it — ugly
+  // coupling, but the alternative (hoisting presence components
+  // into App, or threading the ref back up through `renderEditor`)
+  // would be a bigger refactor for a localized win. Exactly one
+  // element carries the attribute (one App instance per page).
+  useEffect(() => {
+    if (!scrollViewport) return;
+    scrollViewport.dataset.planScrollViewport = '';
+    return () => {
+      // Clean up on unmount so a later App mount (e.g. HMR) doesn't
+      // have two elements briefly claiming the role.
+      delete scrollViewport.dataset.planScrollViewport;
+    };
+  }, [scrollViewport]);
+
   usePrintMode();
 
   // Resizable panels
@@ -248,7 +348,7 @@ const App: React.FC = () => {
     }
   }, [wideModeType, sidebar.close, sidebar.open]);
 
-  const openSidebarTab = useCallback((tab: SidebarTab) => {
+  const openSidebarTab = useCallback((tab?: SidebarTab) => {
     if (wideModeType !== null) {
       exitWideMode({ restore: false, sidebarTab: tab, panelOpen: false });
       return;
@@ -525,7 +625,7 @@ const App: React.FC = () => {
 
   // Flash highlight for annotated files in the sidebar
   const [highlightedFiles, setHighlightedFiles] = useState<Set<string> | undefined>();
-  const flashTimerRef = React.useRef<ReturnType<typeof setTimeout>>();
+  const flashTimerRef = React.useRef<ReturnType<typeof setTimeout> | undefined>(undefined);
   const handleFlashAnnotatedFiles = React.useCallback(() => {
     const filePaths = new Set(allAnnotationCounts.keys());
     if (filePaths.size === 0) return;
@@ -559,18 +659,27 @@ const App: React.FC = () => {
   // Drive DOM highlights for SSE-delivered external annotations. Disabled
   // while a linked doc overlay is open (Viewer DOM is hidden) and while the
   // plan diff view is active (diff view has its own annotation surface).
-  const { reset: resetExternalHighlights } = useExternalAnnotationHighlights({
+  useExternalAnnotationHighlights({
     viewerRef,
     externalAnnotations,
     enabled: isApiMode && !linkedDocHook.isActive && !isPlanDiffActive,
     planKey: markdown,
+    surfaceGeneration: highlightSurfaceGeneration,
   });
 
   // Merge local + SSE annotations, deduping draft-restored externals against
   // live SSE versions. Prefer the SSE version when both exist (same source,
   // type, and originalText). This avoids the timing issues of an effect-based
   // cleanup — draft-restored externals persist until SSE actually re-delivers them.
+  //
+  // Room-mode exclusion: when a live room is active, external annotations are
+  // NOT merged. An SSE-sourced annotation visible only to the creator would
+  // diverge from other participants' views and could be accidentally
+  // consolidated into approve/deny payloads. A future pass can forward
+  // the SSE stream to encrypted room ops so external annotations become
+  // shared.
   const allAnnotations = useMemo(() => {
+    if (roomSession?.room) return annotations;
     if (externalAnnotations.length === 0) return annotations;
 
     const local = annotations.filter(a => {
@@ -583,7 +692,7 @@ const App: React.FC = () => {
     });
 
     return [...local, ...externalAnnotations];
-  }, [annotations, externalAnnotations]);
+  }, [annotations, externalAnnotations, roomSession?.room]);
 
   // Plan diff state — memoize filtered annotation lists to avoid new references per render
   const diffAnnotations = useMemo(() => allAnnotations.filter(a => !!a.diffContext), [allAnnotations]);
@@ -606,7 +715,7 @@ const App: React.FC = () => {
     globalAttachments.length;
   // Code-file comments are intentionally not serialized into share URLs in v1.
   // Hide share entry points once they exist so we do not silently drop feedback.
-  const canShareCurrentSession = sharingEnabled && codeAnnotations.length === 0;
+  const canShareCurrentSession = sharingEnabled && !roomModeActive && codeAnnotations.length === 0;
 
   // URL-based sharing
   const {
@@ -637,6 +746,7 @@ const App: React.FC = () => {
     },
     shareBaseUrl,
     pasteApiUrl,
+    roomModeActive,
     rawHtml,
     setRawHtml,
     setRenderAs,
@@ -653,6 +763,7 @@ const App: React.FC = () => {
   });
 
   const handleRestoreDraft = React.useCallback(() => {
+    if (roomModeActive) return;
     const { annotations: restored, codeAnnotations: restoredCode, globalAttachments: restoredGlobal } = restoreDraft();
     if (restored.length > 0 || restoredCode.length > 0 || restoredGlobal.length > 0) {
       setAnnotations(restored);
@@ -663,7 +774,7 @@ const App: React.FC = () => {
         viewerRef.current?.applySharedAnnotations(restored.filter(a => !a.diffContext));
       }, 100);
     }
-  }, [restoreDraft]);
+  }, [restoreDraft, roomModeActive]);
 
   // Fetch available agents for OpenCode (for validation on approve)
   const { agents: availableAgents, validateAgent, getAgentWarning } = useAgents(origin);
@@ -673,17 +784,33 @@ const App: React.FC = () => {
     if (pendingSharedAnnotations && pendingSharedAnnotations.length > 0) {
       // Small delay to ensure DOM is rendered
       const timer = setTimeout(() => {
-        // Clear existing highlights first (important when loading new share URL)
+        // Clear existing highlights first (important when loading new share URL).
+        // Viewer fires `onHighlightSurfaceReset`, which bumps the parent-owned
+        // generation and cascades into both reconcilers (external SSE + room)
+        // so their applied maps invalidate and repaint on the next tick.
         viewerRef.current?.clearAllHighlights();
         viewerRef.current?.applySharedAnnotations(pendingSharedAnnotations.filter(a => !a.diffContext));
         clearPendingSharedAnnotations();
-        // `clearAllHighlights` wiped live external SSE highlights too;
-        // tell the external-highlight bookkeeper to re-apply them.
-        resetExternalHighlights();
       }, 100);
       return () => clearTimeout(timer);
     }
-  }, [pendingSharedAnnotations, clearPendingSharedAnnotations, resetExternalHighlights]);
+  }, [pendingSharedAnnotations, clearPendingSharedAnnotations]);
+
+  // Room-mode annotation → DOM mark reconciliation. Delegates to the
+  // shared `useAnnotationHighlightReconciler` (also used by external
+  // SSE). Room fingerprint includes comment `text` because peers can
+  // edit an annotation's comment without changing `originalText` —
+  // that case must trigger a remove+reapply so the mark's visible
+  // content matches the canonical annotation.
+  useAnnotationHighlightReconciler({
+    viewerRef,
+    annotations,
+    enabled: roomModeActive,
+    planKey: markdown,
+    surfaceGeneration: highlightSurfaceGeneration,
+    eligibleFilter: a => !a.diffContext && !!a.originalText,
+    fingerprint: roomAnnFingerprint,
+  });
 
   const handleTaterModeChange = useCallback((enabled: boolean) => {
     setTaterMode(enabled);
@@ -708,6 +835,7 @@ const App: React.FC = () => {
   useEffect(() => {
     if (isLoadingShared) return; // Wait for share check to complete
     if (isSharedSession) return; // Already loaded from share
+    if (roomModeActive) return; // Room mode loads plan from the encrypted snapshot
 
     fetch('/api/plan')
       .then(res => {
@@ -887,6 +1015,11 @@ const App: React.FC = () => {
   // Global paste listener for image attachments
   useEffect(() => {
     const handlePaste = (e: ClipboardEvent) => {
+      // Room mode: images are not supported. Block the paste flow so
+      // the user doesn't get an upload modal that silently fails (the
+      // room Worker has no /api/upload endpoint).
+      if (roomModeActive) return;
+
       const items = e.clipboardData?.items;
       if (!items) return;
 
@@ -907,7 +1040,7 @@ const App: React.FC = () => {
 
     document.addEventListener('paste', handlePaste);
     return () => document.removeEventListener('paste', handlePaste);
-  }, [globalAttachments]);
+  }, [globalAttachments, roomModeActive]);
 
   // Handle paste annotator accept — name comes from ImageAnnotator
   const handlePasteAnnotatorAccept = async (blob: Blob, hasDrawings: boolean, name: string) => {
@@ -943,6 +1076,7 @@ const App: React.FC = () => {
   // API mode handlers
   const handleApprove = async () => {
     setIsSubmitting(true);
+    setSubmitError(null);
     try {
       const obsidianSettings = getObsidianSettings();
       const bearSettings = getBearSettings();
@@ -1008,22 +1142,29 @@ const App: React.FC = () => {
         body.feedback = annotationsOutput;
       }
 
-      await fetch('/api/approve', {
+      const approveRes = await fetch('/api/approve', {
         method: 'POST',
         headers: { 'Content-Type': 'application/json' },
         body: JSON.stringify(body),
       });
+      if (!approveRes.ok) {
+        throw new Error(`Approve failed: ${approveRes.status}`);
+      }
+
       setSubmitted('approved');
-    } catch {
+      setSubmitError(null);
+    } catch (err) {
       setIsSubmitting(false);
+      setSubmitError(err instanceof Error ? err.message : 'Approve failed');
     }
   };
 
   const handleDeny = async () => {
     setIsSubmitting(true);
+    setSubmitError(null);
     try {
       const planSaveSettings = getPlanSaveSettings();
-      await fetch('/api/deny', {
+      const denyRes = await fetch('/api/deny', {
         method: 'POST',
         headers: { 'Content-Type': 'application/json' },
         body: JSON.stringify({
@@ -1034,12 +1175,67 @@ const App: React.FC = () => {
           },
         })
       });
+      if (!denyRes.ok) {
+        throw new Error(`Deny failed: ${denyRes.status}`);
+      }
       setSubmitted('denied');
-    } catch {
+      setSubmitError(null);
+    } catch (err) {
       setIsSubmitting(false);
+      setSubmitError(err instanceof Error ? err.message : 'Deny failed');
     }
   };
 
+  /**
+   * Stable `pendingIds` derivation for AnnotationPanel. The controller
+   * exposes pending as `Map<id, PendingOp>` but the panel only needs
+   * "is this id pending?" — we project to a Set with the controller's
+   * pending Map as the memo dependency so a new Set is built ONLY when
+   * pending actually changes.
+   */
+  const pendingAnnotationIds = useMemo<ReadonlySet<string> | undefined>(
+    () => (roomModeActive ? new Set(annotationController.pending.keys()) : undefined),
+    [roomModeActive, annotationController.pending],
+  );
+
+  // Live Rooms is a local-creator-only flow: it needs a running
+  // Plannotator hook (isApiMode) to host the creator's original tab so
+  // the blocked agent hook has an approve/deny surface after the room
+  // opens in a new tab. Hosted portals (share.plannotator.ai, the
+  // marketing demo) have no such host, and the room-service CORS policy
+  // intentionally doesn't whitelist them — offering the button there
+  // would surface an "unreachable room service" error on click. Gate
+  // the menu + export-modal affordances on this single flag so both
+  // surfaces stay consistent.
+  const canStartLiveRoom = isApiMode && !roomModeActive;
+
+  // Creator-side start-room flow. State, handlers, URL construction,
+  // placeholder-tab pop-open, and the image-strip memo all live in
+  // the hook; App.tsx consumes the return object and renders the
+  // modal below.
+  const {
+    showStartRoomModal,
+    startRoomInFlight,
+    startRoomError,
+    imageAnnotationsToStrip,
+    handleStartLiveRoom,
+    handleCancelStartRoom,
+    handleConfirmStartRoom,
+  } = useStartLiveRoom({
+    annotations,
+    markdown,
+    globalAttachments,
+    canStartLiveRoom,
+  });
+
+  // Note: the room admin action (delete) lives only in the Room
+  // menu (RoomMenu / RoomHeaderControls). The PlanHeaderMenu used to
+  // duplicate it via a `runHeaderRoomAdmin` wrapper, but that path
+  // swallowed errors without a visible surface — the Room menu owns
+  // the pending-state chrome and the error toast, so routing admin
+  // clicks through a single focal point gives the user a consistent
+  // recovery path.
+
   // Annotate mode handler — sends feedback via /api/feedback
   const handleAnnotateFeedback = async () => {
     setIsSubmitting(true);
@@ -1153,7 +1349,7 @@ const App: React.FC = () => {
   ]);
 
   const handleAddAnnotation = (ann: Annotation) => {
-    setAnnotations(prev => [...prev, ann]);
+    annotationController.add(ann);
     setSelectedAnnotationId(ann.id);
     setSelectedCodeAnnotationId(null);
     if (wideModeType === null) {
@@ -1191,9 +1387,6 @@ const App: React.FC = () => {
     }
   }, [wideModeType]);
 
-  // The code popout is full-viewport modal — the annotation panel is behind it.
-  // This handler only fires when the popout is closed (sidebar visible), so
-  // reopening the file via codeFilePopout.open() is the correct behavior.
   const handleSelectCodeAnnotation = React.useCallback((id: string) => {
     const annotation = codeAnnotations.find(a => a.id === id);
     if (!annotation) return;
@@ -1211,20 +1404,35 @@ const App: React.FC = () => {
   const handleEditCodeAnnotation = React.useCallback((id: string, updates: Partial<CodeAnnotation>) => {
     setCodeAnnotations(prev => prev.map(a => a.id === id ? { ...a, ...updates } : a));
   }, []);
-
-  // Core annotation removal — highlight cleanup + state filter + selection clear
   const removeAnnotation = (id: string) => {
-    viewerRef.current?.removeHighlight(id);
-    setAnnotations(prev => prev.filter(a => a.id !== id));
+    if (!roomModeActive) {
+      viewerRef.current?.removeHighlight(id);
+    }
+    annotationController.remove(id);
     if (selectedAnnotationId === id) setSelectedAnnotationId(null);
   };
 
+  // Room-mode only. Delegates to `derivePendingCheckboxBlockIds`
+  // (same file as `useCheckboxOverrides`) — busy-gate + revert-gate
+  // semantics documented on the helper.
+  const pendingCheckboxBlockIds = useMemo<ReadonlySet<string> | undefined>(
+    () => (roomModeActive ? derivePendingCheckboxBlockIds(annotationController) : undefined),
+    [
+      roomModeActive,
+      annotationController.pending,
+      annotationController.failed,
+      annotationController.pendingAdditions,
+      annotationController.annotations,
+    ],
+  );
+
   // Interactive checkbox toggling with annotation tracking
   const checkbox = useCheckboxOverrides({
     blocks,
     annotations,
     addAnnotation: handleAddAnnotation,
     removeAnnotation,
+    pendingBlockIds: pendingCheckboxBlockIds,
   });
 
   const handleDeleteAnnotation = (id: string) => {
@@ -1237,8 +1445,21 @@ const App: React.FC = () => {
       if (selectedAnnotationId === id) setSelectedAnnotationId(null);
       return;
     }
-    // If this is a checkbox annotation, revert the visual override
-    if (id.startsWith('ann-checkbox-')) {
+    // If this is a checkbox annotation, clear the visual override.
+    //
+    // Local mode: synchronous — there's no server to reject the remove,
+    // so revert optimistically in lockstep with the annotation removal.
+    //
+    // Room mode: DO NOT revert here. The override must stay until the
+    // canonical checkbox annotation actually disappears from the room
+    // state (echoed remove). Otherwise a remove that later fails
+    // (disconnect, server rejection) leaves the annotation canonical
+    // but the checkbox visually reverted — inconsistent.
+    // `useCheckboxOverrides` runs a reconciliation effect that clears
+    // overrides once the backing annotation is gone from BOTH canonical
+    // and pending/failed state, which is exactly when it's safe to
+    // revert in room mode.
+    if (id.startsWith('ann-checkbox-') && !roomModeActive) {
       if (ann) {
         checkbox.revertOverride(ann.blockId);
       }
@@ -1252,15 +1473,16 @@ const App: React.FC = () => {
       updateExternalAnnotation(id, updates);
       return;
     }
-    setAnnotations(prev => prev.map(a =>
-      a.id === id ? { ...a, ...updates } : a
-    ));
+    annotationController.update(id, updates);
   };
 
   const handleIdentityChange = useCallback((oldIdentity: string, newIdentity: string) => {
-    setAnnotations(prev => prev.map(ann =>
-      ann.author === oldIdentity ? { ...ann, author: newIdentity } : ann
-    ));
+    if (roomModeActive) return;
+    for (const ann of annotations) {
+      if (ann.author === oldIdentity) {
+        annotationController.update(ann.id, { author: newIdentity });
+      }
+    }
     setCodeAnnotations(prev => prev.map(ann =>
       ann.author === oldIdentity ? { ...ann, author: newIdentity } : ann
     ));
@@ -1285,7 +1507,12 @@ const App: React.FC = () => {
     const hasDocAnnotations = Array.from(docAnnotations.values()).some(
       (d) => d.annotations.length > 0 || d.globalAttachments.length > 0
     );
-    const hasPlanAnnotations = allAnnotations.length > 0 || globalAttachments.length > 0;
+    // Room mode: global attachments are local-only (rooms carry no
+    // image payloads), so they must NOT be included in consolidated
+    // feedback — approving with local-only image refs would ship paths
+    // collaborators never saw. Out-of-room keeps existing behavior.
+    const effectiveGlobalAttachments = roomModeActive ? [] : globalAttachments;
+    const hasPlanAnnotations = allAnnotations.length > 0 || effectiveGlobalAttachments.length > 0;
     const hasEditorAnnotations = editorAnnotations.length > 0;
     const hasCodeAnnotations = codeAnnotations.length > 0;
 
@@ -1303,7 +1530,7 @@ const App: React.FC = () => {
       ? exportAnnotations(
           blocks,
           allAnnotations,
-          globalAttachments,
+          effectiveGlobalAttachments,
           annotateSource === 'message' ? 'Message Feedback' : annotateSource === 'folder' ? 'Folder Feedback' : annotateSource === 'file' ? 'File Feedback' : 'Plan Feedback',
           annotateSource ?? 'plan',
           { sourceConverted: activeConverted },
@@ -1331,7 +1558,7 @@ const App: React.FC = () => {
     }
 
     return output;
-  }, [blocks, allAnnotations, globalAttachments, linkedDocHook.getDocAnnotations, editorAnnotations, codeAnnotations, sourceConverted, annotateSource, linkedDocHook.isActive, linkedDocHook.filepath]);
+  }, [blocks, allAnnotations, globalAttachments, roomModeActive, linkedDocHook.getDocAnnotations, editorAnnotations, codeAnnotations, sourceConverted, annotateSource, linkedDocHook.isActive, linkedDocHook.filepath]);
 
   // Bot callback config — read once from URL search params (?cb=&ct=)
   // TODO: bot callbacks post shareUrl which doesn't include code-file annotations.
@@ -1449,6 +1676,70 @@ const App: React.FC = () => {
     }
   };
 
+  const copyToClipboardWithToast = React.useCallback(
+    async (text: string, successMessage: string, errorMessage: string) => {
+      try {
+        await navigator.clipboard.writeText(text);
+        toast.success(successMessage);
+      } catch {
+        toast.error(errorMessage);
+      }
+    },
+    [],
+  );
+  const handleCopyParticipantUrl = React.useCallback(async () => {
+    const url = roomSession?.joinUrl;
+    if (!url) return;
+    await copyToClipboardWithToast(
+      url,
+      'Participant link copied',
+      'Failed to copy link',
+    );
+  }, [roomSession?.joinUrl, copyToClipboardWithToast]);
+  const handleCopyAdminUrl = React.useCallback(async () => {
+    const url = roomSession?.adminUrl;
+    if (!url) return;
+    await copyToClipboardWithToast(
+      url,
+      'Admin link copied',
+      'Failed to copy admin link',
+    );
+  }, [roomSession?.adminUrl, copyToClipboardWithToast]);
+  const handleCopyConsolidatedFeedback = React.useCallback(async () => {
+    // Exclude diff-context annotations from exported feedback — same
+    // filter the prior RoomPanel path used. Global attachments are
+    // empty inside a room (images are stripped at create time).
+    const text = exportAnnotations(
+      blocks,
+      allAnnotations.filter(a => !a.diffContext),
+      [],
+    );
+    await copyToClipboardWithToast(
+      text,
+      'Feedback copied',
+      'Failed to copy feedback',
+    );
+  }, [blocks, allAnnotations, copyToClipboardWithToast]);
+
+  const handleCopyRoomAgentInstructions = React.useCallback(async () => {
+    // Prefer the participant URL (joinUrl) so an agent dropped into
+    // the clipboard payload doesn't accidentally end up with admin
+    // capability. The CLI also strips `#admin=` defensively, but
+    // pairing the strip with a deliberate participant-URL copy here
+    // makes the guard layered rather than single-point.
+    const joinUrl = roomSession?.joinUrl;
+    if (!joinUrl) return;
+    const payload = buildRoomAgentInstructions({
+      joinUrl,
+      userIdentity: getIdentity(),
+    });
+    await copyToClipboardWithToast(
+      payload,
+      'Agent instructions copied',
+      'Failed to copy instructions',
+    );
+  }, [roomSession?.joinUrl, copyToClipboardWithToast]);
+
   // Cmd/Ctrl+S keyboard shortcut — save to default notes app
   useEffect(() => {
     const handleSaveShortcut = (e: KeyboardEvent) => {
@@ -1519,7 +1810,7 @@ const App: React.FC = () => {
 
   // Header handlers ref — stores latest handler references so the stable
   // callbacks below always call the current version without needing useCallback
-  // dep arrays for every handler. This lets React.memo on AppHeader work.
+  // dep arrays for every handler. Enables React.memo on AppHeader.
   const headerHandlersRef = useRef({
     handleApprove,
     handleDeny,
@@ -1608,6 +1899,14 @@ const App: React.FC = () => {
   const handleSaveToObsidian = useCallback(() => headerHandlersRef.current.handleQuickSaveToNotes('obsidian'), []);
   const handleSaveToOctarine = useCallback(() => headerHandlersRef.current.handleQuickSaveToNotes('octarine'), []);
   const handleSaveToBear = useCallback(() => headerHandlersRef.current.handleQuickSaveToNotes('bear'), []);
+  const handleHeaderStartLiveRoom = useMemo(
+    () => canStartLiveRoom ? handleStartLiveRoom : undefined,
+    [canStartLiveRoom, handleStartLiveRoom],
+  );
+  const handleHeaderRoomDelete = useCallback(() => {
+    toast.success('Room deleted');
+    void roomAdmin.run('delete');
+  }, [roomAdmin]);
 
   const planMaxWidth = useMemo(() => {
     const widths: Record<PlanWidth, number> = { compact: 832, default: 1040, wide: 1280 };
@@ -1641,6 +1940,21 @@ const App: React.FC = () => {
           taterMode={taterMode}
           mobileSettingsOpen={mobileSettingsOpen}
           gitUser={gitUser}
+          submitError={submitError ?? undefined}
+          roomControls={roomModeActive && roomSession?.room ? (
+            <RoomHeaderControls
+              connectionStatus={roomSession.room.connectionStatus}
+              remotePresence={roomSession.room.remotePresence}
+              isAdmin={roomSession.room.hasAdminCapability}
+              adminUrl={roomSession.adminUrl}
+              pendingAdminAction={roomAdmin.pending}
+              onCopyParticipantUrl={handleCopyParticipantUrl}
+              onCopyAdminUrl={handleCopyAdminUrl}
+              onCopyConsolidatedFeedback={handleCopyConsolidatedFeedback}
+              onCopyAgentInstructions={handleCopyRoomAgentInstructions}
+              onDelete={handleHeaderRoomDelete}
+            />
+          ) : undefined}
           onCallbackFeedback={handleCallbackFeedback}
           onCallbackApprove={handleCallbackApprove}
           onAnnotateExit={handleHeaderAnnotateExit}
@@ -1665,6 +1979,7 @@ const App: React.FC = () => {
           onSaveToObsidian={handleSaveToObsidian}
           onSaveToBear={handleSaveToBear}
           onSaveToOctarine={handleSaveToOctarine}
+          onStartLiveRoom={handleHeaderStartLiveRoom}
           appVersion={typeof __APP_VERSION__ !== 'undefined' ? __APP_VERSION__ : '0.0.0'}
           agentInstructionsEnabled={isApiMode && !archive.archiveMode && !annotateMode}
           obsidianConfigured={isObsidianConfigured()}
@@ -1672,6 +1987,22 @@ const App: React.FC = () => {
           octarineConfigured={isOctarineConfigured()}
         />
 
+        {/*
+          Room-mode stripped-images banner. Moved here from the old
+          floating RoomPanel so it sits directly under the header as
+          a one-line callout the first time the creator lands in a
+          room; dismissing it (or refreshing, which clears the
+          window global) removes it for the session.
+        */}
+        {roomModeActive && strippedImagesCount > 0 && (
+          <div className="px-4 pt-3 flex-shrink-0">
+            <ImageStripNotice
+              strippedCount={strippedImagesCount}
+              onDismiss={() => setStrippedImagesCount(0)}
+            />
+          </div>
+        )}
+
         {/* Linked document error banner */}
         {linkedDocHook.error && (
           <div className="bg-destructive/10 border-b border-destructive/20 px-4 py-2 flex items-center gap-2 flex-shrink-0">
@@ -1899,19 +2230,22 @@ const App: React.FC = () => {
                     mode={editorMode}
                     inputMethod={inputMethod}
                     taterMode={taterMode}
-                    globalAttachments={globalAttachments}
-                    onAddGlobalAttachment={handleAddGlobalAttachment}
-                    onRemoveGlobalAttachment={handleRemoveGlobalAttachment}
+                    authorOverride={roomSession?.user?.name}
+                    globalAttachments={roomModeActive ? [] : globalAttachments}
+                    onAddGlobalAttachment={roomModeActive ? undefined : handleAddGlobalAttachment}
+                    onRemoveGlobalAttachment={roomModeActive ? undefined : handleRemoveGlobalAttachment}
+                    attachmentsEnabled={!roomModeActive}
                     repoInfo={repoInfo}
                     stickyActions={uiPrefs.stickyActionsEnabled}
                     planDiffStats={linkedDocHook.isActive ? null : planDiff.diffStats}
                     isPlanDiffActive={isPlanDiffActive}
                     onPlanDiffToggle={() => setIsPlanDiffActive(!isPlanDiffActive)}
                     hasPreviousVersion={!linkedDocHook.isActive && planDiff.hasPreviousVersion}
-                    showDemoBadge={!isApiMode && !isLoadingShared && !isSharedSession}
+                    showDemoBadge={!isApiMode && !isLoadingShared && !isSharedSession && !roomModeActive}
                     maxWidth={annotateReaderMaxWidth}
-                    onOpenLinkedDoc={handleOpenLinkedDoc}
+                    onOpenLinkedDoc={roomModeActive ? undefined : handleOpenLinkedDoc}
                     onOpenCodeFile={codeFilePopout.open}
+                    localDocLinksEnabled={!roomModeActive}
                     linkedDocInfo={linkedDocHook.isActive ? { filepath: linkedDocHook.filepath!, onBack: handleLinkedDocBack, label: fileBrowser.dirs.find(d => d.path === fileBrowser.activeDirPath)?.isVault ? 'Vault File' : fileBrowser.activeFile ? 'File' : undefined, backLabel } : null}
                     imageBaseDir={imageBaseDir}
                     codePathBaseDir={activeDocBaseDir}
@@ -1921,6 +2255,7 @@ const App: React.FC = () => {
                     onToggleCheckbox={checkbox.toggle}
                     checkboxOverrides={checkbox.overrides}
                     actionsLabelMode={actionsLabelMode}
+                    onHighlightSurfaceReset={bumpHighlightSurfaceGeneration}
                   />
                 )}
               </div>
@@ -1954,6 +2289,28 @@ const App: React.FC = () => {
             onShare={canShareCurrentSession && (shareUrl || shortShareUrl) ? () => { setIsPanelOpen(false); setInitialExportTab('share'); setShowExport(true); } : undefined}
             otherFileAnnotations={otherFileAnnotations}
             onOtherFileAnnotationsClick={handleFlashAnnotatedFiles}
+            // Room-mode pending/failed surface. Local mode provides undefined
+            // Maps/callbacks so AnnotationPanel skips the UI.
+            pendingIds={pendingAnnotationIds}
+            failedIds={roomModeActive ? annotationController.failed : undefined}
+            pendingAdditions={roomModeActive ? annotationController.pendingAdditions : undefined}
+            onRetry={roomModeActive ? annotationController.retry : undefined}
+            onDiscard={roomModeActive ? (id: string) => {
+              // For failed adds, the selection-highlighter may have
+              // created a local <mark> before the op failed. The
+              // controller's discard clears state but not DOM.
+              // removeHighlight is safe to call on ids that don't have
+              // a mark (no-ops internally).
+              const failedOp = annotationController.failed.get(id);
+              if (failedOp?.kind === 'add') {
+                viewerRef.current?.removeHighlight(id);
+              }
+              annotationController.discard?.(id);
+            } : undefined}
+            // Room mode: "(me)" compares against the joined display
+            // name instead of the per-origin Tater cookie, matching
+            // the override Viewer uses to stamp new annotations.
+            authorOverride={roomSession?.user?.name}
           />
         </div>
         </ScrollViewportContext.Provider>
@@ -1991,6 +2348,7 @@ const App: React.FC = () => {
           markdown={markdown}
           isApiMode={isApiMode}
           initialTab={initialExportTab}
+          onStartLiveRoom={canStartLiveRoom ? handleStartLiveRoom : undefined}
         />
 
         {/* Import Modal */}
@@ -2001,6 +2359,24 @@ const App: React.FC = () => {
           shareBaseUrl={shareBaseUrl}
         />
 
+        {/* Start-live-room modal (local mode only; hidden in room mode).
+            Prefills come from the local-origin ConfigStore — the same
+            identity + color Settings reads/writes. Room creation is a
+            confirmation step, not setup, so a creator who already
+            configured their name/color sees those values preselected
+            and can confirm or tweak per room. */}
+        {showStartRoomModal && !roomModeActive && (
+          <StartRoomModal
+            initialDisplayName={getIdentity()}
+            initialColor={getPresenceColor()}
+            imageAnnotationsToStrip={imageAnnotationsToStrip}
+            inFlight={startRoomInFlight}
+            errorMessage={startRoomError || undefined}
+            onStart={handleConfirmStartRoom}
+            onCancel={handleCancelStartRoom}
+          />
+        )}
+
         {/* Feedback prompt dialog */}
         <ConfirmDialog
           isOpen={showFeedbackPrompt}
@@ -2086,6 +2462,14 @@ const App: React.FC = () => {
           variant="warning"
         />
 
+        {roomAdmin.error && (
+          <RoomAdminErrorToast
+            action={roomAdmin.error.action}
+            message={roomAdmin.error.message}
+            onDismiss={roomAdmin.dismissError}
+          />
+        )}
+
         <Toaster
           position="top-right"
           offset={64}
@@ -2134,14 +2518,20 @@ const App: React.FC = () => {
         {/* Update notification */}
         <UpdateBanner origin={origin} isWSL={isWSL} />
 
-        {/* Image Annotator for pasted images */}
-        <ImageAnnotator
-          isOpen={!!pendingPasteImage}
-          imageSrc={pendingPasteImage?.blobUrl ?? ''}
-          initialName={pendingPasteImage?.initialName}
-          onAccept={handlePasteAnnotatorAccept}
-          onClose={handlePasteAnnotatorClose}
-        />
+        {/* Image Annotator for pasted images — not rendered in room mode
+            because rooms don't support image uploads. The paste handler
+            already short-circuits, but not rendering the component at all
+            prevents any edge case where pendingPasteImage was set before
+            room mode activated. */}
+        {!roomModeActive && (
+          <ImageAnnotator
+            isOpen={!!pendingPasteImage}
+            imageSrc={pendingPasteImage?.blobUrl ?? ''}
+            initialName={pendingPasteImage?.initialName}
+            onAccept={handlePasteAnnotatorAccept}
+            onClose={handlePasteAnnotatorClose}
+          />
+        )}
 
         {/* Permission Mode Setup (Claude Code first-time) */}
         <PermissionModeSetup
@@ -2158,3 +2548,10 @@ const App: React.FC = () => {
 };
 
 export default App;
+
+/** Stable fingerprint for room annotation reconciliation. If any
+ *  display-relevant field changes, the old mark is removed and a
+ *  fresh one applied. */
+function roomAnnFingerprint(a: { id: string; type: string; originalText: string; text?: string }): string {
+  return `${a.type}\0${a.originalText}\0${a.text ?? ''}`;
+}
diff --git a/packages/editor/AppRoot.tsx b/packages/editor/AppRoot.tsx
new file mode 100644
index 000000000..88dfd27d3
--- /dev/null
+++ b/packages/editor/AppRoot.tsx
@@ -0,0 +1,164 @@
+/**
+ * AppRoot — the top-level fork that picks between local mode (<App />) and
+ * room mode (<RoomApp><App roomSession=… /></RoomApp>).
+ *
+ * This is the *only* place that knows whether the editor is in a live
+ * room. Everything below reacts to a single `roomSession` prop; the
+ * Viewer, annotation panel, toolbar, and share UI stay mode-oblivious.
+ *
+ * `@plannotator/editor` re-exports this as its default so apps/hook/,
+ * apps/portal/, and any other consumer automatically pick up room-mode
+ * support by upgrading.
+ */
+
+import React from 'react';
+import App from './App';
+import { RoomApp } from './RoomApp';
+import { useRoomMode } from '@plannotator/ui/hooks/collab/useRoomMode';
+import { ThemeProvider } from '@plannotator/ui/components/ThemeProvider';
+import { isBase64Url32ByteString } from '@plannotator/shared/collab/validation';
+import { storeAdminSecret, loadAdminSecret } from '@plannotator/ui/utils/adminSecretStorage';
+import { captureCreatorIdentityFromFragment } from './roomIdentityHandoff';
+
+/**
+ * Capture the image-strip handoff written by the creator into the
+ * fragment (`&stripped=N`) and strip the param from the visible URL so
+ * a refresh doesn't re-show the notice. The count itself is picked up
+ * by RoomApp via `window.__PLANNOTATOR_STRIPPED_IMAGES__`.
+ *
+ * Path-gated to `/c/:roomId`: non-room shells (apps/hook, apps/portal,
+ * apps/review) also mount `AppRoot`, and their URL fragments are static-
+ * share payloads — feeding those through `URLSearchParams` and rewriting
+ * with `history.replaceState` corrupts the deflated share hash. Only room
+ * URLs carry `&stripped=N`, so scope the rewrite to room paths.
+ */
+function extractStrippedImagesFromFragment(): void {
+  if (typeof window === 'undefined') return;
+  if (!/^\/c\/([^/]+)$/.test(window.location.pathname)) return;
+  const hash = window.location.hash.slice(1);
+  if (!hash.includes('stripped=')) return;
+  const params = new URLSearchParams(hash);
+  const strippedRaw = params.get('stripped');
+  if (strippedRaw) {
+    const n = parseInt(strippedRaw, 10);
+    if (Number.isFinite(n) && n > 0) {
+      (window as { __PLANNOTATOR_STRIPPED_IMAGES__?: number }).__PLANNOTATOR_STRIPPED_IMAGES__ = n;
+    }
+  }
+  params.delete('stripped');
+  const rest = params.toString();
+  const pathname = window.location.pathname;
+  window.history.replaceState(null, '', `${pathname}${rest ? `#${rest}` : ''}`);
+}
+
+/**
+ * Capture the admin secret from the URL fragment into sessionStorage at
+ * this origin so refresh recovers admin capability even if the fragment
+ * later gets stripped (e.g. by a URL cleaner, paste-and-reload, or a
+ * future `replaceState` that drops the admin param).
+ *
+ * We do NOT strip the admin fragment from the visible URL — useCollabRoom
+ * still needs it for WebSocket auth on every connection, and stripping
+ * would break refresh unless we also wired an adminSecret override into
+ * useRoomMode → RoomApp. sessionStorage is best-effort recovery; the
+ * fragment remains the canonical credential carrier.
+ */
+function captureAdminSecretFromFragment(): void {
+  if (typeof window === 'undefined') return;
+  const path = window.location.pathname;
+  const roomMatch = path.match(/^\/c\/([^/]+)$/);
+  if (!roomMatch) return;
+  const hash = window.location.hash.slice(1);
+  if (!hash.includes('admin=')) return;
+  const params = new URLSearchParams(hash);
+  const admin = params.get('admin');
+  if (!admin) return;
+  // Validate before storing: a crafted URL with a garbage admin= value
+  // would poison this room's sessionStorage entry and cause join/admin
+  // recovery failures on later visits until the entry is cleared.
+  // ADMIN_SECRET_LENGTH_BYTES is 32; base64url of 32 bytes is 43 chars.
+  // We validate length + charset rather than importing the full crypto
+  // module at boot time.
+  if (!isBase64Url32ByteString(admin)) return;
+  // No-clobber: if we already have a stored admin secret for this
+  // room, only accept a matching value. A fake-but-well-shaped
+  // `&admin=` appended to the participant URL (room key is already
+  // public via the participant link) could otherwise overwrite the
+  // creator's real stored secret, breaking refresh-based admin
+  // recovery until sessionStorage is cleared manually. Same admin
+  // secret is idempotent; a different one is silently ignored.
+  const existing = loadAdminSecret(roomMatch[1]);
+  if (existing && existing !== admin) return;
+  storeAdminSecret(roomMatch[1], admin);
+}
+
+// Module-level side effects so they run exactly once per tab load, before
+// React mounts anything. `captureCreatorIdentityFromFragment` is imported
+// from `./roomIdentityHandoff` for test isolation — running it alongside
+// the two legacy captures above keeps the visible URL and ConfigStore in
+// sync for the creator-origin → room-origin navigation.
+extractStrippedImagesFromFragment();
+captureAdminSecretFromFragment();
+captureCreatorIdentityFromFragment();
+
+/**
+ * Inner fork (mode selection). Wrapped by `<ThemeProvider>` in the
+ * exported `AppRoot` below so every branch — including the pre-join
+ * gate in room mode and the invalid-room terminal screen — renders
+ * with the theme class on `<html>` and theme-token-based Tailwind
+ * classes (`bg-background`, `bg-card`, `text-muted-foreground`…) resolve
+ * to real colors.
+ *
+ * Earlier the `ThemeProvider` lived inside `<App>` itself, which meant
+ * `<JoinRoomGate>` (rendered by `<RoomApp>` BEFORE it mounts App) had
+ * no theme class applied yet — every theme-token-driven style
+ * collapsed to the browser default and the gate looked unstyled.
+ * Hoisting up fixes that and the invalid-room screen in one shot.
+ */
+function AppRootContent(): React.ReactElement {
+  const mode = useRoomMode();
+
+  if (mode.mode === 'local') {
+    return <App />;
+  }
+
+  if (mode.mode === 'invalid-room') {
+    // A path under /c/ that failed to parse must NOT fall through to
+    // the local editor. On the public room origin this prevents
+    // visitors to room.plannotator.ai/c/<bad> from seeing a blank
+    // local Plannotator with no plan context. We render a terminal
+    // dead-end advising the user to request a fresh link. Same shape
+    // RoomApp uses for room-deleted/room-expired.
+    return (
+      <div className="fixed inset-0 flex items-center justify-center bg-background p-4">
+        <div className="text-center space-y-3 max-w-sm">
+          <h2 className="text-lg font-semibold">This room link looks broken</h2>
+          <p className="text-sm text-muted-foreground">{mode.reason}</p>
+          <p className="text-xs text-muted-foreground">
+            Ask the person who shared this link to send it again.
+          </p>
+        </div>
+      </div>
+    );
+  }
+
+  // Room mode. RoomApp owns the session and renders the editor via
+  // the renderEditor prop with roomSession threaded through.
+  return (
+    <RoomApp
+      roomId={mode.roomId}
+      url={mode.url}
+      renderEditor={({ roomSession }) => <App roomSession={roomSession} />}
+    />
+  );
+}
+
+export function AppRoot(): React.ReactElement {
+  return (
+    <ThemeProvider defaultTheme="dark">
+      <AppRootContent />
+    </ThemeProvider>
+  );
+}
+
+export default AppRoot;
diff --git a/packages/editor/RoomApp.tsx b/packages/editor/RoomApp.tsx
new file mode 100644
index 000000000..2f40898ab
--- /dev/null
+++ b/packages/editor/RoomApp.tsx
@@ -0,0 +1,558 @@
+/**
+ * RoomApp — the room-mode shell that wraps the existing <App>.
+ *
+ * Responsibilities:
+ * - Parse the room URL (already done by AppRoot; passed in as props).
+ * - Render the identity gate until the participant has picked name + color.
+ * - Mount useCollabRoomSession({ intent: 'join', ... }) after the gate.
+ * - Render the RemoteCursorLayer overlay and the LocalPresenceEmitter
+ *   around <App>.
+ * - Show a terminal "room no longer available" screen when the room is
+ *   deleted or expired.
+ *
+ * Explicitly NOT done here:
+ * - Room header UI — `RoomHeaderControls` lives in the editor header
+ *   and is owned by `App.tsx`. That's also where delete, copy links,
+ *   and copy consolidated feedback originate.
+ * - Image-stripped notice and stripped-image count handoff — moved to
+ *   `App.tsx` so the banner renders directly under the editor header
+ *   instead of as a stacked floating card.
+ * - Approve/Deny — local-only, never offered in room mode; the room
+ *   tab has no cross-origin path to the blocked agent hook.
+ */
+
+import React, { useCallback, useEffect, useMemo, useRef, useState } from 'react';
+import { useCollabRoomSession } from '@plannotator/ui/hooks/collab/useCollabRoomSession';
+import { usePresenceThrottle } from '@plannotator/ui/hooks/collab/usePresenceThrottle';
+import { RemoteCursorLayer } from '@plannotator/ui/components/collab/RemoteCursorLayer';
+import { JoinRoomGate } from '@plannotator/ui/components/collab/JoinRoomGate';
+import { RoomUnavailableScreen } from '@plannotator/ui/components/collab/RoomUnavailableScreen';
+import { loadAdminSecret } from '@plannotator/ui/utils/adminSecretStorage';
+import {
+  getIdentity,
+  setCustomIdentity,
+  getPresenceColor,
+  setPresenceColor,
+} from '@plannotator/ui/utils/identity';
+import {
+  isRoomIdentityConfirmed,
+  markRoomIdentityConfirmed,
+} from '@plannotator/ui/utils/roomIdentityConfirmed';
+import type { CollabRoomUser } from '@plannotator/shared/collab/client';
+import type { PresenceState, CursorState } from '@plannotator/shared/collab';
+
+export interface RoomAppProps {
+  roomId: string;
+  url: string;
+  /**
+  /** Children = the existing <App> component; wrapped so it becomes room-aware via props. */
+  renderEditor(args: {
+    roomSession: ReturnType<typeof useCollabRoomSession>;
+  }): React.ReactNode;
+}
+
+/**
+ * Generate a high-entropy internal id for a participant. Not rendered —
+ * cursor labels and avatars pull from `user.name` (the display name the
+ * participant typed). Used as an opaque handle inside this tab so
+ * anything that stores per-id state (future sessionStorage-backed UI)
+ * doesn't collide when two participants picked the same display name.
+ */
+function generateParticipantId(): string {
+  // `crypto.randomUUID()` is available in every browser the editor
+  // supports (Chrome 92+, Firefox 95+, Safari 15.4+).
+  return typeof crypto !== 'undefined' && typeof crypto.randomUUID === 'function'
+    ? crypto.randomUUID()
+    : `guest-${Math.random().toString(36).slice(2)}-${Date.now().toString(36)}`;
+}
+
+export function RoomApp({
+  roomId,
+  url,
+  renderEditor,
+}: RoomAppProps): React.ReactElement {
+  // Skip the join gate when we already have a confirmed identity for
+  // THIS room in this tab. The flag is set by:
+  //   - `AppRoot` on creator arrival (consumed the `&name=&color=`
+  //     fragment handoff).
+  //   - `handleJoin` below after a participant submits the gate.
+  //
+  // `useState` initializer runs synchronously on first render so the
+  // gate never flashes when the flag is already set. A different room
+  // URL in the same tab lands here with `isRoomIdentityConfirmed(...)`
+  // returning false for that new roomId, so the user re-confirms per
+  // room (the agreed UX — allows per-room color tweaks).
+  const [identity, setIdentity] = useState<CollabRoomUser | null>(() => {
+    if (typeof window === 'undefined') return null;
+    if (!isRoomIdentityConfirmed(roomId)) return null;
+    return {
+      id: generateParticipantId(),
+      name: getIdentity(),
+      color: getPresenceColor(),
+    };
+  });
+  // Local cursor state used to live here, but a ~20Hz pointermove-driven
+  // setState at RoomApp's top level rerendered the whole editor tree
+  // (renderEditor's inline arrow in AppRoot produces a fresh <App/>
+  // element on every parent render, and App isn't React.memo'd). It now
+  // lives inside `LocalPresenceEmitter` — a null-rendering sibling of
+  // the editor — so pointer moves only reconcile that tiny subtree.
+  // Latches to true the first time the client reaches `connectionStatus:
+  // 'authenticated'` and never clears. Once set, a transient socket drop
+  // (reconnecting / non-terminal disconnected) must NOT tear the editor
+  // tree down — the runtime preserves the snapshot and re-authenticates
+  // in the background. Unmounting RoomAuthenticatedView during a blip
+  // would lose local UI state (selections, scroll, panel layout) for
+  // every user every time their network flinches.
+  const [hasEverAuthenticated, setHasEverAuthenticated] = useState(false);
+
+  // The stripped-image handoff (window.__PLANNOTATOR_STRIPPED_IMAGES__)
+  // is consumed in App.tsx now — App renders the banner directly
+  // beneath the editor header so it reads as a normal notice rather
+  // than a stacked card next to the floating RoomPanel that used to
+  // live here. AppRoot writes the global; App reads it once at mount.
+
+  // If we came in on a participant-only URL but sessionStorage holds an
+  // admin secret for this roomId (previous create in this tab), recover
+  // admin capability silently. This is the refresh path for creators.
+  const storedAdminSecret = useMemo(
+    () => loadAdminSecret(roomId),
+    [roomId],
+  );
+
+  const session = useCollabRoomSession({
+    intent: 'join',
+    url,
+    user: identity ?? { id: 'anonymous', name: 'anon', color: '#888' },
+    enabled: identity !== null,
+    adminSecretOverride: storedAdminSecret ?? undefined,
+  });
+
+  // Latch hasEverAuthenticated on the first `authenticated` transition so
+  // subsequent reconnects don't unmount the editor.
+  React.useEffect(() => {
+    if (session.room?.connectionStatus === 'authenticated') {
+      setHasEverAuthenticated(true);
+    }
+  }, [session.room?.connectionStatus]);
+
+  const handleJoin = useCallback((submit: { displayName: string; color: string }) => {
+    // Persist gate edits back to room-origin ConfigStore so the same
+    // identity + color prefills on the next room the user joins from
+    // this browser. Same semantics as the StartRoomModal save-back in
+    // App.tsx: identity is a Plannotator-wide preference, not a
+    // per-visit input. Writes are no-ops when the submitted values
+    // already match.
+    if (submit.displayName && submit.displayName !== getIdentity()) {
+      setCustomIdentity(submit.displayName);
+    }
+    if (submit.color && submit.color !== getPresenceColor()) {
+      setPresenceColor(submit.color);
+    }
+    // Mark this room as "identity confirmed in this tab" so a reload
+    // goes straight back in without re-prompting. Per-room scope means
+    // opening a different room URL in this tab still surfaces the
+    // (prefilled) gate so users can adjust per room.
+    markRoomIdentityConfirmed(roomId);
+    setIdentity({
+      id: generateParticipantId(),
+      name: submit.displayName,
+      color: submit.color,
+    });
+  }, [roomId]);
+
+  // Session-level error (e.g. URL parse failure in useCollabRoomSession).
+  // Without this branch, a bad URL would leave the participant stuck in
+  // JoinRoomGate with `connectionStatus: disconnected` forever since
+  // `session.room` stays undefined.
+  if (session.phase === 'error') {
+    return (
+      <div className="fixed inset-0 flex items-center justify-center bg-background">
+        <div className="text-center space-y-3 max-w-sm">
+          <h2 className="text-lg font-semibold">This link looks broken</h2>
+          <p className="text-sm text-muted-foreground">
+            {session.error?.message ?? 'The room URL could not be parsed.'}
+          </p>
+          <p className="text-xs text-muted-foreground">
+            Ask the person who shared this link to send it again.
+          </p>
+        </div>
+      </div>
+    );
+  }
+
+  // Terminal state: the server closed our socket with the "room
+  // unavailable" signal. Same screen for admin-deleted, auto-expired,
+  // or unknown-room — the client deliberately does not distinguish.
+  if (session.room?.roomUnavailable) {
+    return <RoomUnavailableScreen />;
+  }
+
+  // Pre-connect identity gate. Prefill from Plannotator preferences so
+  // a returning user sees their saved name/color instead of blank inputs
+  // (first-time visitors to room.plannotator.ai still get a generated
+  // tater + hash-derived swatch, which is a reasonable default).
+  if (identity === null) {
+    return (
+      <JoinRoomGate
+        initialDisplayName={getIdentity()}
+        initialColor={getPresenceColor()}
+        connectionStatus="disconnected"
+        onJoin={handleJoin}
+      />
+    );
+  }
+
+  // Terminal connect/auth failures: auth rejected, connect timeout,
+  // room unavailable. These set connectionStatus='disconnected' with a
+  // non-null lastError whose scope='join'. room_unavailable routes to
+  // the shared terminal screen; auth/timeout keep their distinct copy
+  // since they're recoverable-ish user errors, not "link is dead."
+  const connectionStatus = session.room?.connectionStatus ?? 'connecting';
+  const joinError = session.room?.lastError;
+  if (connectionStatus === 'disconnected' && joinError && joinError.scope === 'join') {
+    if (joinError.code === 'room_unavailable') {
+      return <RoomUnavailableScreen />;
+    }
+    return (
+      <div className="fixed inset-0 flex items-center justify-center bg-background">
+        <div className="text-center space-y-3 max-w-sm">
+          <h2 className="text-lg font-semibold">
+            {joinError.code === 'auth_rejected' ? 'Access denied' :
+             joinError.code === 'connect_timeout' ? 'Connection timed out' :
+             'Could not join room'}
+          </h2>
+          <p className="text-sm text-muted-foreground">{joinError.message}</p>
+          <p className="text-xs text-muted-foreground">
+            Ask the person who shared this link to verify it.
+          </p>
+        </div>
+      </div>
+    );
+  }
+
+  // Pre-first-auth: keep the gate up with a status indicator. Once we've
+  // ever authenticated, non-terminal transients (reconnecting, the brief
+  // pre-terminal `disconnected` window before the auth-failure branch
+  // above fires) keep RoomAuthenticatedView mounted — the status banner
+  // inside it (RoomStatusBadge + reconnect banner) communicates the
+  // transient state without tearing down editor/panel state.
+  if (!hasEverAuthenticated && connectionStatus !== 'authenticated') {
+    return (
+      <JoinRoomGate
+        initialDisplayName={identity.name}
+        initialColor={identity.color}
+        connectionStatus={connectionStatus}
+        onJoin={handleJoin}
+      />
+    );
+  }
+
+  // Authenticated (or briefly transient after first auth): render editor
+  // + room overlays. session.room can be undefined for a microtask if
+  // useCollabRoomSession is mid-recomputation even after authentication;
+  // fall back to the gate only in that pathological case.
+  const room = session.room;
+  if (!room) {
+    return (
+      <JoinRoomGate
+        initialDisplayName={identity.name}
+        initialColor={identity.color}
+        connectionStatus={connectionStatus}
+        onJoin={handleJoin}
+      />
+    );
+  }
+  return (
+    <RoomAuthenticatedView
+      room={room}
+      session={session}
+      identity={identity}
+      renderEditor={renderEditor}
+    />
+  );
+}
+
+/**
+ * Split from RoomApp so the cursor-presence hooks (pointer listeners,
+ * presence throttle) are only mounted AFTER we've authenticated. Mounting
+ * them in RoomApp's top-level would send presence through an un-ready
+ * client during the identity-gate / connecting window.
+ */
+function RoomAuthenticatedView({
+  room,
+  session,
+  identity,
+  renderEditor,
+}: {
+  room: NonNullable<ReturnType<typeof useCollabRoomSession>['room']>;
+  session: ReturnType<typeof useCollabRoomSession>;
+  identity: CollabRoomUser;
+  renderEditor: RoomAppProps['renderEditor'];
+}): React.ReactElement {
+  // Ref on the relative container so RemoteCursorLayer's coordinate
+  // translation reads the overlay's actual viewport position. Measuring
+  // `document.documentElement` would zero out the top/left and leave
+  // cursors offset whenever the room shell is not flush against the
+  // viewport edges (e.g. future layouts with a header/padding).
+  const roomContainerRef = useRef<HTMLDivElement | null>(null);
+
+  return (
+    <div className="relative" data-testid="room-app" ref={roomContainerRef}>
+      {renderEditor({ roomSession: session })}
+
+      {/*
+        Null-rendering sibling that owns the pointermove listener and
+        throttled presence send. See the component comment for why this
+        is isolated from the editor tree.
+      */}
+      <LocalPresenceEmitter
+        identity={identity}
+        sendPresence={room.updatePresence}
+      />
+
+      <RemoteCursorLayerWithViewport
+        remotePresence={room.remotePresence}
+        containerRef={roomContainerRef}
+      />
+    </div>
+  );
+}
+
+/**
+ * Thin wrapper that tracks the overlay container rect for
+ * `RemoteCursorLayer`. The passed `containerRef` points at the
+ * `RemoteCursorLayer`'s nearest positioned ancestor — the layer itself
+ * is `absolute inset-0`, so cursor coords need to be translated by
+ * that ancestor's viewport offset. Scroll listeners are rAF-throttled
+ * and `ResizeObserver` is used when available for container resizes
+ * that don't fire a `window` resize (layout shifts, font loads).
+ */
+function RemoteCursorLayerWithViewport({
+  remotePresence,
+  containerRef,
+}: {
+  remotePresence: Record<string, import('@plannotator/shared/collab').PresenceState>;
+  containerRef: React.RefObject<HTMLDivElement | null>;
+}): React.ReactElement {
+  const [rect, setRect] = useState<DOMRect | null>(null);
+  useEffect(() => {
+    const el = containerRef.current;
+    if (!el) return;
+
+    let rafId: number | null = null;
+    const update = () => {
+      rafId = null;
+      setRect(el.getBoundingClientRect());
+    };
+    const schedule = () => {
+      if (rafId !== null) return;
+      rafId = requestAnimationFrame(update);
+    };
+
+    update();
+    // Capture-phase scroll catches any scrolling ancestor, not just window.
+    window.addEventListener('scroll', schedule, true);
+    window.addEventListener('resize', schedule);
+
+    let ro: ResizeObserver | null = null;
+    if (typeof ResizeObserver !== 'undefined') {
+      ro = new ResizeObserver(schedule);
+      ro.observe(el);
+    }
+
+    return () => {
+      window.removeEventListener('scroll', schedule, true);
+      window.removeEventListener('resize', schedule);
+      ro?.disconnect();
+      // Cancel a pending frame so `setRect` can't fire after unmount.
+      if (rafId !== null) cancelAnimationFrame(rafId);
+    };
+  }, [containerRef]);
+
+  return (
+    <RemoteCursorLayer
+      remotePresence={remotePresence}
+      containerRect={rect}
+    />
+  );
+}
+
+/**
+ * Null-rendering sibling of the editor that owns the pointermove
+ * listener and the throttled `room.updatePresence` send.
+ *
+ * Why a dedicated component:
+ *   `usePresenceThrottle` is effect-driven — it needs React state as
+ *   its input to fire, so the value can't be pure-ref'd. If that
+ *   state lived on `RoomApp` (as it originally did) every pointer
+ *   move would rerender `RoomApp` and `RoomAuthenticatedView`,
+ *   rebuild the inline `<App roomSession={...}/>` element produced
+ *   by `renderEditor`, and — because `App` isn't `React.memo`'d —
+ *   reconcile the entire editor subtree. On a long plan this is
+ *   measurable jank at ~20Hz.
+ *
+ *   Keeping the state inside a component with no children and a
+ *   `null` render confines the reconciliation cost to this component
+ *   itself. The editor tree upstairs never observes pointermoves.
+ *
+ * Coordinate model — STICKY BLOCK ANCHOR:
+ *   A document reflows. Pixel y-values in a scrolling document are
+ *   NOT shared truth: two participants with different window widths
+ *   can have the same content-y land on different paragraphs. So we
+ *   anchor cursor position to `[data-block-id]` elements (paragraph,
+ *   heading, list item, etc.) — each participant resolves the same
+ *   block by id in their own DOM, and (x, y) relative to that block
+ *   is the same semantic content location for both.
+ *
+ *   The prior non-sticky block attempt snapped at every block
+ *   boundary because the anchor flipped between blocks as the
+ *   pointer crossed whitespace. Sticky fixes that:
+ *
+ *     1. If the pointer is over a `[data-block-id]`, anchor = that
+ *        block, emit (x, y) relative to its rect. Normal case.
+ *     2. If the pointer is over whitespace / between blocks / over
+ *        a non-block element inside the scroll viewport, KEEP the
+ *        last anchor and emit coordinates relative to it — even if
+ *        (x, y) falls outside the block's rect (negative y if above,
+ *        y > block.height if below). Remote cursor smoothly traces
+ *        the whitespace without a coordinate-space flip.
+ *     3. Anchor switches only when the pointer actually lands on a
+ *        different block. The emitted position at that switch jumps
+ *        by the gap between consecutive blocks (~line-height), which
+ *        the receiver's lerp smooths over.
+ *
+ *   When the pointer is OUTSIDE the scroll container (header, room
+ *   menu, margins), we skip the emit entirely — the last anchored
+ *   position stays on the wire so "Alice paused over paragraph 5 to
+ *   use the room menu" shows her cursor frozen over paragraph 5
+ *   rather than teleporting.
+ *
+ *   Emit `cursor: null` only on genuine leave (`window.blur` /
+ *   `document.hidden`); that also resets the sticky anchor so the
+ *   next session picks a fresh one.
+ *
+ * Scroll viewport lookup: App (rendered inside this component's
+ * tree via `renderEditor`) tags the OverlayScrollbars viewport
+ * element with `data-plan-scroll-viewport`. We `querySelector` for
+ * it here. Implicit coupling flagged in App's `useOverlayViewport`
+ * effect.
+ *
+ * Send cadence: 33ms trailing throttle (~30Hz), matching
+ * Excalidraw-style collab tooling.
+ */
+function LocalPresenceEmitter({
+  identity,
+  sendPresence,
+}: {
+  identity: CollabRoomUser;
+  sendPresence: (p: PresenceState) => Promise<void>;
+}): null {
+  const [localCursor, setLocalCursor] = useState<CursorState | null>(null);
+  // Sticky block anchor. Lives in a ref so the pointermove handler
+  // can read/write it synchronously without forcing re-renders.
+  const lastAnchorBlockIdRef = useRef<string | null>(null);
+
+  useEffect(() => {
+    function findScrollViewport(): HTMLElement | null {
+      return typeof document !== 'undefined'
+        ? document.querySelector<HTMLElement>('[data-plan-scroll-viewport]')
+        : null;
+    }
+
+    function findBlockUnder(target: Element | null): HTMLElement | null {
+      return (target?.closest?.('[data-block-id]') as HTMLElement | null) ?? null;
+    }
+
+    function findBlockById(id: string, within: ParentNode): HTMLElement | null {
+      try {
+        const escaped =
+          typeof CSS !== 'undefined' && typeof CSS.escape === 'function'
+            ? CSS.escape(id)
+            : id.replace(/["\\]/g, '\\$&');
+        return within.querySelector<HTMLElement>(`[data-block-id="${escaped}"]`);
+      } catch {
+        return null;
+      }
+    }
+
+    function onPointerMove(e: PointerEvent) {
+      const vp = findScrollViewport();
+      if (!vp) return;  // App hasn't mounted its scroll area yet.
+      const rect = vp.getBoundingClientRect();
+      // Skip emits when the pointer is outside the scroll container —
+      // keeps the remote cursor anchored to its last in-content spot
+      // instead of flashing to the header or off-screen chrome.
+      if (
+        e.clientX < rect.left || e.clientX > rect.right ||
+        e.clientY < rect.top  || e.clientY > rect.bottom
+      ) {
+        return;
+      }
+
+      // Sticky anchor resolution: prefer the block directly under the
+      // pointer; fall back to the last-used anchor when the pointer
+      // is over whitespace or a non-block element. The emitted (x, y)
+      // may overflow the block's rect — the receiver just adds it to
+      // their block's rect, producing a continuous trail through the
+      // gap instead of a jump.
+      let anchor = findBlockUnder(e.target as Element | null);
+      if (!anchor && lastAnchorBlockIdRef.current) {
+        anchor = findBlockById(lastAnchorBlockIdRef.current, vp);
+      }
+      if (!anchor) {
+        // No block anywhere (e.g. empty plan, or first pointer move
+        // happened over whitespace before any block was visited).
+        // Skip until we pick up a real anchor.
+        return;
+      }
+
+      const blockId = anchor.getAttribute('data-block-id');
+      if (!blockId) return;
+      lastAnchorBlockIdRef.current = blockId;
+
+      const anchorRect = anchor.getBoundingClientRect();
+      setLocalCursor({
+        blockId,
+        x: e.clientX - anchorRect.left,
+        y: e.clientY - anchorRect.top,
+        coordinateSpace: 'block',
+      });
+    }
+
+    function clearCursor() {
+      setLocalCursor(null);
+      // Reset the sticky anchor so a fresh session picks a new one
+      // rather than re-using a stale block id from a prior session.
+      lastAnchorBlockIdRef.current = null;
+    }
+    function handleVisibilityChange() {
+      if (document.hidden) clearCursor();
+    }
+
+    window.addEventListener('pointermove', onPointerMove);
+    window.addEventListener('blur', clearCursor);
+    document.addEventListener('visibilitychange', handleVisibilityChange);
+    return () => {
+      window.removeEventListener('pointermove', onPointerMove);
+      window.removeEventListener('blur', clearCursor);
+      document.removeEventListener('visibilitychange', handleVisibilityChange);
+    };
+  }, []);
+
+  // Always a PresenceState (never null) so "pointer left content" can
+  // be transmitted as `cursor: null`. `usePresenceThrottle(null, ...)`
+  // would just cancel the pending send, leaving peers stuck with our
+  // last position until the presence TTL sweep.
+  const presenceState: PresenceState = useMemo(
+    () => ({
+      user: { id: identity.id, name: identity.name, color: identity.color },
+      cursor: localCursor,
+    }),
+    [identity.id, identity.name, identity.color, localCursor],
+  );
+
+  usePresenceThrottle(presenceState, sendPresence, 33);
+
+  return null;
+}
diff --git a/packages/editor/bunfig.toml b/packages/editor/bunfig.toml
new file mode 100644
index 000000000..49e4b8832
--- /dev/null
+++ b/packages/editor/bunfig.toml
@@ -0,0 +1,6 @@
+[test]
+# Reuses the UI package's happy-dom bootstrap so `renderHook` and friends
+# have a DOM global. Same shape as packages/ui/bunfig.toml — duplicated
+# intentionally rather than imported so `bun test --cwd packages/editor`
+# resolves the preload from this directory.
+preload = ["../ui/test-setup.ts"]
diff --git a/packages/editor/components/AppHeader.tsx b/packages/editor/components/AppHeader.tsx
index ad3ca9b74..26b5d6f25 100644
--- a/packages/editor/components/AppHeader.tsx
+++ b/packages/editor/components/AppHeader.tsx
@@ -63,12 +63,17 @@ interface AppHeaderProps {
   onSaveToBear: () => void;
   onSaveToOctarine: () => void;
 
+  // Room mode — opaque slot rendered between approve/deny and annotation toggle
+  roomControls?: React.ReactNode;
+  submitError?: string;
+
   // PlanHeaderMenu config
   appVersion: string;
   agentInstructionsEnabled: boolean;
   obsidianConfigured: boolean;
   bearConfigured: boolean;
   octarineConfigured: boolean;
+  onStartLiveRoom?: () => void;
 }
 
 export const AppHeader = React.memo<AppHeaderProps>(({
@@ -116,11 +121,14 @@ export const AppHeader = React.memo<AppHeaderProps>(({
   onSaveToObsidian,
   onSaveToBear,
   onSaveToOctarine,
+  roomControls,
+  submitError,
   appVersion,
   agentInstructionsEnabled,
   obsidianConfigured,
   bearConfigured,
   octarineConfigured,
+  onStartLiveRoom,
 }) => {
   return (
     <header data-app-header="true" className="h-12 flex items-center justify-between px-2 md:px-4 border-b border-border/50 bg-card/50 backdrop-blur-xl sticky top-0 z-[50]">
@@ -168,6 +176,12 @@ export const AppHeader = React.memo<AppHeaderProps>(({
           </>
         )}
 
+        {submitError && (
+          <div className="text-xs text-destructive max-w-[260px] truncate" title={submitError}>
+            {submitError}
+          </div>
+        )}
+
         {isApiMode && (!linkedDocIsActive || annotateMode) && !archiveMode && (
           <>
             {annotateMode ? (
@@ -229,6 +243,8 @@ export const AppHeader = React.memo<AppHeaderProps>(({
           </>
         )}
 
+        {roomControls}
+
         {/* Annotations panel toggle */}
         <button
           onClick={onAnnotationPanelToggle}
@@ -270,6 +286,7 @@ export const AppHeader = React.memo<AppHeaderProps>(({
           onSaveToObsidian={onSaveToObsidian}
           onSaveToBear={onSaveToBear}
           onSaveToOctarine={onSaveToOctarine}
+          onStartLiveRoom={onStartLiveRoom}
           sharingEnabled={canShareCurrentSession}
           isApiMode={isApiMode}
           agentInstructionsEnabled={agentInstructionsEnabled}
diff --git a/packages/editor/env.d.ts b/packages/editor/env.d.ts
new file mode 100644
index 000000000..0b58cb887
--- /dev/null
+++ b/packages/editor/env.d.ts
@@ -0,0 +1,25 @@
+/// <reference types="vite/client" />
+
+/**
+ * Vite client types for `import.meta.env` access inside the editor
+ * package. The hook (apps/hook) bundles this code through Vite and
+ * injects VITE_-prefixed env vars at build/dev time; this file is
+ * what makes TypeScript accept `import.meta.env.VITE_ROOM_BASE_URL`
+ * without a clever cast.
+ *
+ * Runtime notes:
+ *   - `VITE_ROOM_BASE_URL` — local E2E testing only. Set by
+ *     `scripts/dev-live-room-local.sh` so the editor at :3000 creates
+ *     rooms against the local wrangler dev at :8787 instead of the
+ *     production `room.plannotator.ai`. Production builds leave it
+ *     undefined and the fallback kicks in.
+ */
+
+interface ImportMetaEnv {
+  readonly VITE_ROOM_BASE_URL?: string;
+  readonly VITE_DIFF_DEMO?: string;
+}
+
+interface ImportMeta {
+  readonly env: ImportMetaEnv;
+}
diff --git a/packages/editor/hooks/collab/useStartLiveRoom.ts b/packages/editor/hooks/collab/useStartLiveRoom.ts
new file mode 100644
index 000000000..e893fc48a
--- /dev/null
+++ b/packages/editor/hooks/collab/useStartLiveRoom.ts
@@ -0,0 +1,303 @@
+/**
+ * useStartLiveRoom — creator-side "start a live room" flow.
+ *
+ * Lives under packages/editor/hooks/collab/ (not packages/ui/) because:
+ *   - The flow is editor-shell workflow, not generic reusable UI.
+ *   - It depends on `import.meta.env.VITE_ROOM_BASE_URL` whose ambient
+ *     typing lives in packages/editor/env.d.ts. Placing this hook under
+ *     packages/ui would either leak editor env typing into the UI
+ *     package or require a base-URL injection parameter from App,
+ *     both of which are worse than the straightforward editor-local
+ *     home.
+ *
+ * Invariants this hook MUST preserve (do not "clean up" away):
+ *   - Dynamic imports inside `handleConfirmStartRoom` stay dynamic.
+ *     Four `await import(...)` calls exist specifically to code-split
+ *     the collab client off the editor main bundle. A well-meaning
+ *     lint autofix that hoists them to static imports is a bundle-
+ *     size regression.
+ *   - The `window.open('', '_blank')` placeholder MUST run
+ *     synchronously in the click path, before any `await`. Browsers
+ *     only honor the popup-blocker user-activation grant for
+ *     synchronous work; placing this after an await would make every
+ *     Start click look blocked on strict browsers.
+ */
+
+import { useCallback, useMemo, useRef, useState } from 'react';
+import type { Annotation, ImageAttachment } from '@plannotator/ui/types';
+import { stripRoomAnnotationImages } from '@plannotator/shared/collab';
+import {
+  getIdentity,
+  setCustomIdentity,
+  getPresenceColor,
+  setPresenceColor,
+} from '@plannotator/ui/utils/identity';
+import type { StartRoomSubmit } from '@plannotator/ui/components/collab/StartRoomModal';
+
+/**
+ * Resolve the room-service base URL for `createRoom()`. Precedence:
+ *
+ *   1. `window.__ROOM_BASE_URL` — runtime escape hatch. Set via
+ *      DevTools console for ad-hoc redirection without restarting
+ *      the dev server.
+ *   2. `import.meta.env.VITE_ROOM_BASE_URL` — build/dev-time env
+ *      var, the standard Vite pattern. `scripts/dev-live-room-local.sh`
+ *      sets this so the editor at :3000 targets the local wrangler
+ *      dev at :8787 instead of production.
+ *   3. `https://room.plannotator.ai` — production default; what
+ *      every shipped build should resolve to when neither override
+ *      is present.
+ */
+function getRoomBaseUrl(): string {
+  if (typeof window !== 'undefined') {
+    const explicit = (window as { __ROOM_BASE_URL?: string }).__ROOM_BASE_URL;
+    if (explicit) return explicit;
+  }
+  const viteBase = import.meta.env?.VITE_ROOM_BASE_URL;
+  if (viteBase) return viteBase;
+  return 'https://room.plannotator.ai';
+}
+
+export interface UseStartLiveRoomOptions {
+  annotations: Annotation[];
+  markdown: string;
+  globalAttachments: ImageAttachment[];
+  /**
+   * True when the creator is in a shell that CAN host a live room
+   * (local isApiMode editor, not room mode already). The hook uses
+   * this as a defensive guard inside `handleStartLiveRoom`; App also
+   * gates the surfacing UI on the same value so a blocked click is
+   * theoretically unreachable.
+   */
+  canStartLiveRoom: boolean;
+}
+
+export interface UseStartLiveRoomReturn {
+  showStartRoomModal: boolean;
+  startRoomInFlight: boolean;
+  startRoomError: string;
+  imageAnnotationsToStrip: number;
+  handleStartLiveRoom: () => void;
+  handleCancelStartRoom: () => void;
+  handleConfirmStartRoom: (submit: StartRoomSubmit) => Promise<void>;
+}
+
+export function useStartLiveRoom({
+  annotations,
+  markdown,
+  globalAttachments,
+  canStartLiveRoom,
+}: UseStartLiveRoomOptions): UseStartLiveRoomReturn {
+  // Start-live-room modal state. The modal is the sole entry to the creator
+  // flow — replaces the earlier inline hardcoded path (name/color/expiry
+  // defaults). Abort during in-flight creation runs through an
+  // AbortController passed to createRoom().
+  const [showStartRoomModal, setShowStartRoomModal] = useState(false);
+  const [startRoomInFlight, setStartRoomInFlight] = useState(false);
+  const [startRoomError, setStartRoomError] = useState<string>('');
+  const startRoomAbortRef = useRef<AbortController | null>(null);
+
+  // Single source of truth for "how many local items won't travel to
+  // the room" — matches the value used at actual room-create time
+  // (stripRoomAnnotationImages inside handleConfirmStartRoom) so the
+  // modal notice and the URL `&stripped=N` handoff can never drift.
+  // stripRoomAnnotationImages is synchronous and O(annotations +
+  // globals); running it per render on a typical small annotation list
+  // is cheap.
+  const imageAnnotationsToStrip = useMemo(() => {
+    const { strippedCount } = stripRoomAnnotationImages(annotations, globalAttachments);
+    return strippedCount;
+  }, [annotations, globalAttachments]);
+
+  const handleStartLiveRoom = useCallback(() => {
+    if (!canStartLiveRoom) return;  // belt-and-braces with prop-level gating
+    setStartRoomError('');
+    setShowStartRoomModal(true);
+  }, [canStartLiveRoom]);
+
+  const handleCancelStartRoom = useCallback(() => {
+    // Abort the in-flight createRoom if any; modal closes either way.
+    startRoomAbortRef.current?.abort();
+    startRoomAbortRef.current = null;
+    setShowStartRoomModal(false);
+    setStartRoomInFlight(false);
+  }, []);
+
+  const handleConfirmStartRoom = useCallback(async (submit: StartRoomSubmit) => {
+    setStartRoomInFlight(true);
+    setStartRoomError('');
+
+    const ctrl = new AbortController();
+    startRoomAbortRef.current = ctrl;
+
+    // Persist any edits the user made in the modal. Identity is a
+    // Plannotator-wide preference — what they pick here also becomes
+    // the default for the next room and feeds Settings. Writes are
+    // no-ops when the submitted values already match ConfigStore.
+    if (submit.displayName && submit.displayName !== getIdentity()) {
+      setCustomIdentity(submit.displayName);
+    }
+    if (submit.color && submit.color !== getPresenceColor()) {
+      setPresenceColor(submit.color);
+    }
+
+    // Pre-open a placeholder tab SYNCHRONOUSLY — inside the user-
+    // activation window from the click that landed us here. Browsers
+    // only honor user activation for synchronous work (or a very short
+    // task chain); a bare window.open after the awaits below would
+    // typically be blocked. We sever `.opener` now while the new
+    // window is still a same-origin about:blank so the subsequent
+    // cross-origin `location.replace` doesn't inherit the opener
+    // reference. Do NOT pass `noopener`/`noreferrer` in the features
+    // string — those make window.open return null EVEN ON SUCCESS,
+    // which would make every opened tab look blocked.
+    const newWindow: Window | null =
+      typeof window !== 'undefined' ? window.open('', '_blank') : null;
+    if (newWindow) {
+      newWindow.opener = null;
+    }
+
+    const abortPlaceholder = () => {
+      if (newWindow) {
+        try { newWindow.close(); } catch { /* already closed */ }
+      }
+    };
+
+    try {
+      const { createRoom } = await import('@plannotator/shared/collab/client');
+      const { bytesToBase64url } = await import('@plannotator/shared/collab');
+      const { storeAdminSecret } = await import('@plannotator/ui/utils/adminSecretStorage');
+
+      // `stripRoomAnnotationImages` returns a generic `Omit<T, 'images'>[]`.
+      // RoomAnnotation is defined as Annotation-without-images in the
+      // protocol, so the shape is compatible; we narrow explicitly instead
+      // of `as never` so future protocol drift surfaces as a type error.
+      // Pass globalAttachments so the helper's strippedCount matches the
+      // memoized imageAnnotationsToStrip used for the modal notice and
+      // `&stripped=N` URL handoff (single source of truth). `clean` is
+      // still annotation-shaped — globals are dropped entirely from
+      // room snapshots.
+      const { clean } = stripRoomAnnotationImages(annotations, globalAttachments);
+      const roomAnnotations: import('@plannotator/shared/collab').RoomAnnotation[] =
+        clean as unknown as import('@plannotator/shared/collab').RoomAnnotation[];
+
+      const baseUrl = getRoomBaseUrl();
+
+      const result = await createRoom({
+        baseUrl,
+        expiresInDays: submit.expiresInDays,
+        signal: ctrl.signal,
+        initialSnapshot: {
+          versionId: 'v1',  // RoomSnapshot contract pins versionId to 'v1' in V1
+          planMarkdown: markdown,
+          annotations: roomAnnotations,
+        },
+        user: {
+          id: crypto.randomUUID(),
+          name: submit.displayName,
+          color: submit.color,
+        },
+      });
+
+      if (ctrl.signal.aborted) {
+        // User hit Cancel while the create call was in flight; the request
+        // still landed and a room was created on the server, but we must
+        // not navigate. Close the pre-opened placeholder so it doesn't
+        // linger as an empty tab the user can't explain.
+        abortPlaceholder();
+        return;
+      }
+
+      // sessionStorage is per-origin — the value we set here lives only in
+      // the creator's local editor origin and is NOT visible on
+      // room.plannotator.ai. We still write it so same-origin test/dev
+      // scenarios (everything on localhost) keep working; cross-origin
+      // cases rely on the admin fragment in the URL.
+      storeAdminSecret(result.roomId, bytesToBase64url(result.adminSecret));
+
+      // Auto-copy the PARTICIPANT URL (safe default share target).
+      try {
+        await navigator.clipboard.writeText(result.joinUrl);
+      } catch { /* ignore */ }
+
+      // Creator's destination URL: adminUrl (which already carries
+      // `#key=<roomSecret>&admin=<adminSecret>` in its fragment) plus
+      // an optional `&stripped=N` and an identity handoff. The admin
+      // fragment stays in the URL because useCollabRoom parses it on
+      // every connect; stripping it would force a separate admin-
+      // secret-override injection path.
+      //
+      // Identity handoff (name + color) bridges the cross-origin gap:
+      // localhost ConfigStore cookies are not visible on
+      // room.plannotator.ai, so the creator's confirmed identity
+      // rides along in the URL fragment and is consumed + stripped
+      // by `AppRoot` on arrival. `&admin=` stays (it's the session
+      // credential); `&name=&color=` get stripped after AppRoot
+      // writes them into the room-origin ConfigStore.
+      const appendFragmentParam = (url: string, param: string): string =>
+        `${url}${url.includes('#') ? '&' : '#'}${param}`;
+      let creatorUrl = result.adminUrl;
+      if (imageAnnotationsToStrip > 0) {
+        creatorUrl = appendFragmentParam(
+          creatorUrl,
+          `stripped=${imageAnnotationsToStrip}`,
+        );
+      }
+      if (submit.displayName) {
+        creatorUrl = appendFragmentParam(
+          creatorUrl,
+          `name=${encodeURIComponent(submit.displayName)}`,
+        );
+      }
+      if (submit.color) {
+        creatorUrl = appendFragmentParam(
+          creatorUrl,
+          `color=${encodeURIComponent(submit.color)}`,
+        );
+      }
+
+      // Navigate the pre-opened placeholder tab to the room URL. The
+      // creator's current tab stays on localhost so the blocked hook
+      // has an approval surface. `location.replace` (not `=`) so the
+      // about:blank intermediate doesn't sit in the new tab's back
+      // history. If the browser blocked the synchronous pre-open
+      // above, surface the URL as a copy-able fallback in the modal
+      // rather than silently reassigning the current tab (which would
+      // strand the local hook).
+      if (newWindow) {
+        // Success: new tab takes over the room session. Close the
+        // modal so the localhost tab returns to the editor.
+        newWindow.location.replace(creatorUrl);
+        setStartRoomInFlight(false);
+        setShowStartRoomModal(false);
+      } else {
+        // Popup blocked: KEEP the modal open so the user can copy
+        // the surfaced URL and open the room themselves.
+        setStartRoomError(
+          `Your browser blocked opening the room in a new tab. ` +
+          `Copy this URL and open it yourself: ${creatorUrl}`,
+        );
+        setStartRoomInFlight(false);
+      }
+    } catch (err) {
+      abortPlaceholder();
+      if (ctrl.signal.aborted) return;  // user cancelled; no error
+      const { redactRoomSecrets } = await import('@plannotator/shared/collab');
+      const msg = err instanceof Error ? err.message : String(err);
+      setStartRoomError(redactRoomSecrets(msg) || 'Failed to start live room');
+      setStartRoomInFlight(false);
+    } finally {
+      if (startRoomAbortRef.current === ctrl) startRoomAbortRef.current = null;
+    }
+  }, [annotations, markdown, imageAnnotationsToStrip, globalAttachments]);
+
+  return {
+    showStartRoomModal,
+    startRoomInFlight,
+    startRoomError,
+    imageAnnotationsToStrip,
+    handleStartLiveRoom,
+    handleCancelStartRoom,
+    handleConfirmStartRoom,
+  };
+}
diff --git a/packages/editor/hooks/useCheckboxOverrides.test.tsx b/packages/editor/hooks/useCheckboxOverrides.test.tsx
new file mode 100644
index 000000000..9cee6521f
--- /dev/null
+++ b/packages/editor/hooks/useCheckboxOverrides.test.tsx
@@ -0,0 +1,194 @@
+import { describe, expect, test, mock } from 'bun:test';
+import { renderHook, act } from '@testing-library/react';
+import { useCheckboxOverrides } from './useCheckboxOverrides';
+import { AnnotationType, type Annotation, type Block } from '@plannotator/ui/types';
+
+/**
+ * Coverage scope — the invariants that matter for the room-mode
+ * pending/revert race. Happy-dom is provided by packages/editor/bunfig.toml
+ * (shares packages/ui/test-setup.ts) so `renderHook` has a DOM global.
+ *
+ *   - busy gate: toggle() short-circuits when the block is pending
+ *   - revert gate: override persists while canonical OR pending/failed
+ *     covers the block
+ *   - eventual revert: both canonical + pending/failed must be empty
+ *     before the override clears
+ *   - local-mode parity: when `pendingBlockIds` is undefined (local
+ *     mode), the reconciliation effect still drops overrides whose
+ *     canonical annotation was removed externally
+ */
+
+function makeBlock(id: string, content = 'item'): Block {
+  return { id, type: 'list-item', content, order: 0, startLine: 0, checked: false };
+}
+
+function makeCheckboxAnnotation(blockId: string, id = `ann-checkbox-${blockId}-1`): Annotation {
+  return {
+    id,
+    blockId,
+    startOffset: 0,
+    endOffset: 4,
+    type: AnnotationType.COMMENT,
+    text: 'Mark as completed',
+    originalText: 'item',
+    createdA: 1,
+  };
+}
+
+describe('useCheckboxOverrides — busy gate', () => {
+  test('toggle() short-circuits when pendingBlockIds includes the block', () => {
+    const addAnnotation = mock(() => {});
+    const removeAnnotation = mock(() => {});
+    const block = makeBlock('b1');
+    const pendingBlockIds = new Set(['b1']);
+
+    const { result } = renderHook(() =>
+      useCheckboxOverrides({
+        blocks: [block],
+        annotations: [],
+        addAnnotation,
+        removeAnnotation,
+        pendingBlockIds,
+      }),
+    );
+
+    act(() => {
+      result.current.toggle('b1', true);
+    });
+
+    expect(addAnnotation).not.toHaveBeenCalled();
+    expect(removeAnnotation).not.toHaveBeenCalled();
+    // Visual override must also NOT change — busy means "drop the click
+    // entirely," not "change visuals but skip the server call."
+    expect(result.current.overrides.has('b1')).toBe(false);
+  });
+
+  test('toggle() proceeds for a block not in pendingBlockIds', () => {
+    const addAnnotation = mock(() => {});
+    const removeAnnotation = mock(() => {});
+    const block = makeBlock('b1');
+
+    const { result } = renderHook(() =>
+      useCheckboxOverrides({
+        blocks: [block],
+        annotations: [],
+        addAnnotation,
+        removeAnnotation,
+        pendingBlockIds: new Set(['b-other']),
+      }),
+    );
+
+    act(() => {
+      result.current.toggle('b1', true);
+    });
+
+    // Core busy-gate invariant: when the block is NOT pending, the
+    // toggle reaches the outbound path. Override lifecycle after the
+    // call is a reconciliation concern and is covered separately —
+    // a bare mock caller doesn't feed the optimistic-add back into
+    // `pendingBlockIds` the way App.tsx does, so asserting the
+    // override post-toggle in this harness would test test-plumbing,
+    // not the hook.
+    expect(addAnnotation).toHaveBeenCalledTimes(1);
+  });
+});
+
+describe('useCheckboxOverrides — reconciliation', () => {
+  test('override persists while pendingBlockIds covers the block (no canonical yet)', () => {
+    const block = makeBlock('b1');
+
+    const { result, rerender } = renderHook(
+      ({ annotations, pendingBlockIds }: {
+        annotations: Annotation[];
+        pendingBlockIds: ReadonlySet<string>;
+      }) =>
+        useCheckboxOverrides({
+          blocks: [block],
+          annotations,
+          addAnnotation: () => {},
+          removeAnnotation: () => {},
+          pendingBlockIds,
+        }),
+      { initialProps: { annotations: [], pendingBlockIds: new Set<string>() } },
+    );
+
+    act(() => {
+      result.current.toggle('b1', true);
+    });
+    expect(result.current.overrides.get('b1')).toBe(true);
+
+    // Optimistic add is in flight — no canonical yet, but pendingBlockIds
+    // covers the block. Reconciliation must NOT clear the override.
+    rerender({ annotations: [], pendingBlockIds: new Set(['b1']) });
+    expect(result.current.overrides.get('b1')).toBe(true);
+
+    // Pending fails — moves into `failed`. App.tsx still reports the
+    // block in `pendingBlockIds` (failed entries are included). Override
+    // must still be preserved; only Discard clears failed, and even then
+    // only if no canonical exists.
+    rerender({ annotations: [], pendingBlockIds: new Set(['b1']) });
+    expect(result.current.overrides.get('b1')).toBe(true);
+  });
+
+  test('override clears once both canonical and pending/failed coverage are gone', () => {
+    const block = makeBlock('b1');
+    const ann = makeCheckboxAnnotation('b1');
+
+    const { result, rerender } = renderHook(
+      ({ annotations, pendingBlockIds }: {
+        annotations: Annotation[];
+        pendingBlockIds: ReadonlySet<string>;
+      }) =>
+        useCheckboxOverrides({
+          blocks: [block],
+          annotations,
+          addAnnotation: () => {},
+          removeAnnotation: () => {},
+          pendingBlockIds,
+        }),
+      { initialProps: { annotations: [ann], pendingBlockIds: new Set<string>() } },
+    );
+
+    act(() => {
+      result.current.toggle('b1', true);
+    });
+    expect(result.current.overrides.get('b1')).toBe(true);
+
+    // Simulate a pending remove: canonical still present, pendingBlockIds
+    // covers. Override stays.
+    rerender({ annotations: [ann], pendingBlockIds: new Set(['b1']) });
+    expect(result.current.overrides.get('b1')).toBe(true);
+
+    // Echo arrives — canonical drops, pending clears. Both coverage sets
+    // empty → override clears.
+    rerender({ annotations: [], pendingBlockIds: new Set<string>() });
+    expect(result.current.overrides.has('b1')).toBe(false);
+  });
+
+  test('local mode (pendingBlockIds undefined) still drops overrides whose canonical went away', () => {
+    const block = makeBlock('b1');
+    const ann = makeCheckboxAnnotation('b1');
+
+    const { result, rerender } = renderHook(
+      ({ annotations }: { annotations: Annotation[] }) =>
+        useCheckboxOverrides({
+          blocks: [block],
+          annotations,
+          addAnnotation: () => {},
+          removeAnnotation: () => {},
+          // pendingBlockIds intentionally undefined for local mode
+        }),
+      { initialProps: { annotations: [ann] } },
+    );
+
+    act(() => {
+      result.current.toggle('b1', true);
+    });
+    expect(result.current.overrides.get('b1')).toBe(true);
+
+    // An external path wipes the canonical checkbox annotation (e.g.
+    // draft-restore loading a plan without it). Reconciliation clears.
+    rerender({ annotations: [] });
+    expect(result.current.overrides.has('b1')).toBe(false);
+  });
+});
diff --git a/packages/editor/hooks/useCheckboxOverrides.ts b/packages/editor/hooks/useCheckboxOverrides.ts
index 288b658ad..a20148f8d 100644
--- a/packages/editor/hooks/useCheckboxOverrides.ts
+++ b/packages/editor/hooks/useCheckboxOverrides.ts
@@ -8,12 +8,37 @@
 
 import { useState, useEffect, useCallback, useRef } from 'react';
 import { Annotation, AnnotationType, Block } from '@plannotator/ui/types';
+import type { AnnotationController } from '@plannotator/ui/types/annotationController';
 
 export interface UseCheckboxOverridesOptions {
   blocks: Block[];
   annotations: Annotation[];
   addAnnotation: (ann: Annotation) => void;
   removeAnnotation: (id: string) => void;
+  /**
+   * Room-mode only. Block IDs whose checkbox annotation has an
+   * UNRESOLVED server op — either in flight (pending add / update /
+   * remove) or waiting on user Retry/Discard after a failure. Two
+   * roles inside this hook:
+   *
+   *   1. Busy gate — `toggle()` short-circuits when the block is in
+   *      this set so rapid clicks can't stack a second op on top of
+   *      one the server hasn't settled. Without this, a user who
+   *      clicks twice quickly can end up with a confirmed checkbox
+   *      annotation for state they thought they undid, and the
+   *      room controller's one-op-per-id pending map has no way to
+   *      reconcile the second op against the first.
+   *
+   *   2. Revert gate — the reconciliation effect treats a block in
+   *      this set as still "covered" by a backing annotation, so a
+   *      deletion that's in flight or failed doesn't optimistically
+   *      clear the visual override before the remove echoes (or
+   *      before the user resolves the failure via Retry/Discard).
+   *
+   * Local mode leaves this undefined; synchronous `toggle` and
+   * `revertOverride` calls in App.tsx do the coordination instead.
+   */
+  pendingBlockIds?: ReadonlySet<string>;
 }
 
 export interface UseCheckboxOverridesReturn {
@@ -30,6 +55,7 @@ export function useCheckboxOverrides({
   annotations,
   addAnnotation,
   removeAnnotation,
+  pendingBlockIds,
 }: UseCheckboxOverridesOptions): UseCheckboxOverridesReturn {
   const [overrides, setOverrides] = useState<Map<string, boolean>>(new Map());
 
@@ -38,6 +64,11 @@ export function useCheckboxOverrides({
   blocksRef.current = blocks;
   const annotationsRef = useRef(annotations);
   annotationsRef.current = annotations;
+  // Same ref pattern for the pending-blocks set so the toggle callback's
+  // identity doesn't change on every pending update (which would churn
+  // Viewer/ListMarker re-renders for no reason).
+  const pendingBlockIdsRef = useRef(pendingBlockIds);
+  pendingBlockIdsRef.current = pendingBlockIds;
 
   // Clean up stale overrides when blocks change (e.g. markdown reloaded)
   useEffect(() => {
@@ -53,7 +84,52 @@ export function useCheckboxOverrides({
     }
   }, [blocks]);
 
+  // Reconcile overrides against backing checkbox annotations.
+  //
+  // Local mode: `toggle` clears the override synchronously alongside
+  // the annotation removal, so this effect is usually a no-op. It still
+  // provides a safety net for external paths that mutate annotations
+  // without going through `toggle` (e.g. share-import loading a plan
+  // without the matching checkbox annotations, or draft restore).
+  //
+  // Room mode: this is the primary mechanism that returns the visual
+  // state to the unchecked baseline after a deletion. The delete path
+  // in App.tsx intentionally does NOT call `revertOverride` in room
+  // mode, because a remove that later fails would strand a
+  // visually-reverted checkbox whose canonical annotation still
+  // exists. Instead we wait until the block has no checkbox annotation
+  // in canonical state AND no unresolved op in `pendingBlockIds`
+  // (pending or failed). Both must be empty before we clear — a
+  // pending op means the remove is still in flight; a failed op means
+  // the annotation still exists canonically and the user has to
+  // Retry/Discard first.
+  useEffect(() => {
+    if (overrides.size === 0) return;
+    const coveredBlocks = new Set<string>();
+    for (const a of annotations) {
+      if (a.id.startsWith('ann-checkbox-')) coveredBlocks.add(a.blockId);
+    }
+    if (pendingBlockIds) {
+      for (const id of pendingBlockIds) coveredBlocks.add(id);
+    }
+    const toClear = [...overrides.keys()].filter(id => !coveredBlocks.has(id));
+    if (toClear.length === 0) return;
+    setOverrides(prev => {
+      const next = new Map(prev);
+      toClear.forEach(id => next.delete(id));
+      return next;
+    });
+  }, [annotations, pendingBlockIds]);
+
   const toggle = useCallback((blockId: string, checked: boolean) => {
+    // Room-mode busy gate: if a checkbox add/update/remove for this
+    // block is still in flight with the server, drop the click. The
+    // first op has to echo (or fail with Retry/Discard) before we
+    // accept another toggle, so the user can't send conflicting ops
+    // that the controller can't reconcile against the one-op-per-id
+    // pending map.
+    if (pendingBlockIdsRef.current?.has(blockId)) return;
+
     const blocks = blocksRef.current;
     const annotations = annotationsRef.current;
     const block = blocks.find(b => b.id === blockId);
@@ -116,3 +192,48 @@ export function useCheckboxOverrides({
 
   return { overrides, toggle, revertOverride };
 }
+
+/**
+ * Compute the set of block IDs whose checkbox annotation has an
+ * unresolved server op — either in flight (pending add / update /
+ * remove) or waiting on user Retry/Discard after a failure.
+ *
+ * Consumers feed this into `useCheckboxOverrides`'s `pendingBlockIds`
+ * option, which uses it both as a busy gate (drops rapid-click toggles
+ * that would stack ops the controller can't reconcile) and as a
+ * revert gate (keeps the visual override alive while a deletion is
+ * un-echoed or failed). Co-located with the hook because the ID
+ * convention (`ann-checkbox-<blockId>-<ts>`) is a private protocol
+ * between these two pieces.
+ *
+ * Lookup strategy: `pending` / `failed` only carry ids; we resolve
+ * each id to a blockId via `pendingAdditions` first (optimistic row
+ * for adds the server hasn't echoed) and fall back to the canonical
+ * `controller.annotations` list (for updates/removes of echoed rows).
+ * Then we walk `pendingAdditions` again so purely-optimistic adds
+ * that haven't made it into `pending` yet are still covered — the
+ * controller enqueues them in lockstep, so this is defensive, but
+ * iteration is cheap and keeps the set consistent with its documented
+ * meaning.
+ */
+export function derivePendingCheckboxBlockIds(
+  controller: AnnotationController,
+): ReadonlySet<string> {
+  const blockIds = new Set<string>();
+  const addByIdLookup = (id: string) => {
+    if (!id.startsWith('ann-checkbox-')) return;
+    const optimistic = controller.pendingAdditions.get(id);
+    if (optimistic) {
+      blockIds.add(optimistic.blockId);
+      return;
+    }
+    const canonical = controller.annotations.find(a => a.id === id);
+    if (canonical) blockIds.add(canonical.blockId);
+  };
+  for (const id of controller.pending.keys()) addByIdLookup(id);
+  for (const id of controller.failed.keys()) addByIdLookup(id);
+  for (const [id, ann] of controller.pendingAdditions) {
+    if (id.startsWith('ann-checkbox-')) blockIds.add(ann.blockId);
+  }
+  return blockIds;
+}
diff --git a/packages/editor/package.json b/packages/editor/package.json
index 3e661eef8..a138820a9 100644
--- a/packages/editor/package.json
+++ b/packages/editor/package.json
@@ -3,7 +3,8 @@
   "version": "0.0.1",
   "type": "module",
   "exports": {
-    ".": "./App.tsx",
+    ".": "./AppRoot.tsx",
+    "./App": "./App.tsx",
     "./styles": "./index.css",
     "./shortcuts": "./shortcuts.ts"
   },
@@ -14,5 +15,11 @@
     "react-dom": "^19.2.3",
     "sonner": "^2.0.7",
     "tailwindcss": "^4.1.18"
+  },
+  "devDependencies": {
+    "@happy-dom/global-registrator": "^20.8.9",
+    "@testing-library/react": "^16.3.2",
+    "@types/react": "^19.2.0",
+    "@types/react-dom": "^19.2.0"
   }
 }
diff --git a/packages/editor/roomIdentityHandoff.test.ts b/packages/editor/roomIdentityHandoff.test.ts
new file mode 100644
index 000000000..8bbc7f164
--- /dev/null
+++ b/packages/editor/roomIdentityHandoff.test.ts
@@ -0,0 +1,124 @@
+import { afterEach, beforeEach, describe, expect, test } from 'bun:test';
+import { captureCreatorIdentityFromFragment } from './roomIdentityHandoff';
+import { getIdentity, getPresenceColor } from '@plannotator/ui/utils/identity';
+import { isRoomIdentityConfirmed } from '@plannotator/ui/utils/roomIdentityConfirmed';
+
+/**
+ * Unit coverage for the cross-origin creator identity handoff.
+ *
+ * The function owns a narrow contract: given a URL fragment with
+ * `&name=&color=`, it writes validated values into ConfigStore, marks
+ * the room "confirmed" when BOTH landed, and strips both params from
+ * the visible URL. It's path-gated to `/c/:roomId` so non-room shells
+ * that happen to mount AppRoot can't have their static-share
+ * fragments rewritten.
+ */
+
+function setLocation(pathname: string, hash: string): void {
+  // happy-dom allows overriding href; pathname/hash are derived. Go
+  // through history.replaceState to set state without triggering
+  // navigation (same API the function under test uses to strip).
+  window.history.replaceState(null, '', `${pathname}${hash ? `#${hash}` : ''}`);
+}
+
+beforeEach(() => {
+  // Fresh slate per test: sessionStorage is shared across the file in
+  // happy-dom, so we clear the flag keys the function writes to.
+  sessionStorage.clear();
+});
+
+afterEach(() => {
+  // Reset URL so a stripped-params test doesn't leak state into the next.
+  setLocation('/', '');
+});
+
+describe('captureCreatorIdentityFromFragment — happy path', () => {
+  test('both name and color present: writes ConfigStore, marks confirmed, strips params', () => {
+    setLocation('/c/abc123', 'key=k&admin=a&name=Alice&color=%23f97316');
+    captureCreatorIdentityFromFragment();
+
+    expect(getIdentity()).toBe('Alice');
+    expect(getPresenceColor()).toBe('#f97316');
+    expect(isRoomIdentityConfirmed('abc123')).toBe(true);
+
+    // `name` and `color` stripped; other fragment params preserved.
+    expect(window.location.hash).not.toContain('name=');
+    expect(window.location.hash).not.toContain('color=');
+    expect(window.location.hash).toContain('key=k');
+    expect(window.location.hash).toContain('admin=a');
+  });
+});
+
+describe('captureCreatorIdentityFromFragment — partial / invalid', () => {
+  test('only color landed: writes color, does NOT mark confirmed, still strips', () => {
+    setLocation('/c/room-only-color', 'key=k&color=%2310b981');
+    captureCreatorIdentityFromFragment();
+
+    expect(getPresenceColor()).toBe('#10b981');
+    // Confirmed flag requires BOTH name and color — bug was previously
+    // "either value wins." A truncated or tampered URL shouldn't skip
+    // the gate on stale room-origin ConfigStore values.
+    expect(isRoomIdentityConfirmed('room-only-color')).toBe(false);
+    expect(window.location.hash).not.toContain('color=');
+  });
+
+  test('only name landed: writes name, does NOT mark confirmed', () => {
+    setLocation('/c/room-only-name', 'key=k&name=Bob');
+    captureCreatorIdentityFromFragment();
+
+    expect(getIdentity()).toBe('Bob');
+    expect(isRoomIdentityConfirmed('room-only-name')).toBe(false);
+  });
+
+  test('invalid color (not #RRGGBB): dropped, name still written, NOT confirmed', () => {
+    setLocation('/c/room-bad-color', 'name=Carol&color=not-a-color');
+    const priorColor = getPresenceColor();
+    captureCreatorIdentityFromFragment();
+
+    expect(getIdentity()).toBe('Carol');
+    expect(getPresenceColor()).toBe(priorColor);  // unchanged
+    expect(isRoomIdentityConfirmed('room-bad-color')).toBe(false);
+  });
+
+  test('empty name after trim: dropped, color still written, NOT confirmed', () => {
+    setLocation('/c/room-empty-name', 'name=%20%20%20&color=%23eab308');
+    captureCreatorIdentityFromFragment();
+
+    expect(getPresenceColor()).toBe('#eab308');
+    expect(isRoomIdentityConfirmed('room-empty-name')).toBe(false);
+  });
+
+  test('over-long name (>64 chars): rejected', () => {
+    const longName = 'x'.repeat(65);
+    setLocation('/c/room-long-name', `name=${longName}&color=%232563eb`);
+    const priorName = getIdentity();
+    captureCreatorIdentityFromFragment();
+
+    expect(getIdentity()).toBe(priorName);  // unchanged
+    expect(isRoomIdentityConfirmed('room-long-name')).toBe(false);
+  });
+});
+
+describe('captureCreatorIdentityFromFragment — path gating', () => {
+  test('non-room path: ConfigStore untouched, URL untouched', () => {
+    setLocation('/', 'name=Eve&color=%23ef4444');
+    const priorName = getIdentity();
+    const priorColor = getPresenceColor();
+    captureCreatorIdentityFromFragment();
+
+    expect(getIdentity()).toBe(priorName);
+    expect(getPresenceColor()).toBe(priorColor);
+    // URL rewrite skipped on non-room paths — protects static-share
+    // fragments from being corrupted by `URLSearchParams` reformatting.
+    expect(window.location.hash).toBe('#name=Eve&color=%23ef4444');
+  });
+
+  test('no handoff params: no-op even on room path', () => {
+    setLocation('/c/roomX', 'key=k&admin=a');
+    captureCreatorIdentityFromFragment();
+
+    expect(isRoomIdentityConfirmed('roomX')).toBe(false);
+    // Fragment left alone when we never entered the params branch.
+    expect(window.location.hash).toBe('#key=k&admin=a');
+  });
+});
diff --git a/packages/editor/roomIdentityHandoff.ts b/packages/editor/roomIdentityHandoff.ts
new file mode 100644
index 000000000..c74e831e2
--- /dev/null
+++ b/packages/editor/roomIdentityHandoff.ts
@@ -0,0 +1,75 @@
+/**
+ * Consume the creator's identity handoff (`&name=&color=`) from the
+ * URL fragment written by `handleConfirmStartRoom` on the localhost
+ * origin. Cookies and ConfigStore are per-origin, so a creator who
+ * configured their displayName/color on localhost has no way to
+ * transmit those values to `room.plannotator.ai` except through the
+ * URL they navigate to.
+ *
+ * Responsibilities on success:
+ *   - Write into this origin's ConfigStore via `setCustomIdentity` /
+ *     `setPresenceColor` so the values persist for future joins too.
+ *   - Mark the room as "identity confirmed" when BOTH name and color
+ *     arrived validly, so `RoomApp` skips the join gate. Partial
+ *     handoffs (abnormal — the Start Room flow writes both) fall back
+ *     to the gate so the user can confirm explicitly.
+ *   - Strip the params from the visible URL via `replaceState` so a
+ *     later copy/paste of the address bar doesn't leak the creator's
+ *     name to anyone it was shared with.
+ *
+ * Path-gated to `/c/:roomId` — non-room shells on the same editor
+ * package must not have their static-share fragments rewritten.
+ *
+ * Extracted from `AppRoot` for testability: the module-load IIFE in
+ * `AppRoot` would otherwise run at every test import regardless of
+ * intent. Callers set up `window.location.pathname` / `window.location.hash`
+ * and invoke this function directly.
+ */
+
+import { setCustomIdentity, setPresenceColor } from '@plannotator/ui/utils/identity';
+import { isValidPresenceColor } from '@plannotator/ui/utils/presenceColor';
+import { markRoomIdentityConfirmed } from '@plannotator/ui/utils/roomIdentityConfirmed';
+
+export function captureCreatorIdentityFromFragment(): void {
+  if (typeof window === 'undefined') return;
+  const roomMatch = window.location.pathname.match(/^\/c\/([^/]+)$/);
+  if (!roomMatch) return;
+  const hash = window.location.hash.slice(1);
+  if (!hash.includes('name=') && !hash.includes('color=')) return;
+  const params = new URLSearchParams(hash);
+  const rawName = params.get('name');
+  const rawColor = params.get('color');
+  let handledName = false;
+  let handledColor = false;
+
+  if (rawName) {
+    const trimmed = rawName.trim();
+    if (trimmed && trimmed.length <= 64) {
+      setCustomIdentity(trimmed);
+      handledName = true;
+    }
+  }
+  if (rawColor && isValidPresenceColor(rawColor)) {
+    setPresenceColor(rawColor);
+    handledColor = true;
+  }
+
+  // Require BOTH name and color to have landed validly before skipping
+  // the join gate. Partial handoffs (abnormal — normal UI always writes
+  // both) fall back to the gate so the user can confirm explicitly; the
+  // value that did arrive still prefills the relevant field. Without
+  // this, a truncated URL or hand-edited fragment could skip the gate
+  // using whatever the destination origin had stored from a previous
+  // room — creator types "Alice" + picks orange in the modal but lands
+  // as "Bob" + orange because Bob was their room-origin cookie from
+  // last week.
+  if (handledName && handledColor) {
+    markRoomIdentityConfirmed(roomMatch[1]);
+  }
+
+  params.delete('name');
+  params.delete('color');
+  const rest = params.toString();
+  const pathname = window.location.pathname;
+  window.history.replaceState(null, '', `${pathname}${rest ? `#${rest}` : ''}`);
+}
diff --git a/packages/editor/tsconfig.json b/packages/editor/tsconfig.json
new file mode 100644
index 000000000..829320fd8
--- /dev/null
+++ b/packages/editor/tsconfig.json
@@ -0,0 +1,65 @@
+// Scoped typecheck for the editor package.
+//
+// Explicitly curated entry points:
+//   - AppRoot.tsx (mode fork: local | room | invalid-room)
+//   - RoomApp.tsx (room shell + identity gate + overlays + admin)
+//
+// Transitive reality: AppRoot.tsx does `import App from './App'`, so
+// TypeScript follows that edge and App.tsx IS type-checked here too
+// (including its own transitive imports into `packages/ui`). There is
+// no type-only boundary between AppRoot and App today, and adding one
+// purely to dodge typecheck would be worse than accepting the
+// coverage.
+//
+// What "scoped" actually means in this config:
+//   - The `include` list names the files we want to ACTIVELY CURATE
+//     for Live Rooms correctness — i.e. the ones a reviewer working
+//     on room code is expected to keep clean.
+//   - Errors surfacing from App.tsx (or anything further downstream)
+//     are still blocking: they break `bun run typecheck`, so changes
+//     that regress App.tsx's types will be caught. But this config
+//     does NOT promise that App.tsx stays debt-free over time; the
+//     broader package-wide typecheck is deferred because
+//     `packages/ui` and `packages/editor` have pre-existing drift
+//     unrelated to Live Rooms.
+//
+// If App.tsx grows new debt as unrelated work lands, a future pass
+// should either fix the debt or carve out a separate baseline — not
+// hide coverage behind the `include` list.
+{
+  "compilerOptions": {
+    "target": "ES2022",
+    "experimentalDecorators": true,
+    "useDefineForClassFields": false,
+    "module": "ESNext",
+    "lib": [
+      "ES2022",
+      "DOM",
+      "DOM.Iterable"
+    ],
+    "skipLibCheck": true,
+    "types": [
+      "node"
+    ],
+    "moduleResolution": "bundler",
+    "isolatedModules": true,
+    "moduleDetection": "force",
+    "allowJs": true,
+    "jsx": "react-jsx",
+    "paths": {
+      "@plannotator/editor/*": ["./*"],
+      "@plannotator/ui": ["../ui/index.ts"],
+      "@plannotator/ui/*": ["../ui/*"],
+      "@plannotator/shared": ["../shared/index.ts"],
+      "@plannotator/shared/*": ["../shared/*"]
+    },
+    "allowImportingTsExtensions": true,
+    "noEmit": true
+  },
+  "include": [
+    "../ui/components/types.d.ts",
+    "env.d.ts",
+    "AppRoot.tsx",
+    "RoomApp.tsx"
+  ]
+}
diff --git a/packages/server/annotate.ts b/packages/server/annotate.ts
index 3029a0e9f..a493daca3 100644
--- a/packages/server/annotate.ts
+++ b/packages/server/annotate.ts
@@ -186,9 +186,10 @@ export async function startAnnotateServer(
           // API: Update user config (write-back to ~/.plannotator/config.json)
           if (url.pathname === "/api/config" && req.method === "POST") {
             try {
-              const body = (await req.json()) as { displayName?: string; diffOptions?: Record<string, unknown>; conventionalComments?: boolean; conventionalLabels?: unknown[] | null };
+              const body = (await req.json()) as { displayName?: string; presenceColor?: string; diffOptions?: Record<string, unknown>; conventionalComments?: boolean; conventionalLabels?: unknown[] | null };
               const toSave: Record<string, unknown> = {};
               if (body.displayName !== undefined) toSave.displayName = body.displayName;
+              if (body.presenceColor !== undefined) toSave.presenceColor = body.presenceColor;
               if (body.diffOptions !== undefined) toSave.diffOptions = body.diffOptions;
               if (body.conventionalComments !== undefined) toSave.conventionalComments = body.conventionalComments;
               if (body.conventionalLabels !== undefined) toSave.conventionalLabels = body.conventionalLabels;
diff --git a/packages/server/index.ts b/packages/server/index.ts
index 8b1356a49..46c933c59 100644
--- a/packages/server/index.ts
+++ b/packages/server/index.ts
@@ -47,6 +47,7 @@ import { composeImproveContext } from "@plannotator/shared/pfm-reminder";
 import { handleImage, handleUpload, handleAgents, handleServerReady, handleDraftSave, handleDraftLoad, handleDraftDelete, handleFavicon, type OpencodeClient } from "./shared-handlers";
 import { contentHash, deleteDraft } from "./draft";
 import { handleDoc, handleDocExists, handleObsidianVaults, handleObsidianFiles, handleObsidianDoc, handleFileBrowserFiles } from "./reference-handlers";
+import { isValidPermissionMode } from "@plannotator/shared/collab/validation";
 import { warmFileListCache } from "@plannotator/shared/resolve-file";
 import { createEditorAnnotationHandler } from "./editor-annotations";
 import { createExternalAnnotationHandler } from "./external-annotations";
@@ -204,6 +205,34 @@ export async function startPlannotatorServer(
     decisionPromise = new Promise(() => {});
   }
 
+  // Prevent duplicate approve/deny side effects (note integrations,
+  // draft deletion, final snapshot saves). The decision promise only
+  // resolves once regardless, but integrations and saves run BEFORE
+  // resolve — without this guard, a duplicate POST would re-run them.
+  // Mirrors Pi's `decisionSettled` in apps/pi-extension/server/serverPlan.ts.
+  // Claim-then-publish pattern: claimDecision() atomically sets the
+  // flag BEFORE any side effects run, so two near-simultaneous POSTs
+  // cannot both pass the guard. publishDecision() is called after
+  // integrations/saves finish; it only resolves the promise (the flag
+  // is already set). If side effects throw after claim, duplicates are
+  // still rejected — acceptable because the decision is in progress
+  // and the promise resolves once regardless.
+  let decisionSettled = false;
+  function claimDecision(): boolean {
+    if (decisionSettled) return false;
+    decisionSettled = true;
+    return true;
+  }
+  function publishDecision(result: {
+    approved: boolean;
+    feedback?: string;
+    savedPath?: string;
+    agentSwitch?: string;
+    permissionMode?: string;
+  }): void {
+    resolveDecision(result);
+  }
+
   // Start server with retry logic
   let server: ReturnType<typeof Bun.serve> | null = null;
 
@@ -321,9 +350,10 @@ export async function startPlannotatorServer(
           // API: Update user config (write-back to ~/.plannotator/config.json)
           if (url.pathname === "/api/config" && req.method === "POST") {
             try {
-              const body = (await req.json()) as { displayName?: string; diffOptions?: Record<string, unknown>; conventionalComments?: boolean; conventionalLabels?: unknown[] | null; pfmReminder?: boolean };
+              const body = (await req.json()) as { displayName?: string; presenceColor?: string; diffOptions?: Record<string, unknown>; conventionalComments?: boolean; conventionalLabels?: unknown[] | null; pfmReminder?: boolean };
               const toSave: Record<string, unknown> = {};
               if (body.displayName !== undefined) toSave.displayName = body.displayName;
+              if (body.presenceColor !== undefined) toSave.presenceColor = body.presenceColor;
               if (body.diffOptions !== undefined) toSave.diffOptions = body.diffOptions;
               if (body.conventionalComments !== undefined) toSave.conventionalComments = body.conventionalComments;
               if (body.conventionalLabels !== undefined) toSave.conventionalLabels = body.conventionalLabels;
@@ -451,6 +481,9 @@ export async function startPlannotatorServer(
 
           // API: Approve plan
           if (url.pathname === "/api/approve" && req.method === "POST") {
+            if (!claimDecision()) {
+              return Response.json({ ok: true, duplicate: true });
+            }
             // Check for note integrations and optional feedback
             let feedback: string | undefined;
             let agentSwitch: string | undefined;
@@ -473,23 +506,21 @@ export async function startPlannotatorServer(
                 feedback = body.feedback;
               }
 
-              // Capture agent switch setting for OpenCode
-              if (body.agentSwitch) {
-                agentSwitch = body.agentSwitch;
-              }
-
-              // Capture permission mode from client request (Claude Code)
-              if (body.permissionMode) {
-                requestedPermissionMode = body.permissionMode;
-              }
-
-              // Capture plan save settings
+              if (body.agentSwitch) agentSwitch = body.agentSwitch;
               if (body.planSave !== undefined) {
                 planSaveEnabled = body.planSave.enabled;
                 planSaveCustomPath = body.planSave.customPath;
               }
 
-              // Run integrations in parallel — they're independent
+              // Capture permission mode from client request (Claude Code).
+              // Require a valid mode string — an invalid value would
+              // silently fall through to the hook and could upgrade the
+              // session to something unintended.
+              if (isValidPermissionMode(body.permissionMode)) {
+                requestedPermissionMode = body.permissionMode;
+              }
+
+              // Run integrations in parallel — they're independent.
               const integrationResults: Record<string, IntegrationResult> = {};
               const integrationPromises: Promise<void>[] = [];
               if (body.obsidian?.vaultPath && body.obsidian?.plan) {
@@ -513,27 +544,44 @@ export async function startPlannotatorServer(
               console.error(`[Integration] Error:`, err);
             }
 
-            // Save annotations and final snapshot (if enabled)
+            // Save annotations and final snapshot (if enabled). The
+            // claim-then-publish flag is already set above, so we MUST
+            // reach publishDecision() below no matter what — otherwise
+            // the awaiting hook hangs forever and retries are rejected
+            // as duplicates. Persistence is best-effort: log the error
+            // and continue.
             let savedPath: string | undefined;
             if (planSaveEnabled) {
-              const annotations = feedback || "";
-              if (annotations) {
-                saveAnnotations(slug, annotations, planSaveCustomPath);
+              try {
+                const annotations = feedback || "";
+                if (annotations) {
+                  saveAnnotations(slug, annotations, planSaveCustomPath);
+                }
+                savedPath = saveFinalSnapshot(slug, "approved", plan, annotations, planSaveCustomPath);
+              } catch (err) {
+                console.error(`[plan-save] approve persistence failed:`, err);
               }
-              savedPath = saveFinalSnapshot(slug, "approved", plan, annotations, planSaveCustomPath);
             }
 
-            // Clean up draft on successful submit
-            deleteDraft(draftKey);
+            // Clean up draft on successful submit (best-effort — draft
+            // deletion failure must not prevent decision publication).
+            try {
+              deleteDraft(draftKey);
+            } catch (err) {
+              console.error(`[draft] delete failed:`, err);
+            }
 
-            // Use permission mode from client request if provided, otherwise fall back to hook input
+            // Resolution order: client request body > server startup value.
             const effectivePermissionMode = requestedPermissionMode || permissionMode;
-            resolveDecision({ approved: true, feedback, savedPath, agentSwitch, permissionMode: effectivePermissionMode });
+            publishDecision({ approved: true, feedback, savedPath, agentSwitch, permissionMode: effectivePermissionMode });
             return Response.json({ ok: true, savedPath });
           }
 
           // API: Deny with feedback
           if (url.pathname === "/api/deny" && req.method === "POST") {
+            if (!claimDecision()) {
+              return Response.json({ ok: true, duplicate: true });
+            }
             let feedback = "Plan rejected by user";
             let planSaveEnabled = true; // default to enabled for backwards compat
             let planSaveCustomPath: string | undefined;
@@ -544,7 +592,6 @@ export async function startPlannotatorServer(
               };
               feedback = body.feedback || feedback;
 
-              // Capture plan save settings
               if (body.planSave !== undefined) {
                 planSaveEnabled = body.planSave.enabled;
                 planSaveCustomPath = body.planSave.customPath;
@@ -553,15 +600,25 @@ export async function startPlannotatorServer(
               // Use default feedback
             }
 
-            // Save annotations and final snapshot (if enabled)
+            // Save annotations and final snapshot (if enabled). Must
+            // reach publishDecision() below regardless — see the matching
+            // comment in the approve handler.
             let savedPath: string | undefined;
             if (planSaveEnabled) {
-              saveAnnotations(slug, feedback, planSaveCustomPath);
-              savedPath = saveFinalSnapshot(slug, "denied", plan, feedback, planSaveCustomPath);
+              try {
+                saveAnnotations(slug, feedback, planSaveCustomPath);
+                savedPath = saveFinalSnapshot(slug, "denied", plan, feedback, planSaveCustomPath);
+              } catch (err) {
+                console.error(`[plan-save] deny persistence failed:`, err);
+              }
             }
 
-            deleteDraft(draftKey);
-            resolveDecision({ approved: false, feedback, savedPath });
+            try {
+              deleteDraft(draftKey);
+            } catch (err) {
+              console.error(`[draft] delete failed:`, err);
+            }
+            publishDecision({ approved: false, feedback, savedPath });
             return Response.json({ ok: true, savedPath });
           }
 
diff --git a/packages/server/review.ts b/packages/server/review.ts
index 4e4c12488..78dd2ee9f 100644
--- a/packages/server/review.ts
+++ b/packages/server/review.ts
@@ -933,9 +933,10 @@ export async function startReviewServer(
           // API: Update user config (write-back to ~/.plannotator/config.json)
           if (url.pathname === "/api/config" && req.method === "POST") {
             try {
-              const body = (await req.json()) as { displayName?: string; diffOptions?: Record<string, unknown>; conventionalComments?: boolean; conventionalLabels?: unknown[] | null };
+              const body = (await req.json()) as { displayName?: string; presenceColor?: string; diffOptions?: Record<string, unknown>; conventionalComments?: boolean; conventionalLabels?: unknown[] | null };
               const toSave: Record<string, unknown> = {};
               if (body.displayName !== undefined) toSave.displayName = body.displayName;
+              if (body.presenceColor !== undefined) toSave.presenceColor = body.presenceColor;
               if (body.diffOptions !== undefined) toSave.diffOptions = body.diffOptions;
               if (body.conventionalComments !== undefined) toSave.conventionalComments = body.conventionalComments;
               if (body.conventionalLabels !== undefined) toSave.conventionalLabels = body.conventionalLabels;
diff --git a/packages/shared/collab/canonical-json.test.ts b/packages/shared/collab/canonical-json.test.ts
new file mode 100644
index 000000000..91815af9d
--- /dev/null
+++ b/packages/shared/collab/canonical-json.test.ts
@@ -0,0 +1,92 @@
+import { describe, expect, test } from 'bun:test';
+import { canonicalJson } from './canonical-json';
+
+describe('canonicalJson', () => {
+  test('serializes null', () => {
+    expect(canonicalJson(null)).toBe('null');
+  });
+
+  test('serializes booleans', () => {
+    expect(canonicalJson(true)).toBe('true');
+    expect(canonicalJson(false)).toBe('false');
+  });
+
+  test('serializes numbers', () => {
+    expect(canonicalJson(42)).toBe('42');
+    expect(canonicalJson(-3.14)).toBe('-3.14');
+    expect(canonicalJson(0)).toBe('0');
+  });
+
+  test('serializes strings', () => {
+    expect(canonicalJson('hello')).toBe('"hello"');
+    expect(canonicalJson('')).toBe('""');
+    expect(canonicalJson('has "quotes"')).toBe('"has \\"quotes\\""');
+  });
+
+  test('serializes arrays preserving order', () => {
+    expect(canonicalJson([3, 1, 2])).toBe('[3,1,2]');
+    expect(canonicalJson([])).toBe('[]');
+    expect(canonicalJson(['b', 'a'])).toBe('["b","a"]');
+  });
+
+  test('sorts object keys lexicographically', () => {
+    expect(canonicalJson({ z: 1, a: 2, m: 3 })).toBe('{"a":2,"m":3,"z":1}');
+  });
+
+  test('sorts nested object keys at every level', () => {
+    const input = { b: { d: 1, c: 2 }, a: { f: 3, e: 4 } };
+    expect(canonicalJson(input)).toBe('{"a":{"e":4,"f":3},"b":{"c":2,"d":1}}');
+  });
+
+  test('omits undefined fields', () => {
+    expect(canonicalJson({ a: 1, b: undefined, c: 3 })).toBe('{"a":1,"c":3}');
+  });
+
+  test('handles undefined as top-level value', () => {
+    expect(canonicalJson(undefined)).toBe('null');
+  });
+
+  test('produces no whitespace', () => {
+    const result = canonicalJson({ key: [1, { nested: true }] });
+    expect(result).not.toContain(' ');
+    expect(result).not.toContain('\n');
+    expect(result).not.toContain('\t');
+  });
+
+  test('throws on NaN', () => {
+    expect(() => canonicalJson(NaN)).toThrow('not serializable');
+  });
+
+  test('throws on Infinity', () => {
+    expect(() => canonicalJson(Infinity)).toThrow('not serializable');
+    expect(() => canonicalJson(-Infinity)).toThrow('not serializable');
+  });
+
+  test('throws on functions', () => {
+    expect(() => canonicalJson(() => {})).toThrow('not serializable');
+  });
+
+  test('throws on symbols', () => {
+    expect(() => canonicalJson(Symbol('test'))).toThrow('not serializable');
+  });
+
+  test('throws on bigint', () => {
+    expect(() => canonicalJson(BigInt(42))).toThrow('not serializable');
+  });
+
+  // Known-output test vectors — security-critical stability tests
+  describe('test vectors', () => {
+    test('AdminCommand room.delete', () => {
+      expect(canonicalJson({ type: 'room.delete' })).toBe('{"type":"room.delete"}');
+    });
+
+    test('same input always produces same output', () => {
+      const input = { type: 'room.delete', reason: 'final' };
+      const first = canonicalJson(input);
+      const second = canonicalJson(input);
+      const third = canonicalJson({ reason: 'final', type: 'room.delete' });
+      expect(first).toBe(second);
+      expect(first).toBe(third);
+    });
+  });
+});
diff --git a/packages/shared/collab/canonical-json.ts b/packages/shared/collab/canonical-json.ts
new file mode 100644
index 000000000..eecaecbd0
--- /dev/null
+++ b/packages/shared/collab/canonical-json.ts
@@ -0,0 +1,48 @@
+/**
+ * Deterministic JSON serialization for HMAC proof binding.
+ *
+ * Lexicographically sorted object keys at every nesting level,
+ * no whitespace, UTF-8 bytes. Arrays preserve order.
+ * undefined fields are omitted. Throws on functions, symbols, NaN, Infinity.
+ *
+ * This function is security-critical: its output is included in admin
+ * command HMAC proofs. Any change to its output for the same input is
+ * a protocol-breaking change.
+ */
+export function canonicalJson(value: unknown): string {
+  if (value === null) return 'null';
+  if (value === undefined) return 'null';
+
+  const t = typeof value;
+
+  if (t === 'boolean') return value ? 'true' : 'false';
+
+  if (t === 'number') {
+    if (!Number.isFinite(value as number)) {
+      throw new Error(`canonicalJson: ${value} is not serializable`);
+    }
+    return JSON.stringify(value);
+  }
+
+  if (t === 'string') return JSON.stringify(value);
+
+  if (t === 'function' || t === 'symbol' || t === 'bigint') {
+    throw new Error(`canonicalJson: ${t} is not serializable`);
+  }
+
+  if (Array.isArray(value)) {
+    const elements = value.map(v => canonicalJson(v));
+    return '[' + elements.join(',') + ']';
+  }
+
+  // Plain object — sort keys lexicographically
+  const obj = value as Record<string, unknown>;
+  const keys = Object.keys(obj).sort();
+  const entries: string[] = [];
+  for (const key of keys) {
+    const v = obj[key];
+    if (v === undefined) continue; // omit undefined fields
+    entries.push(JSON.stringify(key) + ':' + canonicalJson(v));
+  }
+  return '{' + entries.join(',') + '}';
+}
diff --git a/packages/shared/collab/client-runtime/apply-event.test.ts b/packages/shared/collab/client-runtime/apply-event.test.ts
new file mode 100644
index 000000000..c0dab93c2
--- /dev/null
+++ b/packages/shared/collab/client-runtime/apply-event.test.ts
@@ -0,0 +1,243 @@
+import { describe, expect, test } from 'bun:test';
+import { applyAnnotationEvent, annotationsToArray } from './apply-event';
+import type { RoomAnnotation, RoomServerEvent, RoomSnapshot } from '../types';
+
+function makeAnnotation(id: string, extras: Partial<RoomAnnotation> = {}): RoomAnnotation {
+  return {
+    id,
+    blockId: 'b1',
+    startOffset: 0,
+    endOffset: 5,
+    type: 'COMMENT',
+    originalText: 'hello',
+    createdA: 1234567890,
+    ...extras,
+  };
+}
+
+describe('applyAnnotationEvent', () => {
+  test('annotation.add inserts annotations', () => {
+    const map = new Map<string, RoomAnnotation>();
+    const event: RoomServerEvent = {
+      type: 'annotation.add',
+      annotations: [makeAnnotation('a1'), makeAnnotation('a2')],
+    };
+    const result = applyAnnotationEvent(map, event);
+    expect(result.applied).toBe(true);
+    expect(map.size).toBe(2);
+    expect(map.has('a1')).toBe(true);
+    expect(map.has('a2')).toBe(true);
+  });
+
+  test('annotation.update merges patch into existing', () => {
+    const map = new Map<string, RoomAnnotation>();
+    map.set('a1', makeAnnotation('a1', { text: 'original' }));
+    const event: RoomServerEvent = {
+      type: 'annotation.update',
+      id: 'a1',
+      patch: { text: 'updated' },
+    };
+    const result = applyAnnotationEvent(map, event);
+    expect(result.applied).toBe(true);
+    expect(map.get('a1')?.text).toBe('updated');
+  });
+
+  test('annotation.update drops own-property undefined values from patch (normalization)', () => {
+    const map = new Map<string, RoomAnnotation>();
+    map.set('a1', makeAnnotation('a1', { text: 'original', author: 'alice' }));
+    const event: RoomServerEvent = {
+      type: 'annotation.update',
+      id: 'a1',
+      // Direct in-process caller passes undefined — must be dropped, not
+      // stored as an own key with value undefined.
+      patch: { text: 'updated', author: undefined } as Partial<RoomAnnotation>,
+    };
+    applyAnnotationEvent(map, event);
+    const stored = map.get('a1')!;
+    expect(stored.text).toBe('updated');
+    // author must still be 'alice' — the undefined patch must not have erased it.
+    expect(stored.author).toBe('alice');
+    // And own-property check: the stored object must NOT have an own `author: undefined` slot.
+    expect('author' in stored).toBe(true);
+    expect(stored.author).not.toBeUndefined();
+  });
+
+  test('annotation.update rejects when merged final annotation violates cross-field invariants', () => {
+    // Inline annotations (COMMENT/DELETION) must have non-empty blockId. A
+    // patch that sets blockId: '' on a COMMENT passes the patch-level
+    // validator (blockId is just a string) but produces an invalid merged
+    // final annotation. The reducer must validate the merged state and
+    // refuse to store the invalid result.
+    const map = new Map<string, RoomAnnotation>();
+    map.set('a1', makeAnnotation('a1'));  // COMMENT with blockId: 'b1'
+    const originalBlockId = map.get('a1')!.blockId;
+
+    const event: RoomServerEvent = {
+      type: 'annotation.update',
+      id: 'a1',
+      patch: { blockId: '' } as Partial<RoomAnnotation>,
+    };
+    const result = applyAnnotationEvent(map, event);
+    expect(result.applied).toBe(false);
+    expect(result.reason).toContain('failed shape validation');
+    // Stored annotation is untouched — blockId is still non-empty.
+    expect(map.get('a1')!.blockId).toBe(originalBlockId);
+  });
+
+  test('annotation.update rejects when patching type turns existing annotation into an invalid inline (empty blockId)', () => {
+    // A GLOBAL_COMMENT legitimately carries blockId: ''. Patching its type
+    // to COMMENT produces an invalid final state (inline requires non-empty
+    // blockId). Must reject.
+    const map = new Map<string, RoomAnnotation>();
+    map.set('g1', makeAnnotation('g1', { type: 'GLOBAL_COMMENT', blockId: '' }));
+    const event: RoomServerEvent = {
+      type: 'annotation.update',
+      id: 'g1',
+      patch: { type: 'COMMENT' },
+    };
+    const result = applyAnnotationEvent(map, event);
+    expect(result.applied).toBe(false);
+    // Stored annotation type is untouched.
+    expect(map.get('g1')!.type).toBe('GLOBAL_COMMENT');
+  });
+
+  test('annotation.update defensively preserves existing.id even if patch slipped in a mismatched id', () => {
+    // Defense-in-depth against identity-mutation: isRoomAnnotationPatch
+    // already rejects id in patches. The reducer ALSO forces existing.id so
+    // that if a malformed patch ever reached here, we'd still store the
+    // annotation under the correct id.
+    const map = new Map<string, RoomAnnotation>();
+    map.set('a1', makeAnnotation('a1', { text: 'original' }));
+    const event: RoomServerEvent = {
+      type: 'annotation.update',
+      id: 'a1',
+      patch: { id: 'hijacked', text: 'updated' } as Partial<RoomAnnotation>,
+    };
+    const result = applyAnnotationEvent(map, event);
+    expect(result.applied).toBe(true);
+    expect(map.size).toBe(1);
+    expect(map.has('a1')).toBe(true);
+    expect(map.has('hijacked')).toBe(false);
+    const stored = map.get('a1')!;
+    expect(stored.id).toBe('a1');             // internal id unchanged
+    expect(stored.text).toBe('updated');       // other fields still patched
+  });
+
+  test('annotation.update isolates nested startMeta/endMeta between input patch and stored annotation', () => {
+    const map = new Map<string, RoomAnnotation>();
+    map.set('a1', makeAnnotation('a1', {
+      startMeta: { parentTagName: 'p', parentIndex: 0, textOffset: 0 },
+    }));
+    const patch: Partial<RoomAnnotation> = {
+      startMeta: { parentTagName: 'div', parentIndex: 1, textOffset: 5 },
+      endMeta: { parentTagName: 'div', parentIndex: 1, textOffset: 10 },
+    };
+    const event: RoomServerEvent = { type: 'annotation.update', id: 'a1', patch };
+    applyAnnotationEvent(map, event);
+
+    // Mutate the INPUT patch's nested meta objects after apply.
+    patch.startMeta!.parentTagName = 'HIJACKED';
+    patch.endMeta!.textOffset = 999;
+
+    const stored = map.get('a1')!;
+    // Stored annotation must be unaffected.
+    expect(stored.startMeta!.parentTagName).toBe('div');
+    expect(stored.startMeta!.textOffset).toBe(5);
+    expect(stored.endMeta!.textOffset).toBe(10);
+  });
+
+  test('annotation.update on missing id is a no-op', () => {
+    const map = new Map<string, RoomAnnotation>();
+    const event: RoomServerEvent = {
+      type: 'annotation.update',
+      id: 'missing',
+      patch: { text: 'x' },
+    };
+    const result = applyAnnotationEvent(map, event);
+    expect(result.applied).toBe(false);
+    expect(result.reason).toContain('not found');
+    expect(map.size).toBe(0);
+  });
+
+  test('annotation.remove deletes ids', () => {
+    const map = new Map<string, RoomAnnotation>();
+    map.set('a1', makeAnnotation('a1'));
+    map.set('a2', makeAnnotation('a2'));
+    map.set('a3', makeAnnotation('a3'));
+    const event: RoomServerEvent = {
+      type: 'annotation.remove',
+      ids: ['a1', 'a3'],
+    };
+    applyAnnotationEvent(map, event);
+    expect(map.has('a1')).toBe(false);
+    expect(map.has('a2')).toBe(true);
+    expect(map.has('a3')).toBe(false);
+  });
+
+  test('annotation.clear without source clears all', () => {
+    const map = new Map<string, RoomAnnotation>();
+    map.set('a1', makeAnnotation('a1'));
+    map.set('a2', makeAnnotation('a2', { source: 'eslint' }));
+    applyAnnotationEvent(map, { type: 'annotation.clear' });
+    expect(map.size).toBe(0);
+  });
+
+  test('annotation.clear with source only removes matching', () => {
+    const map = new Map<string, RoomAnnotation>();
+    map.set('a1', makeAnnotation('a1'));
+    map.set('a2', makeAnnotation('a2', { source: 'eslint' }));
+    map.set('a3', makeAnnotation('a3', { source: 'eslint' }));
+    applyAnnotationEvent(map, { type: 'annotation.clear', source: 'eslint' });
+    expect(map.has('a1')).toBe(true);
+    expect(map.has('a2')).toBe(false);
+    expect(map.has('a3')).toBe(false);
+  });
+
+  test('snapshot is NOT handled here — production uses CollabRoomClient.handleRoomSnapshot()', () => {
+    // Snapshots must atomically update planMarkdown + seq + annotations,
+    // which this reducer cannot do. The client's snapshot path is the sole
+    // entry point; this reducer returns applied: false so any accidental
+    // caller gets a loud no-op rather than a half-applied snapshot.
+    const map = new Map<string, RoomAnnotation>();
+    map.set('a1', makeAnnotation('a1'));
+    const snapshot: RoomSnapshot = {
+      versionId: 'v1',
+      planMarkdown: '# Plan',
+      annotations: [makeAnnotation('b1'), makeAnnotation('b2')],
+    };
+    const result = applyAnnotationEvent(map, { type: 'snapshot', payload: snapshot, snapshotSeq: 5 });
+    expect(result.applied).toBe(false);
+    expect(result.reason).toContain('snapshot');
+    // Map is untouched.
+    expect(map.size).toBe(1);
+    expect(map.has('a1')).toBe(true);
+  });
+
+  test('presence.update is not handled here', () => {
+    const map = new Map<string, RoomAnnotation>();
+    const result = applyAnnotationEvent(map, {
+      type: 'presence.update',
+      clientId: 'c1',
+      presence: {
+        user: { id: 'u1', name: 'alice', color: '#f00' },
+        cursor: null,
+      },
+    });
+    expect(result.applied).toBe(false);
+  });
+});
+
+describe('annotationsToArray', () => {
+  test('returns array in insertion order', () => {
+    const map = new Map<string, RoomAnnotation>();
+    map.set('a1', makeAnnotation('a1'));
+    map.set('a2', makeAnnotation('a2'));
+    map.set('a3', makeAnnotation('a3'));
+    const arr = annotationsToArray(map);
+    expect(arr.map(a => a.id)).toEqual(['a1', 'a2', 'a3']);
+  });
+
+  test('empty map returns empty array', () => {
+    expect(annotationsToArray(new Map())).toEqual([]);
+  });
+});
diff --git a/packages/shared/collab/client-runtime/apply-event.ts b/packages/shared/collab/client-runtime/apply-event.ts
new file mode 100644
index 000000000..bd35eafbe
--- /dev/null
+++ b/packages/shared/collab/client-runtime/apply-event.ts
@@ -0,0 +1,131 @@
+/**
+ * Pure reducer: applies a decrypted RoomServerEvent to a Map<id, RoomAnnotation>.
+ *
+ * In V1 this runs only on the server-echo path — the client does not apply
+ * annotation ops optimistically. Server echo is authoritative; this reducer
+ * is the single point where annotations enter state.
+ *
+ * Separated from the client class so it can be unit-tested without WebSocket mocks.
+ */
+
+import { isRoomAnnotation, type RoomAnnotation, type RoomServerEvent } from '../types';
+
+/** Shallow + nested-meta clone so stored annotations are isolated from inputs.
+ *  Exported so client.ts and other reducer callers share the same definition —
+ *  avoids the drift risk of two helpers cloning the same nested fields. */
+export function cloneRoomAnnotation(a: RoomAnnotation): RoomAnnotation {
+  return {
+    ...a,
+    startMeta: a.startMeta ? { ...a.startMeta } : undefined,
+    endMeta: a.endMeta ? { ...a.endMeta } : undefined,
+  };
+}
+
+/**
+ * Clone a partial patch, including nested startMeta/endMeta. A direct-event
+ * subscriber mutating the emitted event.patch.startMeta must not reach back
+ * into the stored annotation, and vice versa.
+ */
+export function cloneRoomAnnotationPatch(patch: Partial<RoomAnnotation>): Partial<RoomAnnotation> {
+  const out: Partial<RoomAnnotation> = { ...patch };
+  if (patch.startMeta !== undefined) out.startMeta = { ...patch.startMeta };
+  if (patch.endMeta !== undefined) out.endMeta = { ...patch.endMeta };
+  return out;
+}
+
+/**
+ * Apply an annotation-related event to the annotations map.
+ * Mutates the map in place. Returns a hint for the caller about what happened.
+ *
+ * Annotations from the event are CLONED before being stored. Callers (and
+ * event subscribers) can safely mutate input annotations without reaching
+ * back into the stored map.
+ */
+export function applyAnnotationEvent(
+  annotations: Map<string, RoomAnnotation>,
+  event: RoomServerEvent,
+): { applied: boolean; reason?: string } {
+  switch (event.type) {
+    case 'annotation.add':
+      for (const ann of event.annotations) {
+        annotations.set(ann.id, cloneRoomAnnotation(ann));
+      }
+      return { applied: true };
+
+    case 'annotation.update': {
+      const existing = annotations.get(event.id);
+      if (!existing) {
+        return { applied: false, reason: `annotation ${event.id} not found` };
+      }
+      // `undefined` in a patch means "field absent / no change" — it is NOT
+      // a clear-field signal. We strip own-property undefined values before
+      // the spread so `{ text: undefined }` is treated identically to `{}`
+      // and does not create an own `text` key on the stored annotation.
+      //
+      // Wire-path patches come from JSON (which cannot encode undefined), so
+      // this only matters for direct in-process callers. If clear-field
+      // semantics are ever needed, add them explicitly via `null` or a
+      // dedicated operation; do not repurpose `undefined`.
+      const normalized = Object.fromEntries(
+        Object.entries(event.patch).filter(([, v]) => v !== undefined),
+      ) as Partial<RoomAnnotation>;
+      // Clone nested startMeta/endMeta before merging so a later mutation to
+      // the input patch can't reach back into the stored annotation.
+      const patch = cloneRoomAnnotationPatch(normalized);
+      // Defense-in-depth: isRoomAnnotationPatch rejects `id` in patches, but
+      // we also force `id` back to `existing.id` here. Without this, a patch
+      // that slipped through with a mismatched `id` would store an annotation
+      // under map key `existing.id` whose object reports a different id —
+      // subsequent removes/updates by the visible id would miss it.
+      const merged = { ...existing, ...patch, id: existing.id } as RoomAnnotation;
+      // Validate the MERGED final annotation against the full annotation
+      // validator. Individual patch fields pass their type checks but can
+      // still produce an invalid final state when combined with existing
+      // fields — e.g. a patch { blockId: '' } applied to a COMMENT, or a
+      // patch { type: 'COMMENT' } applied to a GLOBAL_COMMENT that carried
+      // blockId: ''. isRoomAnnotation enforces cross-field invariants
+      // (inline annotations require non-empty blockId, etc.).
+      if (!isRoomAnnotation(merged)) {
+        return { applied: false, reason: `merged annotation ${event.id} failed shape validation` };
+      }
+      annotations.set(event.id, cloneRoomAnnotation(merged));
+      return { applied: true };
+    }
+
+    case 'annotation.remove':
+      for (const id of event.ids) {
+        annotations.delete(id);
+      }
+      return { applied: true };
+
+    case 'annotation.clear': {
+      if (event.source === undefined) {
+        annotations.clear();
+      } else {
+        for (const [id, ann] of annotations) {
+          if (ann.source === event.source) annotations.delete(id);
+        }
+      }
+      return { applied: true };
+    }
+
+    case 'snapshot':
+      // Snapshots are NOT handled by this reducer. A correct snapshot apply
+      // must update planMarkdown, seq, AND the annotations map together;
+      // handling any of those in isolation risks drift. Production clients
+      // use CollabRoomClient.handleRoomSnapshot() for that atomic path.
+      return { applied: false, reason: 'snapshots handled by client snapshot path, not this reducer' };
+
+    case 'presence.update':
+      // Presence is handled separately by the caller — not a snapshot mutation.
+      return { applied: false, reason: 'presence event handled separately' };
+
+    default:
+      return { applied: false, reason: 'unknown event type' };
+  }
+}
+
+/** Return annotations as an ordered array (insertion order preserved). */
+export function annotationsToArray(annotations: Map<string, RoomAnnotation>): RoomAnnotation[] {
+  return [...annotations.values()];
+}
diff --git a/packages/shared/collab/client-runtime/backoff.test.ts b/packages/shared/collab/client-runtime/backoff.test.ts
new file mode 100644
index 000000000..1bc1e3cd9
--- /dev/null
+++ b/packages/shared/collab/client-runtime/backoff.test.ts
@@ -0,0 +1,37 @@
+import { describe, expect, test } from 'bun:test';
+import { computeBackoffMs, DEFAULT_BACKOFF } from './backoff';
+
+describe('computeBackoffMs', () => {
+  // Stable random for deterministic tests
+  const rand05 = () => 0.5;
+  const rand0 = () => 0;
+  const rand1 = () => 0.999999;
+
+  test('attempt 0 uses initial delay (with jitter)', () => {
+    expect(computeBackoffMs(0, {}, rand05)).toBe(Math.floor(0.5 * DEFAULT_BACKOFF.initialDelayMs));
+  });
+
+  test('attempt 1 doubles (factor 2)', () => {
+    expect(computeBackoffMs(1, {}, rand05)).toBe(Math.floor(0.5 * DEFAULT_BACKOFF.initialDelayMs * 2));
+  });
+
+  test('delay caps at maxDelayMs', () => {
+    // Attempt 20 would be 500 * 2^20 = 524,288,000 — capped at 15_000
+    expect(computeBackoffMs(20, {}, rand1)).toBe(Math.floor(0.999999 * 15_000));
+  });
+
+  test('rand=0 produces 0 delay', () => {
+    expect(computeBackoffMs(5, {}, rand0)).toBe(0);
+  });
+
+  test('custom options override defaults', () => {
+    const opts = { initialDelayMs: 100, maxDelayMs: 1000, factor: 3 };
+    expect(computeBackoffMs(0, opts, rand05)).toBe(Math.floor(0.5 * 100));
+    expect(computeBackoffMs(1, opts, rand05)).toBe(Math.floor(0.5 * 300));
+    expect(computeBackoffMs(5, opts, rand1)).toBe(Math.floor(0.999999 * 1000));
+  });
+
+  test('negative attempt treated as 0', () => {
+    expect(computeBackoffMs(-5, {}, rand05)).toBe(Math.floor(0.5 * DEFAULT_BACKOFF.initialDelayMs));
+  });
+});
diff --git a/packages/shared/collab/client-runtime/backoff.ts b/packages/shared/collab/client-runtime/backoff.ts
new file mode 100644
index 000000000..f4b733c45
--- /dev/null
+++ b/packages/shared/collab/client-runtime/backoff.ts
@@ -0,0 +1,34 @@
+/**
+ * Exponential backoff with full jitter, used by auto-reconnect.
+ *
+ * Pure function — all timing/randomness injected so tests can stub.
+ */
+
+export interface BackoffOptions {
+  initialDelayMs?: number;  // default 500
+  maxDelayMs?: number;       // default 15_000
+  factor?: number;           // default 2
+}
+
+export const DEFAULT_BACKOFF: Required<BackoffOptions> = {
+  initialDelayMs: 500,
+  maxDelayMs: 15_000,
+  factor: 2,
+};
+
+/**
+ * Compute the delay (ms) before retry attempt N.
+ *
+ * Uses full jitter: `rand() * min(maxDelayMs, initialDelayMs * factor^attempt)`.
+ * Attempt 0 is the first retry. Attempts are capped at the max delay.
+ */
+export function computeBackoffMs(
+  attempt: number,
+  options: BackoffOptions = {},
+  rand: () => number = Math.random,
+): number {
+  const { initialDelayMs, maxDelayMs, factor } = { ...DEFAULT_BACKOFF, ...options };
+  const rawDelay = initialDelayMs * Math.pow(factor, Math.max(0, attempt));
+  const capped = Math.min(maxDelayMs, rawDelay);
+  return Math.floor(rand() * capped);
+}
diff --git a/packages/shared/collab/client-runtime/client.test.ts b/packages/shared/collab/client-runtime/client.test.ts
new file mode 100644
index 000000000..52090dab0
--- /dev/null
+++ b/packages/shared/collab/client-runtime/client.test.ts
@@ -0,0 +1,2297 @@
+/**
+ * Unit tests for CollabRoomClient using MockWebSocket.
+ *
+ * Scripts the server-side handshake, events, and admin flow deterministically.
+ */
+
+import { describe, expect, test } from 'bun:test';
+import {
+  CollabRoomClient,
+  AdminNotAuthorizedError,
+  NotConnectedError,
+  AdminRejectedError,
+  ConnectTimeoutError,
+  InvalidOutboundPayloadError,
+} from './client';
+import { MockWebSocket } from './mock-websocket';
+import {
+  deriveRoomKeys,
+  deriveAdminKey,
+  computeRoomVerifier,
+  computeAdminVerifier,
+  computeAuthProof,
+  encryptEventOp,
+  encryptPresence,
+  encryptSnapshot,
+  decryptEventPayload,
+} from '../crypto';
+import { generateClientId, generateRoomSecret, generateAdminSecret, generateChallengeId, generateNonce } from '../ids';
+import { ADMIN_ERROR_CODES } from '../constants';
+import type { AuthChallenge, AuthAccepted, RoomSnapshot, ServerEnvelope, RoomTransportMessage, RoomAnnotation, AuthResponse, AdminChallenge, AdminCommandEnvelope } from '../types';
+import type { CollabRoomState, CollabRoomUser } from './types';
+
+// ---------------------------------------------------------------------------
+// Test fixture
+// ---------------------------------------------------------------------------
+
+const USER: CollabRoomUser = { id: 'u1', name: 'alice', color: '#f00' };
+const ROOM_ID = 'ABCDEFGHIJKLMNOPQRSTUv';  // 22 chars
+
+/**
+ * Construct a test auth.challenge including the now-required server-assigned
+ * clientId. Tests that care about the exact clientId can pass it explicitly;
+ * otherwise a fresh one is generated per call.
+ */
+function makeAuthChallenge(overrides: Partial<AuthChallenge> = {}): AuthChallenge {
+  return {
+    type: 'auth.challenge',
+    challengeId: overrides.challengeId ?? generateChallengeId(),
+    nonce: overrides.nonce ?? generateNonce(),
+    expiresAt: overrides.expiresAt ?? Date.now() + 30_000,
+    clientId: overrides.clientId ?? generateClientId(),
+  };
+}
+
+interface TestSetup {
+  client: CollabRoomClient;
+  ws: MockWebSocket;
+  roomSecret: Uint8Array;
+  roomVerifier: string;
+  adminSecret: Uint8Array;
+  adminVerifier: string;
+  eventKey: CryptoKey;
+  presenceKey: CryptoKey;
+  snapshot: RoomSnapshot;
+}
+
+async function setup(options: { withAdmin?: boolean } = {}): Promise<TestSetup> {
+  const roomSecret = generateRoomSecret();
+  const adminSecret = generateAdminSecret();
+  const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+  const adminKey = options.withAdmin ? await deriveAdminKey(adminSecret) : null;
+  const roomVerifier = await computeRoomVerifier(authKey, ROOM_ID);
+  const adminVerifier = adminKey ? await computeAdminVerifier(adminKey, ROOM_ID) : null;
+
+  const snapshot: RoomSnapshot = {
+    versionId: 'v1',
+    planMarkdown: '# Plan',
+    annotations: [],
+  };
+
+  // Capture the constructed WebSocket for scripting
+  let capturedWs: MockWebSocket | null = null;
+  const WebSocketImpl = class extends MockWebSocket {
+    constructor(url: string | URL, protocols?: string | string[]) {
+      super(url, protocols);
+      capturedWs = this;
+    }
+  } as unknown as typeof WebSocket;
+
+  const client = new CollabRoomClient({
+    roomId: ROOM_ID,
+    baseUrl: 'http://localhost:8787',
+    eventKey,
+    presenceKey,
+    adminKey,
+    roomVerifier,
+    adminVerifier,
+    user: USER,
+    webSocketImpl: WebSocketImpl,
+    connectTimeoutMs: 2000,
+    reconnect: { maxAttempts: 0 }, // disable auto-reconnect in tests unless overridden
+    presenceTtlMs: 50, // short for testing
+    presenceSweepIntervalMs: 20,
+  });
+
+  // Start connect asynchronously so the mock WS gets constructed
+  const connectPromise = client.connect();
+
+  // Wait for ws to be captured
+  await new Promise<void>((r) => {
+    const check = () => {
+      if (capturedWs) r();
+      else queueMicrotask(check);
+    };
+    check();
+  });
+
+  // Complete auth handshake
+  const ws = capturedWs!;
+  // Let the mock ws fire onopen
+  await new Promise(r => queueMicrotask(r));
+  await new Promise(r => queueMicrotask(r));
+
+  const challenge = makeAuthChallenge();
+  ws.peer.sendFromServer(JSON.stringify(challenge));
+
+  // Client responds with auth.response
+  const responseMsg = await ws.peer.expectFromClient();
+  const response = JSON.parse(responseMsg) as AuthResponse;
+  expect(response.type).toBe('auth.response');
+  expect(response.challengeId).toBe(challenge.challengeId);
+
+  // Server sends auth.accepted
+  const accepted: AuthAccepted = {
+    type: 'auth.accepted',
+    seq: 0,
+    snapshotSeq: 0,
+    snapshotAvailable: true,
+  };
+  ws.peer.sendFromServer(JSON.stringify(accepted));
+
+  // Server sends snapshot
+  const snapshotCiphertext = await encryptSnapshot(eventKey, snapshot);
+  const snapshotMsg: RoomTransportMessage = {
+    type: 'room.snapshot',
+    snapshotSeq: 0,
+    snapshotCiphertext,
+  };
+  ws.peer.sendFromServer(JSON.stringify(snapshotMsg));
+
+  await connectPromise;
+  await new Promise(r => setTimeout(r, 10)); // let snapshot decrypt settle
+
+  return {
+    client,
+    ws,
+    roomSecret,
+    roomVerifier,
+    adminSecret,
+    adminVerifier: adminVerifier ?? '',
+    eventKey,
+    presenceKey,
+    snapshot,
+  };
+}
+
+// ---------------------------------------------------------------------------
+// Tests
+// ---------------------------------------------------------------------------
+
+describe('CollabRoomClient — constructor isolates initialSnapshot (P2)', () => {
+  test('caller mutating initialSnapshot.annotations after construction does not affect internal state', async () => {
+    const roomSecret = generateRoomSecret();
+    const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+    const roomVerifier = await computeRoomVerifier(authKey, ROOM_ID);
+
+    const ann: RoomAnnotation = {
+      id: 'seed-1', blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'original', createdA: 1,
+      startMeta: { parentTagName: 'p', parentIndex: 0, textOffset: 0 },
+    };
+    const initialSnapshot = { versionId: 'v1' as const, planMarkdown: '# P', annotations: [ann] };
+
+    const client = new CollabRoomClient({
+      roomId: ROOM_ID,
+      baseUrl: 'http://localhost:8787',
+      eventKey,
+      presenceKey,
+      adminKey: null,
+      roomVerifier,
+      adminVerifier: null,
+      user: USER,
+      initialSnapshot,
+      webSocketImpl: MockWebSocket as unknown as typeof WebSocket,
+    });
+
+    // Mutate caller's copy.
+    ann.originalText = 'MUTATED';
+    ann.startMeta!.parentTagName = 'HIJACKED';
+    initialSnapshot.annotations.push({ ...ann, id: 'injected' });
+
+    // Client's internal view is unchanged.
+    const snap = client.getState();
+    expect(snap.annotations.length).toBe(1);
+    expect(snap.annotations[0].id).toBe('seed-1');
+    expect(snap.annotations[0].originalText).toBe('original');
+    expect(snap.annotations[0].startMeta!.parentTagName).toBe('p');
+  });
+});
+
+describe('CollabRoomClient — connect', () => {
+  test('authenticates and transitions to authenticated', async () => {
+    const { client } = await setup();
+    expect(client.getState().connectionStatus).toBe('authenticated');
+    client.disconnect();
+  });
+
+  test('getState includes snapshot plan markdown', async () => {
+    const { client } = await setup();
+    expect(client.getState().planMarkdown).toBe('# Plan');
+    client.disconnect();
+  });
+
+  test('hasAdminCapability is true with admin key, false without', async () => {
+    const withAdmin = await setup({ withAdmin: true });
+    expect(withAdmin.client.getState().hasAdminCapability).toBe(true);
+    withAdmin.client.disconnect();
+
+    const noAdmin = await setup();
+    expect(noAdmin.client.getState().hasAdminCapability).toBe(false);
+    noAdmin.client.disconnect();
+  });
+});
+
+describe('CollabRoomClient — concurrent sendOp ordering (P2)', () => {
+  test('concurrent sendAnnotationAdd + sendAnnotationRemove preserves call order on the wire', async () => {
+    const { client, ws, eventKey } = await setup();
+
+    // Sized so the first encrypt (large payload) is slower than the second.
+    const big: RoomAnnotation = {
+      id: 'order-add', blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x'.repeat(50_000), createdA: 1,
+    };
+
+    // Fire two calls without awaiting between them — the second starts
+    // encryption immediately. Without outbound serialization, the small
+    // remove's ciphertext would finish first and land on the wire BEFORE
+    // the add.
+    const p1 = client.sendAnnotationAdd([big]);
+    const p2 = client.sendAnnotationRemove(['order-add']);
+    await Promise.all([p1, p2]);
+
+    const first = JSON.parse(await ws.peer.expectFromClient()) as ServerEnvelope;
+    const second = JSON.parse(await ws.peer.expectFromClient()) as ServerEnvelope;
+
+    const firstOp = await decryptEventPayload(eventKey, first.ciphertext) as { type: string };
+    const secondOp = await decryptEventPayload(eventKey, second.ciphertext) as { type: string };
+
+    expect(firstOp.type).toBe('annotation.add');
+    expect(secondOp.type).toBe('annotation.remove');
+    client.disconnect();
+  });
+});
+
+describe('CollabRoomClient — sendAnnotationAdd', () => {
+  test('produces encrypted envelope on wire', async () => {
+    const { client, ws, eventKey } = await setup();
+    const ann: RoomAnnotation = {
+      id: 'ann-1',
+      blockId: 'b1',
+      startOffset: 0,
+      endOffset: 5,
+      type: 'COMMENT',
+      originalText: 'hello',
+      createdA: 1234,
+      text: 'my comment',
+    };
+    await client.sendAnnotationAdd([ann]);
+    const sent = await ws.peer.expectFromClient();
+    const envelope = JSON.parse(sent) as ServerEnvelope;
+    expect(envelope.channel).toBe('event');
+    expect(envelope.clientId).toBe(client.getState().clientId);
+
+    // Decrypt the envelope ciphertext to confirm round-trip
+    const decrypted = await decryptEventPayload(eventKey, envelope.ciphertext);
+    expect(decrypted).toEqual({ type: 'annotation.add', annotations: [ann] });
+
+    client.disconnect();
+  });
+
+});
+
+describe('CollabRoomClient — server echo is authoritative', () => {
+  test('our own echoed event applies exactly once', async () => {
+    const { client, ws } = await setup();
+    const ann: RoomAnnotation = {
+      id: 'echo-1',
+      blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x', createdA: 1,
+    };
+    await client.sendAnnotationAdd([ann]);
+
+    // No optimistic apply — pre-echo count is 0.
+    expect(client.getState().annotations.length).toBe(0);
+
+    const sent = await ws.peer.expectFromClient();
+    const envelope = JSON.parse(sent) as ServerEnvelope;
+
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 1, receivedAt: Date.now(), envelope,
+    }));
+    await new Promise(r => setTimeout(r, 10));
+
+    // Echo applied once; seq advanced.
+    expect(client.getState().annotations.length).toBe(1);
+    expect(client.getState().annotations[0].id).toBe('echo-1');
+    expect(client.getState().seq).toBe(1);
+    client.disconnect();
+  });
+
+  test('event from another client applies normally', async () => {
+    const { client, ws, eventKey } = await setup();
+    const otherAnn: RoomAnnotation = {
+      id: 'other-1',
+      blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x', createdA: 1,
+    };
+    const ciphertext = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [otherAnn] });
+    const envelope: ServerEnvelope = {
+      clientId: 'other-client',
+      opId: 'other-op-id',
+      channel: 'event',
+      ciphertext,
+    };
+    const event: RoomTransportMessage = { type: 'room.event', seq: 1, receivedAt: Date.now(), envelope };
+    ws.peer.sendFromServer(JSON.stringify(event));
+    await new Promise(r => setTimeout(r, 10));
+
+    expect(client.getState().annotations.length).toBe(1);
+    expect(client.getState().annotations[0].id).toBe('other-1');
+    client.disconnect();
+  });
+});
+
+describe('CollabRoomClient — admin', () => {
+  test('deleteRoom without admin rejects', async () => {
+    const { client } = await setup(); // no admin
+    await expect(client.deleteRoom()).rejects.toThrow(AdminNotAuthorizedError);
+    client.disconnect();
+  });
+
+  test('deleteRoom sends challenge.request, then admin.command with proof, resolves on terminal socket close', async () => {
+    const { client, ws } = await setup({ withAdmin: true });
+
+    const deletePromise = client.deleteRoom();
+
+    // Client sends admin.challenge.request
+    const req = await ws.peer.expectFromClient();
+    expect(JSON.parse(req).type).toBe('admin.challenge.request');
+
+    // Server sends admin.challenge
+    const adminChallenge: AdminChallenge = {
+      type: 'admin.challenge',
+      challengeId: generateChallengeId(),
+      nonce: generateNonce(),
+      expiresAt: Date.now() + 30_000,
+    };
+    ws.peer.sendFromServer(JSON.stringify(adminChallenge));
+
+    // Client sends admin.command
+    const cmdMsg = await ws.peer.expectFromClient();
+    const cmd = JSON.parse(cmdMsg) as AdminCommandEnvelope;
+    expect(cmd.type).toBe('admin.command');
+    expect(cmd.command.type).toBe('room.delete');
+    expect(cmd.challengeId).toBe(adminChallenge.challengeId);
+    expect(cmd.adminProof.length).toBeGreaterThan(0);
+
+    // Server terminates the socket with the unavailable close — the
+    // single success signal for delete in the simplified protocol.
+    ws.peer.simulateClose(4006, 'Room unavailable');
+
+    await deletePromise; // resolves on terminal close
+    expect(client.getState().roomUnavailable).toBe(true);
+    client.disconnect();
+  });
+
+  test('admin command rejects on room.error', async () => {
+    const { client, ws } = await setup({ withAdmin: true });
+
+    const deletePromise = client.deleteRoom();
+    await ws.peer.expectFromClient(); // admin.challenge.request
+
+    const adminChallenge: AdminChallenge = {
+      type: 'admin.challenge',
+      challengeId: generateChallengeId(),
+      nonce: generateNonce(),
+      expiresAt: Date.now() + 30_000,
+    };
+    ws.peer.sendFromServer(JSON.stringify(adminChallenge));
+    await ws.peer.expectFromClient(); // admin.command
+
+    // Server sends room.error instead of room.status
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.error',
+      code: 'delete_failed',
+      message: 'Cannot delete',
+    }));
+
+    await expect(deletePromise).rejects.toThrow(AdminRejectedError);
+    client.disconnect();
+  });
+
+  test('contract: every code in ADMIN_ERROR_CODES rejects a pending admin command as admin-scoped', async () => {
+    // Contract test for the shared admin-error-code tuple. Iterates every
+    // code declared in `packages/shared/collab/constants.ts` and asserts
+    // that the runtime treats it as admin-scoped (rejects pending admin
+    // with AdminRejectedError, does not fall through to the 5s timeout).
+    //
+    // This is the single gate that prevents the class of drift where a
+    // server adds a new `sendAdminError` call site with a code the
+    // client's rejection Set doesn't recognize — the tuple is the shared
+    // source of truth, so any new code must land in the tuple first,
+    // and this test forces it to route correctly end-to-end.
+    //
+    // If this test fails after adding a new admin code:
+    //   1. Confirm the code is in AdminErrorCode namespace in constants.ts.
+    //   2. Confirm ADMIN_SCOPED_ERROR_CODES in client.ts derives from the
+    //      tuple (not a duplicate literal).
+    //   3. If both are correct, the runtime's rejection path has a bug —
+    //      not a contract bug.
+    for (const code of ADMIN_ERROR_CODES) {
+      const { client, ws } = await setup({ withAdmin: true });
+
+      const deletePromise = client.deleteRoom();
+      await ws.peer.expectFromClient(); // admin.challenge.request
+
+      const start = Date.now();
+      ws.peer.sendFromServer(JSON.stringify({
+        type: 'room.error',
+        code,
+        message: `Server rejected: ${code}`,
+      }));
+
+      await expect(deletePromise).rejects.toThrow(AdminRejectedError);
+      // Reject immediately, not via 5s admin timeout.
+      expect(Date.now() - start).toBeLessThan(500);
+
+      client.disconnect();
+    }
+  });
+
+  test('non-admin room.error (e.g. validation_error from event channel) does NOT reject pending admin', async () => {
+    // Regression: previously ANY room.error rejected the pending admin
+    // command. But room.error is also used for event-channel failures
+    // (validation_error, event_persist_failed). If one of those lands
+    // while a delete command is in flight, we must NOT cancel the
+    // delete — its terminal socket-close may still be on the way.
+    const { client, ws } = await setup({ withAdmin: true });
+
+    const deletePromise = client.deleteRoom();
+    await ws.peer.expectFromClient(); // admin.challenge.request
+    const adminChallenge: AdminChallenge = {
+      type: 'admin.challenge',
+      challengeId: generateChallengeId(),
+      nonce: generateNonce(),
+      expiresAt: Date.now() + 30_000,
+    };
+    ws.peer.sendFromServer(JSON.stringify(adminChallenge));
+    await ws.peer.expectFromClient(); // admin.command
+
+    // Event-channel error lands BEFORE the admin command's status broadcast.
+    // pendingAdmin must stay alive.
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.error',
+      code: 'validation_error',
+      message: 'Malformed annotation payload',
+    }));
+    // Give the error a tick to land.
+    await new Promise(r => setTimeout(r, 20));
+
+    // The terminal delete close arrives now — delete should resolve.
+    ws.peer.simulateClose(4006, 'Room unavailable');
+    await deletePromise;  // resolves (does NOT reject)
+
+    // lastError was still set by the event-channel error for UI consumers.
+    expect(client.getState().lastError?.code).toBe('validation_error');
+  });
+});
+
+describe('CollabRoomClient — NotConnectedError', () => {
+  test('sendAnnotationAdd before connect throws', async () => {
+    const roomSecret = generateRoomSecret();
+    const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+    const roomVerifier = await computeRoomVerifier(authKey, ROOM_ID);
+
+    const client = new CollabRoomClient({
+      roomId: ROOM_ID,
+      baseUrl: 'http://localhost:8787',
+      eventKey,
+      presenceKey,
+      adminKey: null,
+      roomVerifier,
+      adminVerifier: null,
+      user: USER,
+      webSocketImpl: MockWebSocket as unknown as typeof WebSocket,
+    });
+
+    // Use a valid (non-empty) annotation so the test exercises the
+    // NotConnectedError path rather than tripping outbound validation's
+    // empty-array rejection.
+    const ann: RoomAnnotation = {
+      id: 'nc-1',
+      blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x', createdA: 1,
+    };
+    await expect(client.sendAnnotationAdd([ann])).rejects.toThrow(NotConnectedError);
+  });
+});
+
+describe('CollabRoomClient — initial connect timeout', () => {
+  test('rejects with ConnectTimeoutError, stays disconnected, does not auto-reconnect', async () => {
+    const roomSecret = generateRoomSecret();
+    const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+    const roomVerifier = await computeRoomVerifier(authKey, ROOM_ID);
+
+    const constructed: MockWebSocket[] = [];
+    const WebSocketImpl = class extends MockWebSocket {
+      constructor(url: string | URL, protocols?: string | string[]) {
+        super(url, protocols);
+        constructed.push(this);
+      }
+    } as unknown as typeof WebSocket;
+
+    const client = new CollabRoomClient({
+      roomId: ROOM_ID,
+      baseUrl: 'http://localhost:8787',
+      eventKey,
+      presenceKey,
+      adminKey: null,
+      roomVerifier,
+      adminVerifier: null,
+      user: USER,
+      webSocketImpl: WebSocketImpl,
+      connectTimeoutMs: 50,  // very short — server never sends challenge
+      reconnect: { maxAttempts: 5, initialDelayMs: 10, maxDelayMs: 20 },
+    });
+
+    // No server script — let the timeout fire
+    await expect(client.connect()).rejects.toThrow(ConnectTimeoutError);
+
+    // Wait past any potential reconnect delay + close handling
+    await new Promise(r => setTimeout(r, 100));
+
+    expect(client.getState().connectionStatus).toBe('disconnected');
+    expect(constructed.length).toBe(1);  // no auto-reconnect attempt
+  });
+});
+
+describe('CollabRoomClient — every event applies (no echo dedup in V1)', () => {
+  test('opId collision from another client does not drop the event', async () => {
+    // V1 removed echo dedup — every room.event applies, including our own
+    // echoes and any event another client happens to send with the same opId.
+    // This makes the "malicious participant silences our ops by opId reuse"
+    // attack inapplicable.
+    const { client, ws, eventKey } = await setup();
+    const ourAnn: RoomAnnotation = {
+      id: 'ours-1',
+      blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x', createdA: 1,
+    };
+    await client.sendAnnotationAdd([ourAnn]);
+    const sent = await ws.peer.expectFromClient();
+    const ourEnvelope = JSON.parse(sent) as ServerEnvelope;
+
+    // Server echoes our op (this applies ours-1).
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 1, receivedAt: Date.now(), envelope: ourEnvelope,
+    }));
+
+    // Another client sends an op with the SAME opId. Must still apply.
+    const otherAnn: RoomAnnotation = {
+      id: 'other-1',
+      blockId: 'b2', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'y', createdA: 2,
+    };
+    const spoofCiphertext = await encryptEventOp(eventKey, {
+      type: 'annotation.add', annotations: [otherAnn],
+    });
+    const spoofEnvelope: ServerEnvelope = {
+      clientId: 'attacker',
+      opId: ourEnvelope.opId,  // reused
+      channel: 'event',
+      ciphertext: spoofCiphertext,
+    };
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 2, receivedAt: Date.now(), envelope: spoofEnvelope,
+    }));
+    await new Promise(r => setTimeout(r, 10));
+
+    const ids = client.getState().annotations.map(a => a.id);
+    expect(ids).toContain('ours-1');
+    expect(ids).toContain('other-1');
+    client.disconnect();
+  });
+});
+
+describe('CollabRoomClient — state events fire on status transitions', () => {
+  test('subscribers receive state for connecting/authenticating/authenticated', async () => {
+    const roomSecret = generateRoomSecret();
+    const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+    const roomVerifier = await computeRoomVerifier(authKey, ROOM_ID);
+
+    let capturedWs: MockWebSocket | null = null;
+    const WebSocketImpl = class extends MockWebSocket {
+      constructor(url: string | URL, protocols?: string | string[]) {
+        super(url, protocols);
+        capturedWs = this;
+      }
+    } as unknown as typeof WebSocket;
+
+    const client = new CollabRoomClient({
+      roomId: ROOM_ID,
+      baseUrl: 'http://localhost:8787',
+      eventKey,
+      presenceKey,
+      adminKey: null,
+      roomVerifier,
+      adminVerifier: null,
+      user: USER,
+      webSocketImpl: WebSocketImpl,
+      connectTimeoutMs: 2000,
+    });
+
+    const statusesFromState: string[] = [];
+    client.on('state', (s) => { statusesFromState.push(s.connectionStatus); });
+
+    const connectPromise = client.connect();
+
+    await new Promise<void>((r) => {
+      const check = () => (capturedWs ? r() : queueMicrotask(check));
+      check();
+    });
+    await new Promise(r => queueMicrotask(r));
+    await new Promise(r => queueMicrotask(r));
+
+    const ws = capturedWs!;
+    const challenge = makeAuthChallenge();
+    ws.peer.sendFromServer(JSON.stringify(challenge));
+    await ws.peer.expectFromClient();  // drain auth.response
+
+    const accepted: AuthAccepted = {
+      type: 'auth.accepted',
+      seq: 0,
+      snapshotSeq: 0,
+      snapshotAvailable: false,
+    };
+    ws.peer.sendFromServer(JSON.stringify(accepted));
+    await connectPromise;
+
+    expect(statusesFromState).toContain('connecting');
+    expect(statusesFromState).toContain('authenticating');
+    expect(statusesFromState).toContain('authenticated');
+    client.disconnect();
+  });
+
+  test('authenticated state is never emitted with stale lastError (P2 ordering)', async () => {
+    const roomSecret = generateRoomSecret();
+    const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+    const roomVerifier = await computeRoomVerifier(authKey, ROOM_ID);
+
+    let capturedWs: MockWebSocket | null = null;
+    const WebSocketImpl = class extends MockWebSocket {
+      constructor(url: string | URL, protocols?: string | string[]) {
+        super(url, protocols);
+        capturedWs = this;
+      }
+    } as unknown as typeof WebSocket;
+
+    const client = new CollabRoomClient({
+      roomId: ROOM_ID,
+      baseUrl: 'http://localhost:8787',
+      eventKey,
+      presenceKey,
+      adminKey: null,
+      roomVerifier,
+      adminVerifier: null,
+      user: USER,
+      webSocketImpl: WebSocketImpl,
+      connectTimeoutMs: 2000,
+    });
+
+    // Record every state snapshot so we can inspect intermediate values.
+    const snapshots: CollabRoomState[] = [];
+    client.on('state', (s) => { snapshots.push({ ...s }); });
+
+    const connectPromise = client.connect();
+    await new Promise<void>((r) => { const c = () => capturedWs ? r() : queueMicrotask(c); c(); });
+    await new Promise(r => queueMicrotask(r));
+    await new Promise(r => queueMicrotask(r));
+
+    const ws = capturedWs!;
+    ws.peer.sendFromServer(JSON.stringify(makeAuthChallenge()));
+    await ws.peer.expectFromClient();
+
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'auth.accepted',
+      seq: 0, snapshotSeq: 0, snapshotAvailable: false,
+    }));
+    await connectPromise;
+
+    // Every snapshot with connectionStatus === 'authenticated' must have
+    // roomUnavailable === false. If setStatus('authenticated') ever fired
+    // against a terminal flag, this would fail.
+    const authedSnapshots = snapshots.filter(s => s.connectionStatus === 'authenticated');
+    expect(authedSnapshots.length).toBeGreaterThan(0);
+    for (const s of authedSnapshots) {
+      expect(s.roomUnavailable).toBe(false);
+    }
+
+    client.disconnect();
+  });
+});
+
+describe('CollabRoomClient — disconnect', () => {
+  test('disconnect transitions to closed', async () => {
+    const { client } = await setup();
+    client.disconnect();
+    expect(client.getState().connectionStatus).toBe('closed');
+  });
+
+  test('reconnect after disconnect clears userDisconnected', async () => {
+    const { client } = await setup();
+    client.disconnect();
+    expect(client.getState().connectionStatus).toBe('closed');
+
+    // Trying to connect again should not throw immediately (userDisconnected cleared)
+    // We don't fully run the handshake here — just verify the state reset
+    const connectPromise = client.connect();
+    // Cancel by disconnecting again
+    client.disconnect();
+    await expect(connectPromise).rejects.toThrow();
+  });
+});
+
+// ---------------------------------------------------------------------------
+// Regression tests for P1/P2 race fixes
+// ---------------------------------------------------------------------------
+
+describe('CollabRoomClient — auth.accepted does not advance local seq (P1 replay safety)', () => {
+  test('accepted.seq > 0 does not update seq until replay snapshot/event applies', async () => {
+    const roomSecret = generateRoomSecret();
+    const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+    const roomVerifier = await computeRoomVerifier(authKey, ROOM_ID);
+
+    let capturedWs: MockWebSocket | null = null;
+    const WebSocketImpl = class extends MockWebSocket {
+      constructor(url: string | URL, protocols?: string | string[]) {
+        super(url, protocols);
+        capturedWs = this;
+      }
+    } as unknown as typeof WebSocket;
+
+    const client = new CollabRoomClient({
+      roomId: ROOM_ID,
+      baseUrl: 'http://localhost:8787',
+      eventKey,
+      presenceKey,
+      adminKey: null,
+      roomVerifier,
+      adminVerifier: null,
+      user: USER,
+      webSocketImpl: WebSocketImpl,
+      connectTimeoutMs: 2000,
+    });
+
+    const connectPromise = client.connect();
+    await new Promise<void>((r) => { const c = () => capturedWs ? r() : queueMicrotask(c); c(); });
+    await new Promise(r => queueMicrotask(r));
+    await new Promise(r => queueMicrotask(r));
+    const ws = capturedWs!;
+
+    const challenge = makeAuthChallenge();
+    ws.peer.sendFromServer(JSON.stringify(challenge));
+    await ws.peer.expectFromClient();
+
+    // Server claims seq: 42 in auth.accepted (replay incoming)
+    const accepted: AuthAccepted = {
+      type: 'auth.accepted',
+      seq: 42, snapshotSeq: 40, snapshotAvailable: true,
+    };
+    ws.peer.sendFromServer(JSON.stringify(accepted));
+    await connectPromise;
+
+    // Crucially: BEFORE any snapshot/event arrives, seq must still be 0.
+    expect(client.getState().seq).toBe(0);
+
+    // Now simulate the server delivering the snapshot — only THEN does seq move.
+    const snapshot: RoomSnapshot = { versionId: 'v1', planMarkdown: '# Plan', annotations: [] };
+    const snapshotCiphertext = await encryptSnapshot(eventKey, snapshot);
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.snapshot', snapshotSeq: 40, snapshotCiphertext,
+    }));
+    await new Promise(r => setTimeout(r, 10));
+    expect(client.getState().seq).toBe(40);
+
+    // And a replayed event after the snapshot advances seq further — proving
+    // the "last server seq consumed" contract holds on the event path too.
+    const replayedAnn: RoomAnnotation = {
+      id: 'replay-1',
+      blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x', createdA: 1,
+    };
+    const replayCipher = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [replayedAnn] });
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 42, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'replay-op-1', channel: 'event', ciphertext: replayCipher },
+    }));
+    await new Promise(r => setTimeout(r, 10));
+    expect(client.getState().seq).toBe(42);
+    expect(client.getState().annotations.map(a => a.id)).toContain('replay-1');
+
+    client.disconnect();
+  });
+});
+
+describe('CollabRoomClient — disconnect during pending auth (P2)', () => {
+  test('ends in closed, not disconnected', async () => {
+    const roomSecret = generateRoomSecret();
+    const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+    const roomVerifier = await computeRoomVerifier(authKey, ROOM_ID);
+
+    let capturedWs: MockWebSocket | null = null;
+    const WebSocketImpl = class extends MockWebSocket {
+      constructor(url: string | URL, protocols?: string | string[]) {
+        super(url, protocols);
+        capturedWs = this;
+      }
+    } as unknown as typeof WebSocket;
+
+    const client = new CollabRoomClient({
+      roomId: ROOM_ID,
+      baseUrl: 'http://localhost:8787',
+      eventKey,
+      presenceKey,
+      adminKey: null,
+      roomVerifier,
+      adminVerifier: null,
+      user: USER,
+      webSocketImpl: WebSocketImpl,
+      connectTimeoutMs: 5000,
+    });
+
+    const connectPromise = client.connect();
+    await new Promise<void>((r) => { const c = () => capturedWs ? r() : queueMicrotask(c); c(); });
+    await new Promise(r => queueMicrotask(r));
+    await new Promise(r => queueMicrotask(r));
+
+    // Do NOT complete auth. User calls disconnect() while pendingConnect is live.
+    client.disconnect();
+    await expect(connectPromise).rejects.toThrow();
+
+    // Must be 'closed' (terminal), NOT 'disconnected' — the pending-connect
+    // close branch must respect userDisconnected.
+    expect(client.getState().connectionStatus).toBe('closed');
+  });
+});
+
+describe('CollabRoomClient — sendOp send() throw does not mutate state (P2)', () => {
+  test('synchronous ws.send throw propagates, leaves local state clean, next send works', async () => {
+    const { client, ws } = await setup();
+
+    const sendMock = ws.send.bind(ws);
+    let shouldThrow = true;
+    ws.send = (data: string | ArrayBufferLike | Blob | ArrayBufferView) => {
+      if (shouldThrow) { shouldThrow = false; throw new Error('simulated send failure'); }
+      return sendMock(data);
+    };
+
+    const ann: RoomAnnotation = {
+      id: 'send-fail-1',
+      blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x', createdA: 1,
+    };
+    const before = client.getState().annotations.length;
+    await expect(client.sendAnnotationAdd([ann])).rejects.toThrow('simulated send failure');
+
+    // Local annotations untouched (V1 has no optimistic apply anyway).
+    expect(client.getState().annotations.length).toBe(before);
+
+    // Subsequent successful send + echo works — no lingering state blocks it.
+    const ann2: RoomAnnotation = {
+      id: 'send-ok-1',
+      blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'y', createdA: 2,
+    };
+    await client.sendAnnotationAdd([ann2]);
+    const sent = await ws.peer.expectFromClient();
+    const env = JSON.parse(sent) as ServerEnvelope;
+
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 1, receivedAt: Date.now(), envelope: env,
+    }));
+    await new Promise(r => setTimeout(r, 10));
+    expect(client.getState().annotations.filter(a => a.id === 'send-ok-1').length).toBe(1);
+
+    client.disconnect();
+  });
+});
+
+async function waitFor(cond: () => boolean, timeoutMs: number): Promise<void> {
+  const start = Date.now();
+  while (!cond()) {
+    if (Date.now() - start > timeoutMs) throw new Error(`waitFor timed out after ${timeoutMs}ms`);
+    await new Promise(r => setTimeout(r, 5));
+  }
+}
+
+describe('CollabRoomClient — auth proof handler handles mid-await rotation (P2)', () => {
+  test('each socket only ever receives auth.response bound to its own challengeId', async () => {
+    // This test pins the invariant that `auth.response` is never sent to a
+    // different socket than the one that issued the challenge. It cannot
+    // deterministically force the specific race where `computeAuthProof`
+    // resolves after a socket rotation without patching Web Crypto internals
+    // (bun's AES-GCM is microtask-fast, rotation happens on a 10ms timer).
+    // What it DOES pin: the guard's observable property — no cross-talk of
+    // auth.response challengeIds between rotated sockets.
+    const constructed: MockWebSocket[] = [];
+    const WebSocketImpl = class extends MockWebSocket {
+      constructor(url: string | URL, protocols?: string | string[]) {
+        super(url, protocols);
+        constructed.push(this);
+      }
+    } as unknown as typeof WebSocket;
+
+    const roomSecret = generateRoomSecret();
+    const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+    const roomVerifier = await computeRoomVerifier(authKey, ROOM_ID);
+
+    const client = new CollabRoomClient({
+      roomId: ROOM_ID,
+      baseUrl: 'http://localhost:8787',
+      eventKey,
+      presenceKey,
+      adminKey: null,
+      roomVerifier,
+      adminVerifier: null,
+      user: USER,
+      webSocketImpl: WebSocketImpl,
+      connectTimeoutMs: 2000,
+      reconnect: { maxAttempts: 5, initialDelayMs: 10, maxDelayMs: 20 },
+    });
+
+    // First handshake completes.
+    const connectPromise = client.connect();
+    await waitFor(() => constructed.length >= 1, 1000);
+    await new Promise(r => queueMicrotask(r));
+    await new Promise(r => queueMicrotask(r));
+    const firstWs = constructed[0];
+
+    const firstChallengeId = generateChallengeId();
+    firstWs.peer.sendFromServer(JSON.stringify(makeAuthChallenge({ challengeId: firstChallengeId })));
+    await firstWs.peer.expectFromClient();
+    firstWs.peer.sendFromServer(JSON.stringify({
+      type: 'auth.accepted',
+      seq: 0, snapshotSeq: 0, snapshotAvailable: false,
+    }));
+    await connectPromise;
+
+    // Rotate to a second socket via post-auth close.
+    firstWs.peer.simulateClose(1006, 'network hiccup');
+    await waitFor(() => constructed.length >= 2, 2000);
+    const secondWs = constructed[1];
+    await new Promise(r => queueMicrotask(r));
+    await new Promise(r => queueMicrotask(r));
+
+    // Fire challenge + close mid-handshake to force a rotation attempt.
+    const secondChallengeId = generateChallengeId();
+    secondWs.peer.sendFromServer(JSON.stringify(makeAuthChallenge({ challengeId: secondChallengeId })));
+    secondWs.peer.simulateClose(1006, 'rotate mid-handshake');
+
+    await waitFor(() => constructed.length >= 3, 2000);
+    const thirdWs = constructed[2];
+    await new Promise(r => queueMicrotask(r));
+    await new Promise(r => queueMicrotask(r));
+    await new Promise(r => setTimeout(r, 30));
+
+    const thirdChallengeId = generateChallengeId();
+    thirdWs.peer.sendFromServer(JSON.stringify(makeAuthChallenge({ challengeId: thirdChallengeId })));
+    await new Promise(r => setTimeout(r, 30));
+
+    // Collect auth.response messages per socket and check each one only saw
+    // responses for its OWN challengeId (or none, if it rotated before resolving).
+    const responsesFor = (ws: MockWebSocket) => ws.peer.sent
+      .map(s => { try { return JSON.parse(s) as { type?: string; challengeId?: string }; } catch { return null; } })
+      .filter((m): m is { type: string; challengeId: string } => m?.type === 'auth.response');
+
+    const firstResponses = responsesFor(firstWs);
+    const secondResponses = responsesFor(secondWs);
+    const thirdResponses = responsesFor(thirdWs);
+
+    // First socket: only firstChallengeId
+    expect(firstResponses.every(r => r.challengeId === firstChallengeId)).toBe(true);
+    // Second socket: only secondChallengeId (if any — proof may have resolved after rotation and been dropped)
+    expect(secondResponses.every(r => r.challengeId === secondChallengeId)).toBe(true);
+    // Third socket: only thirdChallengeId — crucially NOT secondChallengeId
+    expect(thirdResponses.every(r => r.challengeId === thirdChallengeId)).toBe(true);
+    expect(thirdResponses.some(r => r.challengeId === secondChallengeId)).toBe(false);
+    expect(thirdResponses.some(r => r.challengeId === firstChallengeId)).toBe(false);
+
+    client.disconnect();
+  });
+});
+
+// ---------------------------------------------------------------------------
+// Regression tests for the latest review round
+// ---------------------------------------------------------------------------
+
+describe('CollabRoomClient — presence shape validation (P2)', () => {
+  test('malformed presence payload is rejected with presence_malformed error and not stored', async () => {
+    const { client, ws, presenceKey } = await setup();
+
+    const errors: { code: string; message: string }[] = [];
+    client.on('error', (e) => errors.push(e));
+
+    // Encrypt a payload that decrypts to something that is NOT a valid PresenceState.
+    // Use the presence crypto path (encryptPresence accepts an object) with a
+    // garbage object that is valid encrypted JSON but wrong shape.
+    const malformed = { user: { id: 'x', name: 42 /* not a string */, color: '#f00' }, cursor: null };
+    // encryptPresence is typed to take PresenceState; cast to bypass for this adversarial test.
+    const ciphertext = await encryptPresence(presenceKey, malformed as unknown as import('../types').PresenceState);
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.presence',
+      envelope: { clientId: 'attacker', opId: 'p1', channel: 'presence', ciphertext },
+    }));
+    await new Promise(r => setTimeout(r, 10));
+
+    expect(errors.some(e => e.code === 'presence_malformed')).toBe(true);
+    expect(client.getState().remotePresence.attacker).toBeUndefined();
+    // lastError must reflect the malformed presence so hook consumers see it.
+    expect(client.getState().lastError?.code).toBe('presence_malformed');
+    client.disconnect();
+  });
+
+  test('valid presence payload is stored and emitted', async () => {
+    const { client, ws, presenceKey } = await setup();
+
+    const valid = {
+      user: { id: 'u2', name: 'bob', color: '#0f0' },
+      cursor: { x: 10, y: 20, coordinateSpace: 'document' as const },
+    };
+    const ciphertext = await encryptPresence(presenceKey, valid);
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.presence',
+      envelope: { clientId: 'friend', opId: 'p2', channel: 'presence', ciphertext },
+    }));
+    await new Promise(r => setTimeout(r, 10));
+
+    expect(client.getState().remotePresence.friend).toEqual(valid);
+    client.disconnect();
+  });
+});
+
+describe('CollabRoomClient — snapshot is authoritative baseline (P2)', () => {
+  test('snapshotSeq overrides this.seq even when snapshotSeq < this.seq', async () => {
+    const { client, ws, eventKey } = await setup();
+
+    // Drive seq up with an incoming event.
+    const ann: RoomAnnotation = {
+      id: 'e-1', blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x', createdA: 1,
+    };
+    const cipher = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [ann] });
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 10, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'o1', channel: 'event', ciphertext: cipher },
+    }));
+    await waitFor(() => client.getState().seq === 10, 1000);
+
+    // Now the server delivers a snapshot with snapshotSeq=5 (LOWER than local seq).
+    // This simulates the "future claim" fallback where the server's view diverges
+    // from the client's. The snapshot must replace seq unconditionally so future
+    // reconnects don't keep sending the stale higher lastSeq.
+    const snap: RoomSnapshot = { versionId: 'v1', planMarkdown: '# Recovered', annotations: [] };
+    const snapCipher = await encryptSnapshot(eventKey, snap);
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.snapshot', snapshotSeq: 5, snapshotCiphertext: snapCipher,
+    }));
+    await waitFor(() => client.getState().planMarkdown === '# Recovered', 1000);
+
+    expect(client.getState().seq).toBe(5);
+    client.disconnect();
+  });
+});
+
+describe('CollabRoomClient — stale-seq and baseline-invalid guards (P2)', () => {
+  test('stale event (seq <= this.seq) is dropped — no decrypt, no state change, no event emission', async () => {
+    const { client, ws, eventKey } = await setup();
+
+    // Drive seq to 5 with a valid event.
+    const ann: RoomAnnotation = {
+      id: 'guard-1', blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x', createdA: 1,
+    };
+    const cipher = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [ann] });
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 5, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'o1', channel: 'event', ciphertext: cipher },
+    }));
+    await waitFor(() => client.getState().seq === 5, 1000);
+    const snapBefore = client.getState();
+    expect(snapBefore.annotations.length).toBe(1);
+
+    // Replay the SAME event (seq 5) — must be dropped entirely.
+    let eventEmissions = 0;
+    client.on('event', () => { eventEmissions++; });
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 5, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'o1-dup', channel: 'event', ciphertext: cipher },
+    }));
+    await new Promise(r => setTimeout(r, 20));
+    expect(eventEmissions).toBe(0);
+    expect(client.getState().seq).toBe(5);
+    expect(client.getState().annotations.length).toBe(1);
+
+    client.disconnect();
+  });
+
+  test('malformed snapshot blocks subsequent event application (baseline invalid)', async () => {
+    const { client, ws, eventKey } = await setup();
+
+    // Deliver a malformed snapshot.
+    const badSnap = { versionId: 'v99', planMarkdown: 'bad', annotations: [] };
+    const badSnapCipher = await encryptSnapshot(eventKey, badSnap as unknown as RoomSnapshot);
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.snapshot', snapshotSeq: 10, snapshotCiphertext: badSnapCipher,
+    }));
+    await waitFor(() => client.getState().lastError?.code === 'snapshot_malformed', 1000);
+    const annsBefore = client.getState().annotations.length;
+
+    // Now a valid event at seq 11 — must NOT apply (baseline is invalid).
+    const ann: RoomAnnotation = {
+      id: 'post-bad-snap', blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'y', createdA: 1,
+    };
+    const cipher = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [ann] });
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 11, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'o2', channel: 'event', ciphertext: cipher },
+    }));
+    await waitFor(() => client.getState().seq === 11, 1000);
+    // seq advanced for forward-progress, annotations untouched.
+    expect(client.getState().annotations.length).toBe(annsBefore);
+    expect(client.getState().annotations.find(a => a.id === 'post-bad-snap')).toBeUndefined();
+
+    // Delivering a VALID snapshot clears baseline-invalid; subsequent events apply.
+    const goodSnap: RoomSnapshot = {
+      versionId: 'v1',
+      planMarkdown: '# Recovered',
+      annotations: [],
+    };
+    const goodSnapCipher = await encryptSnapshot(eventKey, goodSnap);
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.snapshot', snapshotSeq: 20, snapshotCiphertext: goodSnapCipher,
+    }));
+    await waitFor(() => client.getState().planMarkdown === '# Recovered', 1000);
+
+    const ann2: RoomAnnotation = {
+      id: 'post-good-snap', blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'z', createdA: 1,
+    };
+    const cipher2 = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [ann2] });
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 21, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'o3', channel: 'event', ciphertext: cipher2 },
+    }));
+    await waitFor(() =>
+      client.getState().annotations.some(a => a.id === 'post-good-snap'),
+      1000,
+    );
+
+    client.disconnect();
+  });
+
+  test('baselineInvalid persists across reconnect: lastSeq omitted, events blocked until valid snapshot', async () => {
+    // 1. Authenticate socket A and consume a valid event to drive seq to 1.
+    const roomSecret = generateRoomSecret();
+    const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+    const roomVerifier = await computeRoomVerifier(authKey, ROOM_ID);
+
+    const constructed: MockWebSocket[] = [];
+    const WebSocketImpl = class extends MockWebSocket {
+      constructor(url: string | URL, protocols?: string | string[]) {
+        super(url, protocols);
+        constructed.push(this);
+      }
+    } as unknown as typeof WebSocket;
+
+    const client = new CollabRoomClient({
+      roomId: ROOM_ID,
+      baseUrl: 'http://localhost:8787',
+      eventKey,
+      presenceKey,
+      adminKey: null,
+      roomVerifier,
+      adminVerifier: null,
+      user: USER,
+      webSocketImpl: WebSocketImpl,
+      connectTimeoutMs: 2000,
+      reconnect: { maxAttempts: 5, initialDelayMs: 10, maxDelayMs: 20 },
+    });
+
+    const connectPromise = client.connect();
+    await waitFor(() => constructed.length >= 1, 1000);
+    await new Promise(r => queueMicrotask(r));
+    await new Promise(r => queueMicrotask(r));
+    const wsA = constructed[0];
+    wsA.peer.sendFromServer(JSON.stringify(makeAuthChallenge()));
+    await wsA.peer.expectFromClient();
+    wsA.peer.sendFromServer(JSON.stringify({
+      type: 'auth.accepted',
+      seq: 0, snapshotSeq: 0, snapshotAvailable: false,
+    }));
+    await connectPromise;
+
+    // Drive seq to 10 with a malformed snapshot (baselineInvalid = true).
+    const badSnap = { versionId: 'v99', planMarkdown: 'bad', annotations: [] };
+    const badSnapCipher = await encryptSnapshot(eventKey, badSnap as unknown as RoomSnapshot);
+    wsA.peer.sendFromServer(JSON.stringify({
+      type: 'room.snapshot', snapshotSeq: 10, snapshotCiphertext: badSnapCipher,
+    }));
+    await waitFor(() => client.getState().lastError?.code === 'snapshot_malformed', 1000);
+
+    // Deliver a post-snapshot event; it must NOT apply but SEQ must advance.
+    const blockedAnn: RoomAnnotation = {
+      id: 'blocked', blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'should-not-show', createdA: 1,
+    };
+    const blockedCipher = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [blockedAnn] });
+    wsA.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 11, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'b1', channel: 'event', ciphertext: blockedCipher },
+    }));
+    await waitFor(() => client.getState().seq === 11, 1000);
+    expect(client.getState().annotations.find(a => a.id === 'blocked')).toBeUndefined();
+
+    // 2. Force a reconnect. The new socket's auth.response MUST omit lastSeq
+    //    because baselineInvalid is true — otherwise the server might skip
+    //    snapshot replay and leave us stale forever.
+    wsA.peer.simulateClose(1006, 'reconnect drill');
+    await waitFor(() => constructed.length >= 2, 2000);
+    const wsB = constructed[1];
+    await new Promise(r => queueMicrotask(r));
+    await new Promise(r => queueMicrotask(r));
+
+    wsB.peer.sendFromServer(JSON.stringify(makeAuthChallenge()));
+    const authResponseMsg = await wsB.peer.expectFromClient();
+    const authResp = JSON.parse(authResponseMsg) as { lastSeq?: number };
+    expect(authResp.lastSeq).toBeUndefined();
+
+    wsB.peer.sendFromServer(JSON.stringify({
+      type: 'auth.accepted',
+      seq: 11, snapshotSeq: 11, snapshotAvailable: true,
+    }));
+    // auth.accepted alone must NOT clear baselineInvalid — only a valid
+    // snapshot apply does. Prove by delivering another event BEFORE the
+    // snapshot: it must still not apply.
+    await new Promise(r => setTimeout(r, 20));
+    const stillBlockedAnn: RoomAnnotation = {
+      id: 'still-blocked', blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'still-should-not-show', createdA: 1,
+    };
+    const stillBlockedCipher = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [stillBlockedAnn] });
+    wsB.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 12, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'b2', channel: 'event', ciphertext: stillBlockedCipher },
+    }));
+    await waitFor(() => client.getState().seq === 12, 1000);
+    expect(client.getState().annotations.find(a => a.id === 'still-blocked')).toBeUndefined();
+
+    // 3. Valid snapshot arrives and clears baselineInvalid — subsequent
+    //    events apply.
+    const goodSnap: RoomSnapshot = {
+      versionId: 'v1',
+      planMarkdown: '# Recovered',
+      annotations: [],
+    };
+    const goodSnapCipher = await encryptSnapshot(eventKey, goodSnap);
+    wsB.peer.sendFromServer(JSON.stringify({
+      type: 'room.snapshot', snapshotSeq: 20, snapshotCiphertext: goodSnapCipher,
+    }));
+    await waitFor(() => client.getState().planMarkdown === '# Recovered', 1000);
+
+    const recoveredAnn: RoomAnnotation = {
+      id: 'recovered', blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'ok', createdA: 1,
+    };
+    const recoveredCipher = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [recoveredAnn] });
+    wsB.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 21, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'r1', channel: 'event', ciphertext: recoveredCipher },
+    }));
+    await waitFor(() =>
+      client.getState().annotations.some(a => a.id === 'recovered'),
+      1000,
+    );
+
+    client.disconnect();
+  });
+
+  test('reducer-rejected update (merged-annotation invalid) advances seq without mutating state or emitting event', async () => {
+    const { client, ws, eventKey } = await setup();
+
+    // Seed a COMMENT with a valid non-empty blockId.
+    const seed: RoomAnnotation = {
+      id: 'reducer-seed', blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x', createdA: 1,
+    };
+    const seedCipher = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [seed] });
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 1, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'seed', channel: 'event', ciphertext: seedCipher },
+    }));
+    await waitFor(() => client.getState().annotations.length === 1, 1000);
+    const stored = client.getState().annotations[0];
+
+    // Patch passes op-level validation (blockId is a string per field rules)
+    // but the merged final annotation violates the cross-field invariant
+    // (COMMENT must have non-empty blockId). The reducer should reject.
+    let eventEmissions = 0;
+    client.on('event', () => { eventEmissions++; });
+
+    const badPatch = { type: 'annotation.update', id: 'reducer-seed', patch: { blockId: '' } };
+    const badCipher = await encryptEventOp(eventKey, badPatch as unknown as import('../types').RoomEventClientOp);
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 2, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'bad-patch', channel: 'event', ciphertext: badCipher },
+    }));
+    await waitFor(() => client.getState().seq === 2, 1000);
+
+    // seq advanced for forward-progress, annotation untouched, lastError set,
+    // no `event` emitted.
+    const after = client.getState().annotations[0];
+    expect(after.blockId).toBe(stored.blockId);
+    expect(client.getState().lastError?.code).toBe('event_rejected_by_reducer');
+    expect(eventEmissions).toBe(0);
+
+    client.disconnect();
+  });
+
+  test('outbound event payload is cloned before encryption — caller mutations cannot alter the wire op', async () => {
+    const { client, ws, eventKey } = await setup();
+
+    const ann: RoomAnnotation = {
+      id: 'clone-1', blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'original', createdA: 1,
+    };
+    const anns = [ann];
+
+    // Synchronously kick off the send, THEN mutate the caller's arrays before
+    // the encryption queue has had a chance to run.
+    const sendPromise = client.sendAnnotationAdd(anns);
+    ann.originalText = 'MUTATED';
+    anns.push({ ...ann, id: 'injected' });
+    await sendPromise;
+
+    const sent = JSON.parse(await ws.peer.expectFromClient()) as ServerEnvelope;
+    const decrypted = await decryptEventPayload(eventKey, sent.ciphertext) as { type: string; annotations: RoomAnnotation[] };
+    expect(decrypted.type).toBe('annotation.add');
+    expect(decrypted.annotations).toHaveLength(1);  // injected push did NOT affect wire
+    expect(decrypted.annotations[0].id).toBe('clone-1');
+    expect(decrypted.annotations[0].originalText).toBe('original');
+
+    client.disconnect();
+  });
+});
+
+describe('CollabRoomClient — event/snapshot shape validation (P2)', () => {
+  test('malformed RoomClientOp is rejected via event_malformed error, does not enter state', async () => {
+    const { client, ws, eventKey } = await setup();
+
+    const errors: { code: string; message: string }[] = [];
+    client.on('error', (e) => errors.push(e));
+
+    // A participant holds the eventKey but ships a structurally bad annotation.
+    const malformed = {
+      type: 'annotation.add',
+      annotations: [{ id: null, blockId: 'b', type: null, originalText: null, startOffset: 0, endOffset: 0, createdA: 0 }],
+    };
+    const ciphertext = await encryptEventOp(eventKey, malformed as unknown as import('../types').RoomEventClientOp);
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 1, receivedAt: Date.now(),
+      envelope: { clientId: 'attacker', opId: 'o1', channel: 'event', ciphertext },
+    }));
+    await new Promise(r => setTimeout(r, 20));
+
+    expect(errors.some(e => e.code === 'event_malformed')).toBe(true);
+    expect(client.getState().annotations.length).toBe(0);
+    // V1 forward-progress: seq MUST advance even though the event was rejected.
+    // If it didn't, reconnect lastSeq would keep replaying the malformed event
+    // forever and block every valid event behind it.
+    expect(client.getState().seq).toBe(1);
+    // Event errors must also surface via state.lastError for hook consumers.
+    expect(client.getState().lastError?.code).toBe('event_malformed');
+    client.disconnect();
+  });
+
+  test('inbound presence.update on event channel is rejected (event/presence split)', async () => {
+    const { client, ws, eventKey } = await setup();
+    const errors: { code: string; message: string }[] = [];
+    client.on('error', (e) => errors.push(e));
+
+    // A participant with the eventKey encrypts a presence.update as if it
+    // were an event-channel op. The narrow event validator must reject it so
+    // presence traffic cannot pollute the durable event log.
+    const presenceOnEvent = {
+      type: 'presence.update',
+      presence: {
+        user: { id: 'u', name: 'x', color: '#f00' },
+        cursor: null,
+      },
+    };
+    const ciphertext = await encryptEventOp(eventKey, presenceOnEvent as unknown as import('../types').RoomEventClientOp);
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 1, receivedAt: Date.now(),
+      envelope: { clientId: 'attacker', opId: 'sneaky', channel: 'event', ciphertext },
+    }));
+    await waitFor(() => client.getState().seq === 1, 1000);
+
+    expect(errors.some(e => e.code === 'event_malformed')).toBe(true);
+    expect(client.getState().annotations.length).toBe(0);
+    client.disconnect();
+  });
+
+  test('malformed event at seq=N does not block valid events at seq>N (forward-progress)', async () => {
+    const { client, ws, eventKey } = await setup();
+
+    // Ship a malformed event at seq=1.
+    const malformed = {
+      type: 'annotation.add',
+      annotations: [{ id: null, blockId: 'b', type: null, originalText: null, startOffset: 0, endOffset: 0, createdA: 0 }],
+    };
+    const badCipher = await encryptEventOp(eventKey, malformed as unknown as import('../types').RoomEventClientOp);
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 1, receivedAt: Date.now(),
+      envelope: { clientId: 'attacker', opId: 'bad', channel: 'event', ciphertext: badCipher },
+    }));
+    await waitFor(() => client.getState().seq === 1, 1000);
+
+    // Ship a valid event at seq=2. It must apply — replay-stream is not poisoned.
+    const goodAnn: RoomAnnotation = {
+      id: 'after-bad',
+      blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'y', createdA: 2,
+    };
+    const goodCipher = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [goodAnn] });
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 2, receivedAt: Date.now(),
+      envelope: { clientId: 'friend', opId: 'good', channel: 'event', ciphertext: goodCipher },
+    }));
+    await waitFor(() => client.getState().seq === 2, 1000);
+
+    const ids = client.getState().annotations.map(a => a.id);
+    expect(ids).toContain('after-bad');
+    client.disconnect();
+  });
+
+  test('malformed annotation.update patch is rejected (does not corrupt existing annotations)', async () => {
+    const { client, ws, eventKey } = await setup();
+
+    // Seed a real annotation first.
+    const ann: RoomAnnotation = {
+      id: 'real-1',
+      blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x', createdA: 1,
+    };
+    const addCipher = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [ann] });
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 1, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'a1', channel: 'event', ciphertext: addCipher },
+    }));
+    await waitFor(() => client.getState().annotations.length === 1, 1000);
+
+    // Malicious update with patch that tries to set type=null (not a valid enum).
+    const malformedPatch = {
+      type: 'annotation.update',
+      id: 'real-1',
+      patch: { type: null, originalText: 42 },
+    };
+    const ciphertext = await encryptEventOp(eventKey, malformedPatch as unknown as import('../types').RoomEventClientOp);
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 2, receivedAt: Date.now(),
+      envelope: { clientId: 'attacker', opId: 'u1', channel: 'event', ciphertext },
+    }));
+    await new Promise(r => setTimeout(r, 20));
+
+    // The existing annotation must be untouched.
+    const stillThere = client.getState().annotations.find(a => a.id === 'real-1');
+    expect(stillThere).toBeDefined();
+    expect(stillThere!.type).toBe('COMMENT');
+    expect(stillThere!.originalText).toBe('x');
+    client.disconnect();
+  });
+
+  test('annotation.update with mismatched id in patch is rejected (identity-mutation attack)', async () => {
+    const { client, ws, eventKey } = await setup();
+
+    // Seed a real annotation via a valid event.
+    const ann: RoomAnnotation = {
+      id: 'stable-id',
+      blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x', createdA: 1,
+    };
+    const addCipher = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [ann] });
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 1, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'a1', channel: 'event', ciphertext: addCipher },
+    }));
+    await waitFor(() => client.getState().annotations.length === 1, 1000);
+
+    // Malicious update: patch tries to hijack the id to a new value.
+    // isRoomClientOp must reject this via isRoomAnnotationPatch — event_malformed emitted.
+    const errors: { code: string; message: string }[] = [];
+    client.on('error', (e) => errors.push(e));
+    const hijackPatch = {
+      type: 'annotation.update',
+      id: 'stable-id',
+      patch: { id: 'hijacked-id', text: 'pwned' },
+    };
+    const hijackCipher = await encryptEventOp(
+      eventKey,
+      hijackPatch as unknown as import('../types').RoomEventClientOp,
+    );
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 2, receivedAt: Date.now(),
+      envelope: { clientId: 'attacker', opId: 'hijack', channel: 'event', ciphertext: hijackCipher },
+    }));
+    await waitFor(() => client.getState().seq === 2, 1000);
+
+    expect(errors.some(e => e.code === 'event_malformed')).toBe(true);
+    const ids = client.getState().annotations.map(a => a.id);
+    expect(ids).toContain('stable-id');
+    expect(ids).not.toContain('hijacked-id');
+    // Also confirm no renaming happened under the hood — the annotation at key 'stable-id' is intact.
+    const stored = client.getState().annotations.find(a => a.id === 'stable-id')!;
+    expect(stored.originalText).toBe('x');
+    expect(stored.text).toBeUndefined();  // not patched with 'pwned'
+    client.disconnect();
+  });
+
+  test('malformed snapshot is rejected via snapshot_malformed error, does not corrupt state', async () => {
+    const { client, ws, eventKey } = await setup();
+
+    const errors: { code: string; message: string }[] = [];
+    client.on('error', (e) => errors.push(e));
+
+    // First seed a real annotation via event so we can assert state is unchanged.
+    const ann: RoomAnnotation = {
+      id: 'keep-me',
+      blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x', createdA: 1,
+    };
+    const addCipher = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [ann] });
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 1, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'a1', channel: 'event', ciphertext: addCipher },
+    }));
+    await waitFor(() => client.getState().annotations.length === 1, 1000);
+
+    // Now a malformed snapshot: wrong versionId.
+    const malformedSnap = { versionId: 'v99', planMarkdown: 'corrupt', annotations: [] };
+    const snapCipher = await encryptSnapshot(eventKey, malformedSnap as unknown as RoomSnapshot);
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.snapshot', snapshotSeq: 99, snapshotCiphertext: snapCipher,
+    }));
+    await new Promise(r => setTimeout(r, 20));
+
+    expect(errors.some(e => e.code === 'snapshot_malformed')).toBe(true);
+    // Existing state preserved
+    expect(client.getState().annotations.length).toBe(1);
+    expect(client.getState().planMarkdown).toBe('# Plan');  // from setup()
+    // seq not advanced by rejected snapshot
+    expect(client.getState().seq).toBe(1);
+    // Snapshot errors must surface to `state` subscribers via lastError so
+    // hook consumers (which only subscribe to state) can react.
+    expect(client.getState().lastError?.code).toBe('snapshot_malformed');
+    client.disconnect();
+  });
+});
+
+describe('CollabRoomClient — terminal close sets roomUnavailable (P2)', () => {
+  test('close 4006 "Room unavailable" sets roomUnavailable=true and closes the connection', async () => {
+    const { client, ws } = await setup();
+    expect(client.getState().roomUnavailable).toBe(false);
+    ws.peer.simulateClose(4006, 'Room unavailable');
+    await new Promise(r => setTimeout(r, 10));
+    expect(client.getState().roomUnavailable).toBe(true);
+    expect(client.getState().connectionStatus).toBe('closed');
+  });
+
+  test('network drop (code 1006) does NOT set roomUnavailable', async () => {
+    const { client, ws } = await setup();
+    ws.peer.simulateClose(1006, '');
+    await new Promise(r => setTimeout(r, 10));
+    expect(client.getState().roomUnavailable).toBe(false);
+  });
+});
+
+describe('CollabRoomClient — deleteRoom socket-close semantics (P2)', () => {
+  test('deleteRoom rejects with AdminInterruptedError on network drop (not a delete close)', async () => {
+    const { client, ws } = await setup({ withAdmin: true });
+
+    const deletePromise = client.deleteRoom();
+    await ws.peer.expectFromClient();  // admin.challenge.request
+
+    const adminChallenge: AdminChallenge = {
+      type: 'admin.challenge', challengeId: generateChallengeId(),
+      nonce: generateNonce(), expiresAt: Date.now() + 30_000,
+    };
+    ws.peer.sendFromServer(JSON.stringify(adminChallenge));
+    await ws.peer.expectFromClient();  // admin.command
+
+    // Simulate a network drop — NOT the server's delete close.
+    // Code 1006, no reason. Must NOT be treated as successful delete.
+    ws.peer.simulateClose(1006, '');
+
+    await expect(deletePromise).rejects.toThrow(/interrupted/i);
+  });
+
+  test('deleteRoom resolves on server close (code 4006, "Room unavailable")', async () => {
+    const { client, ws } = await setup({ withAdmin: true });
+
+    const deletePromise = client.deleteRoom();
+    await ws.peer.expectFromClient();
+    const adminChallenge: AdminChallenge = {
+      type: 'admin.challenge', challengeId: generateChallengeId(),
+      nonce: generateNonce(), expiresAt: Date.now() + 30_000,
+    };
+    ws.peer.sendFromServer(JSON.stringify(adminChallenge));
+    await ws.peer.expectFromClient();
+
+    // Server's purge-initiated close — the single success signal.
+    ws.peer.simulateClose(4006, 'Room unavailable');
+
+    await deletePromise;
+    expect(client.getState().roomUnavailable).toBe(true);
+  });
+});
+
+describe('CollabRoomClient — stale socket handlers do not clobber current socket (P3)', () => {
+  // Helper: create a client + constructed-sockets array, with configurable reconnect.
+  async function makeClient(opts: { asyncClose?: boolean; reconnect?: { maxAttempts: number; initialDelayMs?: number; maxDelayMs?: number } } = {}) {
+    const prevAsyncMode = MockWebSocket.asyncCloseMode;
+    MockWebSocket.asyncCloseMode = opts.asyncClose ?? false;
+    const constructed: MockWebSocket[] = [];
+    const WebSocketImpl = class extends MockWebSocket {
+      constructor(url: string | URL, protocols?: string | string[]) {
+        super(url, protocols);
+        constructed.push(this);
+      }
+    } as unknown as typeof WebSocket;
+
+    const roomSecret = generateRoomSecret();
+    const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+    const roomVerifier = await computeRoomVerifier(authKey, ROOM_ID);
+
+    const client = new CollabRoomClient({
+      roomId: ROOM_ID,
+      baseUrl: 'http://localhost:8787',
+      eventKey,
+      presenceKey,
+      adminKey: null,
+      roomVerifier,
+      adminVerifier: null,
+      user: USER,
+      webSocketImpl: WebSocketImpl,
+      connectTimeoutMs: 5000,
+      reconnect: opts.reconnect ?? { maxAttempts: 0 },
+    });
+    return {
+      client, constructed,
+      restore: () => { MockWebSocket.asyncCloseMode = prevAsyncMode; },
+    };
+  }
+
+  async function completeAuth(ws: MockWebSocket, connectPromise: Promise<void>) {
+    await new Promise(r => queueMicrotask(r));
+    await new Promise(r => queueMicrotask(r));
+    ws.peer.sendFromServer(JSON.stringify(makeAuthChallenge()));
+    await ws.peer.expectFromClient();
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'auth.accepted',
+      seq: 0, snapshotSeq: 0, snapshotAvailable: false,
+    }));
+    await connectPromise;
+  }
+
+  test('auto-reconnect + explicit connect() during B: B is retired, C completes auth, late B events are ignored', async () => {
+    // Exact original-race reproduction — NO intervening disconnect():
+    //   1. Authenticate socket A.
+    //   2. Server closes A; auto-reconnect opens socket B.
+    //   3. Caller invokes connect() while B is still in flight.
+    //   4. connect() must rotate: retire B, open socket C.
+    //   5. Fire late onclose / onmessage on B — handlers must no-op, C must not be clobbered.
+    //   6. Complete auth on C — must succeed.
+    const { client, constructed, restore } = await makeClient({
+      reconnect: { maxAttempts: 5, initialDelayMs: 10, maxDelayMs: 20 },
+    });
+
+    try {
+      // 1) Authenticate on socket A.
+      const firstConnect = client.connect();
+      await waitFor(() => constructed.length >= 1, 1000);
+      const socketA = constructed[0];
+      await completeAuth(socketA, firstConnect);
+      expect(client.getState().connectionStatus).toBe('authenticated');
+
+      // 2) Server closes A. Auto-reconnect opens socket B (post-auth, so
+      //    pendingConnect is null and handleSocketClose schedules a reconnect).
+      socketA.peer.simulateClose(1006, 'network flap');
+      await waitFor(() => constructed.length >= 2, 1000);
+      const socketB = constructed[1];
+      // At this point B is the current socket; its handlers are bound; status
+      // should be reconnecting / connecting. pendingConnect is null because
+      // this is auto-reconnect, not initial-connect or explicit connect().
+
+      // 3) Caller invokes connect() DIRECTLY while B is live (no disconnect()).
+      //    This must open socket C and retire socket B.
+      const rotationConnect = client.connect();
+      await waitFor(() => constructed.length >= 3, 1000);
+      const socketC = constructed[2];
+      expect(socketC).not.toBe(socketB);
+
+      // B should be closed by retireSocket (the implementation calls
+      // ws.close() when it adds a socket to retiredSockets).
+      expect(socketB.readyState).toBe(socketB.CLOSED);
+
+      // 4) Fire a late onclose directly on the retired B — the handler
+      //    (bound to B when it was constructed) must short-circuit on the
+      //    retiredSockets check. If the guard is broken, this would re-enter
+      //    handleSocketClose and null out this.ws, orphaning C.
+      socketB.onclose?.(new CloseEvent('close', { code: 1006, reason: 'late B straggler', wasClean: false }));
+      // Also fire a late onmessage on B — must be gated out.
+      socketB.onmessage?.(new MessageEvent('message', { data: '{"type":"room.error","code":"stale","message":"from B"}' }));
+
+      // 5) Complete auth on socket C — if B had clobbered this.ws, this would hang.
+      await completeAuth(socketC, rotationConnect);
+      expect(client.getState().connectionStatus).toBe('authenticated');
+
+      client.disconnect();
+    } finally {
+      restore();
+    }
+  });
+
+  test('async-close mock: intentional disconnect rejects pendingConnect synchronously (does not wait for deferred onclose)', async () => {
+    // In real browsers ws.close() returns immediately and onclose fires in a
+    // later microtask. Previously the client relied on the synchronous onclose
+    // from closeSocket() to reject pendingConnect/pendingAdmin. Under true
+    // async-close semantics, that produced a hang until timeout. This test
+    // pins the fix: disconnect() rejects pendingConnect synchronously.
+    const { client, constructed, restore } = await makeClient({ asyncClose: true });
+
+    try {
+      const connectPromise = client.connect();
+      await waitFor(() => constructed.length === 1, 1000);
+      await new Promise(r => queueMicrotask(r));
+      await new Promise(r => queueMicrotask(r));
+
+      // Do NOT complete auth. Just disconnect while pendingConnect is live.
+      // Under the OLD implementation, this would hang until the 5000ms
+      // connectTimeout fired because the onclose that would reject was
+      // deferred as a microtask AND then gated away by `this.ws !== ws`.
+      // Under the fix, disconnect() rejects synchronously.
+      const start = Date.now();
+      client.disconnect();
+      await expect(connectPromise).rejects.toThrow();
+      const elapsed = Date.now() - start;
+      expect(elapsed).toBeLessThan(500);  // must not wait for 5s timeout
+      expect(client.getState().connectionStatus).toBe('closed');
+    } finally {
+      restore();
+    }
+  });
+
+  test('async-close mock: connect timeout rejects and transitions to disconnected even when onclose is deferred', async () => {
+    const { client, constructed, restore } = await makeClient({ asyncClose: true });
+
+    try {
+      // Reach into the instance to shorten the connect timeout for test speed.
+      // Construct a new client with a short timeout instead.
+      client.disconnect();
+      const roomSecret = generateRoomSecret();
+      const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+      const roomVerifier = await computeRoomVerifier(authKey, ROOM_ID);
+
+      const WebSocketImpl = class extends MockWebSocket {
+        constructor(url: string | URL, protocols?: string | string[]) {
+          super(url, protocols);
+          constructed.push(this);
+        }
+      } as unknown as typeof WebSocket;
+
+      const fastClient = new CollabRoomClient({
+        roomId: ROOM_ID,
+        baseUrl: 'http://localhost:8787',
+        eventKey,
+        presenceKey,
+        adminKey: null,
+        roomVerifier,
+        adminVerifier: null,
+        user: USER,
+        webSocketImpl: WebSocketImpl,
+        connectTimeoutMs: 50,  // trigger timeout path
+        reconnect: { maxAttempts: 0 },
+      });
+
+      const connectPromise = fastClient.connect();
+      await expect(connectPromise).rejects.toThrow(ConnectTimeoutError);
+
+      // Let the deferred onclose fire (from the timeout's closeSocket call).
+      await new Promise(r => setTimeout(r, 50));
+
+      // Critical assertions: the deferred onclose must not clobber the
+      // already-settled state. Status must be 'disconnected' (not mutated
+      // back by a late handleSocketClose).
+      expect(fastClient.getState().connectionStatus).toBe('disconnected');
+    } finally {
+      restore();
+    }
+  });
+});
+
+describe('CollabRoomClient — getState() returns immutable snapshot (P2)', () => {
+  test('mutating returned annotations / remotePresence does not affect internal state', async () => {
+    const { client, ws, eventKey, presenceKey } = await setup();
+
+    // Seed an annotation via server echo.
+    const ann: RoomAnnotation = {
+      id: 'imm-1',
+      blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x', createdA: 1,
+      startMeta: { parentTagName: 'p', parentIndex: 0, textOffset: 0 },
+    };
+    const cipher = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [ann] });
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 1, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'a1', channel: 'event', ciphertext: cipher },
+    }));
+    await waitFor(() => client.getState().annotations.length === 1, 1000);
+
+    // Seed presence.
+    const presence = {
+      user: { id: 'u2', name: 'bob', color: '#0f0' },
+      cursor: { x: 10, y: 20, coordinateSpace: 'document' as const },
+    };
+    const pCipher = await encryptPresence(presenceKey, presence);
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.presence',
+      envelope: { clientId: 'friend', opId: 'p1', channel: 'presence', ciphertext: pCipher },
+    }));
+    await waitFor(() => client.getState().remotePresence.friend !== undefined, 1000);
+
+    // Seed a non-null lastError by pushing a room.error from the server.
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.error', code: 'validation_error', message: 'Test error message',
+    }));
+    await waitFor(() => client.getState().lastError !== null, 1000);
+
+    // Grab the snapshot and MUTATE the returned objects.
+    const snap1 = client.getState();
+    (snap1.annotations[0] as RoomAnnotation).originalText = 'MUTATED';
+    snap1.annotations[0].startMeta!.parentTagName = 'HIJACKED';
+    snap1.remotePresence.friend.user.name = 'MUTATED';
+    snap1.remotePresence.friend.cursor!.x = 9999;
+    snap1.annotations.push({ ...ann, id: 'injected' });
+    snap1.remotePresence.intruder = {
+      user: { id: 'x', name: 'x', color: '#000' },
+      cursor: null,
+    };
+    snap1.lastError!.message = 'MUTATED ERROR';
+
+    // Fresh snapshot must reflect internal state, not the mutations above.
+    const snap2 = client.getState();
+    expect(snap2.annotations.length).toBe(1);
+    expect(snap2.annotations[0].id).toBe('imm-1');
+    expect(snap2.annotations[0].originalText).toBe('x');
+    expect(snap2.annotations[0].startMeta!.parentTagName).toBe('p');
+    expect(snap2.remotePresence.friend.user.name).toBe('bob');
+    expect(snap2.remotePresence.friend.cursor!.x).toBe(10);
+    expect(snap2.remotePresence.intruder).toBeUndefined();
+    expect(snap2.lastError).not.toBeNull();
+    expect(snap2.lastError!.message).toBe('Test error message');
+    expect(snap2.lastError!.code).toBe('validation_error');
+
+    client.disconnect();
+  });
+
+});
+
+// NOTE: the auth-proof failure during auto-reconnect code path (handleAuthChallenge
+// catch branch when pendingConnect === null) is defensive and hard to exercise
+// deterministically without patching WebCrypto. It's covered by code review and the
+// existing initial-connect auth-failure path is tested above.
+
+describe('CollabRoomClient — auth.challenge missing clientId (P3 protocol violation)', () => {
+  test('initial-connect: rejects pendingConnect and transitions to disconnected (does not hang until timeout)', async () => {
+    const roomSecret = generateRoomSecret();
+    const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+    const roomVerifier = await computeRoomVerifier(authKey, ROOM_ID);
+
+    let capturedWs: MockWebSocket | null = null;
+    const WebSocketImpl = class extends MockWebSocket {
+      constructor(url: string | URL, protocols?: string | string[]) {
+        super(url, protocols);
+        capturedWs = this;
+      }
+    } as unknown as typeof WebSocket;
+
+    const client = new CollabRoomClient({
+      roomId: ROOM_ID,
+      baseUrl: 'http://localhost:8787',
+      eventKey,
+      presenceKey,
+      adminKey: null,
+      roomVerifier,
+      adminVerifier: null,
+      user: USER,
+      webSocketImpl: WebSocketImpl,
+      connectTimeoutMs: 5000,  // intentionally long — test must reject fast
+      reconnect: { maxAttempts: 0 },
+    });
+
+    const connectPromise = client.connect();
+    await waitFor(() => capturedWs !== null, 1000);
+    await new Promise(r => queueMicrotask(r));
+    await new Promise(r => queueMicrotask(r));
+
+    // Send a challenge WITHOUT clientId (simulates old server / malformed).
+    const ws = capturedWs!;
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'auth.challenge',
+      challengeId: generateChallengeId(),
+      nonce: generateNonce(),
+      expiresAt: Date.now() + 30_000,
+      // clientId: missing
+    }));
+
+    const start = Date.now();
+    await expect(connectPromise).rejects.toThrow();
+    const elapsed = Date.now() - start;
+    expect(elapsed).toBeLessThan(500);  // not waiting for connectTimeoutMs
+    expect(client.getState().connectionStatus).toBe('disconnected');
+  });
+});
+
+describe('CollabRoomClient — openSocket synchronous throw is cleaned up (P2)', () => {
+  test('synchronous WebSocket constructor throw: connect rejects, state returns to disconnected, next connect is not blocked', async () => {
+    const roomSecret = generateRoomSecret();
+    const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+    const roomVerifier = await computeRoomVerifier(authKey, ROOM_ID);
+
+    // First impl throws synchronously from the constructor. Second impl is
+    // a normal MockWebSocket so a follow-up connect() can actually proceed.
+    let attempt = 0;
+    const boom = new Error('WebSocket constructor exploded');
+    const capturedSockets: MockWebSocket[] = [];
+    const WebSocketImpl = class extends MockWebSocket {
+      constructor(url: string | URL, protocols?: string | string[]) {
+        attempt++;
+        if (attempt === 1) {
+          // Throw from the constructor so the `new this.WebSocketImpl(wsUrl)`
+          // expression in openSocket() fails before `this.ws = ws`.
+          super(url, protocols);
+          throw boom;
+        }
+        super(url, protocols);
+        capturedSockets.push(this);
+      }
+    } as unknown as typeof WebSocket;
+
+    const client = new CollabRoomClient({
+      roomId: ROOM_ID,
+      baseUrl: 'http://localhost:8787',
+      eventKey,
+      presenceKey,
+      adminKey: null,
+      roomVerifier,
+      adminVerifier: null,
+      user: USER,
+      webSocketImpl: WebSocketImpl,
+      connectTimeoutMs: 2000,
+      reconnect: { maxAttempts: 0 },
+    });
+
+    // First connect — constructor throws. Must reject quickly with the
+    // underlying error, not sit until connectTimeoutMs.
+    const start = Date.now();
+    await expect(client.connect()).rejects.toThrow('WebSocket constructor exploded');
+    expect(Date.now() - start).toBeLessThan(500);
+
+    // State must be disconnected — not stuck in 'connecting'.
+    expect(client.getState().connectionStatus).toBe('disconnected');
+
+    // A subsequent connect() must NOT be trapped behind stale pendingConnect
+    // state. Drive it to full auth to prove end-to-end that the pending state
+    // was cleaned up.
+    const secondConnect = client.connect();
+    await waitFor(() => capturedSockets.length === 1, 1000);
+    await new Promise(r => queueMicrotask(r));
+    await new Promise(r => queueMicrotask(r));
+
+    const ws = capturedSockets[0];
+    ws.peer.sendFromServer(JSON.stringify(makeAuthChallenge()));
+    await ws.peer.expectFromClient();
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'auth.accepted',
+      seq: 0, snapshotSeq: 0, snapshotAvailable: false,
+    }));
+    await secondConnect;
+    expect(client.getState().connectionStatus).toBe('authenticated');
+    client.disconnect();
+  });
+});
+
+describe('CollabRoomClient — outbound validation (P2)', () => {
+  // Helper: a rejected outbound validation must not push a new message onto the
+  // wire. setup() already drains the auth.response, so compare against baseline.
+  const assertNoNewSend = (ws: MockWebSocket, sentBefore: number) => {
+    expect(ws.peer.sent.length).toBe(sentBefore);
+  };
+
+  test('sendAnnotationAdd rejects annotation with images before encryption/send', async () => {
+    const { client, ws } = await setup();
+    const sentBefore = ws.peer.sent.length;
+    const bad = {
+      id: 'bad-1',
+      blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT' as const, originalText: 'x', createdA: 1,
+      // images is forbidden in V1 RoomAnnotation
+      images: [{ path: '/tmp/x', name: 'x.png' }],
+    } as unknown as RoomAnnotation;
+    await expect(client.sendAnnotationAdd([bad])).rejects.toThrow(InvalidOutboundPayloadError);
+    assertNoNewSend(ws, sentBefore);
+    client.disconnect();
+  });
+
+  test('sendAnnotationAdd rejects annotation with null id before send', async () => {
+    const { client, ws } = await setup();
+    const sentBefore = ws.peer.sent.length;
+    const bad = {
+      id: null,
+      blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x', createdA: 1,
+    } as unknown as RoomAnnotation;
+    await expect(client.sendAnnotationAdd([bad])).rejects.toThrow(InvalidOutboundPayloadError);
+    assertNoNewSend(ws, sentBefore);
+    client.disconnect();
+  });
+
+  test('sendAnnotationUpdate rejects patch that tries to mutate id', async () => {
+    const { client, ws } = await setup();
+    const sentBefore = ws.peer.sent.length;
+    await expect(
+      client.sendAnnotationUpdate('some-id', { id: 'hijacked' } as Partial<RoomAnnotation>),
+    ).rejects.toThrow(InvalidOutboundPayloadError);
+    assertNoNewSend(ws, sentBefore);
+    client.disconnect();
+  });
+
+  test('sendAnnotationRemove rejects non-string / empty ids', async () => {
+    const { client, ws } = await setup();
+    const sentBefore = ws.peer.sent.length;
+    await expect(
+      client.sendAnnotationRemove(['valid-id', ''] as string[]),
+    ).rejects.toThrow(InvalidOutboundPayloadError);
+    assertNoNewSend(ws, sentBefore);
+    client.disconnect();
+  });
+
+  test('sendPresence rejects non-finite cursor coordinates', async () => {
+    const { client, ws } = await setup();
+    const sentBefore = ws.peer.sent.length;
+    const bad = {
+      user: { id: 'u', name: 'a', color: '#f00' },
+      cursor: { x: Infinity, y: 0, coordinateSpace: 'document' as const },
+    };
+    await expect(client.sendPresence(bad as never)).rejects.toThrow(InvalidOutboundPayloadError);
+    assertNoNewSend(ws, sentBefore);
+    client.disconnect();
+  });
+
+});
+
+describe('createRoom — success body is not parsed (P2)', () => {
+  test('resolves after 201 even when the response body is malformed JSON', async () => {
+    // Adversarial body covers the empty-body case too: createRoom must
+    // never attempt to parse the success body, regardless of content.
+    const { createRoom } = await import('./create-room');
+    const goodSnapshot = {
+      versionId: 'v1' as const,
+      planMarkdown: '# Plan',
+      annotations: [],
+    };
+    const fakeFetch: typeof fetch = async () => new Response('not-json{{{', { status: 201 });
+
+    const result = await createRoom({
+      baseUrl: 'http://localhost:8787',
+      initialSnapshot: goodSnapshot,
+      user: USER,
+      fetchImpl: fakeFetch,
+    });
+
+    expect(result.roomId).toBeTruthy();
+    expect(result.roomSecret).toBeTruthy();
+    expect(result.adminSecret).toBeTruthy();
+    expect(result.joinUrl).toContain(result.roomId);
+    expect(result.adminUrl).toContain(result.roomId);
+    expect(result.client).toBeDefined();
+  });
+});
+
+describe('createRoom — outbound validation (P2)', () => {
+  test('rejects malformed initialSnapshot before any fetch', async () => {
+    const { createRoom } = await import('./create-room');
+    let fetchCalls = 0;
+    const fakeFetch: typeof fetch = async () => {
+      fetchCalls++;
+      return new Response('{}', { status: 201 });
+    };
+    const bad = { versionId: 'v99', planMarkdown: 'x', annotations: [] } as unknown as RoomSnapshot;
+    await expect(createRoom({
+      baseUrl: 'http://localhost:8787',
+      initialSnapshot: bad,
+      user: USER,
+      fetchImpl: fakeFetch,
+    })).rejects.toThrow(InvalidOutboundPayloadError);
+    expect(fetchCalls).toBe(0);
+  });
+
+  test('rejects initialSnapshot containing malformed annotation', async () => {
+    const { createRoom } = await import('./create-room');
+    let fetchCalls = 0;
+    const fakeFetch: typeof fetch = async () => {
+      fetchCalls++;
+      return new Response('{}', { status: 201 });
+    };
+    const badAnn = {
+      id: 'x', blockId: 'b', startOffset: 0, endOffset: 0,
+      type: 'INVALID_TYPE', originalText: 'x', createdA: 1,
+    };
+    const bad = {
+      versionId: 'v1', planMarkdown: '', annotations: [badAnn],
+    } as unknown as RoomSnapshot;
+    await expect(createRoom({
+      baseUrl: 'http://localhost:8787',
+      initialSnapshot: bad,
+      user: USER,
+      fetchImpl: fakeFetch,
+    })).rejects.toThrow(InvalidOutboundPayloadError);
+    expect(fetchCalls).toBe(0);
+  });
+});
+
+describe('CollabRoomClient — runAdminCommand send() failure (P3)', () => {
+  test('synchronous send throw clears pendingAdmin; subsequent admin command works', async () => {
+    const { client, ws } = await setup({ withAdmin: true });
+
+    const sendMock = ws.send.bind(ws);
+    let shouldThrow = true;
+    ws.send = (data: string | ArrayBufferLike | Blob | ArrayBufferView) => {
+      if (shouldThrow) { shouldThrow = false; throw new Error('simulated admin send failure'); }
+      return sendMock(data);
+    };
+
+    await expect(client.deleteRoom()).rejects.toThrow('simulated admin send failure');
+
+    // pendingAdmin should be cleared — a fresh command must not report "Another admin command is pending".
+    // Drive a full successful delete now.
+    const deletePromise = client.deleteRoom();
+    await ws.peer.expectFromClient();  // admin.challenge.request
+
+    const adminChallenge: AdminChallenge = {
+      type: 'admin.challenge',
+      challengeId: generateChallengeId(),
+      nonce: generateNonce(),
+      expiresAt: Date.now() + 30_000,
+    };
+    ws.peer.sendFromServer(JSON.stringify(adminChallenge));
+    await ws.peer.expectFromClient();  // admin.command
+    ws.peer.simulateClose(4006, 'Room unavailable');
+    await deletePromise;
+  });
+});
+
+describe('CollabRoomClient — socket-generation guards drop stale queued messages', () => {
+  // These tests simulate a reconnect that rolls the socket while a queued
+  // snapshot or event is mid-flight. The guard check (gen !== socketGeneration)
+  // must cause the queued handler to return without mutating state. We bump
+  // socketGeneration synchronously between enqueue and queue drain to simulate
+  // a rotation deterministically — the natural race is hard to pin to a single
+  // microtask boundary, but the guard is the same code path either way.
+
+  test('queued room.event from retired socket does not mutate state after generation advances', async () => {
+    const { client, ws, eventKey } = await setup();
+
+    // Sanity: baseline is empty at seq=0.
+    expect(client.getState().annotations.length).toBe(0);
+    expect(client.getState().seq).toBe(0);
+
+    // Inject a valid annotation.add room.event — handleSocketMessage enqueues
+    // handleRoomEvent with the CURRENT socketGeneration captured.
+    const ann: RoomAnnotation = {
+      id: 'stale-ev-1',
+      blockId: 'b1', startOffset: 0, endOffset: 5,
+      type: 'COMMENT', originalText: 'x', createdA: 1,
+      startMeta: { parentTagName: 'p', parentIndex: 0, textOffset: 0 },
+    };
+    const cipher = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [ann] });
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 1, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'a1', channel: 'event', ciphertext: cipher },
+    }));
+
+    // Synchronously simulate a socket rotation: bump the generation counter
+    // before the queued handler's microtask runs. The next time the handler
+    // compares `gen !== this.socketGeneration`, it must short-circuit.
+    // eslint-disable-next-line @typescript-eslint/no-explicit-any
+    (client as any).socketGeneration = (client as any).socketGeneration + 1;
+
+    // Drain the message queue.
+    await new Promise(r => setTimeout(r, 20));
+
+    // State must be untouched — no annotation applied, seq not advanced.
+    expect(client.getState().annotations.length).toBe(0);
+    expect(client.getState().seq).toBe(0);
+    // lastError should not be a decrypt/shape error either — the handler
+    // short-circuited entirely.
+    expect(client.getState().lastError).toBeNull();
+
+    // After the stale drop, the newer socket must still accept valid events.
+    // Restore the counter so the next message's captured gen matches.
+    // eslint-disable-next-line @typescript-eslint/no-explicit-any
+    (client as any).socketGeneration = (client as any).socketGeneration - 1;
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 1, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'a2', channel: 'event', ciphertext: cipher },
+    }));
+    await new Promise(r => setTimeout(r, 20));
+    expect(client.getState().annotations.length).toBe(1);
+    expect(client.getState().seq).toBe(1);
+
+    client.disconnect();
+  });
+
+  test('queued room.snapshot from retired socket does not replace baseline after generation advances', async () => {
+    const { client, ws, eventKey } = await setup();
+
+    // Seed a single annotation so we can detect unwanted baseline replacement.
+    const seedAnn: RoomAnnotation = {
+      id: 'seed-ann', blockId: 'b1', startOffset: 0, endOffset: 3,
+      type: 'COMMENT', originalText: 'seed', createdA: 1,
+      startMeta: { parentTagName: 'p', parentIndex: 0, textOffset: 0 },
+    };
+    const seedCipher = await encryptEventOp(eventKey, { type: 'annotation.add', annotations: [seedAnn] });
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.event', seq: 1, receivedAt: Date.now(),
+      envelope: { clientId: 'other', opId: 'seed', channel: 'event', ciphertext: seedCipher },
+    }));
+    await new Promise(r => setTimeout(r, 20));
+    expect(client.getState().annotations.length).toBe(1);
+    expect(client.getState().seq).toBe(1);
+
+    // Queue a stale snapshot that WOULD wipe the seed annotation and rewind seq
+    // to 0 if it applied. The generation guard must drop it.
+    const staleSnapshot: RoomSnapshot = { versionId: 'v-stale', planMarkdown: '# stale', annotations: [] };
+    const staleCipher = await encryptSnapshot(eventKey, staleSnapshot);
+    ws.peer.sendFromServer(JSON.stringify({
+      type: 'room.snapshot', snapshotSeq: 0, snapshotCiphertext: staleCipher,
+    }));
+
+    // Synchronously advance the generation before the queued decrypt task runs.
+    // eslint-disable-next-line @typescript-eslint/no-explicit-any
+    (client as any).socketGeneration = (client as any).socketGeneration + 1;
+
+    await new Promise(r => setTimeout(r, 20));
+
+    // Baseline untouched: annotation still present, seq still 1.
+    expect(client.getState().annotations.length).toBe(1);
+    expect(client.getState().annotations[0].id).toBe('seed-ann');
+    expect(client.getState().seq).toBe(1);
+    expect(client.getState().planMarkdown).toBe('# Plan');  // unchanged from setup()
+    // No snapshot-decrypt error surfaced on the newer socket.
+    expect(client.getState().lastError).toBeNull();
+
+    client.disconnect();
+  });
+});
diff --git a/packages/shared/collab/client-runtime/client.ts b/packages/shared/collab/client-runtime/client.ts
new file mode 100644
index 000000000..039f0bea1
--- /dev/null
+++ b/packages/shared/collab/client-runtime/client.ts
@@ -0,0 +1,1548 @@
+/**
+ * CollabRoomClient — the browser/agent runtime for Plannotator Live Rooms.
+ *
+ * Owns WebSocket lifecycle, auth handshake, message dispatch, state management,
+ * auto-reconnect with backoff, and admin command flow.
+ *
+ * V1 state model: server echo is authoritative. Annotation mutations are NOT
+ * applied optimistically — they are only applied when the server echoes them
+ * back via room.event. See sendOp() for the rationale (no opId-correlated
+ * ack/reject in V1, so no safe rollback path).
+ *
+ * Zero-knowledge: decrypts server-provided ciphertext locally; encrypts before send.
+ */
+
+import {
+  computeAuthProof,
+  computeAdminProof,
+  encryptEventOp,
+  decryptEventPayload,
+  encryptPresence,
+  decryptPresence,
+  decryptSnapshot,
+} from '../crypto';
+import { ADMIN_ERROR_CODES, WS_CLOSE_ROOM_UNAVAILABLE } from '../constants';
+import { generateOpId } from '../ids';
+import type {
+  AdminChallenge,
+  AdminCommand,
+  AuthAccepted,
+  AuthChallenge,
+  PresenceState,
+  RoomAnnotation,
+  RoomEventClientOp,
+  RoomServerEvent,
+  RoomTransportMessage,
+  ServerEnvelope,
+} from '../types';
+import { isPresenceState, isRoomEventClientOp, isRoomSnapshot } from '../types';
+// Event channel uses isRoomEventClientOp (event ops ONLY — no presence.update).
+// Presence channel uses isPresenceState (validates raw PresenceState payloads).
+// This split prevents presence.update from leaking into the durable event log.
+import { applyAnnotationEvent, annotationsToArray, cloneRoomAnnotation, cloneRoomAnnotationPatch } from './apply-event';
+import { computeBackoffMs, DEFAULT_BACKOFF } from './backoff';
+import { TypedEventEmitter } from './emitter';
+import type {
+  CollabRoomEvents,
+  CollabRoomState,
+  ConnectionStatus,
+  InternalClientOptions,
+  ReconnectOptions,
+} from './types';
+
+// ---------------------------------------------------------------------------
+// Error types
+// ---------------------------------------------------------------------------
+
+export class ConnectTimeoutError extends Error { constructor() { super('WebSocket connect/auth timed out'); this.name = 'ConnectTimeoutError'; } }
+export class AuthRejectedError extends Error { constructor(msg = 'Auth rejected') { super(msg); this.name = 'AuthRejectedError'; } }
+export class RoomUnavailableError extends Error { constructor(msg = 'Room unavailable') { super(msg); this.name = 'RoomUnavailableError'; } }
+export class NotConnectedError extends Error { constructor() { super('Client is not authenticated'); this.name = 'NotConnectedError'; } }
+export class AdminNotAuthorizedError extends Error { constructor() { super('No admin capability'); this.name = 'AdminNotAuthorizedError'; } }
+export class AdminTimeoutError extends Error { constructor() { super('Admin command timed out'); this.name = 'AdminTimeoutError'; } }
+export class AdminInterruptedError extends Error { constructor() { super('Admin command interrupted by socket close'); this.name = 'AdminInterruptedError'; } }
+export class AdminRejectedError extends Error {
+  constructor(public code: string, message: string) {
+    super(message);
+    this.name = 'AdminRejectedError';
+  }
+}
+
+/**
+ * Thrown by public mutation methods when the payload fails shape validation
+ * BEFORE encryption/send. This catches UI bugs early — without it, a bad
+ * payload would be encrypted, sequenced by the server, echoed, and then
+ * rejected by every client (including the sender) with no clear signal that
+ * the original send was the cause.
+ */
+export class InvalidOutboundPayloadError extends Error {
+  constructor(message: string) {
+    super(message);
+    this.name = 'InvalidOutboundPayloadError';
+  }
+}
+
+// ---------------------------------------------------------------------------
+// Clone helpers for getState() immutability
+//
+// V1 state is server-authoritative: internal annotation/presence objects must
+// only be mutated by decrypted server events. If getState() exposed internal
+// references, UI code could silently corrupt local state by mutating a
+// returned annotation or cursor. These helpers keep the public surface
+// read-only.
+//
+// cloneRoomAnnotation is imported from apply-event.ts (single source of truth
+// for the nested-meta clone rule — avoids drift if a new nested field is
+// added to RoomAnnotation).
+// ---------------------------------------------------------------------------
+
+function clonePresenceState(p: PresenceState): PresenceState {
+  return {
+    ...p,
+    user: { ...p.user },
+    cursor: p.cursor ? { ...p.cursor } : null,
+  };
+}
+
+/** Clone a decoded RoomServerEvent so emission to subscribers is isolated from internal state. */
+/**
+ * Clone an outbound RoomEventClientOp so the payload the client queues for
+ * encryption is immune to caller mutation. Public mutation methods clone
+ * synchronously before validation + queueing; if the caller mutates the
+ * annotation/patch/ids array after the call returns, the queued op stays
+ * pinned to the value at call time.
+ */
+function cloneRoomEventClientOp(op: RoomEventClientOp): RoomEventClientOp {
+  switch (op.type) {
+    case 'annotation.add':
+      return { type: 'annotation.add', annotations: op.annotations.map(cloneRoomAnnotation) };
+    case 'annotation.update':
+      return { type: 'annotation.update', id: op.id, patch: cloneRoomAnnotationPatch(op.patch) };
+    case 'annotation.remove':
+      return { type: 'annotation.remove', ids: [...op.ids] };
+    case 'annotation.clear':
+      return { type: 'annotation.clear', source: op.source };
+  }
+}
+
+function cloneRoomServerEvent(event: RoomServerEvent): RoomServerEvent {
+  switch (event.type) {
+    case 'annotation.add':
+      return { type: 'annotation.add', annotations: event.annotations.map(cloneRoomAnnotation) };
+    case 'annotation.update':
+      return { type: 'annotation.update', id: event.id, patch: cloneRoomAnnotationPatch(event.patch) };
+    case 'annotation.remove':
+      return { type: 'annotation.remove', ids: [...event.ids] };
+    case 'annotation.clear':
+      return { type: 'annotation.clear', source: event.source };
+    case 'snapshot':
+      return {
+        type: 'snapshot',
+        snapshotSeq: event.snapshotSeq,
+        payload: { ...event.payload, annotations: event.payload.annotations.map(cloneRoomAnnotation) },
+      };
+    case 'presence.update':
+      return { type: 'presence.update', clientId: event.clientId, presence: clonePresenceState(event.presence) };
+  }
+}
+
+// ---------------------------------------------------------------------------
+// Constants
+// ---------------------------------------------------------------------------
+
+const DEFAULT_CONNECT_TIMEOUT_MS = 10_000;
+const DEFAULT_PRESENCE_TTL_MS = 30_000;
+const DEFAULT_PRESENCE_SWEEP_INTERVAL_MS = 5_000;
+const ADMIN_COMMAND_TIMEOUT_MS = 5_000;
+
+/**
+ * `room.error` codes that are emitted exclusively from the admin command
+ * path on the server. A pending admin command rejects ONLY when a room.error
+ * with one of these codes arrives; other codes (e.g. `validation_error`
+ * from an event-channel op) are event-channel failures and must not
+ * cancel an in-flight admin command.
+ *
+ * Derived from the shared `ADMIN_ERROR_CODES` tuple so there is exactly
+ * one source of truth across the server (`sendAdminError` call sites in
+ * `room-do.ts`) and this client. Membership check tolerates unknown
+ * strings as non-admin — forward-compatible with servers that add
+ * future codes we don't yet recognize.
+ */
+// Typed as `Set<string>` (not `Set<AdminErrorCode>`) because we call
+// `.has(msg.code)` where `msg.code: string` arrives from the wire —
+// forward-compatibility with unknown future codes is intentional:
+// they fall through as non-admin, not typecheck errors at the
+// membership site.
+const ADMIN_SCOPED_ERROR_CODES: ReadonlySet<string> =
+  new Set<string>(ADMIN_ERROR_CODES);
+
+
+// ---------------------------------------------------------------------------
+// Internal types
+// ---------------------------------------------------------------------------
+
+interface PendingAdmin {
+  command: AdminCommand;
+  resolve: () => void;
+  reject: (err: Error) => void;
+  timeoutHandle: ReturnType<typeof setTimeout>;
+}
+
+interface PendingConnect {
+  resolve: () => void;
+  reject: (err: Error) => void;
+  timeoutHandle: ReturnType<typeof setTimeout>;
+}
+
+// ---------------------------------------------------------------------------
+// Class
+// ---------------------------------------------------------------------------
+
+export class CollabRoomClient {
+  // Identity / keys (stable across reconnects)
+  private readonly roomId: string;
+  private readonly baseUrl: string;
+  private readonly eventKey: CryptoKey;
+  private readonly presenceKey: CryptoKey;
+  private readonly adminKey: CryptoKey | null;
+  private readonly roomVerifier: string;
+  private readonly adminVerifier: string | null;
+
+  // Runtime state
+  private ws: WebSocket | null = null;
+  /**
+   * Monotonic generation counter. Incremented every time openSocket()
+   * installs a new WebSocket. Queued async handlers (room.snapshot,
+   * room.event, room.presence, room.error) capture the
+   * generation at dispatch time and re-check it after any async decrypt
+   * before mutating state — so a late decrypt from a retired socket can
+   * never clobber the newer socket's state, even though the retired
+   * socket's onmessage was already short-circuited by the retiredSockets
+   * gate (the async continuation could still be in flight).
+   */
+  private socketGeneration = 0;
+  /**
+   * Sockets we've actively retired. Their onmessage/onclose/onerror handlers
+   * no-op once a socket is in this set. WeakSet so retired sockets can be
+   * GC'd once they close.
+   *
+   * Two paths add to this set:
+   *   1. openSocket() when REPLACING a prior socket — the replacement retires
+   *      the predecessor so its late events don't clobber the new socket.
+   *   2. closeSocket() for INTENTIONAL closes of the current socket
+   *      (disconnect, connect timeout, auth-proof failure). These callers
+   *      do their own synchronous lifecycle cleanup (reject pendingConnect /
+   *      pendingAdmin, set status, clear presence) BEFORE calling closeSocket,
+   *      so the async onclose does not need to run handleSocketClose — and
+   *      must not, or it could clobber state the caller already settled.
+   *
+   * Network-initiated closes of the current socket (server close, network
+   * drop) do NOT go through closeSocket — they reach onclose directly with
+   * the socket NOT in this set, so handleSocketClose runs as normal and does
+   * the reconnect / pending-rejection logic itself.
+   */
+  private retiredSockets = new WeakSet<WebSocket>();
+  private clientId: string = '';                // regenerated per connect
+  private status: ConnectionStatus = 'disconnected';
+  /**
+   * True after the server closed our socket with the "room unavailable"
+   * terminal code. Replaces the former `roomStatus` tri-state — the
+   * client does not distinguish admin delete, auto-expiry, or
+   * unknown-room. All three produce the same generic terminal UX.
+   */
+  private roomUnavailable: boolean = false;
+  private seq: number = 0;
+  private planMarkdown: string = '';
+  private annotations = new Map<string, RoomAnnotation>();
+  private remotePresence = new Map<string, { presence: PresenceState; lastSeen: number }>();
+  private lastError: { code: string; message: string; scope: 'mutation' | 'admin' | 'event' | 'presence' | 'snapshot' | 'join' } | null = null;
+  /**
+   * Monotonic id bumped on every NEW lastError assignment. Exposed via
+   * `CollabRoomState.lastErrorId` so consumers can dedupe state emissions
+   * without relying on object identity — buildState() clones `lastError`
+   * each call, so identity changes even when the underlying error didn't.
+   * Clearing (lastError = null) does NOT bump — consumers can check
+   * `state.lastError === null` independently.
+   */
+  private lastErrorId: number = 0;
+
+  /**
+   * Centralized setter so every event-channel error assignment bumps
+   * `lastErrorId`. Prefer this over direct `this.lastError = ...`; the
+   * direct form is only appropriate for `= null` resets.
+   */
+  private setLastError(
+    code: string,
+    message: string,
+    scope: 'mutation' | 'admin' | 'event' | 'presence' | 'snapshot' | 'join',
+  ): void {
+    this.lastError = { code, message, scope };
+    this.lastErrorId++;
+  }
+  /**
+   * True when the most-recent snapshot attempt failed (malformed or
+   * decrypt-failed) and a valid baseline has not yet been re-established.
+   * While true, inbound room.events are rejected — applying events on top of
+   * a stale baseline would produce silently-divergent local state. Cleared
+   * when a valid snapshot is applied or the client reconnects.
+   */
+  private baselineInvalid = false;
+
+  // Admin flow
+  private pendingAdmin: PendingAdmin | null = null;
+
+  // Lifecycle state
+  private pendingConnect: PendingConnect | null = null;
+  private pendingConnectPromise: Promise<void> | null = null;
+  private userDisconnected = false;
+
+  // Serialized async message processing queue.
+  // Ensures snapshot/event/presence decrypts apply in wire order regardless
+  // of decrypt latency variance. Prevents the race where an event's decrypt
+  // finishes before a concurrent snapshot's decrypt and then gets clobbered.
+  private messageQueue: Promise<void> = Promise.resolve();
+  /**
+   * Serializes outbound EVENT-channel sends. Encryption is async, so two
+   * concurrent sendAnnotationAdd()/Remove()/Update()/Clear() calls could
+   * otherwise race and send in completion order rather than call order —
+   * a user clicking "add" then "remove" could see remove land first, leaving
+   * the annotation the remove was supposed to delete. Presence is NOT in
+   * this queue — it's lossy by design and throughput matters more than
+   * strict ordering there.
+   */
+  private outboundEventQueue: Promise<unknown> = Promise.resolve();
+  private reconnectAttempt = 0;
+  private reconnectTimer: ReturnType<typeof setTimeout> | null = null;
+  private presenceSweepTimer: ReturnType<typeof setInterval> | null = null;
+  /**
+   * Watchdog for auto-reconnect handshakes. Initial connect() uses
+   * pendingConnect's own connectTimeoutMs; auto-reconnect does not, so
+   * without this a reconnect socket that opens but never authenticates would
+   * hang the client in `connecting` / `authenticating` forever.
+   */
+  private reconnectHandshakeTimer: ReturnType<typeof setTimeout> | null = null;
+
+  // Injected / options
+  private readonly WebSocketImpl: typeof WebSocket;
+  private readonly reconnectOpts: Required<ReconnectOptions>;
+  private readonly connectTimeoutMs: number;
+  private readonly presenceTtlMs: number;
+  private readonly presenceSweepIntervalMs: number;
+
+  // Emitter
+  private readonly emitter = new TypedEventEmitter<CollabRoomEvents>();
+
+  constructor(options: InternalClientOptions) {
+    this.roomId = options.roomId;
+    this.baseUrl = options.baseUrl;
+    this.eventKey = options.eventKey;
+    this.presenceKey = options.presenceKey;
+    this.adminKey = options.adminKey;
+    this.roomVerifier = options.roomVerifier;
+    this.adminVerifier = options.adminVerifier;
+    // options.user is reserved for future use (presence auto-construction); not stored.
+    this.WebSocketImpl = options.webSocketImpl ?? WebSocket;
+    this.reconnectOpts = {
+      initialDelayMs: options.reconnect?.initialDelayMs ?? DEFAULT_BACKOFF.initialDelayMs,
+      maxDelayMs: options.reconnect?.maxDelayMs ?? DEFAULT_BACKOFF.maxDelayMs,
+      factor: options.reconnect?.factor ?? DEFAULT_BACKOFF.factor,
+      maxAttempts: options.reconnect?.maxAttempts ?? Number.POSITIVE_INFINITY,
+    };
+    this.connectTimeoutMs = options.connectTimeoutMs ?? DEFAULT_CONNECT_TIMEOUT_MS;
+    this.presenceTtlMs = options.presenceTtlMs ?? DEFAULT_PRESENCE_TTL_MS;
+    this.presenceSweepIntervalMs = options.presenceSweepIntervalMs ?? DEFAULT_PRESENCE_SWEEP_INTERVAL_MS;
+
+    // Seed initial snapshot if provided (by createRoom). Clone on store so
+    // a caller mutating their snapshot object later can't reach back into
+    // the client's internal annotations map.
+    if (options.initialSnapshot) {
+      this.planMarkdown = options.initialSnapshot.planMarkdown;
+      for (const ann of options.initialSnapshot.annotations) {
+        this.annotations.set(ann.id, cloneRoomAnnotation(ann));
+      }
+    }
+  }
+
+  // ---------------------------------------------------------------------------
+  // Public API
+  // ---------------------------------------------------------------------------
+
+  on<K extends keyof CollabRoomEvents>(
+    name: K,
+    fn: (p: CollabRoomEvents[K]) => void,
+  ): () => void {
+    return this.emitter.on(name, fn);
+  }
+
+  getState(): CollabRoomState {
+    return this.buildState();
+  }
+
+  async connect(): Promise<void> {
+    // Already authenticated → resolved no-op
+    if (this.status === 'authenticated') {
+      return;
+    }
+
+    // Already in-flight → return the existing pending promise (shared by all callers).
+    // Invariant: pendingConnect and pendingConnectPromise are always set/cleared
+    // together. If this fires, it indicates a programming error.
+    if (this.pendingConnect) {
+      if (!this.pendingConnectPromise) {
+        throw new Error('CollabRoomClient connect() invariant violated: pendingConnect set without pendingConnectPromise');
+      }
+      return this.pendingConnectPromise;
+    }
+
+    // Explicit connect clears any poisoned state from prior disconnect/terminal
+    this.userDisconnected = false;
+    this.lastError = null;
+    this.reconnectAttempt = 0;
+    this.clearReconnectTimer();
+
+    // Build the promise FIRST, wire up pendingConnect + pendingConnectPromise,
+    // and only then open the socket. openSocket() calls setStatus('connecting'),
+    // which synchronously emits state. If a listener re-enters connect() during
+    // that emission, both refs must already be consistent — otherwise the
+    // fallback return would hand out a promise that's disconnected from the
+    // actual handshake.
+    let resolve!: () => void;
+    let reject!: (err: Error) => void;
+    const promise = new Promise<void>((res, rej) => { resolve = res; reject = rej; });
+    const timeoutHandle = setTimeout(() => {
+      if (this.pendingConnect) {
+        // Synchronous cleanup: closeSocket retires the socket so its async
+        // onclose won't re-enter handleSocketClose. All lifecycle transitions
+        // happen here.
+        this.pendingConnect = null;
+        this.pendingConnectPromise = null;
+        this.closeSocket(1000, 'connect timeout');
+        this.setStatus('disconnected');
+        reject(new ConnectTimeoutError());
+      }
+    }, this.connectTimeoutMs);
+
+    this.pendingConnect = { resolve, reject, timeoutHandle };
+    this.pendingConnectPromise = promise;
+    // Clean up promise ref when settled — attach BEFORE openSocket so the
+    // handlers exist if an unusual synchronous rejection path fires.
+    promise.then(
+      () => { if (this.pendingConnectPromise === promise) this.pendingConnectPromise = null; },
+      () => { if (this.pendingConnectPromise === promise) this.pendingConnectPromise = null; },
+    );
+
+    // openSocket() runs outside the Promise executor (so pendingConnectPromise
+    // is already assigned before `setStatus('connecting')` emits). That means
+    // a synchronous throw here — e.g. `new URL(baseUrl)` rejecting a bad base,
+    // or a WebSocket constructor throwing — would otherwise leave pendingConnect
+    // and the timeout live, poisoning later connect() calls with a stale
+    // in-flight promise. Catch, clean up, and reject the connect promise.
+    try {
+      this.openSocket();
+    } catch (err) {
+      clearTimeout(timeoutHandle);
+      if (this.pendingConnect?.timeoutHandle === timeoutHandle) {
+        this.pendingConnect = null;
+      }
+      if (this.pendingConnectPromise === promise) {
+        this.pendingConnectPromise = null;
+      }
+      this.setStatus('disconnected');
+      reject(err instanceof Error ? err : new Error(String(err)));
+    }
+    return promise;
+  }
+
+  disconnect(reason?: string): void {
+    this.userDisconnected = true;
+    this.clearReconnectTimer();
+    this.clearReconnectHandshakeTimer();
+    // Synchronous lifecycle cleanup — closeSocket retires the socket, so the
+    // async onclose will NOT run handleSocketClose to do this cleanup for us.
+    if (this.pendingConnect) {
+      clearTimeout(this.pendingConnect.timeoutHandle);
+      const { reject } = this.pendingConnect;
+      this.pendingConnect = null;
+      this.pendingConnectPromise = null;
+      reject(new AuthRejectedError('Disconnected by user'));
+    }
+    if (this.pendingAdmin) {
+      const pending = this.pendingAdmin;
+      this.pendingAdmin = null;
+      clearTimeout(pending.timeoutHandle);
+      pending.reject(new AdminInterruptedError());
+    }
+    this.remotePresence.clear();
+    this.closeSocket(1000, reason ?? 'user disconnect');
+    this.stopPresenceSweep();
+    this.setStatus('closed');
+  }
+
+  // ---------------------------------------------------------------------------
+  // Mutation contract (V1)
+  //
+  // Mutation methods below resolve when the op is SENT, not when local state
+  // has been updated. Local state updates when the server echoes the op back
+  // via room.event — subscribe to the `state` event to observe post-echo
+  // state.annotations. A caller that awaits `sendAnnotationAdd(...)` and then
+  // reads `getState().annotations` may still see pre-echo state.
+  //
+  // Rationale: V1 has no opId-correlated ack/reject (see sendOp comments).
+  // Applying optimistically would be unsafe; requiring a round-trip before
+  // resolution would couple send latency to UI responsiveness. Decoupling the
+  // send ack from the state update matches the wire semantics exactly.
+  // ---------------------------------------------------------------------------
+
+  /** Resolves when queued/sent to the server. State updates arrive via `state` events after echo. */
+  async sendAnnotationAdd(annotations: RoomAnnotation[]): Promise<void> {
+    // Clone SYNCHRONOUSLY before validation + queueing so the payload is
+    // immutable with respect to caller mutations after this call returns.
+    const op = cloneRoomEventClientOp({ type: 'annotation.add', annotations });
+    if (!isRoomEventClientOp(op)) {
+      throw new InvalidOutboundPayloadError('Invalid annotation.add payload');
+    }
+    await this.sendOp(op);
+  }
+
+  /** Resolves when queued/sent to the server. State updates arrive via `state` events after echo. */
+  async sendAnnotationUpdate(id: string, patch: Partial<RoomAnnotation>): Promise<void> {
+    const op = cloneRoomEventClientOp({ type: 'annotation.update', id, patch });
+    if (!isRoomEventClientOp(op)) {
+      throw new InvalidOutboundPayloadError('Invalid annotation.update payload');
+    }
+    await this.sendOp(op);
+  }
+
+  /** Resolves when queued/sent to the server. State updates arrive via `state` events after echo. */
+  async sendAnnotationRemove(ids: string[]): Promise<void> {
+    const op = cloneRoomEventClientOp({ type: 'annotation.remove', ids });
+    if (!isRoomEventClientOp(op)) {
+      throw new InvalidOutboundPayloadError('Invalid annotation.remove payload');
+    }
+    await this.sendOp(op);
+  }
+
+  /** Resolves when queued/sent to the server. State updates arrive via `state` events after echo. */
+  async sendAnnotationClear(source?: string): Promise<void> {
+    const op = cloneRoomEventClientOp({ type: 'annotation.clear', source });
+    if (!isRoomEventClientOp(op)) {
+      throw new InvalidOutboundPayloadError('Invalid annotation.clear payload');
+    }
+    await this.sendOp(op);
+  }
+
+  async sendPresence(presence: PresenceState): Promise<void> {
+    // Shape validation is a real programming error (caller passed an
+    // invalid object); surface it even for fire-and-forget callers.
+    if (!isPresenceState(presence)) {
+      throw new InvalidOutboundPayloadError('Invalid presence payload');
+    }
+    // Presence is lossy by design — a dropped cursor update is fine; the
+    // next mouse move fires another. Swallow disconnect-only failures so
+    // UI code that calls sendPresence() without awaiting (common for cursor
+    // throttles) doesn't log spurious "not connected" errors during brief
+    // reconnect windows. Shape errors above still throw.
+    try {
+      this.assertConnected();
+    } catch {
+      return;
+    }
+    const opId = generateOpId();
+    const ciphertext = await encryptPresence(this.presenceKey, presence);
+
+    // Recheck socket after async encryption — it may have closed.
+    const ws = this.ws;
+    if (this.status !== 'authenticated' || !ws) {
+      return;  // lossy: see comment above
+    }
+
+    const envelope: ServerEnvelope = {
+      clientId: this.clientId,
+      opId,
+      channel: 'presence',
+      ciphertext,
+    };
+    try {
+      ws.send(JSON.stringify(envelope));
+    } catch {
+      // Socket transitioned to closing between the liveness check and send.
+      // Still lossy — drop silently.
+    }
+  }
+
+  async deleteRoom(): Promise<void> {
+    if (!this.adminKey || !this.adminVerifier) throw new AdminNotAuthorizedError();
+    await this.runAdminCommand({ type: 'room.delete' });
+  }
+
+  // ---------------------------------------------------------------------------
+  // Internal: socket lifecycle
+  // ---------------------------------------------------------------------------
+
+  private openSocket(): void {
+    // Reset clientId; the authoritative value will come from auth.challenge.clientId.
+    // We leave a placeholder here for pre-auth logging only.
+    this.clientId = '';
+
+    // If a socket is already in-flight (e.g. auto-reconnect opened one and the
+    // caller immediately invoked connect() again), RETIRE it. Retirement
+    // marks the socket so its handlers no-op when they eventually fire —
+    // otherwise the old socket's late onclose/onmessage could clobber state
+    // belonging to the new socket.
+    if (this.ws) {
+      this.retireSocket(this.ws);
+    }
+
+    const wsUrl = this.buildWebSocketUrl();
+    this.setStatus('connecting');
+
+    // Abort guard: setStatus emits synchronously. A listener could call
+    // disconnect() during that emission, which sets userDisconnected=true
+    // and puts status at 'closed'. If we continue, we'd open a dead socket.
+    // The same applies if another listener cascade rotated status away from
+    // 'connecting'.
+    if (this.userDisconnected || this.status !== 'connecting') {
+      return;
+    }
+
+    const ws = new this.WebSocketImpl(wsUrl);
+    this.ws = ws;
+    this.socketGeneration++;
+
+    // Arm a handshake watchdog when this socket is opened by auto-reconnect
+    // (pendingConnect is null). Initial connect paths already have their own
+    // connectTimeoutMs on pendingConnect, so we don't double-arm there.
+    this.clearReconnectHandshakeTimer();
+    if (!this.pendingConnect) {
+      this.reconnectHandshakeTimer = setTimeout(() => {
+        this.reconnectHandshakeTimer = null;
+        // Only act if this is still the current socket and we're not
+        // authenticated yet — otherwise the watchdog is stale.
+        if (this.ws !== ws || this.status === 'authenticated') return;
+        this.closeSocket(1000, 'reconnect handshake timeout');
+        this.scheduleReconnectAfterSocketFailure();
+      }, this.connectTimeoutMs);
+    }
+
+    // No ws.onopen handler — we transition to 'authenticating' when the
+    // server sends auth.challenge, not when the socket opens.
+
+    // Handlers gate on the retiredSockets set rather than on `this.ws !== ws`.
+    // The reason: network-initiated closes of the current socket must still
+    // reach handleSocketClose() (for reconnect scheduling and pending-promise
+    // rejection), while replaced or intentionally retired sockets must no-op.
+    // A `this.ws !== ws` check would gate out both paths, so we use the
+    // explicit retiredSockets set to distinguish them.
+    ws.onmessage = (ev: MessageEvent) => {
+      if (this.retiredSockets.has(ws)) return;
+      this.handleSocketMessage(ev.data);
+    };
+
+    ws.onclose = (ev: CloseEvent) => {
+      if (this.retiredSockets.has(ws)) return;
+      this.handleSocketClose(ev.code, ev.reason);
+    };
+
+    ws.onerror = () => {
+      if (this.retiredSockets.has(ws)) return;
+      this.emitter.emit('error', { code: 'socket_error', message: 'WebSocket error' });
+    };
+  }
+
+  /**
+   * Retire a socket without touching this.ws. Used by openSocket() when a
+   * replacement is being installed. Stale handlers on this socket no-op.
+   */
+  private retireSocket(ws: WebSocket): void {
+    this.retiredSockets.add(ws);
+    try { ws.close(1000, 'replaced by new connection'); } catch { /* ignore */ }
+  }
+
+  /**
+   * Intentionally close the CURRENT socket (disconnect, connect timeout, auth
+   * failure). Retires the socket so its async onclose will not re-enter
+   * handleSocketClose in a state where this.ws may have been repointed (in
+   * browsers, ws.close() fires onclose asynchronously — if the caller opens
+   * a new socket before that fires, the stale onclose would otherwise clobber
+   * the new socket's state).
+   *
+   * Because onclose is short-circuited after retirement, callers of this
+   * method MUST do their own synchronous lifecycle cleanup — reject
+   * pendingConnect/pendingAdmin, set status, stop presence sweep — BEFORE
+   * calling closeSocket. Do NOT rely on handleSocketClose running as a side
+   * effect of this call.
+   *
+   * Network-initiated closes of the current socket (server close, network
+   * drop) do NOT go through this method and remain handled by handleSocketClose.
+   */
+  private closeSocket(code: number, reason: string): void {
+    if (!this.ws) return;
+    const ws = this.ws;
+    this.retiredSockets.add(ws);
+    this.ws = null;
+    try {
+      ws.close(code, reason);
+    } catch {
+      // ignore
+    }
+  }
+
+  private handleSocketClose(code: number, reason: string): void {
+    this.ws = null;
+    // Socket is gone — any reconnect-handshake watchdog for it is moot.
+    this.clearReconnectHandshakeTimer();
+
+    // Set the terminal flag BEFORE the pendingAdmin and terminal checks
+    // below. Any close with the dedicated "room unavailable" code means
+    // the link no longer resolves — admin delete, auto-expiry, or an
+    // unknown-room connect. We don't distinguish the cause.
+    if (code === WS_CLOSE_ROOM_UNAVAILABLE) {
+      this.roomUnavailable = true;
+    }
+
+    if (this.pendingConnect) {
+      clearTimeout(this.pendingConnect.timeoutHandle);
+      const { reject } = this.pendingConnect;
+      this.pendingConnect = null;
+      // Clear pendingConnectPromise synchronously too — the microtask-scheduled
+      // .then cleanup runs later; during that window the invariant
+      // "pendingConnect <=> pendingConnectPromise" would be broken if read by
+      // a reentrant caller.
+      this.pendingConnectPromise = null;
+      const err = code === WS_CLOSE_ROOM_UNAVAILABLE
+        ? new RoomUnavailableError(reason || 'Room unavailable')
+        : new AuthRejectedError(`Socket closed during auth: ${reason}`);
+      reject(err);
+      // If disconnect() already fired, respect the terminal intent — don't
+      // overwrite 'closed' with 'disconnected' just because auth was pending.
+      if (this.userDisconnected) {
+        this.stopPresenceSweep();
+        this.setStatus('closed');
+      } else {
+        this.setStatus('disconnected');
+      }
+      return;
+    }
+
+    // Reject pending admin if socket closed mid-flight.
+    // For delete: the server closes our socket with WS_CLOSE_ROOM_UNAVAILABLE
+    // as the success signal — purging the room tears down all sockets
+    // (including ours). Any other close (network drop, server error) must
+    // reject so callers don't mistakenly believe a failed/interrupted
+    // delete succeeded.
+    if (this.pendingAdmin) {
+      const pending = this.pendingAdmin;
+      this.pendingAdmin = null;
+      clearTimeout(pending.timeoutHandle);
+      const isSuccessfulDeleteClose =
+        pending.command.type === 'room.delete' &&
+        code === WS_CLOSE_ROOM_UNAVAILABLE;
+      if (isSuccessfulDeleteClose) {
+        pending.resolve();
+      } else {
+        pending.reject(new AdminInterruptedError());
+      }
+    }
+
+    this.remotePresence.clear();
+    this.stopPresenceSweep();
+
+    // Terminal close or user-initiated? Don't reconnect.
+    // (roomUnavailable is set above iff code === WS_CLOSE_ROOM_UNAVAILABLE,
+    // so checking the flag alone covers both.)
+    const isTerminal = this.userDisconnected || this.roomUnavailable;
+
+    if (isTerminal) {
+      // setStatus already emits `state` on a transition; no trailing emitState
+      // needed (would cause a redundant React render).
+      this.setStatus('closed');
+      return;
+    }
+
+    // Auto-reconnect shares implementation with the explicit-failure path.
+    this.scheduleReconnect();
+  }
+
+  /**
+   * Explicit reconnect scheduling without waiting for onclose. Used by code
+   * paths that deterministically close the current socket (e.g. auth-proof
+   * failure during auto-reconnect) and need the client to continue the
+   * reconnect loop rather than sit in the closing state waiting for a
+   * deferred close event.
+   */
+  private scheduleReconnectAfterSocketFailure(): void {
+    this.remotePresence.clear();
+    this.stopPresenceSweep();
+
+    if (this.userDisconnected || this.roomUnavailable) {
+      this.setStatus('closed');
+      return;
+    }
+
+    this.scheduleReconnect();
+  }
+
+  /**
+   * Shared reconnect scheduling: checks max-attempts, transitions to
+   * 'reconnecting' or 'closed', and arms the backoff timer.
+   */
+  private scheduleReconnect(): void {
+    if (this.reconnectAttempt >= this.reconnectOpts.maxAttempts) {
+      this.setStatus('closed');
+      return;
+    }
+    this.setStatus('reconnecting');
+    const delay = computeBackoffMs(this.reconnectAttempt++, this.reconnectOpts);
+    this.reconnectTimer = setTimeout(() => {
+      this.reconnectTimer = null;
+      this.openSocket();
+    }, delay);
+  }
+
+  // ---------------------------------------------------------------------------
+  // Internal: message dispatch
+  // ---------------------------------------------------------------------------
+
+  private handleSocketMessage(raw: unknown): void {
+    let msg: Record<string, unknown>;
+    try {
+      const text = typeof raw === 'string' ? raw : String(raw);
+      msg = JSON.parse(text);
+    } catch {
+      return; // malformed server message — ignore
+    }
+
+    // Auth phase messages
+    if (msg.type === 'auth.challenge') {
+      this.handleAuthChallenge(msg as unknown as AuthChallenge);
+      return;
+    }
+    if (msg.type === 'auth.accepted') {
+      this.handleAuthAccepted(msg as unknown as AuthAccepted);
+      return;
+    }
+
+    // Admin challenge (response to admin.challenge.request)
+    if (msg.type === 'admin.challenge') {
+      this.handleAdminChallenge(msg as unknown as AdminChallenge);
+      return;
+    }
+
+    // Transport messages — serialize via messageQueue so decrypts apply in wire order.
+    // Capture the socket generation at dispatch time. The handlers below
+    // re-check it after any async decrypt and drop the message if the
+    // generation has rolled (reconnect opened a new socket during the
+    // decrypt). This prevents stale messages from clobbering newer state.
+    const gen = this.socketGeneration;
+    if (msg.type === 'room.snapshot') {
+      const snap = msg as unknown as Extract<RoomTransportMessage, { type: 'room.snapshot' }>;
+      this.enqueue(() => this.handleRoomSnapshot(snap, gen));
+      return;
+    }
+    if (msg.type === 'room.event') {
+      const event = msg as unknown as Extract<RoomTransportMessage, { type: 'room.event' }>;
+      this.enqueue(() => this.handleRoomEvent(event, gen));
+      return;
+    }
+    if (msg.type === 'room.presence') {
+      const presence = msg as unknown as Extract<RoomTransportMessage, { type: 'room.presence' }>;
+      this.enqueue(() => this.handleRoomPresence(presence, gen));
+      return;
+    }
+    if (msg.type === 'room.error') {
+      // Route through the queue so an error that references a specific event
+      // (e.g. validation_error for an in-flight op) can't beat the event /
+      // status messages that preceded it in wire order.
+      const err = msg as unknown as Extract<RoomTransportMessage, { type: 'room.error' }>;
+      this.enqueue(async () => { this.handleRoomError(err, gen); });
+      return;
+    }
+    if (msg.type === 'room.participant.left') {
+      // Broadcast from the server when a peer's WebSocket closed.
+      // Drop their presence immediately so the UI doesn't hold a
+      // ghost cursor until the 30s TTL sweep — that stale window
+      // made "refresh to test" show one extra bubble per refresh.
+      //
+      // Route through the queue so the delete observes wire order
+      // against any still-decrypting presence from the same peer.
+      // Without this, wire order presence→left lets the queued
+      // presence decrypt resolve AFTER the synchronous delete and
+      // re-insert the peer — reviving the ghost for a full TTL.
+      //
+      // Protocol validation: require a non-empty string clientId.
+      // Garbage from a non-conforming server or a buggy relay is
+      // ignored rather than corrupting the presence map.
+      const left = msg as unknown as Extract<RoomTransportMessage, { type: 'room.participant.left' }>;
+      this.enqueue(async () => {
+        if (typeof left.clientId === 'string' && left.clientId.length > 0) {
+          if (this.remotePresence.delete(left.clientId)) {
+            this.emitState();
+          }
+        }
+      });
+      return;
+    }
+  }
+
+  private async handleAuthChallenge(challenge: AuthChallenge): Promise<void> {
+    this.setStatus('authenticating');
+    // The server assigns clientId on the challenge; adopt it here so the
+    // proof binds to exactly the value the server will verify. Capturing
+    // `ws` and `clientId` locally lets the post-await guard detect a
+    // rotation (reconnect opened a new socket mid-proof) and drop the
+    // stale response.
+    //
+    // Protocol-shape validation. Missing/malformed challenge fields come from
+    // an old server or malformed message and must fail fast — otherwise the
+    // client would sit in `authenticating` until connectTimeoutMs.
+    const protocolError =
+      (typeof challenge.clientId !== 'string' || challenge.clientId.length === 0)
+        ? 'Missing or invalid clientId in auth.challenge'
+      : (typeof challenge.challengeId !== 'string' || challenge.challengeId.length === 0)
+        ? 'Missing or invalid challengeId in auth.challenge'
+      : (typeof challenge.nonce !== 'string' || challenge.nonce.length === 0)
+        ? 'Missing or invalid nonce in auth.challenge'
+      : (typeof challenge.expiresAt !== 'number' || !Number.isFinite(challenge.expiresAt))
+        ? 'Missing or invalid expiresAt in auth.challenge'
+      : null;
+    if (protocolError) {
+      this.emitter.emit('error', { code: 'auth_error', message: protocolError });
+      const currentWs = this.ws;
+      if (this.pendingConnect) {
+        clearTimeout(this.pendingConnect.timeoutHandle);
+        const { reject } = this.pendingConnect;
+        this.pendingConnect = null;
+        this.pendingConnectPromise = null;
+        this.closeSocket(1000, 'invalid auth.challenge');
+        this.setStatus('disconnected');
+        reject(new AuthRejectedError(protocolError));
+      } else if (currentWs) {
+        // Auto-reconnect path — close and schedule the next attempt.
+        this.closeSocket(1000, 'invalid auth.challenge');
+        this.scheduleReconnectAfterSocketFailure();
+      }
+      return;
+    }
+    this.clientId = challenge.clientId;
+    const ws = this.ws;
+    const clientId = challenge.clientId;
+    try {
+      const proof = await computeAuthProof(
+        this.roomVerifier,
+        this.roomId,
+        clientId,
+        challenge.challengeId,
+        challenge.nonce,
+      );
+      if (this.userDisconnected || !ws || this.ws !== ws || this.clientId !== clientId || this.status !== 'authenticating') {
+        return;  // socket/identity rotated or cleared, or user disconnected during async proof; drop the stale response
+      }
+      const response = {
+        type: 'auth.response',
+        challengeId: challenge.challengeId,
+        clientId,
+        proof,
+        // When baselineInvalid, our local state is unknown relative to the
+        // server. Omit lastSeq so the server falls back to the snapshot path
+        // and re-establishes an authoritative baseline — otherwise it may
+        // "fast-forward" replay, skip the snapshot, and leave us silently
+        // stale forever.
+        lastSeq: !this.baselineInvalid && this.seq > 0 ? this.seq : undefined,
+      };
+      ws.send(JSON.stringify(response));
+    } catch (err) {
+      // Stale-identity drop: mirror the success-path guard. If the socket or
+      // identity rotated during the failed proof computation, the current
+      // pending state belongs to a NEW attempt; acting on it would clobber it.
+      if (this.userDisconnected || !ws || this.ws !== ws || this.clientId !== clientId) {
+        return;
+      }
+      // Reject pendingConnect immediately with the real error rather than waiting for timeout
+      const authErr = new AuthRejectedError(`Auth proof computation failed: ${String(err)}`);
+      this.emitter.emit('error', { code: 'auth_error', message: String(err) });
+      if (this.pendingConnect) {
+        // Initial connect path — reject the caller and transition to disconnected.
+        clearTimeout(this.pendingConnect.timeoutHandle);
+        const { reject } = this.pendingConnect;
+        this.pendingConnect = null;
+        this.pendingConnectPromise = null;
+        // Synchronous cleanup: closeSocket retires the socket so its async
+        // onclose won't re-enter handleSocketClose.
+        this.closeSocket(1000, 'auth proof failed');
+        this.setStatus('disconnected');
+        reject(authErr);
+      } else if (ws && this.ws === ws) {
+        // Auto-reconnect path — pendingConnect is null, but we're still in
+        // `authenticating` from setStatus() above. Without explicit handling,
+        // the client would sit in 'authenticating' until the server eventually
+        // closes the socket.
+        //
+        // Retire the socket synchronously (so its deferred onclose no-ops via
+        // retiredSockets) and explicitly schedule the next reconnect attempt
+        // instead of waiting for the onclose round-trip. This is deterministic
+        // and avoids any double-transition emission.
+        this.closeSocket(1000, 'auth proof failed');
+        this.scheduleReconnectAfterSocketFailure();
+      }
+    }
+  }
+
+  private handleAuthAccepted(_accepted: AuthAccepted): void {
+    // Defense-in-depth: a rotated/disconnected client should not promote
+    // itself to 'authenticated' on a late auth.accepted from a retired socket.
+    if (this.userDisconnected) return;
+    // Handshake complete — disarm any reconnect-phase watchdog.
+    this.clearReconnectHandshakeTimer();
+    // Do NOT clear baselineInvalid here. Authentication itself does not
+    // establish an authoritative baseline — only a valid snapshot apply
+    // does (see handleRoomSnapshot). If the previous session ended with a
+    // bad-snapshot baselineInvalid=true and the reconnect's lastSeq was
+    // (correctly) omitted, the server will send us a snapshot next; that
+    // snapshot's apply is what clears the flag. Clearing here would leave
+    // a window where post-accept events apply on stale local state.
+    // Clear lastError BEFORE transitioning to 'authenticated'. setStatus()
+    // emits the `state` event; if we flipped to 'authenticated' first,
+    // subscribers would briefly see connectionStatus='authenticated' with a
+    // stale lastError — a confusing intermediate state for UI consumers.
+    this.lastError = null;
+    this.setStatus('authenticated');
+    // this.seq means "last server seq consumed by this client".
+    // Valid events advance seq after applying state. Malformed or undecryptable
+    // events may advance seq without state mutation to preserve replay forward
+    // progress (see handleRoomEvent).
+    //
+    // Do NOT advance this.seq from accepted.seq. The server sends the snapshot
+    // and replayed events *after* auth.accepted. If the socket drops between
+    // accepted and those events being consumed, the next reconnect's
+    // auth.response could claim lastSeq = server.seq and skip replay, leaving
+    // local state stale. seq advances only when an event/snapshot has actually
+    // been consumed by this client.
+
+    // Start presence sweep
+    this.startPresenceSweep();
+
+    // Reset reconnect state
+    this.reconnectAttempt = 0;
+
+    // Resolve pending connect
+    if (this.pendingConnect) {
+      clearTimeout(this.pendingConnect.timeoutHandle);
+      const { resolve } = this.pendingConnect;
+      this.pendingConnect = null;
+      // Keep the invariant literally true: clear the promise ref synchronously
+      // alongside pendingConnect rather than waiting for the microtask cleanup.
+      this.pendingConnectPromise = null;
+      resolve();
+    }
+
+    this.emitState();
+  }
+
+  private async handleRoomSnapshot(
+    msg: Extract<RoomTransportMessage, { type: 'room.snapshot' }>,
+    gen: number,
+  ): Promise<void> {
+    // Pre-decrypt socket-generation guard: drop snapshots that arrived on a
+    // now-retired socket BEFORE spending decrypt time on them. Mirrors the
+    // pre-decrypt check in handleRoomEvent/handleRoomPresence.
+    if (gen !== this.socketGeneration) return;
+    try {
+      const snapshot = await decryptSnapshot(this.eventKey, msg.snapshotCiphertext);
+      // Post-decrypt re-check: if reconnect rolled the socket while we were
+      // decrypting, this snapshot belongs to the retired session and must
+      // not mutate current state or the newer socket's baseline.
+      if (gen !== this.socketGeneration) return;
+      // Encryption only proves the sender held the room key. Validate shape
+      // before replacing state — a malformed snapshot would corrupt the view.
+      if (!isRoomSnapshot(snapshot)) {
+        // Snapshot is the highest-impact inbound message (it establishes or
+        // replaces the entire baseline). Surface failures via lastError +
+        // state so hook consumers subscribed only to `state` can react.
+        // Also mark the baseline invalid so subsequent room.events cannot
+        // apply on top of stale local state until a valid snapshot lands.
+        this.baselineInvalid = true;
+        this.setLastError('snapshot_malformed', 'Snapshot payload failed shape validation', 'snapshot');
+        this.emitter.emit('error', { code: 'snapshot_malformed', message: 'Snapshot payload failed shape validation' });
+        this.emitState();
+        return;
+      }
+      // Valid snapshot — baseline is authoritative again.
+      this.baselineInvalid = false;
+      this.planMarkdown = snapshot.planMarkdown;
+      this.annotations.clear();
+      // Defensive clone on store: the decrypted snapshot payload is untrusted
+      // shape-wise AND is a freshly-allocated JSON object that we might also
+      // emit to external subscribers; cloning here guarantees later mutations
+      // to the emitted snapshot cannot reach back into our internal map.
+      for (const ann of snapshot.annotations) {
+        this.annotations.set(ann.id, cloneRoomAnnotation(ann));
+      }
+      // A received snapshot is the authoritative baseline — set seq to
+      // msg.snapshotSeq unconditionally. If we only raised seq when
+      // snapshotSeq > this.seq, a client whose local seq was somehow ahead
+      // (e.g. a corrupted reconnect state or the server's "future claim"
+      // fallback) would keep sending that bad lastSeq on subsequent
+      // reconnects and never self-repair.
+      this.seq = msg.snapshotSeq;
+      // Emit a cloned snapshot so direct event subscribers can mutate freely.
+      this.emitter.emit('snapshot', {
+        ...snapshot,
+        annotations: snapshot.annotations.map(cloneRoomAnnotation),
+      });
+      this.emitState();
+    } catch (err) {
+      // Socket-generation guard: decrypt failed on a stale socket; do not
+      // mark the NEW session's baseline invalid.
+      if (gen !== this.socketGeneration) return;
+      // Baseline establishment failed — block event application until the
+      // next valid snapshot or reconnect clears the flag.
+      this.baselineInvalid = true;
+      const payload = { code: 'snapshot_decrypt_failed', message: String(err) };
+      this.setLastError(payload.code, payload.message, 'snapshot');
+      this.emitter.emit('error', payload);
+      this.emitState();
+    }
+  }
+
+  private async handleRoomEvent(
+    msg: Extract<RoomTransportMessage, { type: 'room.event' }>,
+    gen: number,
+  ): Promise<void> {
+    const { seq, envelope } = msg;
+
+    // Socket-generation guard: drop events that arrived on a now-retired
+    // socket. This must run BEFORE the stale-seq check because a retired
+    // socket might deliver seq values that look valid relative to the
+    // current socket's (possibly-different) seq.
+    if (gen !== this.socketGeneration) return;
+
+    // Stale-event guard: drop anything at-or-below our consumed seq. This
+    // can happen on reconnect replay if the server re-sends events we
+    // already consumed, or on a dup from a server-side hiccup. We must not
+    // decrypt, validate, apply, OR emit — doing any of those would lie
+    // about local state having changed.
+    if (seq <= this.seq) {
+      return;
+    }
+
+    // Baseline-invalid guard: a prior snapshot decrypt/shape failure left
+    // local state in an unknown relation to the server. Applying events on
+    // top of that is silent divergence. Consume the seq for forward progress
+    // and keep surfacing the (already-set) snapshot error via state, but do
+    // not apply.
+    if (this.baselineInvalid) {
+      this.seq = seq;
+      this.emitState();
+      return;
+    }
+
+    // V1: no optimistic apply and no echo dedup. Every room.event (including
+    // our own echoes) is applied here. The server's event log is the authority;
+    // replay after reconnect also funnels through this path.
+    try {
+      const decrypted = await decryptEventPayload(this.eventKey, envelope.ciphertext);
+      // Post-decrypt generation guard — reconnect could have rolled the
+      // socket while we were decrypting.
+      if (gen !== this.socketGeneration) return;
+      // Encryption only proves the sender had the room key. Reject malformed
+      // ops (e.g. annotation.add with null id/type fields) before they hit
+      // applyAnnotationEvent and corrupt state.
+      // Narrow validator: event-channel ops only. presence.update must NOT
+      // be accepted here — it would otherwise land in the durable event log.
+      if (!isRoomEventClientOp(decrypted)) {
+        const err = {
+          code: 'event_malformed',
+          message: `Malformed event op from clientId=${envelope.clientId} at seq=${seq}`,
+        };
+        this.setLastError(err.code, err.message, 'event');  // inbound event malformed
+        this.emitter.emit('error', err);
+        // V1 forward-progress policy: the server has already sequenced and
+        // persisted this event, so NOT advancing this.seq would cause the
+        // same malformed event to replay on every reconnect (and block all
+        // subsequent valid events 43+). Advance seq, apply nothing, emit the
+        // error. This makes a single malformed event lossy but keeps the
+        // replay stream unblocked, and prevents a malicious participant from
+        // poisoning the client's replay state.
+        this.seq = seq;
+        this.emitState();
+        return;
+      }
+      const op = decrypted;
+      const event = this.clientOpToServerEvent(op);
+      const result = applyAnnotationEvent(this.annotations, event);
+      // Consume the seq regardless — forward-progress (same rationale as the
+      // malformed-op branch above).
+      this.seq = seq;
+      if (!result.applied) {
+        // Op was shape-valid but produced an invalid final state (e.g. an
+        // annotation.update merge that violates the cross-field invariants).
+        // Surface as an error on state; do NOT emit `event` — listeners must
+        // not see a notification for an op that didn't actually change state.
+        const err = {
+          code: 'event_rejected_by_reducer',
+          message: `Event at seq=${seq} rejected by reducer: ${result.reason ?? 'unknown'}`,
+        };
+        this.setLastError(err.code, err.message, 'event');  // inbound event reducer-rejected
+        this.emitter.emit('error', err);
+        this.emitState();
+        return;
+      }
+      // Emit a cloned event so direct event subscribers can mutate freely
+      // without reaching into our internal annotations map.
+      this.emitter.emit('event', cloneRoomServerEvent(event));
+      this.emitState();
+    } catch (err) {
+      // Post-decrypt generation guard — don't mutate newer socket's state
+      // from a stale decrypt failure.
+      if (gen !== this.socketGeneration) return;
+      const payload = { code: 'event_decrypt_failed', message: String(err) };
+      this.setLastError(payload.code, payload.message, 'event');  // inbound event decrypt failed
+      this.emitter.emit('error', payload);
+      // Same forward-progress policy as malformed events — the server has
+      // already sequenced this event, so we must advance seq or the same
+      // undecryptable payload will replay on every reconnect indefinitely.
+      // Stale-seq guard at the top of this method already ruled out seq <= this.seq,
+      // so unconditional assignment here is safe.
+      this.seq = seq;
+      this.emitState();
+    }
+  }
+
+  private async handleRoomPresence(
+    msg: Extract<RoomTransportMessage, { type: 'room.presence' }>,
+    gen: number,
+  ): Promise<void> {
+    // Pre-decrypt generation guard: skip presence from retired sockets.
+    if (gen !== this.socketGeneration) return;
+    try {
+      const presence = await decryptPresence(this.presenceKey, msg.envelope.ciphertext);
+      // Post-decrypt generation guard — reconnect could have rolled during decrypt.
+      if (gen !== this.socketGeneration) return;
+      // Encryption only proves the sender has the room key. Validate the shape
+      // before letting it into client state to prevent malformed-presence attacks
+      // from crashing UI render code.
+      if (!isPresenceState(presence)) {
+        const err = {
+          code: 'presence_malformed',
+          message: `Malformed presence from clientId=${msg.envelope.clientId}`,
+        };
+        this.setLastError(err.code, err.message, 'presence');
+        this.emitter.emit('error', err);
+        this.emitState();
+        return;
+      }
+      // Store a clone so subsequent mutations to the decrypted/emitted object
+      // can't reach back into our internal remotePresence map.
+      this.remotePresence.set(msg.envelope.clientId, {
+        presence: clonePresenceState(presence),
+        lastSeen: Date.now(),
+      });
+      this.emitter.emit('presence', {
+        clientId: msg.envelope.clientId,
+        presence: clonePresenceState(presence),
+      });
+      this.emitState();
+    } catch (err) {
+      // Post-decrypt generation guard.
+      if (gen !== this.socketGeneration) return;
+      const payload = { code: 'presence_decrypt_failed', message: String(err) };
+      this.setLastError(payload.code, payload.message, 'presence');
+      this.emitter.emit('error', payload);
+      this.emitState();
+    }
+  }
+
+  private handleRoomError(
+    msg: Extract<RoomTransportMessage, { type: 'room.error' }>,
+    gen: number,
+  ): void {
+    // Drop errors from retired sockets — they reference operations on a
+    // session the client has already moved past.
+    if (gen !== this.socketGeneration) return;
+    // Classify scope from the server code. `admin` errors are consumed
+    // by pendingAdmin handling; everything else from the server is a
+    // rejection of a mutation WE sent (the server only returns room.error
+    // to the originator of the rejected op). The annotation controller
+    // uses `'mutation'` to transition pending → failed.
+    const scope: 'mutation' | 'admin' = ADMIN_SCOPED_ERROR_CODES.has(msg.code) ? 'admin' : 'mutation';
+    this.setLastError(msg.code, msg.message, scope);
+    this.emitter.emit('error', { code: msg.code, message: msg.message });
+
+    // Reject pending admin ONLY for admin-scoped error codes. Event-channel
+    // errors like `validation_error` can land while an admin command is in
+    // flight (e.g. a concurrent annotation op hit a validation failure just
+    // after the admin command was accepted); rejecting pendingAdmin on those
+    // would fail a successful admin command whose terminal status broadcast
+    // is still in-flight. Admin-scoped codes are the ones the server emits
+    // exclusively from the admin command path.
+    if (this.pendingAdmin && scope === 'admin') {
+      const pending = this.pendingAdmin;
+      clearTimeout(pending.timeoutHandle);
+      this.pendingAdmin = null;
+      pending.reject(new AdminRejectedError(msg.code, msg.message));
+    }
+
+    this.emitState();
+  }
+
+  // ---------------------------------------------------------------------------
+  // Internal: sending ops
+  // ---------------------------------------------------------------------------
+
+  private sendOp(op: RoomEventClientOp): Promise<void> {
+    // Synchronous precondition check — fail fast before enqueuing.
+    // `assertConnected` throws if status isn't 'authenticated'; a terminal
+    // close (room-unavailable) flips status to 'closed' in handleSocketClose,
+    // so this catches rooms that have been purged as well.
+    this.assertConnected();
+    // Chain onto the outbound queue so concurrent calls send in CALL order,
+    // not encryption-completion order. Without this, a user adding then
+    // removing an annotation in quick succession could see the remove land
+    // first (empty payloads encrypt faster), leaving the annotation that
+    // the remove was meant to delete.
+    const next = this.outboundEventQueue.then(async () => {
+      // Re-check liveness inside the queue — a disconnect or terminal close
+      // could have landed while we were waiting our turn.
+      this.assertConnected();
+
+      const opId = generateOpId();
+      const ciphertext = await encryptEventOp(this.eventKey, op);
+
+      // Recheck socket after async encryption. A terminal close during the
+      // encrypt would otherwise let us send an op the server will never
+      // receive — the user would see the mutation resolve as "sent" and
+      // only learn from async lastError.
+      const ws = this.ws;
+      if (this.status !== 'authenticated' || !ws) {
+        throw new NotConnectedError();
+      }
+
+      const envelope: ServerEnvelope = {
+        clientId: this.clientId,
+        opId,
+        channel: 'event',
+        ciphertext,
+      };
+
+      // V1 policy: server echo is authoritative. We do NOT apply annotation
+      // ops optimistically. See class header for full rationale.
+      ws.send(JSON.stringify(envelope));
+    });
+    // Keep the chain alive even if this op rejects — later ops must still
+    // serialize. The caller's returned promise surfaces the rejection.
+    this.outboundEventQueue = next.catch(() => { /* swallow; caller sees it */ });
+    return next;
+  }
+
+  // Event-channel ops only. Presence is a separate channel with its own
+  // encryption and dispatch; it never flows through this converter.
+  private clientOpToServerEvent(op: RoomEventClientOp): RoomServerEvent {
+    switch (op.type) {
+      case 'annotation.add':
+        return { type: 'annotation.add', annotations: op.annotations };
+      case 'annotation.update':
+        return { type: 'annotation.update', id: op.id, patch: op.patch };
+      case 'annotation.remove':
+        return { type: 'annotation.remove', ids: op.ids };
+      case 'annotation.clear':
+        return { type: 'annotation.clear', source: op.source };
+    }
+  }
+
+  // ---------------------------------------------------------------------------
+  // Internal: admin flow
+  // ---------------------------------------------------------------------------
+
+  private async runAdminCommand(command: AdminCommand): Promise<void> {
+    this.assertConnected();
+    if (this.pendingAdmin) {
+      throw new Error('Another admin command is pending');
+    }
+
+    return new Promise<void>((resolve, reject) => {
+      const ws = this.ws;
+      if (!ws) {
+        reject(new NotConnectedError());
+        return;
+      }
+
+      const timeoutHandle = setTimeout(() => {
+        if (this.pendingAdmin) {
+          this.pendingAdmin = null;
+          reject(new AdminTimeoutError());
+        }
+      }, ADMIN_COMMAND_TIMEOUT_MS);
+
+      this.pendingAdmin = { command, resolve, reject, timeoutHandle };
+
+      // Request admin challenge. If send() throws synchronously, don't leave
+      // pendingAdmin stuck until timeout — clear it and propagate the error.
+      try {
+        ws.send(JSON.stringify({ type: 'admin.challenge.request' }));
+      } catch (err) {
+        clearTimeout(timeoutHandle);
+        this.pendingAdmin = null;
+        reject(err instanceof Error ? err : new Error(String(err)));
+      }
+    });
+  }
+
+  private async handleAdminChallenge(challenge: AdminChallenge): Promise<void> {
+    const pending = this.pendingAdmin;
+    if (!pending || !this.adminVerifier) return;
+
+    // Capture socket and identity now. Mirror of handleAuthChallenge: if a
+    // rotation happens mid-await, the stale admin proof (bound to the old
+    // clientId) must not be sent on the replacement socket.
+    const ws = this.ws;
+    const clientId = this.clientId;
+
+    try {
+      const proof = await computeAdminProof(
+        this.adminVerifier,
+        this.roomId,
+        clientId,
+        challenge.challengeId,
+        challenge.nonce,
+        pending.command,
+      );
+      if (!ws || this.ws !== ws || this.clientId !== clientId || this.pendingAdmin !== pending) {
+        return;  // socket/identity/pending rotated during async proof; drop stale response
+      }
+      ws.send(JSON.stringify({
+        type: 'admin.command',
+        challengeId: challenge.challengeId,
+        clientId,
+        command: pending.command,
+        adminProof: proof,
+      }));
+      // Promise stays pending — resolves when the server closes the socket
+      // with WS_CLOSE_ROOM_UNAVAILABLE (handled in handleSocketClose).
+    } catch (err) {
+      // Stale-identity drop: mirror the success-path guard. If the socket,
+      // identity, or pending-admin slot rotated during the failed proof, the
+      // current pendingAdmin belongs to a NEW admin command; do not clear it
+      // and do not reject — the original caller's `pending` promise still
+      // gets rejected below so nothing is leaked, but current client state
+      // stays untouched.
+      if (this.userDisconnected || !ws || this.ws !== ws || this.clientId !== clientId || this.pendingAdmin !== pending) {
+        // Still clear the ORIGINAL pending's timeout so it doesn't leak, even
+        // though we're not touching the current pendingAdmin slot (which
+        // belongs to a NEW command after the rotation).
+        clearTimeout(pending.timeoutHandle);
+        pending.reject(err instanceof Error ? err : new Error(String(err)));
+        return;
+      }
+      clearTimeout(pending.timeoutHandle);
+      this.pendingAdmin = null;
+      pending.reject(err instanceof Error ? err : new Error(String(err)));
+    }
+  }
+
+  // ---------------------------------------------------------------------------
+  // Internal: helpers
+  // ---------------------------------------------------------------------------
+
+  private buildWebSocketUrl(): string {
+    const base = new URL(this.baseUrl);
+    const wsScheme = base.protocol === 'https:' ? 'wss:' : 'ws:';
+    return `${wsScheme}//${base.host}/ws/${this.roomId}`;
+  }
+
+  private assertConnected(): void {
+    if (this.status !== 'authenticated' || !this.ws) {
+      throw new NotConnectedError();
+    }
+  }
+
+  private setStatus(status: ConnectionStatus): void {
+    if (this.status === status) return;
+    this.status = status;
+    this.emitter.emit('status', status);
+    // Also emit state so consumers subscribed only to `state` (e.g. useCollabRoom)
+    // see connecting/authenticating/reconnecting transitions.
+    this.emitter.emit('state', this.buildState());
+  }
+
+  private buildState(): CollabRoomState {
+    // Clone every value exposed through getState()/state events. V1's
+    // server-authoritative model means local state mutations must come ONLY
+    // from decrypted server events; if a consumer (UI code) accidentally
+    // mutated a returned annotation or cursor, they'd corrupt local state
+    // with no server echo. Returning fresh clones makes getState() an
+    // isolated snapshot — it is not frozen, but mutation by the caller
+    // does not reach back into the client's internal state.
+    const presence: Record<string, PresenceState> = {};
+    for (const [clientId, entry] of this.remotePresence) {
+      presence[clientId] = clonePresenceState(entry.presence);
+    }
+    return {
+      connectionStatus: this.status,
+      roomUnavailable: this.roomUnavailable,
+      roomId: this.roomId,
+      clientId: this.clientId,
+      seq: this.seq,
+      planMarkdown: this.planMarkdown,
+      annotations: annotationsToArray(this.annotations).map(cloneRoomAnnotation),
+      remotePresence: presence,
+      hasAdminCapability: this.adminKey !== null,
+      lastError: this.lastError ? { ...this.lastError } : null,
+      lastErrorId: this.lastErrorId,
+    };
+  }
+
+  private emitState(): void {
+    this.emitter.emit('state', this.buildState());
+  }
+
+  private startPresenceSweep(): void {
+    if (this.presenceSweepTimer) return;
+    this.presenceSweepTimer = setInterval(() => {
+      const now = Date.now();
+      let pruned = false;
+      for (const [clientId, entry] of this.remotePresence) {
+        if (now - entry.lastSeen > this.presenceTtlMs) {
+          this.remotePresence.delete(clientId);
+          pruned = true;
+        }
+      }
+      if (pruned) this.emitState();
+    }, this.presenceSweepIntervalMs);
+  }
+
+  private stopPresenceSweep(): void {
+    if (this.presenceSweepTimer) {
+      clearInterval(this.presenceSweepTimer);
+      this.presenceSweepTimer = null;
+    }
+  }
+
+  private clearReconnectTimer(): void {
+    if (this.reconnectTimer) {
+      clearTimeout(this.reconnectTimer);
+      this.reconnectTimer = null;
+    }
+  }
+
+  private clearReconnectHandshakeTimer(): void {
+    if (this.reconnectHandshakeTimer) {
+      clearTimeout(this.reconnectHandshakeTimer);
+      this.reconnectHandshakeTimer = null;
+    }
+  }
+
+  /**
+   * Chain an async task on the serialized message queue.
+   *
+   * Two-arg .then(task, task) is intentional: if the previous queue entry
+   * rejected, we still want the NEXT task to run (forward progress — we're
+   * serializing for ordering, not coupling failures). The trailing .catch
+   * then swallows any rejection from the task itself so one failed handler
+   * doesn't permanently poison the chain with an unhandled rejection.
+   * Individual task errors are already surfaced via `error` events inside
+   * the handlers themselves.
+   */
+  private enqueue(task: () => Promise<void>): void {
+    this.messageQueue = this.messageQueue.then(task, task).catch(() => { /* swallow */ });
+  }
+}
diff --git a/packages/shared/collab/client-runtime/create-room.test.ts b/packages/shared/collab/client-runtime/create-room.test.ts
new file mode 100644
index 000000000..2dec3079c
--- /dev/null
+++ b/packages/shared/collab/client-runtime/create-room.test.ts
@@ -0,0 +1,92 @@
+/**
+ * Unit tests for createRoom() — focuses on the timeout + AbortSignal behavior.
+ * Happy-path round-trips are covered by integration.test.ts against wrangler dev.
+ */
+
+import { describe, expect, test } from 'bun:test';
+import { createRoom, CreateRoomError } from './create-room';
+import type { CollabRoomUser } from './types';
+import type { RoomSnapshot } from '../types';
+
+const USER: CollabRoomUser = { id: 'u1', name: 'alice', color: '#f00' };
+const SNAPSHOT: RoomSnapshot = { versionId: 'v1', planMarkdown: '# Plan', annotations: [] };
+
+// A fetch impl that never resolves until its signal aborts. Mirrors the real
+// AbortSignal wiring: when aborted, reject with an AbortError-like error.
+function hangingFetch(): typeof fetch {
+  return ((_input: RequestInfo | URL, init?: RequestInit) => {
+    return new Promise<Response>((_resolve, reject) => {
+      const signal = init?.signal;
+      if (!signal) return;  // without a signal, hang forever (caller bug)
+      if (signal.aborted) {
+        reject(signal.reason ?? new Error('aborted'));
+        return;
+      }
+      signal.addEventListener('abort', () => {
+        reject(signal.reason ?? new Error('aborted'));
+      }, { once: true });
+    });
+  }) as typeof fetch;
+}
+
+describe('createRoom() — timeout and AbortSignal', () => {
+  test('rejects with CreateRoomError when the server does not respond within timeoutMs', async () => {
+    const start = Date.now();
+    const promise = createRoom({
+      baseUrl: 'http://localhost:9',
+      initialSnapshot: SNAPSHOT,
+      user: USER,
+      fetchImpl: hangingFetch(),
+      timeoutMs: 100,
+    });
+
+    // Timeout must fire — no stuck promise. Error message mentions 'timed out'
+    // so callers can distinguish it from a transport failure.
+    await expect(promise).rejects.toBeInstanceOf(CreateRoomError);
+    await expect(promise).rejects.toMatchObject({ message: expect.stringContaining('timed out') });
+
+    const elapsed = Date.now() - start;
+    expect(elapsed).toBeGreaterThanOrEqual(90);    // near timeoutMs
+    expect(elapsed).toBeLessThan(1000);            // definitely not hanging
+  });
+
+  test('rejects immediately when the external signal is already aborted', async () => {
+    const controller = new AbortController();
+    controller.abort();  // pre-aborted
+
+    const start = Date.now();
+    const promise = createRoom({
+      baseUrl: 'http://localhost:9',
+      initialSnapshot: SNAPSHOT,
+      user: USER,
+      fetchImpl: hangingFetch(),
+      signal: controller.signal,
+      timeoutMs: 60_000,  // high — signal must short-circuit well before this
+    });
+
+    await expect(promise).rejects.toBeInstanceOf(CreateRoomError);
+    const elapsed = Date.now() - start;
+    expect(elapsed).toBeLessThan(100);  // synchronous early rejection
+  });
+
+  test('rejects when the external signal aborts mid-fetch', async () => {
+    const controller = new AbortController();
+    const start = Date.now();
+    const promise = createRoom({
+      baseUrl: 'http://localhost:9',
+      initialSnapshot: SNAPSHOT,
+      user: USER,
+      fetchImpl: hangingFetch(),
+      signal: controller.signal,
+      timeoutMs: 60_000,
+    });
+
+    // Abort after a short delay — must interrupt the hanging fetch.
+    setTimeout(() => controller.abort(new Error('user cancelled')), 50);
+
+    await expect(promise).rejects.toBeInstanceOf(CreateRoomError);
+    const elapsed = Date.now() - start;
+    expect(elapsed).toBeGreaterThanOrEqual(40);
+    expect(elapsed).toBeLessThan(1000);
+  });
+});
diff --git a/packages/shared/collab/client-runtime/create-room.ts b/packages/shared/collab/client-runtime/create-room.ts
new file mode 100644
index 000000000..f3dada8d5
--- /dev/null
+++ b/packages/shared/collab/client-runtime/create-room.ts
@@ -0,0 +1,130 @@
+/**
+ * createRoom — HTTP helper that creates a room on room-service and returns
+ * a ready-to-connect CollabRoomClient plus the URLs and raw secrets.
+ *
+ * Client-side only. Runs in browsers, Bun, and direct-agent environments.
+ */
+
+import {
+  deriveRoomKeys,
+  deriveAdminKey,
+  computeRoomVerifier,
+  computeAdminVerifier,
+  encryptSnapshot,
+} from '../crypto';
+import { generateRoomId, generateRoomSecret, generateAdminSecret } from '../ids';
+import { isRoomSnapshot } from '../types';
+import { buildRoomJoinUrl, buildAdminRoomUrl } from '../url';
+import type { CreateRoomRequest } from '../types';
+import { CollabRoomClient, InvalidOutboundPayloadError } from './client';
+import type { CreateRoomOptions, CreateRoomResult } from './types';
+
+export class CreateRoomError extends Error {
+  constructor(public status: number, message: string) {
+    super(message);
+    this.name = 'CreateRoomError';
+  }
+}
+
+export async function createRoom(options: CreateRoomOptions): Promise<CreateRoomResult> {
+  // Validate the initial snapshot BEFORE any network/crypto work. A UI bug
+  // that passes a malformed snapshot should fail immediately and clearly
+  // instead of after a fetch round-trip the server will reject.
+  if (!isRoomSnapshot(options.initialSnapshot)) {
+    throw new InvalidOutboundPayloadError('Invalid initialSnapshot payload');
+  }
+
+  const roomId = generateRoomId();
+  const roomSecret = generateRoomSecret();
+  const adminSecret = generateAdminSecret();
+
+  const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+  const adminKey = await deriveAdminKey(adminSecret);
+  const roomVerifier = await computeRoomVerifier(authKey, roomId);
+  const adminVerifier = await computeAdminVerifier(adminKey, roomId);
+  const initialSnapshotCiphertext = await encryptSnapshot(eventKey, options.initialSnapshot);
+
+  const body: CreateRoomRequest = {
+    roomId,
+    roomVerifier,
+    adminVerifier,
+    initialSnapshotCiphertext,
+    expiresInDays: options.expiresInDays,
+  };
+
+  const fetchFn = options.fetchImpl ?? fetch;
+  // new URL() handles trailing slashes correctly regardless of caller hygiene.
+  const apiUrl = new URL('/api/rooms', options.baseUrl).toString();
+
+  // Timeout + external-signal cancellation. Without this, a server hang or
+  // a dropped connection would leave createRoom() pending indefinitely, and
+  // the caller has no way to bail. Compose the two signals via AbortController
+  // so either source aborts the fetch.
+  const timeoutMs = options.timeoutMs ?? 10_000;
+  const controller = new AbortController();
+  const timeoutId = setTimeout(() => controller.abort(new CreateRoomError(0, 'createRoom timed out')), timeoutMs);
+  const externalAbort = () => controller.abort(options.signal?.reason);
+  if (options.signal) {
+    if (options.signal.aborted) {
+      clearTimeout(timeoutId);
+      throw new CreateRoomError(0, 'createRoom aborted before start');
+    }
+    options.signal.addEventListener('abort', externalAbort, { once: true });
+  }
+
+  let res: Response;
+  try {
+    res = await fetchFn(apiUrl, {
+      method: 'POST',
+      headers: { 'Content-Type': 'application/json' },
+      body: JSON.stringify(body),
+      signal: controller.signal,
+    });
+  } catch (err) {
+    // Distinguish timeout / external abort / transport failure for the caller.
+    if (controller.signal.aborted) {
+      const reason = controller.signal.reason;
+      throw reason instanceof CreateRoomError
+        ? reason
+        : new CreateRoomError(0, `createRoom aborted: ${String(reason ?? err)}`);
+    }
+    throw new CreateRoomError(0, `createRoom fetch failed: ${String(err)}`);
+  } finally {
+    clearTimeout(timeoutId);
+    options.signal?.removeEventListener('abort', externalAbort);
+  }
+
+  if (res.status !== 201) {
+    let message = `createRoom failed with status ${res.status}`;
+    try {
+      const errBody = await res.json() as { error?: string };
+      if (errBody.error) message = errBody.error;
+    } catch { /* ignore */ }
+    throw new CreateRoomError(res.status, message);
+  }
+
+  // Success. Do NOT parse the response body — we already have everything
+  // needed (roomId, secrets, locally-built URLs, derived keys). Parsing an
+  // empty, malformed, or future-format body could strand the user from a
+  // room that already exists and whose only admin secret lives in memory.
+  // Protocol neatness is less important than not losing recovery material.
+
+  const joinUrl = buildRoomJoinUrl(roomId, roomSecret, options.baseUrl);
+  const adminUrl = buildAdminRoomUrl(roomId, roomSecret, adminSecret, options.baseUrl);
+
+  const client = new CollabRoomClient({
+    roomId,
+    baseUrl: options.baseUrl,
+    eventKey,
+    presenceKey,
+    adminKey,
+    roomVerifier,
+    adminVerifier,
+    user: options.user,
+    initialSnapshot: options.initialSnapshot,
+    webSocketImpl: options.webSocketImpl,
+    reconnect: options.reconnect,
+  });
+
+  return { roomId, roomSecret, adminSecret, joinUrl, adminUrl, client };
+}
diff --git a/packages/shared/collab/client-runtime/emitter.test.ts b/packages/shared/collab/client-runtime/emitter.test.ts
new file mode 100644
index 000000000..17d57ffb8
--- /dev/null
+++ b/packages/shared/collab/client-runtime/emitter.test.ts
@@ -0,0 +1,77 @@
+import { describe, expect, test, mock } from 'bun:test';
+import { TypedEventEmitter } from './emitter';
+
+interface Events {
+  foo: number;
+  bar: { message: string };
+}
+
+describe('TypedEventEmitter', () => {
+  test('emits to subscribed listeners', () => {
+    const e = new TypedEventEmitter<Events>();
+    const fn = mock(() => {});
+    e.on('foo', fn);
+    e.emit('foo', 42);
+    expect(fn).toHaveBeenCalledWith(42);
+  });
+
+  test('unsubscribe function removes listener', () => {
+    const e = new TypedEventEmitter<Events>();
+    const fn = mock(() => {});
+    const unsub = e.on('foo', fn);
+    e.emit('foo', 1);
+    unsub();
+    e.emit('foo', 2);
+    expect(fn).toHaveBeenCalledTimes(1);
+  });
+
+  test('off removes a specific listener', () => {
+    const e = new TypedEventEmitter<Events>();
+    const fn1 = mock(() => {});
+    const fn2 = mock(() => {});
+    e.on('foo', fn1);
+    e.on('foo', fn2);
+    e.off('foo', fn1);
+    e.emit('foo', 1);
+    expect(fn1).not.toHaveBeenCalled();
+    expect(fn2).toHaveBeenCalled();
+  });
+
+  test('isolates listener errors', () => {
+    const e = new TypedEventEmitter<Events>();
+    const fn1 = mock(() => { throw new Error('boom'); });
+    const fn2 = mock(() => {});
+    e.on('foo', fn1);
+    e.on('foo', fn2);
+    // Should not throw
+    e.emit('foo', 1);
+    expect(fn2).toHaveBeenCalled();
+  });
+
+  test('removeAll clears listeners', () => {
+    const e = new TypedEventEmitter<Events>();
+    const fn = mock(() => {});
+    e.on('foo', fn);
+    e.removeAll();
+    e.emit('foo', 1);
+    expect(fn).not.toHaveBeenCalled();
+  });
+
+  test('emitting with no listeners is safe', () => {
+    const e = new TypedEventEmitter<Events>();
+    // Should not throw
+    e.emit('foo', 1);
+  });
+
+  test('supports multiple event types', () => {
+    const e = new TypedEventEmitter<Events>();
+    const fooFn = mock(() => {});
+    const barFn = mock(() => {});
+    e.on('foo', fooFn);
+    e.on('bar', barFn);
+    e.emit('foo', 1);
+    e.emit('bar', { message: 'hi' });
+    expect(fooFn).toHaveBeenCalledWith(1);
+    expect(barFn).toHaveBeenCalledWith({ message: 'hi' });
+  });
+});
diff --git a/packages/shared/collab/client-runtime/emitter.ts b/packages/shared/collab/client-runtime/emitter.ts
new file mode 100644
index 000000000..9ea7da13a
--- /dev/null
+++ b/packages/shared/collab/client-runtime/emitter.ts
@@ -0,0 +1,50 @@
+/**
+ * Tiny typed event emitter for the collab room client runtime.
+ *
+ * Returns an unsubscribe function from `on()` for clean React useEffect teardown.
+ * Wraps listener calls in try/catch so one throwing listener doesn't break others.
+ */
+
+export class TypedEventEmitter<M extends Record<string, unknown>> {
+  private listeners: { [K in keyof M]?: Set<(payload: M[K]) => void> } = {};
+
+  /** Subscribe to an event. Returns an unsubscribe function. */
+  on<K extends keyof M>(name: K, fn: (payload: M[K]) => void): () => void {
+    let set = this.listeners[name];
+    if (!set) {
+      set = new Set();
+      this.listeners[name] = set;
+    }
+    set.add(fn);
+    return () => this.off(name, fn);
+  }
+
+  /** Remove a specific listener. */
+  off<K extends keyof M>(name: K, fn: (payload: M[K]) => void): void {
+    this.listeners[name]?.delete(fn);
+  }
+
+  /** Emit an event. Listener errors are isolated. */
+  emit<K extends keyof M>(name: K, payload: M[K]): void {
+    const set = this.listeners[name];
+    if (!set) return;
+    // Snapshot listeners BEFORE iterating so listeners added during emission
+    // don't fire in the same pass (surprising semantics) and listeners
+    // removed during emission don't throw the iterator.
+    const snapshot = [...set];
+    for (const fn of snapshot) {
+      try {
+        fn(payload);
+      } catch (err) {
+        // Isolate listener errors so one bad listener doesn't break others.
+        // Log but don't re-throw.
+        console.error(`[TypedEventEmitter] listener for "${String(name)}" threw:`, err);
+      }
+    }
+  }
+
+  /** Remove all listeners (useful for teardown). */
+  removeAll(): void {
+    this.listeners = {};
+  }
+}
diff --git a/packages/shared/collab/client-runtime/index.ts b/packages/shared/collab/client-runtime/index.ts
new file mode 100644
index 000000000..f0c89b962
--- /dev/null
+++ b/packages/shared/collab/client-runtime/index.ts
@@ -0,0 +1,20 @@
+/**
+ * Client runtime barrel. Re-exports public API for browser + direct-agent clients.
+ *
+ * Consumers typically import from `@plannotator/shared/collab/client`, which
+ * re-exports this barrel plus base types.
+ */
+
+export * from './client';
+export * from './create-room';
+export * from './join-room';
+export type {
+  ConnectionStatus,
+  CollabRoomUser,
+  CollabRoomState,
+  CollabRoomEvents,
+  CreateRoomOptions,
+  CreateRoomResult,
+  JoinRoomOptions,
+  ReconnectOptions,
+} from './types';
diff --git a/packages/shared/collab/client-runtime/integration.test.ts b/packages/shared/collab/client-runtime/integration.test.ts
new file mode 100644
index 000000000..17b3c7816
--- /dev/null
+++ b/packages/shared/collab/client-runtime/integration.test.ts
@@ -0,0 +1,222 @@
+/**
+ * Integration tests for the collab client runtime against a live wrangler dev Worker.
+ *
+ * Gated by SMOKE_BASE_URL env var. Skipped when unset.
+ *
+ * Usage:
+ *   cd apps/room-service && bunx wrangler dev
+ *   # In another terminal:
+ *   SMOKE_BASE_URL=http://localhost:8787 bun test packages/shared/collab/client-runtime/integration.test.ts
+ */
+
+import { describe, expect, test } from 'bun:test';
+import { createRoom, joinRoom } from './index';
+import type { CollabRoomClient } from './client';
+import type { RoomSnapshot } from '../types';
+
+const BASE_URL = process.env.SMOKE_BASE_URL;
+const shouldRun = !!BASE_URL;
+
+const USER_A = { id: 'user-a', name: 'alice', color: '#f00' };
+const USER_B = { id: 'user-b', name: 'bob', color: '#0f0' };
+
+const describeFn = shouldRun ? describe : describe.skip;
+
+function safeDisconnect(client: CollabRoomClient | null): void {
+  if (!client) return;
+  try { client.disconnect(); } catch { /* ignore — best-effort cleanup */ }
+}
+
+describeFn('CollabRoomClient integration (against wrangler dev)', () => {
+  test('createRoom, two clients exchange event + presence, admin delete', async () => {
+    let creator: CollabRoomClient | null = null;
+    let participant: CollabRoomClient | null = null;
+    let adminClient: CollabRoomClient | null = null;
+
+    try {
+      const snapshot: RoomSnapshot = {
+        versionId: 'v1',
+        planMarkdown: '# Integration test',
+        annotations: [],
+      };
+
+      // Creator creates the room and connects
+      const created = await createRoom({
+        baseUrl: BASE_URL!,
+        initialSnapshot: snapshot,
+        user: USER_A,
+      });
+      creator = created.client;
+      const { joinUrl, adminUrl } = created;
+      await creator.connect();
+      expect(creator.getState().connectionStatus).toBe('authenticated');
+
+      // Second participant joins via joinUrl
+      participant = await joinRoom({
+        url: joinUrl,
+        user: USER_B,
+        autoConnect: true,
+      });
+      expect(participant.getState().connectionStatus).toBe('authenticated');
+
+      // Creator sends an annotation — participant should see it
+      const ann = {
+        id: 'int-ann-1',
+        blockId: 'b1',
+        startOffset: 0,
+        endOffset: 5,
+        type: 'COMMENT' as const,
+        originalText: 'hello',
+        createdA: Date.now(),
+        text: 'from creator',
+      };
+      await creator.sendAnnotationAdd([ann]);
+      await new Promise(r => setTimeout(r, 500));
+      expect(participant.getState().annotations.map(a => a.id)).toContain('int-ann-1');
+
+      // Admin (creator) joins via adminUrl to exercise admin capability
+      adminClient = await joinRoom({ url: adminUrl, user: USER_A, autoConnect: true });
+      expect(adminClient.getState().hasAdminCapability).toBe(true);
+
+      // Admin deletes the room
+      await adminClient.deleteRoom();
+      await new Promise(r => setTimeout(r, 500));
+      expect(adminClient.getState().roomUnavailable).toBe(true);
+    } finally {
+      safeDisconnect(creator);
+      safeDisconnect(participant);
+      safeDisconnect(adminClient);
+    }
+  }, 30_000);
+
+  test('manual reconnect replays events missed while a participant was offline', async () => {
+    // NOTE: this exercises the MANUAL reconnect path — participant calls
+    // disconnect() and then connect() again. The automatic network-drop
+    // reconnect path (auto-reconnect timer with preserved seq) is covered by
+    // the unit-test socket lifecycle suite; a live test of that path would
+    // require simulating a server-side socket close, which wrangler dev does
+    // not cleanly expose.
+    let creator: CollabRoomClient | null = null;
+    let participant: CollabRoomClient | null = null;
+    // Admin URL captured for server-side cleanup in finally. If SMOKE_BASE_URL
+    // ever points at a shared/staging room-service, leaving rooms around until
+    // expiry is noisy; deleting explicitly keeps the target clean.
+    let adminUrl: string | null = null;
+
+    try {
+      const snapshot: RoomSnapshot = {
+        versionId: 'v1',
+        planMarkdown: '# Reconnect replay test',
+        annotations: [],
+      };
+
+      const created = await createRoom({
+        baseUrl: BASE_URL!,
+        initialSnapshot: snapshot,
+        user: USER_A,
+      });
+      creator = created.client;
+      adminUrl = created.adminUrl;
+      await creator.connect();
+      expect(creator.getState().connectionStatus).toBe('authenticated');
+
+      participant = await joinRoom({
+        url: created.joinUrl,
+        user: USER_B,
+        autoConnect: true,
+      });
+      expect(participant.getState().connectionStatus).toBe('authenticated');
+
+      // Both clients see an initial annotation round-trip (baseline sanity).
+      const firstAnn = {
+        id: 'replay-ann-1',
+        blockId: 'b1',
+        startOffset: 0,
+        endOffset: 5,
+        type: 'COMMENT' as const,
+        originalText: 'hello',
+        createdA: Date.now(),
+        text: 'before drop',
+      };
+      await creator.sendAnnotationAdd([firstAnn]);
+      await waitFor(() =>
+        participant!.getState().annotations.some(a => a.id === firstAnn.id),
+        3000,
+      );
+      const seqAtDisconnect = participant.getState().seq;
+      expect(seqAtDisconnect).toBeGreaterThan(0);
+
+      // Participant disconnects. While offline, the creator makes two more ops.
+      participant.disconnect();
+      expect(participant.getState().connectionStatus).toBe('closed');
+
+      const missedAnn1 = {
+        id: 'replay-ann-missed-1',
+        blockId: 'b1',
+        startOffset: 10,
+        endOffset: 15,
+        type: 'COMMENT' as const,
+        originalText: 'missed-1',
+        createdA: Date.now(),
+        text: 'sent while offline',
+      };
+      const missedAnn2 = {
+        id: 'replay-ann-missed-2',
+        blockId: 'b1',
+        startOffset: 20,
+        endOffset: 25,
+        type: 'COMMENT' as const,
+        originalText: 'missed-2',
+        createdA: Date.now(),
+        text: 'also sent while offline',
+      };
+      await creator.sendAnnotationAdd([missedAnn1]);
+      await creator.sendAnnotationAdd([missedAnn2]);
+      await waitFor(() => {
+        const ids = creator!.getState().annotations.map(a => a.id);
+        return ids.includes(missedAnn1.id) && ids.includes(missedAnn2.id);
+      }, 3000);
+
+      // Participant reconnects. The client sends its preserved seq as lastSeq
+      // and the server replays the missed events.
+      await participant.connect();
+      expect(participant.getState().connectionStatus).toBe('authenticated');
+
+      await waitFor(() => {
+        const ids = participant!.getState().annotations.map(a => a.id);
+        return ids.includes(missedAnn1.id) && ids.includes(missedAnn2.id);
+      }, 5000);
+
+      // Participant's seq must have advanced past seqAtDisconnect.
+      expect(participant.getState().seq).toBeGreaterThan(seqAtDisconnect);
+
+      // And the baseline annotation is still there.
+      expect(participant.getState().annotations.map(a => a.id)).toContain(firstAnn.id);
+    } finally {
+      // Server-side cleanup: delete the room so shared/staging SMOKE_BASE_URL
+      // targets don't accumulate smoke rooms until expiry. Disconnect the
+      // participant first — delete will close remaining sockets, but a clean
+      // pre-disconnect avoids noisy AdminInterruptedError on the participant.
+      safeDisconnect(participant);
+      if (adminUrl) {
+        let adminClient: CollabRoomClient | null = null;
+        try {
+          adminClient = await joinRoom({ url: adminUrl, user: USER_A, autoConnect: true });
+          await adminClient.deleteRoom();
+        } catch { /* ignore cleanup errors */ }
+        finally { safeDisconnect(adminClient); }
+      }
+      safeDisconnect(creator);
+    }
+  }, 30_000);
+});
+
+async function waitFor(cond: () => boolean, timeoutMs = 3000): Promise<void> {
+  const start = Date.now();
+  while (!cond()) {
+    if (Date.now() - start > timeoutMs) {
+      throw new Error(`waitFor timed out after ${timeoutMs}ms`);
+    }
+    await new Promise(r => setTimeout(r, 25));
+  }
+}
diff --git a/packages/shared/collab/client-runtime/join-room.test.ts b/packages/shared/collab/client-runtime/join-room.test.ts
new file mode 100644
index 000000000..76518eeaa
--- /dev/null
+++ b/packages/shared/collab/client-runtime/join-room.test.ts
@@ -0,0 +1,65 @@
+/**
+ * Unit tests for joinRoom — focus on admin secret override length validation (P3).
+ */
+
+import { describe, expect, test } from 'bun:test';
+import { joinRoom, InvalidAdminSecretError, InvalidRoomUrlError } from './join-room';
+import { buildRoomJoinUrl } from '../url';
+import { generateRoomSecret } from '../ids';
+import { bytesToBase64url } from '../encoding';
+import type { CollabRoomUser } from './types';
+
+const USER: CollabRoomUser = { id: 'u1', name: 'alice', color: '#f00' };
+
+describe('joinRoom — admin secret override validation (P3)', () => {
+  test('rejects Uint8Array admin override with wrong length', async () => {
+    const roomSecret = generateRoomSecret();
+    const url = buildRoomJoinUrl('roomA', roomSecret);
+    const badAdmin = new Uint8Array(16);  // 16 bytes, not 32
+
+    await expect(joinRoom({ url, adminSecret: badAdmin, user: USER }))
+      .rejects.toThrow(InvalidAdminSecretError);
+  });
+
+  test('rejects string admin override that decodes to wrong length', async () => {
+    const roomSecret = generateRoomSecret();
+    const url = buildRoomJoinUrl('roomA', roomSecret);
+    const badAdminStr = bytesToBase64url(new Uint8Array(16));
+
+    await expect(joinRoom({ url, adminSecret: badAdminStr, user: USER }))
+      .rejects.toThrow(InvalidAdminSecretError);
+  });
+
+  test('rejects malformed base64url admin override', async () => {
+    const roomSecret = generateRoomSecret();
+    const url = buildRoomJoinUrl('roomA', roomSecret);
+
+    await expect(joinRoom({ url, adminSecret: 'not-valid-base64url!', user: USER }))
+      .rejects.toThrow(InvalidAdminSecretError);
+  });
+
+  test('accepts valid 32-byte Uint8Array admin override', async () => {
+    const roomSecret = generateRoomSecret();
+    const url = buildRoomJoinUrl('roomA', roomSecret);
+    const validAdmin = new Uint8Array(32);
+    validAdmin[0] = 1;  // non-zero
+
+    const client = await joinRoom({ url, adminSecret: validAdmin, user: USER });
+    expect(client.getState().hasAdminCapability).toBe(true);
+  });
+
+  test('accepts valid 32-byte string admin override', async () => {
+    const roomSecret = generateRoomSecret();
+    const url = buildRoomJoinUrl('roomA', roomSecret);
+    const validAdminStr = bytesToBase64url(new Uint8Array(32));
+
+    const client = await joinRoom({ url, adminSecret: validAdminStr, user: USER });
+    expect(client.getState().hasAdminCapability).toBe(true);
+  });
+
+  test('InvalidRoomUrlError is still thrown for malformed URL regardless of admin override', async () => {
+    const validAdmin = new Uint8Array(32);
+    await expect(joinRoom({ url: 'not-a-url', adminSecret: validAdmin, user: USER }))
+      .rejects.toThrow(InvalidRoomUrlError);
+  });
+});
diff --git a/packages/shared/collab/client-runtime/join-room.ts b/packages/shared/collab/client-runtime/join-room.ts
new file mode 100644
index 000000000..08040fc68
--- /dev/null
+++ b/packages/shared/collab/client-runtime/join-room.ts
@@ -0,0 +1,100 @@
+/**
+ * joinRoom — factory that parses a room URL, derives keys locally,
+ * and constructs a CollabRoomClient ready to connect.
+ *
+ * Client-side only. The URL fragment is client-private.
+ */
+
+import {
+  deriveRoomKeys,
+  deriveAdminKey,
+  computeRoomVerifier,
+  computeAdminVerifier,
+} from '../crypto';
+import { ADMIN_SECRET_LENGTH_BYTES } from '../constants';
+import { base64urlToBytes } from '../encoding';
+import { parseRoomUrl } from '../url';
+import { CollabRoomClient } from './client';
+import type { JoinRoomOptions } from './types';
+
+export class InvalidRoomUrlError extends Error {
+  constructor() { super('Room URL is malformed or missing required fragment'); this.name = 'InvalidRoomUrlError'; }
+}
+
+export class InvalidAdminSecretError extends Error {
+  constructor(detail: string) {
+    super(`Invalid admin secret override: ${detail}`);
+    this.name = 'InvalidAdminSecretError';
+  }
+}
+
+export async function joinRoom(options: JoinRoomOptions): Promise<CollabRoomClient> {
+  const parsed = parseRoomUrl(options.url);
+  if (!parsed) throw new InvalidRoomUrlError();
+
+  const { roomId, roomSecret } = parsed;
+  const adminSecretBytes = resolveAdminSecret(options.adminSecret, parsed.adminSecret);
+
+  const { authKey, eventKey, presenceKey } = await deriveRoomKeys(roomSecret);
+  const adminKey = adminSecretBytes ? await deriveAdminKey(adminSecretBytes) : null;
+  const roomVerifier = await computeRoomVerifier(authKey, roomId);
+  const adminVerifier = adminKey ? await computeAdminVerifier(adminKey, roomId) : null;
+
+  const baseUrl = originFromUrl(options.url);
+
+  const client = new CollabRoomClient({
+    roomId,
+    baseUrl,
+    eventKey,
+    presenceKey,
+    adminKey,
+    roomVerifier,
+    adminVerifier,
+    user: options.user,
+    webSocketImpl: options.webSocketImpl,
+    reconnect: options.reconnect,
+  });
+
+  if (options.autoConnect) {
+    await client.connect();
+  }
+
+  return client;
+}
+
+function resolveAdminSecret(
+  override: Uint8Array | string | undefined,
+  fromUrl: Uint8Array | undefined,
+): Uint8Array | null {
+  // URL-derived admin secrets are length-validated inside parseRoomUrl().
+  // Overrides bypass that path, so validate explicitly here.
+  if (override instanceof Uint8Array) {
+    if (override.length !== ADMIN_SECRET_LENGTH_BYTES) {
+      throw new InvalidAdminSecretError(
+        `expected ${ADMIN_SECRET_LENGTH_BYTES} bytes, got ${override.length}`,
+      );
+    }
+    return override;
+  }
+  if (typeof override === 'string') {
+    let bytes: Uint8Array;
+    try {
+      bytes = base64urlToBytes(override);
+    } catch (err) {
+      throw new InvalidAdminSecretError(`base64url decode failed: ${String(err)}`);
+    }
+    if (bytes.length !== ADMIN_SECRET_LENGTH_BYTES) {
+      throw new InvalidAdminSecretError(
+        `expected ${ADMIN_SECRET_LENGTH_BYTES} bytes, got ${bytes.length}`,
+      );
+    }
+    return bytes;
+  }
+  if (fromUrl) return fromUrl;
+  return null;
+}
+
+function originFromUrl(url: string): string {
+  const parsed = new URL(url);
+  return parsed.origin;
+}
diff --git a/packages/shared/collab/client-runtime/mock-websocket.ts b/packages/shared/collab/client-runtime/mock-websocket.ts
new file mode 100644
index 000000000..e9c17dfcd
--- /dev/null
+++ b/packages/shared/collab/client-runtime/mock-websocket.ts
@@ -0,0 +1,156 @@
+/**
+ * In-memory WebSocket mock for unit testing the CollabRoomClient.
+ *
+ * Implements enough of the WebSocket interface to satisfy the client runtime.
+ * Exposes a `peer` handle for test code to script server-side behavior:
+ *   - peer.sendFromServer(msg) — simulate a server message
+ *   - peer.expectFromClient() — await next message the client sends
+ *   - peer.simulateClose(code, reason) — simulate server-initiated close
+ *   - peer.simulateError() — trigger onerror
+ */
+
+export interface MockWebSocketPeer {
+  /** Send a message from "the server" to the client. */
+  sendFromServer(message: string): void;
+  /** Await the next message the client sends. Rejects after `timeoutMs`. */
+  expectFromClient(timeoutMs?: number): Promise<string>;
+  /** Close the socket from the server side. */
+  simulateClose(code?: number, reason?: string): void;
+  /** Trigger the onerror handler. */
+  simulateError(): void;
+  /** All messages the client has sent, in order. */
+  readonly sent: string[];
+  /** Whether the client has called close(). */
+  readonly closedByClient: boolean;
+}
+
+interface PendingExpect {
+  resolve: (msg: string) => void;
+  reject: (err: Error) => void;
+  timeoutHandle: ReturnType<typeof setTimeout>;
+}
+
+const OPEN = 1;
+const CLOSING = 2;
+const CLOSED = 3;
+
+export class MockWebSocket implements EventTarget {
+  static CONNECTING = 0;
+  static OPEN = 1;
+  static CLOSING = 2;
+  static CLOSED = 3;
+
+  readonly CONNECTING = 0;
+  readonly OPEN = 1;
+  readonly CLOSING = 2;
+  readonly CLOSED = 3;
+
+  url: string;
+  readyState: number = 0;
+  binaryType: BinaryType = 'blob';
+  bufferedAmount = 0;
+  extensions = '';
+  protocol = '';
+
+  onopen: ((ev: Event) => void) | null = null;
+  onclose: ((ev: CloseEvent) => void) | null = null;
+  onmessage: ((ev: MessageEvent) => void) | null = null;
+  onerror: ((ev: Event) => void) | null = null;
+
+  public readonly peer: MockWebSocketPeer;
+  private readonly sentMessages: string[] = [];
+  private readonly expectQueue: PendingExpect[] = [];
+  private readonly bufferedSent: string[] = [];
+  private isClosedByClient = false;
+
+  constructor(url: string | URL, _protocols?: string | string[]) {
+    this.url = typeof url === 'string' ? url : url.toString();
+
+    const self = this;
+    this.peer = {
+      sendFromServer(message: string) {
+        if (self.readyState !== OPEN) return;
+        self.onmessage?.(new MessageEvent('message', { data: message }));
+      },
+      expectFromClient(timeoutMs = 2000): Promise<string> {
+        if (self.bufferedSent.length > 0) {
+          const msg = self.bufferedSent.shift()!;
+          return Promise.resolve(msg);
+        }
+        return new Promise((resolve, reject) => {
+          const timeoutHandle = setTimeout(() => {
+            const idx = self.expectQueue.findIndex(p => p.resolve === resolve);
+            if (idx >= 0) self.expectQueue.splice(idx, 1);
+            reject(new Error(`expectFromClient timed out after ${timeoutMs}ms`));
+          }, timeoutMs);
+          self.expectQueue.push({ resolve, reject, timeoutHandle });
+        });
+      },
+      simulateClose(code = 1000, reason = '') {
+        if (self.readyState === CLOSED) return;
+        self.readyState = CLOSED;
+        self.onclose?.(new CloseEvent('close', { code, reason, wasClean: true }));
+      },
+      simulateError() {
+        self.onerror?.(new Event('error'));
+      },
+      get sent() { return self.sentMessages; },
+      get closedByClient() { return self.isClosedByClient; },
+    };
+
+    // Open asynchronously (like a real WebSocket)
+    queueMicrotask(() => {
+      if (this.readyState === 0) {
+        this.readyState = OPEN;
+        this.onopen?.(new Event('open'));
+      }
+    });
+  }
+
+  send(data: string | ArrayBufferLike | Blob | ArrayBufferView): void {
+    if (this.readyState !== OPEN) {
+      throw new Error(`MockWebSocket.send called in state ${this.readyState}`);
+    }
+    const msg = typeof data === 'string' ? data : String(data);
+    this.sentMessages.push(msg);
+
+    // Satisfy a pending expectFromClient if any
+    const pending = this.expectQueue.shift();
+    if (pending) {
+      clearTimeout(pending.timeoutHandle);
+      pending.resolve(msg);
+    } else {
+      this.bufferedSent.push(msg);
+    }
+  }
+
+  /**
+   * When true, close() defers the onclose handler to a microtask instead of
+   * firing it synchronously. This mirrors real browser behavior, where
+   * ws.close() returns immediately and onclose fires asynchronously. Set via
+   * `MockWebSocket.asyncCloseMode` to exercise code paths that assume async
+   * close semantics.
+   */
+  static asyncCloseMode = false;
+
+  close(code?: number, reason?: string): void {
+    if (this.readyState === CLOSED) return;
+    this.isClosedByClient = true;
+    this.readyState = CLOSED;
+    const closeEvent = new CloseEvent('close', {
+      code: code ?? 1000,
+      reason: reason ?? '',
+      wasClean: true,
+    });
+    if (MockWebSocket.asyncCloseMode) {
+      queueMicrotask(() => this.onclose?.(closeEvent));
+    } else {
+      this.onclose?.(closeEvent);
+    }
+  }
+
+  // EventTarget stubs (not used by client, but required by type)
+  addEventListener(): void {}
+  removeEventListener(): void {}
+  dispatchEvent(_ev: Event): boolean { return true; }
+}
diff --git a/packages/shared/collab/client-runtime/types.ts b/packages/shared/collab/client-runtime/types.ts
new file mode 100644
index 000000000..f79143057
--- /dev/null
+++ b/packages/shared/collab/client-runtime/types.ts
@@ -0,0 +1,219 @@
+/**
+ * Types for the collab room client runtime.
+ *
+ * Client-side state shape, options, and event map. Distinct from wire protocol
+ * types (which live in ../types.ts).
+ */
+
+import type {
+  PresenceState,
+  RoomAnnotation,
+  RoomServerEvent,
+  RoomSnapshot,
+} from '../types';
+
+// Forward type-only import to break the cycle between types.ts and client.ts.
+// `import type` is erased at compile time — no runtime dependency created.
+import type { CollabRoomClient } from './client';
+
+// ---------------------------------------------------------------------------
+// Connection status
+// ---------------------------------------------------------------------------
+
+export type ConnectionStatus =
+  | 'disconnected'
+  | 'connecting'
+  | 'authenticating'
+  | 'authenticated'
+  | 'reconnecting'
+  | 'closed';
+
+// ---------------------------------------------------------------------------
+// User identity carried in encrypted presence
+// ---------------------------------------------------------------------------
+
+export interface CollabRoomUser {
+  /** Stable across reconnects — lives inside encrypted PresenceState.user.id. */
+  id: string;
+  name: string;
+  color: string;
+}
+
+// ---------------------------------------------------------------------------
+// Client state snapshot
+// ---------------------------------------------------------------------------
+
+export interface CollabRoomState {
+  connectionStatus: ConnectionStatus;
+  /**
+   * True after the server closed the socket with the "room unavailable"
+   * terminal code. Set by the admin-initiated delete, the 30-day alarm
+   * auto-purge, or any connect attempt against a room that no longer
+   * exists. Indistinguishable to the client — all three surface the
+   * same generic "link doesn't resolve" UX.
+   */
+  roomUnavailable: boolean;
+  roomId: string;
+  /** Random per WebSocket connection — not a stable participant identifier. */
+  clientId: string;
+  /**
+   * Last server seq consumed by this client. Valid events advance seq after
+   * applying state. Malformed or undecryptable events also advance seq without
+   * mutating annotation state so reconnect replay does not loop on a bad event.
+   * Used as `lastSeq` on reconnect.
+   */
+  seq: number;
+  planMarkdown: string;
+  /** Ordered view of internal annotations Map. */
+  annotations: RoomAnnotation[];
+  /** Keyed by sender clientId. Stale entries are pruned by lastSeen TTL. */
+  remotePresence: Record<string, PresenceState>;
+  /**
+   * True when this client holds the admin secret. The normal participant
+   * share URL is `#key=...` only; the `#key=...&admin=...` URL is the
+   * sensitive creator/recovery URL and is not intentionally shared with
+   * participants. Admin commands resolve by observing the socket-close
+   * signal that the delete-triggered purge produces; a future multi-admin
+   * surface would need commandId-correlated acks instead.
+   */
+  hasAdminCapability: boolean;
+  /**
+   * Most recent client or server error. `scope` classifies the source so
+   * consumers can react only to the classes they care about:
+   *
+   *   'mutation' — server-sent rejection of a mutation (room.error on an
+   *                annotation op this client sent). The annotation
+   *                controller uses this to transition in-flight pending
+   *                ops to failed. This is the ONLY scope that does so.
+   *   'admin'    — admin-command rejection. Consumed by
+   *                CollabRoomClient.pendingAdmin; never affects pending
+   *                mutations (a failed admin command must not fail a racing add).
+   *   'event'    — inbound event from another participant failed to
+   *                decode locally (malformed payload, decrypt failure,
+   *                reducer rejection). Not a rejection of OUR state.
+   *   'presence' — inbound presence frame failed to decode locally. Not
+   *                a rejection of our state.
+   *   'snapshot' — snapshot replay failed to decode or validate. Not a
+   *                rejection of our state.
+   *   'join'     — connect/join-phase failure surfaced by the hook
+   *                wrapper (mapJoinFailure).
+   *
+   * `id` is a monotonic counter bumped on every NEW error — state clones
+   * rebuild the `lastError` object each emit, so object identity is NOT
+   * a safe "same error" signal; consumers must dedupe on `lastErrorId`.
+   */
+  lastError: { code: string; message: string; scope: 'mutation' | 'admin' | 'event' | 'presence' | 'snapshot' | 'join' } | null;
+  /** Monotonic identifier for `lastError`. 0 when no error has ever occurred. */
+  lastErrorId: number;
+}
+
+// ---------------------------------------------------------------------------
+// Event map (subscribed via CollabRoomClient.on)
+// ---------------------------------------------------------------------------
+
+export type CollabRoomEvents = {
+  status: ConnectionStatus;
+  snapshot: RoomSnapshot;
+  event: RoomServerEvent;
+  presence: { clientId: string; presence: PresenceState };
+  error: { code: string; message: string };
+  /** Fires on any state mutation — React hooks subscribe here. */
+  state: CollabRoomState;
+};
+
+// ---------------------------------------------------------------------------
+// createRoom options + result
+// ---------------------------------------------------------------------------
+
+export interface CreateRoomOptions {
+  /** e.g. https://room.plannotator.ai or http://localhost:8787 (no trailing slash). */
+  baseUrl: string;
+  initialSnapshot: RoomSnapshot;
+  expiresInDays?: number;
+  user: CollabRoomUser;
+  /** Test injection. */
+  webSocketImpl?: typeof WebSocket;
+  /** Test injection. */
+  fetchImpl?: typeof fetch;
+  /** Optional reconnect tuning for the returned client. */
+  reconnect?: ReconnectOptions;
+  /**
+   * Abort the fetch to the room service. If the signal is already aborted
+   * when createRoom() is called, it rejects immediately. If the signal
+   * aborts mid-fetch, the fetch is cancelled and createRoom rejects with
+   * a CreateRoomError.
+   */
+  signal?: AbortSignal;
+  /**
+   * Cap for the room-creation fetch in ms. If neither the signal fires nor
+   * the server responds within this window, createRoom() rejects with a
+   * CreateRoomError. Default: 10_000 ms.
+   */
+  timeoutMs?: number;
+}
+
+export interface CreateRoomResult {
+  roomId: string;
+  /** 32-byte raw secret. Callers may discard after building URLs. */
+  roomSecret: Uint8Array;
+  /** 32-byte raw admin secret. Callers should persist carefully (creator-only). */
+  adminSecret: Uint8Array;
+  /** #key-only URL. Safe to share with participants. */
+  joinUrl: string;
+  /** #key + #admin URL. Creator/recovery only — never the default share target. */
+  adminUrl: string;
+  /** Constructed but NOT connected. Caller invokes client.connect(). */
+  client: CollabRoomClient;
+}
+
+// ---------------------------------------------------------------------------
+// joinRoom options
+// ---------------------------------------------------------------------------
+
+export interface JoinRoomOptions {
+  /** Full room URL including fragment. */
+  url: string;
+  /** Override if admin capability is not in URL fragment. base64url string or raw bytes. */
+  adminSecret?: Uint8Array | string;
+  user: CollabRoomUser;
+  webSocketImpl?: typeof WebSocket;
+  reconnect?: ReconnectOptions;
+  /** If true, awaits connect() before returning. Default: false. */
+  autoConnect?: boolean;
+}
+
+export interface ReconnectOptions {
+  initialDelayMs?: number;
+  maxDelayMs?: number;
+  /** Exponential backoff multiplier per attempt. Default: 2. */
+  factor?: number;
+  /** 0 disables auto-reconnect entirely (useful in tests). Default: Infinity. */
+  maxAttempts?: number;
+}
+
+// ---------------------------------------------------------------------------
+// Internal client constructor options (used by createRoom/joinRoom)
+// ---------------------------------------------------------------------------
+
+export interface InternalClientOptions {
+  roomId: string;
+  baseUrl: string;
+  eventKey: CryptoKey;
+  presenceKey: CryptoKey;
+  adminKey: CryptoKey | null;
+  roomVerifier: string;
+  adminVerifier: string | null;
+  user: CollabRoomUser;
+  /** Seed initial state from known snapshot (used by createRoom). */
+  initialSnapshot?: RoomSnapshot;
+  webSocketImpl?: typeof WebSocket;
+  reconnect?: ReconnectOptions;
+  /** Connect timeout in milliseconds. Default: 10_000. */
+  connectTimeoutMs?: number;
+  /** Presence TTL in milliseconds. Default: 30_000. */
+  presenceTtlMs?: number;
+  /** Presence sweep interval. Default: 5_000. */
+  presenceSweepIntervalMs?: number;
+}
+
+// Note: concrete CollabRoomClient class lives in client.ts to avoid forward-reference cycles.
diff --git a/packages/shared/collab/client.ts b/packages/shared/collab/client.ts
new file mode 100644
index 000000000..419349bd5
--- /dev/null
+++ b/packages/shared/collab/client.ts
@@ -0,0 +1,16 @@
+/**
+ * Plannotator Live Rooms — client barrel export.
+ *
+ * Re-exports the server-safe barrel plus client-only URL helpers.
+ * This is the import path for browser and direct-agent clients:
+ *   import { ..., parseRoomUrl, buildRoomJoinUrl } from '@plannotator/shared/collab/client'
+ */
+
+export * from './index';
+export * from './url';
+
+// Client runtime (WebSocket + stateful client)
+export * from './client-runtime/client';
+export * from './client-runtime/create-room';
+export * from './client-runtime/join-room';
+export * from './client-runtime/types';
diff --git a/packages/shared/collab/constants.ts b/packages/shared/collab/constants.ts
new file mode 100644
index 000000000..02f0634eb
--- /dev/null
+++ b/packages/shared/collab/constants.ts
@@ -0,0 +1,62 @@
+/** Plannotator Live Rooms protocol constants. */
+
+/** Room secret is a 256-bit raw byte value. */
+export const ROOM_SECRET_LENGTH_BYTES = 32;
+
+/** Admin secret is a 256-bit raw byte value. Distinct symbol from the room
+ * secret so the intent at each call site is explicit (even though the V1
+ * protocol uses the same length for both). */
+export const ADMIN_SECRET_LENGTH_BYTES = 32;
+
+/**
+ * WebSocket close code the server uses when the room is no longer available
+ * (deleted by admin, auto-expired at the 30-day mark, or never existed in
+ * the first place). Client code treats this as a terminal close and surfaces
+ * the same "link doesn't resolve" screen for all three cases — the server
+ * does not distinguish them to the client.
+ */
+export const WS_CLOSE_ROOM_UNAVAILABLE = 4006;
+
+/**
+ * Close reason string paired with WS_CLOSE_ROOM_UNAVAILABLE for every
+ * terminal close path (admin delete, auto-expiry, unknown-room connect).
+ * The server logs the specific trigger internally; the client sees only
+ * this one reason.
+ */
+export const WS_CLOSE_REASON_ROOM_UNAVAILABLE = 'Room unavailable';
+
+/**
+ * Admin-scoped error codes — the contract between server emit sites (in
+ * `apps/room-service/core/room-do.ts` admin handlers) and client handling
+ * (in `packages/shared/collab/client-runtime/client.ts` pending-admin
+ * rejection path).
+ *
+ * The server MUST emit admin-command errors only with codes from this
+ * namespace, and the client treats receipt of any of these while an
+ * admin command is pending as a rejection of that command (vs. ignoring
+ * event-channel errors like `validation_error` /
+ * `event_persist_failed` that are not part of the admin contract).
+ *
+ * Adding a new admin error code:
+ *   1. Add a key here.
+ *   2. Emit it server-side via `sendAdminError`.
+ *   3. `ADMIN_ERROR_CODES` and the runtime Set derive from this object
+ *      automatically; the client's contract test (see
+ *      `client-runtime/client.test.ts`) iterates the tuple and asserts
+ *      every code rejects a pending admin promise, so new entries are
+ *      enforced end-to-end.
+ */
+export const AdminErrorCode = {
+  ValidationError: 'admin_validation_error',
+  ClientIdMismatch: 'client_id_mismatch',
+  NoAdminChallenge: 'no_admin_challenge',
+  UnknownAdminChallenge: 'unknown_admin_challenge',
+  AdminChallengeExpired: 'admin_challenge_expired',
+  InvalidAdminProof: 'invalid_admin_proof',
+  DeleteFailed: 'delete_failed',
+} as const;
+
+export type AdminErrorCode = typeof AdminErrorCode[keyof typeof AdminErrorCode];
+
+export const ADMIN_ERROR_CODES: readonly AdminErrorCode[] =
+  Object.values(AdminErrorCode);
diff --git a/packages/shared/collab/crypto.test.ts b/packages/shared/collab/crypto.test.ts
new file mode 100644
index 000000000..17aed3441
--- /dev/null
+++ b/packages/shared/collab/crypto.test.ts
@@ -0,0 +1,347 @@
+import { describe, expect, test } from 'bun:test';
+import {
+  deriveRoomKeys,
+  deriveAdminKey,
+  computeRoomVerifier,
+  computeAdminVerifier,
+  computeAuthProof,
+  verifyAuthProof,
+  computeAdminProof,
+  verifyAdminProof,
+  encryptPayload,
+  decryptPayload,
+  encryptEventOp,
+  decryptEventPayload,
+  encryptPresence,
+  decryptPresence,
+  encryptSnapshot,
+  decryptSnapshot,
+} from './crypto';
+import type { AdminCommand, PresenceState, RoomEventClientOp, RoomSnapshot } from './types';
+
+// Stable test secret (32 bytes)
+const TEST_SECRET = new Uint8Array(32);
+TEST_SECRET.fill(0xab);
+
+const TEST_ADMIN_SECRET = new Uint8Array(32);
+TEST_ADMIN_SECRET.fill(0xcd);
+
+const TEST_ROOM_ID = 'test-room-abc123';
+
+// ---------------------------------------------------------------------------
+// Key Derivation — tested via observable outputs
+// ---------------------------------------------------------------------------
+
+describe('deriveRoomKeys', () => {
+  test('rejects non-256-bit room secrets', async () => {
+    await expect(deriveRoomKeys(new Uint8Array(31))).rejects.toThrow('Invalid room secret');
+    await expect(deriveRoomKeys(new Uint8Array(33))).rejects.toThrow('Invalid room secret');
+  });
+
+  test('same secret produces same verifier (deterministic)', async () => {
+    const keys1 = await deriveRoomKeys(TEST_SECRET);
+    const keys2 = await deriveRoomKeys(TEST_SECRET);
+
+    const v1 = await computeRoomVerifier(keys1.authKey, TEST_ROOM_ID);
+    const v2 = await computeRoomVerifier(keys2.authKey, TEST_ROOM_ID);
+    expect(v1).toBe(v2);
+  });
+
+  test('derives from the Uint8Array view, not the entire backing buffer', async () => {
+    const backing = new Uint8Array(96);
+    backing.fill(0xee);
+    backing.set(TEST_SECRET, 32);
+    const secretView = backing.subarray(32, 64);
+
+    const keys1 = await deriveRoomKeys(TEST_SECRET);
+    const keys2 = await deriveRoomKeys(secretView);
+
+    const v1 = await computeRoomVerifier(keys1.authKey, TEST_ROOM_ID);
+    const v2 = await computeRoomVerifier(keys2.authKey, TEST_ROOM_ID);
+    expect(v1).toBe(v2);
+  });
+
+  test('different secrets produce different verifiers', async () => {
+    const secret2 = new Uint8Array(32);
+    secret2.fill(0x99);
+
+    const keys1 = await deriveRoomKeys(TEST_SECRET);
+    const keys2 = await deriveRoomKeys(secret2);
+
+    const v1 = await computeRoomVerifier(keys1.authKey, TEST_ROOM_ID);
+    const v2 = await computeRoomVerifier(keys2.authKey, TEST_ROOM_ID);
+    expect(v1).not.toBe(v2);
+  });
+
+  test('different labels produce different keys (cross-key isolation)', async () => {
+    const { eventKey, presenceKey } = await deriveRoomKeys(TEST_SECRET);
+
+    // Encrypt with event key, try to decrypt with presence key — should fail
+    const ciphertext = await encryptPayload(eventKey, 'secret message');
+    await expect(decryptPayload(presenceKey, ciphertext)).rejects.toThrow();
+  });
+});
+
+describe('deriveAdminKey', () => {
+  test('rejects non-256-bit admin secrets', async () => {
+    await expect(deriveAdminKey(new Uint8Array(31))).rejects.toThrow('Invalid admin secret');
+    await expect(deriveAdminKey(new Uint8Array(33))).rejects.toThrow('Invalid admin secret');
+  });
+
+  test('same secret produces same admin verifier', async () => {
+    const key1 = await deriveAdminKey(TEST_ADMIN_SECRET);
+    const key2 = await deriveAdminKey(TEST_ADMIN_SECRET);
+
+    const v1 = await computeAdminVerifier(key1, TEST_ROOM_ID);
+    const v2 = await computeAdminVerifier(key2, TEST_ROOM_ID);
+    expect(v1).toBe(v2);
+  });
+
+  test('derives admin key from the Uint8Array view, not the entire backing buffer', async () => {
+    const backing = new Uint8Array(96);
+    backing.fill(0xee);
+    backing.set(TEST_ADMIN_SECRET, 32);
+    const secretView = backing.subarray(32, 64);
+
+    const key1 = await deriveAdminKey(TEST_ADMIN_SECRET);
+    const key2 = await deriveAdminKey(secretView);
+
+    const v1 = await computeAdminVerifier(key1, TEST_ROOM_ID);
+    const v2 = await computeAdminVerifier(key2, TEST_ROOM_ID);
+    expect(v1).toBe(v2);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// Verifiers
+// ---------------------------------------------------------------------------
+
+describe('computeRoomVerifier', () => {
+  test('different roomIds produce different verifiers', async () => {
+    const { authKey } = await deriveRoomKeys(TEST_SECRET);
+    const v1 = await computeRoomVerifier(authKey, 'room-a');
+    const v2 = await computeRoomVerifier(authKey, 'room-b');
+    expect(v1).not.toBe(v2);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// Auth Proofs
+// ---------------------------------------------------------------------------
+
+describe('auth proof', () => {
+  test('compute and verify round-trip', async () => {
+    const { authKey } = await deriveRoomKeys(TEST_SECRET);
+    const verifier = await computeRoomVerifier(authKey, TEST_ROOM_ID);
+
+    const proof = await computeAuthProof(verifier, TEST_ROOM_ID, 'client-1', 'ch_abc', 'nonce123');
+    const valid = await verifyAuthProof(verifier, TEST_ROOM_ID, 'client-1', 'ch_abc', 'nonce123', proof);
+    expect(valid).toBe(true);
+  });
+
+  test('wrong clientId rejects', async () => {
+    const { authKey } = await deriveRoomKeys(TEST_SECRET);
+    const verifier = await computeRoomVerifier(authKey, TEST_ROOM_ID);
+
+    const proof = await computeAuthProof(verifier, TEST_ROOM_ID, 'client-1', 'ch_abc', 'nonce123');
+    const valid = await verifyAuthProof(verifier, TEST_ROOM_ID, 'client-2', 'ch_abc', 'nonce123', proof);
+    expect(valid).toBe(false);
+  });
+
+  test('wrong nonce rejects', async () => {
+    const { authKey } = await deriveRoomKeys(TEST_SECRET);
+    const verifier = await computeRoomVerifier(authKey, TEST_ROOM_ID);
+
+    const proof = await computeAuthProof(verifier, TEST_ROOM_ID, 'client-1', 'ch_abc', 'nonce123');
+    const valid = await verifyAuthProof(verifier, TEST_ROOM_ID, 'client-1', 'ch_abc', 'wrong-nonce', proof);
+    expect(valid).toBe(false);
+  });
+
+  test('wrong verifier rejects', async () => {
+    const { authKey } = await deriveRoomKeys(TEST_SECRET);
+    const verifier = await computeRoomVerifier(authKey, TEST_ROOM_ID);
+
+    const secret2 = new Uint8Array(32);
+    secret2.fill(0x11);
+    const keys2 = await deriveRoomKeys(secret2);
+    const wrongVerifier = await computeRoomVerifier(keys2.authKey, TEST_ROOM_ID);
+
+    const proof = await computeAuthProof(verifier, TEST_ROOM_ID, 'client-1', 'ch_abc', 'nonce123');
+    const valid = await verifyAuthProof(wrongVerifier, TEST_ROOM_ID, 'client-1', 'ch_abc', 'nonce123', proof);
+    expect(valid).toBe(false);
+  });
+
+  test('malformed proof rejects without throwing', async () => {
+    const { authKey } = await deriveRoomKeys(TEST_SECRET);
+    const verifier = await computeRoomVerifier(authKey, TEST_ROOM_ID);
+
+    await expect(verifyAuthProof(verifier, TEST_ROOM_ID, 'client-1', 'ch_abc', 'nonce123', 'A'))
+      .resolves.toBe(false);
+    await expect(verifyAuthProof(verifier, TEST_ROOM_ID, 'client-1', 'ch_abc', 'nonce123', '!!!!'))
+      .resolves.toBe(false);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// Admin Proofs
+// ---------------------------------------------------------------------------
+
+describe('admin proof', () => {
+  test('compute and verify round-trip', async () => {
+    const adminKey = await deriveAdminKey(TEST_ADMIN_SECRET);
+    const verifier = await computeAdminVerifier(adminKey, TEST_ROOM_ID);
+    const command: AdminCommand = { type: 'room.delete' };
+
+    const proof = await computeAdminProof(verifier, TEST_ROOM_ID, 'client-1', 'ch_xyz', 'nonce456', command);
+    const valid = await verifyAdminProof(verifier, TEST_ROOM_ID, 'client-1', 'ch_xyz', 'nonce456', command, proof);
+    expect(valid).toBe(true);
+  });
+
+  test('wrong command rejects (proof is bound to canonicalJson(command))', async () => {
+    // V1 has a single AdminCommand shape (room.delete), so this exercises
+    // the binding via an unsanctioned command type — the proof must not
+    // verify for ANY command whose canonicalJson differs from what the
+    // proof was computed over.
+    const adminKey = await deriveAdminKey(TEST_ADMIN_SECRET);
+    const verifier = await computeAdminVerifier(adminKey, TEST_ROOM_ID);
+    const deleteCommand: AdminCommand = { type: 'room.delete' };
+    const otherCommand = { type: 'room.other' } as unknown as AdminCommand;
+
+    const proof = await computeAdminProof(verifier, TEST_ROOM_ID, 'client-1', 'ch_xyz', 'nonce456', deleteCommand);
+    const valid = await verifyAdminProof(verifier, TEST_ROOM_ID, 'client-1', 'ch_xyz', 'nonce456', otherCommand, proof);
+    expect(valid).toBe(false);
+  });
+
+  test('malformed proof rejects without throwing', async () => {
+    const adminKey = await deriveAdminKey(TEST_ADMIN_SECRET);
+    const verifier = await computeAdminVerifier(adminKey, TEST_ROOM_ID);
+    const command: AdminCommand = { type: 'room.delete' };
+
+    await expect(verifyAdminProof(verifier, TEST_ROOM_ID, 'client-1', 'ch_xyz', 'nonce456', command, 'A'))
+      .resolves.toBe(false);
+    await expect(verifyAdminProof(verifier, TEST_ROOM_ID, 'client-1', 'ch_xyz', 'nonce456', command, '!!!!'))
+      .resolves.toBe(false);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// AES-256-GCM Encrypt / Decrypt
+// ---------------------------------------------------------------------------
+
+describe('encryptPayload / decryptPayload', () => {
+  test('round-trip', async () => {
+    const { eventKey } = await deriveRoomKeys(TEST_SECRET);
+    const plaintext = 'hello, encrypted world!';
+    const ciphertext = await encryptPayload(eventKey, plaintext);
+    const decrypted = await decryptPayload(eventKey, ciphertext);
+    expect(decrypted).toBe(plaintext);
+  });
+
+  test('unique ciphertext per call (fresh IV)', async () => {
+    const { eventKey } = await deriveRoomKeys(TEST_SECRET);
+    const plaintext = 'same input';
+    const ct1 = await encryptPayload(eventKey, plaintext);
+    const ct2 = await encryptPayload(eventKey, plaintext);
+    expect(ct1).not.toBe(ct2);
+  });
+
+  test('wrong key fails', async () => {
+    const keys1 = await deriveRoomKeys(TEST_SECRET);
+    const secret2 = new Uint8Array(32);
+    secret2.fill(0x77);
+    const keys2 = await deriveRoomKeys(secret2);
+
+    const ciphertext = await encryptPayload(keys1.eventKey, 'secret');
+    await expect(decryptPayload(keys2.eventKey, ciphertext)).rejects.toThrow();
+  });
+
+  test('tampered ciphertext fails', async () => {
+    const { eventKey } = await deriveRoomKeys(TEST_SECRET);
+    const ciphertext = await encryptPayload(eventKey, 'secret');
+
+    // Flip a character in the middle
+    const tampered = ciphertext.slice(0, 20) + 'X' + ciphertext.slice(21);
+    await expect(decryptPayload(eventKey, tampered)).rejects.toThrow();
+  });
+});
+
+// ---------------------------------------------------------------------------
+// Channel Wrappers
+// ---------------------------------------------------------------------------
+
+describe('encryptEventOp / decryptEventPayload', () => {
+  test('round-trip with annotation.add', async () => {
+    const { eventKey } = await deriveRoomKeys(TEST_SECRET);
+    const op: RoomEventClientOp = {
+      type: 'annotation.add',
+      annotations: [{
+        id: 'ann-1',
+        blockId: 'b1',
+        startOffset: 0,
+        endOffset: 10,
+        type: 'COMMENT',
+        originalText: 'hello',
+        createdA: Date.now(),
+        text: 'my comment',
+      }],
+    };
+
+    const ciphertext = await encryptEventOp(eventKey, op);
+    const decrypted = await decryptEventPayload(eventKey, ciphertext);
+    expect(decrypted).toEqual(op);
+  });
+});
+
+describe('encryptPresence / decryptPresence', () => {
+  test('round-trip', async () => {
+    const { presenceKey } = await deriveRoomKeys(TEST_SECRET);
+    const presence: PresenceState = {
+      user: { id: 'user-1', name: 'swift-falcon-tater', color: '#ff0000' },
+      cursor: { blockId: 'block-3', x: 100, y: 200, coordinateSpace: 'block' },
+      activeAnnotationId: 'ann-5',
+      idle: false,
+    };
+
+    const ciphertext = await encryptPresence(presenceKey, presence);
+    const decrypted = await decryptPresence(presenceKey, ciphertext);
+    expect(decrypted).toEqual(presence);
+  });
+});
+
+describe('encryptSnapshot / decryptSnapshot', () => {
+  test('round-trip with real RoomSnapshot', async () => {
+    const { eventKey } = await deriveRoomKeys(TEST_SECRET);
+    const snapshot: RoomSnapshot = {
+      versionId: 'v1',
+      planMarkdown: '# My Plan\n\nStep 1: do the thing\nStep 2: profit',
+      annotations: [
+        {
+          id: 'ann-1',
+          blockId: 'b1',
+          startOffset: 0,
+          endOffset: 5,
+          type: 'COMMENT',
+          text: 'nice plan',
+          originalText: 'My Plan',
+          createdA: 1234567890,
+          author: 'alice',
+        },
+        {
+          id: 'ann-2',
+          blockId: 'b2',
+          startOffset: 0,
+          endOffset: 13,
+          type: 'DELETION',
+          originalText: 'do the thing',
+          createdA: 1234567891,
+        },
+      ],
+    };
+
+    const ciphertext = await encryptSnapshot(eventKey, snapshot);
+    const decrypted = await decryptSnapshot(eventKey, ciphertext);
+    expect(decrypted).toEqual(snapshot);
+    expect(decrypted.versionId).toBe('v1');
+    expect(decrypted.annotations.length).toBe(2);
+  });
+});
diff --git a/packages/shared/collab/crypto.ts b/packages/shared/collab/crypto.ts
new file mode 100644
index 000000000..45e6490e4
--- /dev/null
+++ b/packages/shared/collab/crypto.ts
@@ -0,0 +1,308 @@
+/**
+ * Plannotator Live Rooms — cryptographic primitives.
+ *
+ * HKDF key derivation, HMAC verifier/proof generation, and AES-256-GCM
+ * encrypt/decrypt for event, presence, and snapshot channels.
+ *
+ * Uses only Web Crypto API (crypto.subtle) — works in browsers, Bun,
+ * and Cloudflare Workers.
+ *
+ * Protocol decisions:
+ * - HKDF uses SHA-256 with a zero-filled 32-byte salt (standard when
+ *   no application-specific salt is provided).
+ * - HMAC input concatenation uses null byte (\0) separators between
+ *   components to prevent ambiguity.
+ * - AES-GCM uses a 12-byte random IV prepended to ciphertext.
+ */
+
+import { bytesToBase64url, base64urlToBytes } from './encoding';
+import { canonicalJson } from './canonical-json';
+import { ADMIN_SECRET_LENGTH_BYTES, ROOM_SECRET_LENGTH_BYTES } from './constants';
+import type { AdminCommand, PresenceState, RoomEventClientOp, RoomSnapshot } from './types';
+
+// ---------------------------------------------------------------------------
+// Constants
+// ---------------------------------------------------------------------------
+
+const HKDF_SALT = new Uint8Array(32); // zero-filled, per protocol spec
+const IV_LENGTH = 12;
+
+const LABELS = {
+  auth: 'plannotator:v1:room-auth',
+  event: 'plannotator:v1:event',
+  presence: 'plannotator:v1:presence',
+  admin: 'plannotator:v1:room-admin',
+  roomVerifier: 'plannotator:v1:room-verifier:',
+  adminVerifier: 'plannotator:v1:admin-verifier:',
+  authProof: 'plannotator:v1:auth-proof',
+  adminProof: 'plannotator:v1:admin-proof',
+} as const;
+
+// ---------------------------------------------------------------------------
+// Internal helpers
+// ---------------------------------------------------------------------------
+
+const encoder = new TextEncoder();
+const decoder = new TextDecoder();
+
+/** Copy a Uint8Array view into an exact ArrayBuffer for Web Crypto APIs. */
+function toArrayBuffer(bytes: Uint8Array): ArrayBuffer {
+  const copy = new Uint8Array(bytes.byteLength);
+  copy.set(bytes);
+  return copy.buffer;
+}
+
+/** Import raw secret bytes as HKDF key material. */
+async function importKeyMaterial(secret: Uint8Array): Promise<CryptoKey> {
+  return crypto.subtle.importKey('raw', toArrayBuffer(secret), 'HKDF', false, ['deriveKey']);
+}
+
+/** Derive an HMAC-SHA-256 key via HKDF. */
+async function deriveHmacKey(material: CryptoKey, info: string): Promise<CryptoKey> {
+  return crypto.subtle.deriveKey(
+    { name: 'HKDF', hash: 'SHA-256', salt: HKDF_SALT, info: encoder.encode(info) },
+    material,
+    { name: 'HMAC', hash: 'SHA-256' },
+    false,
+    ['sign', 'verify'],
+  );
+}
+
+/** Derive an AES-256-GCM key via HKDF. */
+async function deriveAesKey(material: CryptoKey, info: string): Promise<CryptoKey> {
+  return crypto.subtle.deriveKey(
+    { name: 'HKDF', hash: 'SHA-256', salt: HKDF_SALT, info: encoder.encode(info) },
+    material,
+    { name: 'AES-GCM', length: 256 },
+    false,
+    ['encrypt', 'decrypt'],
+  );
+}
+
+/**
+ * Concatenate string components with null byte separators.
+ * Returns UTF-8 encoded bytes for HMAC input.
+ */
+function concatComponents(...components: string[]): Uint8Array {
+  return encoder.encode(components.join('\0'));
+}
+
+/** Import a base64url-encoded verifier as an HMAC signing key. */
+async function importVerifierAsKey(verifierB64: string): Promise<CryptoKey> {
+  const bytes = base64urlToBytes(verifierB64);
+  return crypto.subtle.importKey(
+    'raw',
+    toArrayBuffer(bytes),
+    { name: 'HMAC', hash: 'SHA-256' },
+    false,
+    ['sign', 'verify'],
+  );
+}
+
+/** HMAC-SHA-256 sign and return base64url. */
+async function hmacSign(key: CryptoKey, data: Uint8Array): Promise<string> {
+  const sig = await crypto.subtle.sign('HMAC', key, toArrayBuffer(data));
+  return bytesToBase64url(new Uint8Array(sig));
+}
+
+/** HMAC-SHA-256 verify. */
+async function hmacVerify(key: CryptoKey, data: Uint8Array, signature: string): Promise<boolean> {
+  const sigBytes = base64urlToBytes(signature);
+  return crypto.subtle.verify('HMAC', key, toArrayBuffer(sigBytes), toArrayBuffer(data));
+}
+
+// ---------------------------------------------------------------------------
+// Key Derivation
+// ---------------------------------------------------------------------------
+
+/** Derive all room keys from a room secret. */
+export async function deriveRoomKeys(roomSecret: Uint8Array): Promise<{
+  authKey: CryptoKey;
+  eventKey: CryptoKey;
+  presenceKey: CryptoKey;
+}> {
+  if (roomSecret.length !== ROOM_SECRET_LENGTH_BYTES) {
+    throw new Error(`Invalid room secret: expected ${ROOM_SECRET_LENGTH_BYTES} bytes`);
+  }
+  const material = await importKeyMaterial(roomSecret);
+  const [authKey, eventKey, presenceKey] = await Promise.all([
+    deriveHmacKey(material, LABELS.auth),
+    deriveAesKey(material, LABELS.event),
+    deriveAesKey(material, LABELS.presence),
+  ]);
+  return { authKey, eventKey, presenceKey };
+}
+
+/** Derive the admin HMAC key from an admin secret. */
+export async function deriveAdminKey(adminSecret: Uint8Array): Promise<CryptoKey> {
+  if (adminSecret.length !== ADMIN_SECRET_LENGTH_BYTES) {
+    throw new Error(`Invalid admin secret: expected ${ADMIN_SECRET_LENGTH_BYTES} bytes`);
+  }
+  const material = await importKeyMaterial(adminSecret);
+  return deriveHmacKey(material, LABELS.admin);
+}
+
+// ---------------------------------------------------------------------------
+// Verifiers
+// ---------------------------------------------------------------------------
+
+/** Compute roomVerifier = HMAC(authKey, "plannotator:v1:room-verifier:" \0 roomId) */
+export async function computeRoomVerifier(authKey: CryptoKey, roomId: string): Promise<string> {
+  return hmacSign(authKey, concatComponents(LABELS.roomVerifier, roomId));
+}
+
+/** Compute adminVerifier = HMAC(adminKey, "plannotator:v1:admin-verifier:" \0 roomId) */
+export async function computeAdminVerifier(adminKey: CryptoKey, roomId: string): Promise<string> {
+  return hmacSign(adminKey, concatComponents(LABELS.adminVerifier, roomId));
+}
+
+// ---------------------------------------------------------------------------
+// Auth Proofs
+// ---------------------------------------------------------------------------
+
+/** Compute auth proof for WebSocket connection. */
+export async function computeAuthProof(
+  roomVerifier: string,
+  roomId: string,
+  clientId: string,
+  challengeId: string,
+  nonce: string,
+): Promise<string> {
+  const key = await importVerifierAsKey(roomVerifier);
+  return hmacSign(key, concatComponents(LABELS.authProof, roomId, clientId, challengeId, nonce));
+}
+
+/** Verify an auth proof against the stored room verifier. */
+export async function verifyAuthProof(
+  roomVerifier: string,
+  roomId: string,
+  clientId: string,
+  challengeId: string,
+  nonce: string,
+  proof: string,
+): Promise<boolean> {
+  try {
+    const key = await importVerifierAsKey(roomVerifier);
+    return await hmacVerify(key, concatComponents(LABELS.authProof, roomId, clientId, challengeId, nonce), proof);
+  } catch {
+    return false;
+  }
+}
+
+// ---------------------------------------------------------------------------
+// Admin Proofs
+// ---------------------------------------------------------------------------
+
+/** Compute admin proof for an admin command. */
+export async function computeAdminProof(
+  adminVerifier: string,
+  roomId: string,
+  clientId: string,
+  challengeId: string,
+  nonce: string,
+  command: AdminCommand,
+): Promise<string> {
+  const key = await importVerifierAsKey(adminVerifier);
+  const data = concatComponents(
+    LABELS.adminProof, roomId, clientId, challengeId, nonce, canonicalJson(command),
+  );
+  return hmacSign(key, data);
+}
+
+/** Verify an admin command proof. */
+export async function verifyAdminProof(
+  adminVerifier: string,
+  roomId: string,
+  clientId: string,
+  challengeId: string,
+  nonce: string,
+  command: AdminCommand,
+  proof: string,
+): Promise<boolean> {
+  try {
+    const key = await importVerifierAsKey(adminVerifier);
+    const data = concatComponents(
+      LABELS.adminProof, roomId, clientId, challengeId, nonce, canonicalJson(command),
+    );
+    return await hmacVerify(key, data, proof);
+  } catch {
+    return false;
+  }
+}
+
+// ---------------------------------------------------------------------------
+// AES-256-GCM Encrypt / Decrypt
+// ---------------------------------------------------------------------------
+
+/** Encrypt plaintext with AES-256-GCM. Returns base64url(IV || ciphertext+tag). */
+export async function encryptPayload(key: CryptoKey, plaintext: string): Promise<string> {
+  const iv = crypto.getRandomValues(new Uint8Array(IV_LENGTH));
+  const encrypted = await crypto.subtle.encrypt(
+    { name: 'AES-GCM', iv },
+    key,
+    encoder.encode(plaintext),
+  );
+  const combined = new Uint8Array(iv.length + encrypted.byteLength);
+  combined.set(iv, 0);
+  combined.set(new Uint8Array(encrypted), iv.length);
+  return bytesToBase64url(combined);
+}
+
+/** Decrypt base64url(IV || ciphertext+tag) with AES-256-GCM. Returns plaintext string. */
+export async function decryptPayload(key: CryptoKey, ciphertext: string): Promise<string> {
+  const combined = base64urlToBytes(ciphertext);
+  const iv = combined.slice(0, IV_LENGTH);
+  const encrypted = combined.slice(IV_LENGTH);
+  const decrypted = await crypto.subtle.decrypt(
+    { name: 'AES-GCM', iv },
+    key,
+    encrypted,
+  );
+  return decoder.decode(decrypted);
+}
+
+// ---------------------------------------------------------------------------
+// Channel convenience wrappers
+// ---------------------------------------------------------------------------
+
+/** Encrypt a RoomEventClientOp for the event channel.
+ *  Presence is intentionally NOT accepted here — the presence channel ships
+ *  a raw PresenceState via encryptPresence(). */
+export async function encryptEventOp(eventKey: CryptoKey, op: RoomEventClientOp): Promise<string> {
+  return encryptPayload(eventKey, JSON.stringify(op));
+}
+
+/** Decrypt an event channel ciphertext. */
+export async function decryptEventPayload(eventKey: CryptoKey, ciphertext: string): Promise<unknown> {
+  const plaintext = await decryptPayload(eventKey, ciphertext);
+  return JSON.parse(plaintext);
+}
+
+/** Encrypt a PresenceState for the presence channel. */
+export async function encryptPresence(presenceKey: CryptoKey, presence: PresenceState): Promise<string> {
+  return encryptPayload(presenceKey, JSON.stringify(presence));
+}
+
+/**
+ * Decrypt a presence channel ciphertext. Returns `unknown` — encryption only
+ * proves the sender had the presence key. Callers MUST validate the shape
+ * (via isPresenceState) before entering state.
+ */
+export async function decryptPresence(presenceKey: CryptoKey, ciphertext: string): Promise<unknown> {
+  const plaintext = await decryptPayload(presenceKey, ciphertext);
+  return JSON.parse(plaintext);
+}
+
+/** Encrypt a RoomSnapshot with the event key. */
+export async function encryptSnapshot(eventKey: CryptoKey, snapshot: RoomSnapshot): Promise<string> {
+  return encryptPayload(eventKey, JSON.stringify(snapshot));
+}
+
+/**
+ * Decrypt a snapshot ciphertext. Returns `unknown` — same reasoning as
+ * decryptPresence. Callers MUST validate via isRoomSnapshot before use.
+ */
+export async function decryptSnapshot(eventKey: CryptoKey, ciphertext: string): Promise<unknown> {
+  const plaintext = await decryptPayload(eventKey, ciphertext);
+  return JSON.parse(plaintext);
+}
diff --git a/packages/shared/collab/encoding.test.ts b/packages/shared/collab/encoding.test.ts
new file mode 100644
index 000000000..7848c31ec
--- /dev/null
+++ b/packages/shared/collab/encoding.test.ts
@@ -0,0 +1,77 @@
+import { describe, expect, test } from 'bun:test';
+import { bytesToBase64url, base64urlToBytes } from './encoding';
+
+describe('bytesToBase64url', () => {
+  test('encodes empty input', () => {
+    expect(bytesToBase64url(new Uint8Array(0))).toBe('');
+  });
+
+  test('encodes single byte', () => {
+    const result = bytesToBase64url(new Uint8Array([0xff]));
+    expect(result).not.toContain('+');
+    expect(result).not.toContain('/');
+    expect(result).not.toContain('=');
+  });
+
+  test('encodes all 256 byte values', () => {
+    const bytes = new Uint8Array(256);
+    for (let i = 0; i < 256; i++) bytes[i] = i;
+    const encoded = bytesToBase64url(bytes);
+    expect(encoded).not.toContain('+');
+    expect(encoded).not.toContain('/');
+    expect(encoded).not.toContain('=');
+  });
+
+  test('handles large payloads (> 65K)', () => {
+    const bytes = new Uint8Array(70_000);
+    crypto.getRandomValues(bytes);
+    const encoded = bytesToBase64url(bytes);
+    expect(encoded.length).toBeGreaterThan(0);
+    // Round-trip
+    const decoded = base64urlToBytes(encoded);
+    expect(decoded).toEqual(bytes);
+  });
+});
+
+describe('base64urlToBytes', () => {
+  test('decodes empty input', () => {
+    expect(base64urlToBytes('')).toEqual(new Uint8Array(0));
+  });
+
+  test('round-trips through encode/decode', () => {
+    const original = new Uint8Array([1, 2, 3, 4, 5, 6, 7, 8]);
+    const encoded = bytesToBase64url(original);
+    const decoded = base64urlToBytes(encoded);
+    expect(decoded).toEqual(original);
+  });
+
+  test('decodes valid unpadded input (length 2 mod 4 = 1 source byte)', () => {
+    // 1 byte -> 2 base64 chars (length % 4 === 2)
+    const original = new Uint8Array([42]);
+    const encoded = bytesToBase64url(original);
+    expect(encoded.length % 4).toBe(2);
+    expect(base64urlToBytes(encoded)).toEqual(original);
+  });
+
+  test('decodes valid unpadded input (length 3 mod 4 = 2 source bytes)', () => {
+    // 2 bytes -> 3 base64 chars (length % 4 === 3)
+    const original = new Uint8Array([42, 99]);
+    const encoded = bytesToBase64url(original);
+    expect(encoded.length % 4).toBe(3);
+    expect(base64urlToBytes(encoded)).toEqual(original);
+  });
+
+  test('rejects length 1 mod 4 as malformed', () => {
+    expect(() => base64urlToBytes('A')).toThrow('Invalid base64url');
+    expect(() => base64urlToBytes('AAAAA')).toThrow('Invalid base64url');
+  });
+
+  test('handles URL-safe characters (- and _)', () => {
+    // Encode bytes that produce + and / in standard base64
+    const original = new Uint8Array([251, 255, 191]);
+    const encoded = bytesToBase64url(original);
+    expect(encoded).toContain('-');
+    const decoded = base64urlToBytes(encoded);
+    expect(decoded).toEqual(original);
+  });
+});
diff --git a/packages/shared/collab/encoding.ts b/packages/shared/collab/encoding.ts
new file mode 100644
index 000000000..2622634eb
--- /dev/null
+++ b/packages/shared/collab/encoding.ts
@@ -0,0 +1,37 @@
+/**
+ * Base64url encode/decode helpers.
+ *
+ * Exported for use by collab crypto, IDs, and URL modules.
+ * Uses only btoa/atob — portable across browsers, Bun, and Cloudflare Workers.
+ */
+
+/** Encode a Uint8Array to a URL-safe base64 string (no padding). */
+export function bytesToBase64url(bytes: Uint8Array): string {
+  // Loop to avoid RangeError on large payloads (>65K args to String.fromCharCode)
+  let binary = '';
+  for (let i = 0; i < bytes.length; i++) {
+    binary += String.fromCharCode(bytes[i]);
+  }
+  return btoa(binary)
+    .replace(/\+/g, '-')
+    .replace(/\//g, '_')
+    .replace(/=/g, '');
+}
+
+/**
+ * Decode a URL-safe base64 string to a Uint8Array.
+ *
+ * Normalizes padding before atob for cross-runtime safety.
+ * Rejects strings whose length is 1 mod 4 (no valid byte count produces that length).
+ */
+export function base64urlToBytes(b64: string): Uint8Array {
+  if (b64.length % 4 === 1) {
+    throw new Error('Invalid base64url: length mod 4 cannot be 1');
+  }
+  // Restore standard base64 characters
+  const base64 = b64.replace(/-/g, '+').replace(/_/g, '/');
+  // Normalize padding
+  const padded = base64 + '==='.slice(0, (4 - base64.length % 4) % 4);
+  const binary = atob(padded);
+  return Uint8Array.from(binary, c => c.charCodeAt(0));
+}
diff --git a/packages/shared/collab/ids.test.ts b/packages/shared/collab/ids.test.ts
new file mode 100644
index 000000000..982e7f6f9
--- /dev/null
+++ b/packages/shared/collab/ids.test.ts
@@ -0,0 +1,73 @@
+import { describe, expect, test } from 'bun:test';
+import {
+  generateRoomId,
+  generateOpId,
+  generateClientId,
+  generateRoomSecret,
+  generateAdminSecret,
+  generateNonce,
+  generateChallengeId,
+} from './ids';
+import { base64urlToBytes } from './encoding';
+
+describe('generateRoomId', () => {
+  test('produces at least 128 bits of entropy', () => {
+    const id = generateRoomId();
+    const bytes = base64urlToBytes(id);
+    expect(bytes.length).toBeGreaterThanOrEqual(16);
+  });
+
+  test('produces unique values', () => {
+    const ids = new Set(Array.from({ length: 100 }, () => generateRoomId()));
+    expect(ids.size).toBe(100);
+  });
+});
+
+describe('generateOpId', () => {
+  test('produces unique values', () => {
+    const ids = new Set(Array.from({ length: 100 }, () => generateOpId()));
+    expect(ids.size).toBe(100);
+  });
+});
+
+describe('generateClientId', () => {
+  test('produces unique values', () => {
+    const ids = new Set(Array.from({ length: 100 }, () => generateClientId()));
+    expect(ids.size).toBe(100);
+  });
+});
+
+describe('generateRoomSecret', () => {
+  test('returns exactly 32 bytes', () => {
+    expect(generateRoomSecret().length).toBe(32);
+  });
+
+  test('returns Uint8Array', () => {
+    expect(generateRoomSecret()).toBeInstanceOf(Uint8Array);
+  });
+});
+
+describe('generateAdminSecret', () => {
+  test('returns exactly 32 bytes', () => {
+    expect(generateAdminSecret().length).toBe(32);
+  });
+});
+
+describe('generateNonce', () => {
+  test('decodes to 32 bytes', () => {
+    const nonce = generateNonce();
+    const bytes = base64urlToBytes(nonce);
+    expect(bytes.length).toBe(32);
+  });
+});
+
+describe('generateChallengeId', () => {
+  test('starts with ch_ prefix', () => {
+    expect(generateChallengeId()).toMatch(/^ch_/);
+  });
+
+  test('produces unique values', () => {
+    const ids = new Set(Array.from({ length: 100 }, () => generateChallengeId()));
+    expect(ids.size).toBe(100);
+  });
+});
diff --git a/packages/shared/collab/ids.ts b/packages/shared/collab/ids.ts
new file mode 100644
index 000000000..e1e331832
--- /dev/null
+++ b/packages/shared/collab/ids.ts
@@ -0,0 +1,47 @@
+/**
+ * High-entropy ID and secret generation for room protocol.
+ *
+ * All functions use crypto.getRandomValues() — portable across
+ * browsers, Bun, and Cloudflare Workers.
+ */
+
+import { bytesToBase64url } from './encoding';
+
+/** Generate a room ID with at least 128 bits of randomness. */
+export function generateRoomId(): string {
+  return bytesToBase64url(crypto.getRandomValues(new Uint8Array(16)));
+}
+
+/** Generate a unique operation ID. */
+export function generateOpId(): string {
+  return bytesToBase64url(crypto.getRandomValues(new Uint8Array(16)));
+}
+
+/** Generate a random client ID for a WebSocket connection. */
+export function generateClientId(): string {
+  return bytesToBase64url(crypto.getRandomValues(new Uint8Array(16)));
+}
+
+/**
+ * Generate a 256-bit room secret.
+ * Returns raw bytes (not base64url) because deriveRoomKeys() takes bytes directly.
+ * The URL helper handles encoding for the fragment.
+ */
+export function generateRoomSecret(): Uint8Array {
+  return crypto.getRandomValues(new Uint8Array(32));
+}
+
+/** Generate a 256-bit admin secret. Returns raw bytes. */
+export function generateAdminSecret(): Uint8Array {
+  return crypto.getRandomValues(new Uint8Array(32));
+}
+
+/** Generate a random nonce for challenge-response. */
+export function generateNonce(): string {
+  return bytesToBase64url(crypto.getRandomValues(new Uint8Array(32)));
+}
+
+/** Generate a challenge ID with "ch_" prefix. */
+export function generateChallengeId(): string {
+  return 'ch_' + bytesToBase64url(crypto.getRandomValues(new Uint8Array(16)));
+}
diff --git a/packages/shared/collab/index.ts b/packages/shared/collab/index.ts
new file mode 100644
index 000000000..afe3936fa
--- /dev/null
+++ b/packages/shared/collab/index.ts
@@ -0,0 +1,20 @@
+/**
+ * Plannotator Live Rooms — server-safe barrel export.
+ *
+ * This is the import path for Worker and Durable Object code:
+ *   import { ... } from '@plannotator/shared/collab'
+ *
+ * NOTE: ./url is intentionally NOT re-exported here — it is client-only.
+ * Browser and direct-agent clients should import from:
+ *   import { ... } from '@plannotator/shared/collab/client'
+ */
+
+export * from './types';
+export * from './constants';
+export * from './encoding';
+export * from './canonical-json';
+export * from './crypto';
+export * from './ids';
+export * from './strip-images';
+export * from './redact-url';
+export * from './validation';
diff --git a/packages/shared/collab/redact-url.test.ts b/packages/shared/collab/redact-url.test.ts
new file mode 100644
index 000000000..3990f8632
--- /dev/null
+++ b/packages/shared/collab/redact-url.test.ts
@@ -0,0 +1,80 @@
+import { describe, expect, test } from 'bun:test';
+import { redactRoomSecrets } from './redact-url';
+
+describe('redactRoomSecrets', () => {
+  test('returns empty string for null / undefined / empty', () => {
+    expect(redactRoomSecrets(null)).toBe('');
+    expect(redactRoomSecrets(undefined)).toBe('');
+    expect(redactRoomSecrets('')).toBe('');
+  });
+
+  test('leaves URLs without secrets untouched', () => {
+    expect(redactRoomSecrets('https://example.com/path')).toBe('https://example.com/path');
+    expect(redactRoomSecrets('https://example.com/?q=1')).toBe('https://example.com/?q=1');
+    expect(redactRoomSecrets('/relative/path#section')).toBe('/relative/path#section');
+  });
+
+  test('strips key from fragment (leading position)', () => {
+    const url = 'https://room.plannotator.ai/c/abc123#key=AAAABBBBCCCC';
+    // Fragment becomes "key=" which is all-scrubbed, so the entire fragment
+    // including the `#` is dropped.
+    expect(redactRoomSecrets(url)).toBe('https://room.plannotator.ai/c/abc123');
+  });
+
+  test('strips admin from fragment (second position)', () => {
+    const url = 'https://room.plannotator.ai/c/abc#key=AAA&admin=BBB';
+    expect(redactRoomSecrets(url)).toBe('https://room.plannotator.ai/c/abc');
+  });
+
+  test('strips key/admin from querystring preserving other params', () => {
+    const url = 'https://example.com/?foo=1&key=SECRET&bar=2&admin=SECRET';
+    expect(redactRoomSecrets(url)).toBe('https://example.com/?foo=1&key=&bar=2&admin=');
+  });
+
+  test('preserves fragment content when only part is secret', () => {
+    // Fragment contains `key=X` AND non-secret content — fragment must be kept.
+    const url = 'https://example.com/page#section-2&key=SECRET';
+    expect(redactRoomSecrets(url)).toBe('https://example.com/page#section-2&key=');
+  });
+
+  test('is case-insensitive on param name', () => {
+    const url = 'https://example.com/#KEY=abc&Admin=def';
+    expect(redactRoomSecrets(url)).toBe('https://example.com/');
+  });
+
+  test('is idempotent', () => {
+    const url = 'https://room.plannotator.ai/c/abc#key=ZZZZ&admin=YYYY';
+    const once = redactRoomSecrets(url);
+    const twice = redactRoomSecrets(once);
+    expect(twice).toBe(once);
+  });
+
+  test('does not falsely match keys that happen to contain "key" or "admin"', () => {
+    const url = 'https://example.com/?apikey=abc&sadmin=def';
+    // "apikey" and "sadmin" must NOT be scrubbed; only exact `key` / `admin`
+    // match the boundary regex.
+    expect(redactRoomSecrets(url)).toBe('https://example.com/?apikey=abc&sadmin=def');
+  });
+
+  test('handles URL where fragment has multiple scrubbed secrets plus a preserved non-secret param', () => {
+    const url = 'https://example.com/#page=3&key=AA&admin=BB';
+    expect(redactRoomSecrets(url)).toBe('https://example.com/#page=3&key=&admin=');
+  });
+
+  test('handles non-URL strings without throwing', () => {
+    expect(redactRoomSecrets('just some text')).toBe('just some text');
+    // Bare "key=..." at start-of-string is intentionally scrubbed — better to
+    // over-redact if a caller hands us an unexpected value than to leak.
+    expect(redactRoomSecrets('key=notaurl')).toBe('key=');
+  });
+
+  test('handles empty fragment and empty query gracefully', () => {
+    expect(redactRoomSecrets('https://example.com/#')).toBe('https://example.com/');
+    expect(redactRoomSecrets('https://example.com/?')).toBe('https://example.com/?');
+  });
+
+  test('non-string input (defensive) returns empty', () => {
+    expect(redactRoomSecrets(42 as unknown as string)).toBe('');
+    expect(redactRoomSecrets({} as unknown as string)).toBe('');
+  });
+});
diff --git a/packages/shared/collab/redact-url.ts b/packages/shared/collab/redact-url.ts
new file mode 100644
index 000000000..5418d3f39
--- /dev/null
+++ b/packages/shared/collab/redact-url.ts
@@ -0,0 +1,81 @@
+/**
+ * Scrub room credentials (`key` / `admin`) from any URL before it is handed to
+ * telemetry, error reporting, referrer headers, or logs.
+ *
+ * Threat model: the URL fragment `#key=<roomSecret>` is the product's access
+ * token. We intentionally keep the fragment in the visible URL bar so
+ * refresh + copy-address-bar keep working. That means any code path that
+ * captures `window.location.href` or `document.referrer` for reporting must
+ * route through this helper first. Missing one capture site would ship room
+ * secrets to third-party systems.
+ *
+ * Rules:
+ * - Remove `key` and `admin` params wherever they appear in the URL — query
+ *   and fragment, before or after any other keys. Preserve other params.
+ * - Values are replaced with the empty string rather than the key being
+ *   deleted entirely. That keeps downstream URL parsers from silently
+ *   mis-interpreting a missing key as "default roomSecret" (a mistake would
+ *   fail loudly instead of silently authing) and leaves the URL shape
+ *   identical — so logs that dedupe by URL still dedupe consistently.
+ * - If a fragment becomes empty after scrubbing, strip the leading `#` so
+ *   the URL doesn't grow a dangling separator.
+ * - Idempotent: redact(redact(x)) === redact(x).
+ * - Safe on non-URLs and non-string inputs. Never throws.
+ *
+ * We avoid the URL constructor here because:
+ *   1. Fragments containing `key=...&admin=...` are not part of URL's
+ *      searchParams API — fragments are opaque strings per WHATWG URL spec.
+ *   2. Relative URLs without a base would throw; we must tolerate them.
+ *   3. Manual regex-level substitution preserves exact non-secret formatting
+ *      (trailing slashes, encoded characters) which matters when the caller
+ *      diffs URLs for deduplication.
+ */
+
+const SECRET_PARAM_NAMES = ['key', 'admin'] as const;
+
+// Match `<name>=<value>` where value runs to the next `&` or end of string.
+// `\b` would miss `&key=...` at position 0 of a fragment; we match by explicit
+// boundary instead (start-of-string, `?`, `&`, or `#`). Capture the boundary
+// so we can put it back unchanged. Hoisted: the pattern is constant.
+const SECRET_REGEX = new RegExp(
+  `(^|[?&#])(${SECRET_PARAM_NAMES.join('|')})=[^&#]*`,
+  'gi',
+);
+
+export function redactRoomSecrets(url: string | null | undefined): string {
+  if (typeof url !== 'string' || url.length === 0) return '';
+
+  // String.prototype.replace with a global regex does NOT use lastIndex
+  // for iteration — it always starts from index 0. So the hoisted regex
+  // is safe to reuse without resetting lastIndex between calls.
+  const re = SECRET_REGEX;
+  let out = url.replace(re, (_match, boundary: string, name: string) => {
+    return `${boundary}${name}=`;
+  });
+
+  // If the fragment is now just `#` or `#&` or `#&&`, strip it. A stripped
+  // fragment is a cleaner reporting artifact; carrying empty `#` into a log
+  // can mask legitimate "same URL, different fragment" signal.
+  const hashIdx = out.indexOf('#');
+  if (hashIdx !== -1) {
+    const fragment = out.slice(hashIdx + 1);
+    // Fragment is "empty" if every param's value is blank AND no non-secret
+    // content remains. We look for any char that's not `&`, `=`, or a known
+    // scrubbed-secret-name token.
+    const onlyScrubbedSecrets = fragment
+      .split('&')
+      .every((part) => {
+        if (part === '') return true;
+        const eq = part.indexOf('=');
+        if (eq === -1) return false;  // non-kv token = real content
+        const key = part.slice(0, eq).toLowerCase();
+        const value = part.slice(eq + 1);
+        return SECRET_PARAM_NAMES.includes(key as (typeof SECRET_PARAM_NAMES)[number]) && value === '';
+      });
+    if (onlyScrubbedSecrets) {
+      out = out.slice(0, hashIdx);
+    }
+  }
+
+  return out;
+}
diff --git a/packages/shared/collab/strip-images.test.ts b/packages/shared/collab/strip-images.test.ts
new file mode 100644
index 000000000..c50698154
--- /dev/null
+++ b/packages/shared/collab/strip-images.test.ts
@@ -0,0 +1,142 @@
+import { describe, expect, test } from 'bun:test';
+import { toRoomAnnotation, stripRoomAnnotationImages } from './strip-images';
+
+describe('toRoomAnnotation', () => {
+  test('strips images field', () => {
+    const annotation = {
+      id: 'ann-1',
+      blockId: 'block-1',
+      startOffset: 0,
+      endOffset: 10,
+      type: 'COMMENT' as const,
+      text: 'a comment',
+      originalText: 'some text',
+      createdA: Date.now(),
+      images: [{ path: '/tmp/image.png', name: 'screenshot' }],
+    };
+
+    const room = toRoomAnnotation(annotation);
+    expect(room.id).toBe('ann-1');
+    expect(room.text).toBe('a comment');
+    expect(room.originalText).toBe('some text');
+    expect('images' in room).toBe(false);
+  });
+
+  test('preserves all non-image fields', () => {
+    const annotation = {
+      id: 'ann-2',
+      blockId: 'block-2',
+      startOffset: 5,
+      endOffset: 15,
+      type: 'DELETION' as const,
+      originalText: 'deleted text',
+      createdA: 1234567890,
+      author: 'swift-falcon-tater',
+      source: 'eslint',
+      isQuickLabel: true,
+      diffContext: 'added' as const,
+      images: [{ path: '/tmp/a.png', name: 'a' }],
+    };
+
+    const room = toRoomAnnotation(annotation);
+    expect(room.author).toBe('swift-falcon-tater');
+    expect(room.source).toBe('eslint');
+    expect(room.isQuickLabel).toBe(true);
+    expect(room.diffContext).toBe('added');
+  });
+
+  test('works on annotation without images', () => {
+    const annotation = {
+      id: 'ann-3',
+      blockId: 'block-3',
+      startOffset: 0,
+      endOffset: 5,
+      type: 'GLOBAL_COMMENT' as const,
+      text: 'global note',
+      originalText: '',
+      createdA: Date.now(),
+    };
+
+    const room = toRoomAnnotation(annotation);
+    expect(room.id).toBe('ann-3');
+    expect(room.text).toBe('global note');
+    expect('images' in room).toBe(false);
+  });
+
+  test('serialized output has no images key', () => {
+    const annotation = {
+      id: 'ann-4',
+      type: 'COMMENT' as const,
+      images: [{ path: '/tmp/x.png', name: 'x' }],
+    };
+    const room = toRoomAnnotation(annotation);
+    const json = JSON.stringify(room);
+    expect(json).not.toContain('images');
+  });
+});
+
+// Batch conversion (`toRoomAnnotations`) is module-private; it's
+// exercised transitively through `stripRoomAnnotationImages` below.
+
+describe('stripRoomAnnotationImages', () => {
+  test('returns clean annotations with images removed', () => {
+    const annotations = [
+      { id: '1', type: 'COMMENT' as const, images: [{ path: '/a', name: 'a' }] },
+      { id: '2', type: 'DELETION' as const },
+    ];
+    const { clean, strippedCount } = stripRoomAnnotationImages(annotations);
+    expect(clean.length).toBe(2);
+    for (const a of clean) expect('images' in a).toBe(false);
+    expect(strippedCount).toBe(1);
+  });
+
+  test('counts only annotations with non-empty images arrays', () => {
+    const annotations = [
+      { id: '1', images: [{ path: '/a', name: 'a' }] },               // counts
+      { id: '2', images: [{ path: '/b', name: 'b' }, { path: '/c', name: 'c' }] }, // counts
+      { id: '3', images: [] },                                         // does NOT count (empty)
+      { id: '4' },                                                     // does NOT count (undefined)
+    ];
+    const { strippedCount } = stripRoomAnnotationImages(annotations);
+    expect(strippedCount).toBe(2);
+  });
+
+  test('returns 0 count for empty input', () => {
+    const { clean, strippedCount } = stripRoomAnnotationImages([]);
+    expect(clean).toEqual([]);
+    expect(strippedCount).toBe(0);
+  });
+
+  test('returns 0 count when no annotations carry images', () => {
+    const annotations = [
+      { id: '1', type: 'COMMENT' as const },
+      { id: '2', type: 'DELETION' as const, images: undefined },
+    ];
+    const { strippedCount } = stripRoomAnnotationImages(annotations);
+    expect(strippedCount).toBe(0);
+  });
+
+  test('strippedCount includes globalAttachments length', () => {
+    const annotations = [
+      { id: '1', type: 'COMMENT' as const, images: [{ path: '/a', name: 'a' }] },
+      { id: '2', type: 'DELETION' as const },
+    ];
+    const globals = [
+      { path: '/g1', name: 'g1' },
+      { path: '/g2', name: 'g2' },
+    ];
+    const { clean, strippedCount } = stripRoomAnnotationImages(annotations, globals);
+    // 1 image-bearing annotation + 2 globals = 3 items not traveling.
+    expect(strippedCount).toBe(3);
+    // clean still only reflects annotation shape, no globals merged in.
+    expect(clean.length).toBe(2);
+  });
+
+  test('omitting globalAttachments defaults to 0 (back-compat with callers)', () => {
+    const annotations = [
+      { id: '1', type: 'COMMENT' as const, images: [{ path: '/a', name: 'a' }] },
+    ];
+    const { strippedCount } = stripRoomAnnotationImages(annotations);
+    expect(strippedCount).toBe(1);
+  });
+});
diff --git a/packages/shared/collab/strip-images.ts b/packages/shared/collab/strip-images.ts
new file mode 100644
index 000000000..2d2abde89
--- /dev/null
+++ b/packages/shared/collab/strip-images.ts
@@ -0,0 +1,58 @@
+/**
+ * Image stripping for converting Annotation objects into RoomAnnotation.
+ *
+ * Uses a generic approach to avoid importing Annotation from @plannotator/ui.
+ * Callers in packages/ui or packages/editor pass Annotation values; this
+ * helper strips the images field.
+ */
+
+/** Strip the images field from an annotation-like object. */
+export function toRoomAnnotation<T extends { images?: unknown }>(
+  annotation: T,
+): Omit<T, 'images'> {
+  const { images: _, ...rest } = annotation;
+  return rest;
+}
+
+/**
+ * Batch conversion. Module-private — the public entry for room-bound
+ * annotations is `stripRoomAnnotationImages`, which returns both the
+ * `clean` batch and the total `strippedCount`. Direct callers should
+ * use `toRoomAnnotation` for a single annotation or
+ * `stripRoomAnnotationImages` for a batch; this internal helper is
+ * intentionally not exported so the count reporting stays centralized.
+ */
+function toRoomAnnotations<T extends { images?: unknown }>(
+  annotations: T[],
+): Omit<T, 'images'>[] {
+  return annotations.map(toRoomAnnotation);
+}
+
+/**
+ * Batch conversion + count of how many local items will NOT travel to
+ * the room.
+ *
+ * Used by the creator flow to decide whether to show an "N items
+ * stripped" notice before creating a room. The count combines:
+ *   - annotations with a non-empty `images` array (per-annotation
+ *     attachments — only `clean` carries forward), and
+ *   - the length of an optional `globalAttachments` list (separate
+ *     top-level attachments; room snapshots don't carry these at all).
+ *
+ * An annotation counts as image-bearing only if `images` is a non-empty
+ * array — a bare `undefined` field or `[]` does not trigger the notice.
+ * The notice text, the URL `&stripped=N` handoff, and any future
+ * analytics all read from `strippedCount`, so there's exactly one
+ * definition of "how many images won't travel".
+ */
+export function stripRoomAnnotationImages<T extends { images?: unknown }>(
+  annotations: T[],
+  globalAttachments: readonly unknown[] = [],
+): { clean: Omit<T, 'images'>[]; strippedCount: number } {
+  let strippedCount = globalAttachments.length;
+  for (const a of annotations) {
+    const imgs = (a as { images?: unknown }).images;
+    if (Array.isArray(imgs) && imgs.length > 0) strippedCount++;
+  }
+  return { clean: toRoomAnnotations(annotations), strippedCount };
+}
diff --git a/packages/shared/collab/types.test.ts b/packages/shared/collab/types.test.ts
new file mode 100644
index 000000000..c260beb83
--- /dev/null
+++ b/packages/shared/collab/types.test.ts
@@ -0,0 +1,355 @@
+/**
+ * Unit tests for runtime validators — isPresenceState, isRoomAnnotation,
+ * isRoomAnnotationPatch, isRoomClientOp, isRoomSnapshot.
+ *
+ * These validators run on the client after decryption to reject structurally
+ * malformed payloads before they enter client state. Coverage focuses on
+ * edge cases that could crash UI render paths.
+ */
+
+import { describe, expect, test } from 'bun:test';
+import {
+  isPresenceState,
+  isRoomAnnotation,
+  isRoomAnnotationPatch,
+  isRoomClientOp,
+  isRoomSnapshot,
+  type RoomAnnotation,
+} from './types';
+
+const GOOD_ANN: RoomAnnotation = {
+  id: 'ann-1',
+  blockId: 'b1',
+  startOffset: 0,
+  endOffset: 5,
+  type: 'COMMENT',
+  originalText: 'hello',
+  createdA: 1234,
+};
+
+describe('isRoomAnnotation', () => {
+  test('accepts a minimal valid annotation', () => {
+    expect(isRoomAnnotation(GOOD_ANN)).toBe(true);
+  });
+
+  test('accepts an annotation with all optional fields', () => {
+    expect(isRoomAnnotation({
+      ...GOOD_ANN,
+      text: 'my comment',
+      author: 'alice',
+      source: 'eslint',
+      isQuickLabel: true,
+      quickLabelTip: 'tip',
+      diffContext: 'added',
+      startMeta: { parentTagName: 'p', parentIndex: 0, textOffset: 3 },
+      endMeta: { parentTagName: 'p', parentIndex: 0, textOffset: 8 },
+    })).toBe(true);
+  });
+
+  test.each([
+    ['null', null],
+    ['undefined', undefined],
+    ['string', 'not-an-obj'],
+    ['number', 42],
+    ['array', [GOOD_ANN]],
+  ])('rejects non-object: %s', (_label, input) => {
+    expect(isRoomAnnotation(input)).toBe(false);
+  });
+
+  test('rejects null id', () => {
+    expect(isRoomAnnotation({ ...GOOD_ANN, id: null })).toBe(false);
+  });
+
+  test('rejects empty id', () => {
+    expect(isRoomAnnotation({ ...GOOD_ANN, id: '' })).toBe(false);
+  });
+
+  test('rejects null type', () => {
+    expect(isRoomAnnotation({ ...GOOD_ANN, type: null })).toBe(false);
+  });
+
+  test('rejects unknown type enum', () => {
+    expect(isRoomAnnotation({ ...GOOD_ANN, type: 'SOMETHING_ELSE' })).toBe(false);
+  });
+
+  test('rejects non-string originalText', () => {
+    expect(isRoomAnnotation({ ...GOOD_ANN, originalText: 42 })).toBe(false);
+    expect(isRoomAnnotation({ ...GOOD_ANN, originalText: null })).toBe(false);
+  });
+
+  test('rejects non-finite offsets', () => {
+    expect(isRoomAnnotation({ ...GOOD_ANN, startOffset: NaN })).toBe(false);
+    expect(isRoomAnnotation({ ...GOOD_ANN, endOffset: Infinity })).toBe(false);
+  });
+
+  test('rejects wrong-typed optionals', () => {
+    expect(isRoomAnnotation({ ...GOOD_ANN, text: 42 })).toBe(false);
+    expect(isRoomAnnotation({ ...GOOD_ANN, author: true })).toBe(false);
+    expect(isRoomAnnotation({ ...GOOD_ANN, isQuickLabel: 'yes' })).toBe(false);
+    expect(isRoomAnnotation({ ...GOOD_ANN, diffContext: 'unexpected' })).toBe(false);
+  });
+
+  test('rejects malformed startMeta', () => {
+    expect(isRoomAnnotation({
+      ...GOOD_ANN,
+      startMeta: { parentTagName: 'p', parentIndex: 'x', textOffset: 3 },
+    })).toBe(false);
+  });
+
+  test('rejects presence of images field (V1 room annotations have no images)', () => {
+    expect(isRoomAnnotation({ ...GOOD_ANN, images: [{ path: '/t', name: 'n' }] })).toBe(false);
+  });
+
+  test('inline annotations (COMMENT, DELETION) require non-empty blockId', () => {
+    expect(isRoomAnnotation({ ...GOOD_ANN, type: 'COMMENT', blockId: '' })).toBe(false);
+    expect(isRoomAnnotation({ ...GOOD_ANN, type: 'DELETION', blockId: '' })).toBe(false);
+  });
+
+  test('GLOBAL_COMMENT is allowed to carry blockId: "" (matches existing UI convention)', () => {
+    expect(isRoomAnnotation({
+      ...GOOD_ANN,
+      type: 'GLOBAL_COMMENT',
+      blockId: '',
+    })).toBe(true);
+  });
+});
+
+describe('isRoomAnnotationPatch', () => {
+  test('rejects empty patch (no defined allowed fields — would burn a seq for a no-op)', () => {
+    expect(isRoomAnnotationPatch({})).toBe(false);
+  });
+
+  test('rejects patch where every field is explicitly undefined', () => {
+    expect(isRoomAnnotationPatch({ text: undefined })).toBe(false);
+    expect(isRoomAnnotationPatch({ text: undefined, author: undefined })).toBe(false);
+  });
+
+  test('accepts single-field patches', () => {
+    expect(isRoomAnnotationPatch({ text: 'new' })).toBe(true);
+    expect(isRoomAnnotationPatch({ type: 'DELETION' })).toBe(true);
+    expect(isRoomAnnotationPatch({ diffContext: 'modified' })).toBe(true);
+  });
+
+  test('rejects patch that sets required field to invalid value', () => {
+    expect(isRoomAnnotationPatch({ type: null })).toBe(false);
+    expect(isRoomAnnotationPatch({ originalText: 42 })).toBe(false);
+    expect(isRoomAnnotationPatch({ startOffset: NaN })).toBe(false);
+  });
+
+  test('rejects patch that tries to mutate annotation id (identity-mutation attack)', () => {
+    // Even a well-formed string id is rejected — an annotation.update must
+    // never change the id of an existing annotation.
+    expect(isRoomAnnotationPatch({ id: 'other-id' })).toBe(false);
+    expect(isRoomAnnotationPatch({ id: '' })).toBe(false);
+  });
+
+  test('rejects patch that tries to add images field', () => {
+    expect(isRoomAnnotationPatch({ images: [{ path: '/x', name: 'x' }] })).toBe(false);
+  });
+});
+
+describe('isRoomClientOp', () => {
+  test('accepts annotation.add with valid annotations', () => {
+    expect(isRoomClientOp({ type: 'annotation.add', annotations: [GOOD_ANN] })).toBe(true);
+  });
+
+  test('rejects annotation.add with malformed annotation', () => {
+    expect(isRoomClientOp({
+      type: 'annotation.add',
+      annotations: [{ ...GOOD_ANN, type: null }],
+    })).toBe(false);
+  });
+
+  test('rejects annotation.add with non-array annotations', () => {
+    expect(isRoomClientOp({ type: 'annotation.add', annotations: GOOD_ANN })).toBe(false);
+  });
+
+  test('rejects annotation.add with empty array (no-op would burn a seq)', () => {
+    expect(isRoomClientOp({ type: 'annotation.add', annotations: [] })).toBe(false);
+  });
+
+  test('rejects annotation.remove with empty ids array (no-op would burn a seq)', () => {
+    expect(isRoomClientOp({ type: 'annotation.remove', ids: [] })).toBe(false);
+  });
+
+  test('accepts annotation.update with valid patch', () => {
+    expect(isRoomClientOp({
+      type: 'annotation.update', id: 'ann-1', patch: { text: 'new' },
+    })).toBe(true);
+  });
+
+  test('rejects annotation.update with empty id', () => {
+    expect(isRoomClientOp({
+      type: 'annotation.update', id: '', patch: {},
+    })).toBe(false);
+  });
+
+  test('rejects annotation.update with invalid patch', () => {
+    expect(isRoomClientOp({
+      type: 'annotation.update', id: 'ann-1', patch: { type: 'BAD' },
+    })).toBe(false);
+  });
+
+  test('accepts annotation.remove with string ids', () => {
+    expect(isRoomClientOp({ type: 'annotation.remove', ids: ['a', 'b'] })).toBe(true);
+  });
+
+  test('rejects annotation.remove with empty-string id', () => {
+    expect(isRoomClientOp({ type: 'annotation.remove', ids: [''] })).toBe(false);
+  });
+
+  test('accepts annotation.clear with and without source', () => {
+    expect(isRoomClientOp({ type: 'annotation.clear' })).toBe(true);
+    expect(isRoomClientOp({ type: 'annotation.clear', source: 'eslint' })).toBe(true);
+  });
+
+  test('rejects unknown op type', () => {
+    expect(isRoomClientOp({ type: 'annotation.explode' })).toBe(false);
+  });
+
+  test('accepts presence.update with valid PresenceState', () => {
+    expect(isRoomClientOp({
+      type: 'presence.update',
+      presence: { user: { id: 'u', name: 'n', color: '#f00' }, cursor: null },
+    })).toBe(true);
+  });
+
+  test('rejects presence.update with malformed presence', () => {
+    expect(isRoomClientOp({
+      type: 'presence.update',
+      presence: { user: { id: 'u', name: 42, color: '#f00' }, cursor: null },
+    })).toBe(false);
+  });
+});
+
+describe('isRoomSnapshot', () => {
+  test('accepts a minimal valid snapshot', () => {
+    expect(isRoomSnapshot({ versionId: 'v1', planMarkdown: '# Plan', annotations: [] })).toBe(true);
+  });
+
+  test('accepts a snapshot with annotations', () => {
+    expect(isRoomSnapshot({
+      versionId: 'v1', planMarkdown: '# Plan', annotations: [GOOD_ANN],
+    })).toBe(true);
+  });
+
+  test('rejects wrong versionId', () => {
+    expect(isRoomSnapshot({ versionId: 'v2', planMarkdown: '', annotations: [] })).toBe(false);
+    expect(isRoomSnapshot({ versionId: null, planMarkdown: '', annotations: [] })).toBe(false);
+  });
+
+  test('rejects non-string planMarkdown', () => {
+    expect(isRoomSnapshot({ versionId: 'v1', planMarkdown: 42, annotations: [] })).toBe(false);
+  });
+
+  test('rejects non-array annotations', () => {
+    expect(isRoomSnapshot({ versionId: 'v1', planMarkdown: '', annotations: 'not-array' })).toBe(false);
+  });
+
+  test('rejects if any annotation is malformed', () => {
+    expect(isRoomSnapshot({
+      versionId: 'v1', planMarkdown: '', annotations: [{ ...GOOD_ANN, type: null }],
+    })).toBe(false);
+  });
+
+  test('rejects snapshot with unknown top-level keys', () => {
+    expect(isRoomSnapshot({
+      versionId: 'v1', planMarkdown: '', annotations: [], future: 'smuggled',
+    })).toBe(false);
+  });
+});
+
+describe('isPresenceState', () => {
+  test('accepts minimal presence (null cursor)', () => {
+    expect(isPresenceState({
+      user: { id: 'u', name: 'alice', color: '#f00' }, cursor: null,
+    })).toBe(true);
+  });
+
+  test('accepts presence with cursor', () => {
+    expect(isPresenceState({
+      user: { id: 'u', name: 'alice', color: '#f00' },
+      cursor: { x: 1, y: 2, coordinateSpace: 'document' },
+    })).toBe(true);
+  });
+
+  test('rejects non-string name', () => {
+    expect(isPresenceState({
+      user: { id: 'u', name: 42, color: '#f00' }, cursor: null,
+    })).toBe(false);
+  });
+
+  test('rejects payload missing required user field', () => {
+    expect(isPresenceState({ cursor: null })).toBe(false);
+  });
+
+  test('rejects payload missing required cursor field (must be explicit, not absent)', () => {
+    expect(isPresenceState({ user: { id: 'u', name: 'a', color: '#f00' } })).toBe(false);
+  });
+
+  test('rejects cursor without required fields', () => {
+    expect(isPresenceState({
+      user: { id: 'u', name: 'a', color: '#f00' },
+      cursor: { x: 1 },
+    })).toBe(false);
+  });
+
+  test('rejects cursor with unknown coordinateSpace', () => {
+    expect(isPresenceState({
+      user: { id: 'u', name: 'a', color: '#f00' },
+      cursor: { x: 1, y: 2, coordinateSpace: 'galaxy' },
+    })).toBe(false);
+  });
+
+  test('rejects non-finite cursor coordinates', () => {
+    const base = { user: { id: 'u', name: 'a', color: '#f00' } };
+    expect(isPresenceState({ ...base, cursor: { x: Infinity, y: 2, coordinateSpace: 'document' } })).toBe(false);
+    expect(isPresenceState({ ...base, cursor: { x: -Infinity, y: 2, coordinateSpace: 'document' } })).toBe(false);
+    expect(isPresenceState({ ...base, cursor: { x: NaN, y: 2, coordinateSpace: 'document' } })).toBe(false);
+    expect(isPresenceState({ ...base, cursor: { x: 1, y: Infinity, coordinateSpace: 'document' } })).toBe(false);
+    expect(isPresenceState({ ...base, cursor: { x: 1, y: NaN, coordinateSpace: 'document' } })).toBe(false);
+  });
+
+  test('rejects unknown top-level keys', () => {
+    expect(isPresenceState({
+      user: { id: 'u', name: 'a', color: '#f00' },
+      cursor: null,
+      extra: 'smuggled',
+    })).toBe(false);
+  });
+
+  test('rejects unknown keys on user', () => {
+    expect(isPresenceState({
+      user: { id: 'u', name: 'a', color: '#f00', email: 'leak@example.com' },
+      cursor: null,
+    })).toBe(false);
+  });
+
+  test('rejects unknown keys on cursor', () => {
+    expect(isPresenceState({
+      user: { id: 'u', name: 'a', color: '#f00' },
+      cursor: { x: 1, y: 2, coordinateSpace: 'document', z: 3 },
+    })).toBe(false);
+  });
+});
+
+describe('nested annotation meta — strict key allowlist', () => {
+  test('rejects annotation meta with unknown keys', () => {
+    expect(isRoomAnnotation({
+      ...GOOD_ANN,
+      startMeta: { parentTagName: 'p', parentIndex: 0, textOffset: 0, sneaky: true },
+    })).toBe(false);
+    expect(isRoomAnnotation({
+      ...GOOD_ANN,
+      endMeta: { parentTagName: 'p', parentIndex: 0, textOffset: 0, sneaky: true },
+    })).toBe(false);
+  });
+
+  test('accepts annotation meta with exactly the allowlisted keys', () => {
+    expect(isRoomAnnotation({
+      ...GOOD_ANN,
+      startMeta: { parentTagName: 'p', parentIndex: 0, textOffset: 3 },
+      endMeta: { parentTagName: 'p', parentIndex: 0, textOffset: 8 },
+    })).toBe(true);
+  });
+});
diff --git a/packages/shared/collab/types.ts b/packages/shared/collab/types.ts
new file mode 100644
index 000000000..3e2d8161b
--- /dev/null
+++ b/packages/shared/collab/types.ts
@@ -0,0 +1,515 @@
+/**
+ * Plannotator Live Rooms — canonical protocol types.
+ *
+ * RoomAnnotation is a structural copy of the Annotation type from
+ * packages/ui/types.ts with the `images` field excluded (V1 rooms
+ * do not support image attachments). If Annotation gains new fields,
+ * they must be manually added here when they should be part of the
+ * room protocol.
+ *
+ * RoomState is intentionally NOT defined here — it contains server-only
+ * fields (roomVerifier, adminVerifier, event log) and belongs in
+ * apps/room-service.
+ */
+
+// ---------------------------------------------------------------------------
+// Room Annotation
+// ---------------------------------------------------------------------------
+
+/** Annotation type values matching AnnotationType enum in packages/ui/types.ts */
+export type RoomAnnotationType = 'DELETION' | 'COMMENT' | 'GLOBAL_COMMENT';
+
+/**
+ * Room-safe annotation. Structurally matches Annotation from packages/ui/types.ts
+ * minus the images field. V1 rooms do not support image attachments.
+ */
+export interface RoomAnnotation {
+  id: string;
+  blockId: string;
+  startOffset: number;
+  endOffset: number;
+  type: RoomAnnotationType;
+  text?: string;
+  originalText: string;
+  /**
+   * Creation timestamp in ms. Field name intentionally mirrors the existing
+   * UI `Annotation.createdA` (see `packages/ui/types.ts`). DO NOT rename —
+   * existing UI code, existing annotations persisted to disk, and share-URL
+   * payloads all use this exact key.
+   */
+  createdA: number;
+  author?: string;
+  source?: string;
+  isQuickLabel?: boolean;
+  quickLabelTip?: string;
+  diffContext?: 'added' | 'removed' | 'modified';
+  startMeta?: { parentTagName: string; parentIndex: number; textOffset: number };
+  endMeta?: { parentTagName: string; parentIndex: number; textOffset: number };
+  images?: never;
+}
+
+const ANNOTATION_META_KEYS = new Set(['parentTagName', 'parentIndex', 'textOffset']);
+function isAnnotationMeta(x: unknown): boolean {
+  if (x === null || typeof x !== 'object') return false;
+  const m = x as Record<string, unknown>;
+  // Strict boundary: reject unknown nested keys so the validator doesn't drift.
+  for (const key of Object.keys(m)) {
+    if (!ANNOTATION_META_KEYS.has(key)) return false;
+  }
+  return (
+    typeof m.parentTagName === 'string' &&
+    typeof m.parentIndex === 'number' && Number.isFinite(m.parentIndex) &&
+    typeof m.textOffset === 'number' && Number.isFinite(m.textOffset)
+  );
+}
+
+/**
+ * Centralized per-field validators for RoomAnnotation. Both isRoomAnnotation
+ * and isRoomAnnotationPatch delegate to this so field definitions don't drift
+ * when annotation fields are added. Each entry returns true if the value is
+ * acceptable for that field (either as a full-annotation required field or as
+ * a patch override, depending on the caller).
+ *
+ * The `satisfies` constraint forces this map to cover every RoomAnnotation key
+ * except `images` (which V1 rejects outright). Adding a new field to
+ * RoomAnnotation without a matching validator here is a compile error.
+ */
+const ROOM_ANNOTATION_FIELD_VALIDATORS = {
+  id: (v) => typeof v === 'string' && v.length > 0,
+  blockId: (v) => typeof v === 'string',
+  startOffset: (v) => typeof v === 'number' && Number.isFinite(v),
+  endOffset: (v) => typeof v === 'number' && Number.isFinite(v),
+  type: (v) => v === 'DELETION' || v === 'COMMENT' || v === 'GLOBAL_COMMENT',
+  originalText: (v) => typeof v === 'string',
+  createdA: (v) => typeof v === 'number' && Number.isFinite(v),
+  text: (v) => typeof v === 'string',
+  author: (v) => typeof v === 'string',
+  source: (v) => typeof v === 'string',
+  isQuickLabel: (v) => typeof v === 'boolean',
+  quickLabelTip: (v) => typeof v === 'string',
+  diffContext: (v) => v === 'added' || v === 'removed' || v === 'modified',
+  startMeta: isAnnotationMeta,
+  endMeta: isAnnotationMeta,
+} satisfies Record<Exclude<keyof RoomAnnotation, 'images'>, (v: unknown) => boolean>;
+
+const ROOM_ANNOTATION_KNOWN_FIELDS = new Set<string>([
+  ...Object.keys(ROOM_ANNOTATION_FIELD_VALIDATORS),
+  'images',  // known-but-forbidden
+]);
+
+const ROOM_ANNOTATION_REQUIRED_FIELDS = [
+  'id', 'blockId', 'startOffset', 'endOffset', 'type', 'originalText', 'createdA',
+] as const;
+
+/** Fast membership check for optional-field iteration in isRoomAnnotation. */
+const ROOM_ANNOTATION_REQUIRED_FIELD_SET = new Set<string>(ROOM_ANNOTATION_REQUIRED_FIELDS);
+
+/**
+ * Fields that are NOT accepted in an annotation.update patch. `id` is the
+ * critical one: letting a patch replace the id lets a malicious sender store
+ * an annotation under map key `old-id` whose object reports `id: "new-id"`.
+ * Later removes/updates by the visible id would miss it. `images` is excluded
+ * because V1 room annotations cannot carry images.
+ */
+const ROOM_ANNOTATION_PATCH_FORBIDDEN_FIELDS = new Set(['id', 'images']);
+
+/**
+ * Runtime validator for a decrypted RoomAnnotation. Encryption proves only
+ * that the sender held the room key; payload shape is not proven. Any room
+ * participant can encrypt arbitrary JSON, so annotations that are about to
+ * enter client state must be shape-checked first. Without this, malformed
+ * annotations can crash UI render paths that assume well-formed fields.
+ */
+export function isRoomAnnotation(x: unknown): x is RoomAnnotation {
+  if (x === null || typeof x !== 'object') return false;
+  const a = x as Record<string, unknown>;
+  // Strict boundary: reject unknown keys. The validators are the contract —
+  // anything outside ROOM_ANNOTATION_KNOWN_FIELDS would silently pass through
+  // otherwise, defeating the purpose of the validation pass.
+  for (const key of Object.keys(a)) {
+    if (!ROOM_ANNOTATION_KNOWN_FIELDS.has(key)) return false;
+  }
+  // Single pass over the validator map: required fields must pass validation
+  // regardless of value; optional fields only run validation when present.
+  for (const [field, validate] of Object.entries(ROOM_ANNOTATION_FIELD_VALIDATORS)) {
+    const required = ROOM_ANNOTATION_REQUIRED_FIELD_SET.has(field);
+    if (required) {
+      if (!validate(a[field])) return false;
+    } else if (a[field] !== undefined) {
+      if (!validate(a[field])) return false;
+    }
+  }
+  // Cross-field invariant: inline annotations (COMMENT, DELETION) must have a
+  // non-empty blockId — they attach to a block in the rendered plan. Only
+  // GLOBAL_COMMENT is allowed to carry blockId: '' (it's a top-level comment
+  // with no block anchor, matching the existing UI convention).
+  if ((a.type === 'COMMENT' || a.type === 'DELETION') && (a.blockId as string).length === 0) {
+    return false;
+  }
+  // images must be absent in V1 room annotations
+  if ('images' in a && a.images !== undefined) return false;
+  return true;
+}
+
+/**
+ * Runtime validator for a partial RoomAnnotation patch (annotation.update).
+ * Allows any subset of fields but each present field must be well-typed.
+ * Forbids mutating required fields into invalid values (e.g. type=null) and
+ * forbids the `id` and `images` fields entirely (see
+ * ROOM_ANNOTATION_PATCH_FORBIDDEN_FIELDS for rationale).
+ */
+export function isRoomAnnotationPatch(x: unknown): x is Partial<RoomAnnotation> {
+  if (x === null || typeof x !== 'object') return false;
+  const p = x as Record<string, unknown>;
+  // Strict boundary: reject unknown keys. Patches must not smuggle in
+  // fields the type doesn't know about.
+  for (const key of Object.keys(p)) {
+    if (!ROOM_ANNOTATION_KNOWN_FIELDS.has(key)) return false;
+  }
+  for (const forbidden of ROOM_ANNOTATION_PATCH_FORBIDDEN_FIELDS) {
+    if (forbidden in p && p[forbidden] !== undefined) return false;
+  }
+  // Reject effectively-empty patches. A patch with no allowed/defined fields
+  // (including `{}` and `{ text: undefined }`) would burn a durable seq for
+  // a guaranteed no-op when sent — avoidable log noise with no effect.
+  let hasDefinedAllowedField = false;
+  for (const [field, validate] of Object.entries(ROOM_ANNOTATION_FIELD_VALIDATORS)) {
+    if (ROOM_ANNOTATION_PATCH_FORBIDDEN_FIELDS.has(field)) continue;
+    if (p[field] === undefined) continue;
+    if (!validate(p[field])) return false;
+    hasDefinedAllowedField = true;
+  }
+  if (!hasDefinedAllowedField) return false;
+  return true;
+}
+
+// ---------------------------------------------------------------------------
+// Presence
+// ---------------------------------------------------------------------------
+
+export interface CursorState {
+  blockId?: string;
+  x: number;
+  y: number;
+  coordinateSpace: 'block' | 'document' | 'viewport';
+}
+
+export interface PresenceState {
+  user: { id: string; name: string; color: string };
+  cursor: CursorState | null;
+  activeAnnotationId?: string | null;
+  idle?: boolean;
+}
+
+/**
+ * Runtime validator for decrypted PresenceState. Encryption only proves the
+ * sender holds the room key; it does not prove payload shape. Without this,
+ * a malicious participant could ship a valid-encrypted but malformed presence
+ * and crash UI render code that assumes `user.name` is a string, etc.
+ */
+const PRESENCE_STATE_KEYS = new Set(['user', 'cursor', 'activeAnnotationId', 'idle']);
+const PRESENCE_USER_KEYS = new Set(['id', 'name', 'color']);
+const CURSOR_STATE_KEYS = new Set(['blockId', 'x', 'y', 'coordinateSpace']);
+
+export function isPresenceState(x: unknown): x is PresenceState {
+  if (x === null || typeof x !== 'object') return false;
+  const p = x as Record<string, unknown>;
+
+  // Required-field intent made explicit (previously relied on subsequent
+  // typeof checks to reject missing fields via undefined).
+  if (!('user' in p) || !('cursor' in p)) return false;
+
+  // Strict boundary: reject unknown top-level keys.
+  for (const key of Object.keys(p)) {
+    if (!PRESENCE_STATE_KEYS.has(key)) return false;
+  }
+
+  const user = p.user;
+  if (user === null || typeof user !== 'object') return false;
+  const u = user as Record<string, unknown>;
+  for (const key of Object.keys(u)) {
+    if (!PRESENCE_USER_KEYS.has(key)) return false;
+  }
+  if (typeof u.id !== 'string' || typeof u.name !== 'string' || typeof u.color !== 'string') return false;
+
+  // cursor: null OR CursorState
+  if (p.cursor !== null) {
+    if (p.cursor === undefined || typeof p.cursor !== 'object') return false;
+    const c = p.cursor as Record<string, unknown>;
+    for (const key of Object.keys(c)) {
+      if (!CURSOR_STATE_KEYS.has(key)) return false;
+    }
+    // Require finite coordinates — JSON can encode Infinity/NaN via non-standard
+    // parsers or adversarial payloads, and non-finite cursors would corrupt
+    // remote-cursor rendering math downstream.
+    if (typeof c.x !== 'number' || !Number.isFinite(c.x)) return false;
+    if (typeof c.y !== 'number' || !Number.isFinite(c.y)) return false;
+    if (c.coordinateSpace !== 'block' && c.coordinateSpace !== 'document' && c.coordinateSpace !== 'viewport') return false;
+    if (c.blockId !== undefined && typeof c.blockId !== 'string') return false;
+  }
+
+  if (p.activeAnnotationId !== undefined && p.activeAnnotationId !== null && typeof p.activeAnnotationId !== 'string') return false;
+  if (p.idle !== undefined && typeof p.idle !== 'boolean') return false;
+
+  return true;
+}
+
+// ---------------------------------------------------------------------------
+// Server Envelope
+// ---------------------------------------------------------------------------
+
+/**
+ * Server-visible message wrapper. The DO can read clientId, opId, and channel
+ * but cannot read the encrypted ciphertext.
+ *
+ * clientId is random per WebSocket connection — not a stable user identity.
+ * Stable identity lives inside the encrypted PresenceState.user.id.
+ */
+export interface ServerEnvelope {
+  clientId: string;
+  opId: string;
+  channel: 'event' | 'presence';
+  ciphertext: string;
+}
+
+// ---------------------------------------------------------------------------
+// Client Operations (encrypted inside envelope ciphertext)
+//
+// Event channel payloads are annotation ops only. Presence is encrypted as a
+// raw PresenceState on the presence channel (the wire envelope's `channel`
+// field already discriminates). Keeping presence OUT of the event-channel
+// type and validator prevents clients from writing durable no-op presence
+// events into the sequenced event log.
+// ---------------------------------------------------------------------------
+
+/** Ops valid on the event channel. */
+export type RoomEventClientOp =
+  | { type: 'annotation.add'; annotations: RoomAnnotation[] }
+  | { type: 'annotation.update'; id: string; patch: Partial<RoomAnnotation> }
+  | { type: 'annotation.remove'; ids: string[] }
+  | { type: 'annotation.clear'; source?: string };
+
+/**
+ * Superset union retained for protocol-level typing and tests that want one
+ * client-op union. Runtime event-channel code uses RoomEventClientOp; presence
+ * is sent as raw PresenceState on the presence channel.
+ */
+export type RoomClientOp =
+  | RoomEventClientOp
+  | { type: 'presence.update'; presence: PresenceState };
+
+/**
+ * Runtime validator for a decrypted EVENT-channel op. Does NOT accept
+ * presence.update — presence ops flow through the presence channel with a
+ * raw PresenceState payload validated by isPresenceState.
+ */
+export function isRoomEventClientOp(x: unknown): x is RoomEventClientOp {
+  if (x === null || typeof x !== 'object') return false;
+  const op = x as Record<string, unknown>;
+  switch (op.type) {
+    case 'annotation.add':
+      // Empty-array adds would burn a durable seq for a no-op; reject.
+      return (
+        Array.isArray(op.annotations) &&
+        op.annotations.length > 0 &&
+        op.annotations.every(isRoomAnnotation)
+      );
+    case 'annotation.update':
+      return (
+        typeof op.id === 'string' && op.id.length > 0 &&
+        isRoomAnnotationPatch(op.patch)
+      );
+    case 'annotation.remove':
+      // Empty-array removes would burn a durable seq for a no-op; reject.
+      return (
+        Array.isArray(op.ids) &&
+        op.ids.length > 0 &&
+        op.ids.every((id: unknown) => typeof id === 'string' && id.length > 0)
+      );
+    case 'annotation.clear':
+      return op.source === undefined || typeof op.source === 'string';
+    default:
+      return false;
+  }
+}
+
+/**
+ * Superset validator — accepts event-channel ops OR presence.update. Not
+ * currently used by the runtime (outbound mutation methods validate event
+ * ops via isRoomEventClientOp, and presence via isPresenceState directly).
+ * Retained for completeness; inbound event-channel validation should always
+ * use isRoomEventClientOp so presence.update cannot pollute the durable log.
+ */
+export function isRoomClientOp(x: unknown): x is RoomClientOp {
+  if (isRoomEventClientOp(x)) return true;
+  if (x === null || typeof x !== 'object') return false;
+  const op = x as Record<string, unknown>;
+  return op.type === 'presence.update' && isPresenceState(op.presence);
+}
+
+// ---------------------------------------------------------------------------
+// Server Events (decrypted by client from envelope ciphertext)
+// ---------------------------------------------------------------------------
+
+export type RoomServerEvent =
+  | { type: 'snapshot'; payload: RoomSnapshot; snapshotSeq: number }
+  | { type: 'annotation.add'; annotations: RoomAnnotation[] }
+  | { type: 'annotation.update'; id: string; patch: Partial<RoomAnnotation> }
+  | { type: 'annotation.remove'; ids: string[] }
+  | { type: 'annotation.clear'; source?: string }
+  | { type: 'presence.update'; clientId: string; presence: PresenceState };
+
+// ---------------------------------------------------------------------------
+// Snapshot
+// ---------------------------------------------------------------------------
+
+export interface RoomSnapshot {
+  versionId: 'v1';
+  planMarkdown: string;
+  annotations: RoomAnnotation[];
+}
+
+/**
+ * Runtime validator for a decrypted RoomSnapshot. A malformed snapshot must
+ * not enter client state — it clears and re-seeds the annotations map plus
+ * planMarkdown, so garbage here corrupts the whole view.
+ */
+const ROOM_SNAPSHOT_KEYS = new Set(['versionId', 'planMarkdown', 'annotations']);
+
+export function isRoomSnapshot(x: unknown): x is RoomSnapshot {
+  if (x === null || typeof x !== 'object') return false;
+  const s = x as Record<string, unknown>;
+  // Strict boundary: reject unknown keys so future protocol drift fails
+  // loudly instead of silently slipping fields past the validator.
+  for (const key of Object.keys(s)) {
+    if (!ROOM_SNAPSHOT_KEYS.has(key)) return false;
+  }
+  if (s.versionId !== 'v1') return false;
+  if (typeof s.planMarkdown !== 'string') return false;
+  if (!Array.isArray(s.annotations)) return false;
+  return s.annotations.every(isRoomAnnotation);
+}
+
+// ---------------------------------------------------------------------------
+// Transport Messages (server-to-client, pre-decryption)
+// ---------------------------------------------------------------------------
+
+export type RoomTransportMessage =
+  | { type: 'room.snapshot'; snapshotSeq: number; snapshotCiphertext: string }
+  | { type: 'room.event'; seq: number; receivedAt: number; envelope: ServerEnvelope }
+  | { type: 'room.presence'; envelope: ServerEnvelope }
+  | { type: 'room.error'; code: string; message: string }
+  /**
+   * Peer left the room. Broadcast by the room service on a
+   * WebSocket close so other participants can drop the peer's
+   * presence (cursor, avatar) immediately rather than waiting for
+   * the client-side presence TTL sweep to expire the entry.
+   *
+   * `clientId` is the server-assigned id from the peer's
+   * auth.challenge; the server knows it from the socket's
+   * attachment. No encrypted payload — nothing here that a
+   * receiver couldn't have inferred from absence anyway.
+   */
+  | { type: 'room.participant.left'; clientId: string };
+
+// ---------------------------------------------------------------------------
+// Sequenced Envelope (for event log storage)
+// ---------------------------------------------------------------------------
+
+export interface SequencedEnvelope {
+  seq: number;
+  receivedAt: number;
+  envelope: ServerEnvelope;
+}
+
+// ---------------------------------------------------------------------------
+// Auth
+// ---------------------------------------------------------------------------
+
+export interface AuthChallenge {
+  type: 'auth.challenge';
+  challengeId: string;
+  nonce: string;
+  expiresAt: number;
+  /**
+   * Server-assigned ephemeral clientId for this WebSocket. Binding the auth
+   * proof to it prevents a malicious participant from choosing another active
+   * connection's visible clientId and overwriting their presence slot after
+   * auth. Clients MUST use this value as their clientId for the connection
+   * (not self-generate one).
+   */
+  clientId: string;
+}
+
+export interface AuthResponse {
+  type: 'auth.response';
+  challengeId: string;
+  /** Must equal the server-assigned clientId from the corresponding AuthChallenge. */
+  clientId: string;
+  proof: string;
+  lastSeq?: number;
+}
+
+export interface AuthAccepted {
+  type: 'auth.accepted';
+  seq: number;
+  snapshotSeq?: number;
+  snapshotAvailable: boolean;
+}
+
+// ---------------------------------------------------------------------------
+// Admin
+// ---------------------------------------------------------------------------
+
+export type AdminCommand =
+  | { type: 'room.delete' };
+
+export interface AdminChallengeRequest {
+  type: 'admin.challenge.request';
+}
+
+export interface AdminChallenge {
+  type: 'admin.challenge';
+  challengeId: string;
+  nonce: string;
+  expiresAt: number;
+}
+
+export interface AdminCommandEnvelope {
+  type: 'admin.command';
+  challengeId: string;
+  clientId: string;
+  command: AdminCommand;
+  adminProof: string;
+}
+
+// ---------------------------------------------------------------------------
+// Room Creation
+// ---------------------------------------------------------------------------
+
+export interface CreateRoomRequest {
+  roomId: string;
+  roomVerifier: string;
+  adminVerifier: string;
+  initialSnapshotCiphertext: string;
+  expiresInDays?: number;
+}
+
+export interface CreateRoomResponse {
+  roomId: string;
+  seq: 0;
+  snapshotSeq: 0;
+  joinUrl: string;
+  websocketUrl: string;
+}
+
+// ---------------------------------------------------------------------------
+// Agent-Readable State
+// ---------------------------------------------------------------------------
+
+export interface AgentReadableRoomState {
+  roomId: string;
+  versionId: 'v1';
+  planMarkdown: string;
+  annotations: RoomAnnotation[];
+}
diff --git a/packages/shared/collab/url.test.ts b/packages/shared/collab/url.test.ts
new file mode 100644
index 000000000..80c20a489
--- /dev/null
+++ b/packages/shared/collab/url.test.ts
@@ -0,0 +1,167 @@
+import { describe, expect, test } from 'bun:test';
+import { parseRoomUrl, buildRoomJoinUrl, buildAdminRoomUrl } from './url';
+import { generateRoomSecret, generateAdminSecret, generateRoomId } from './ids';
+
+describe('parseRoomUrl', () => {
+  test('parses valid room URL', () => {
+    const secret = generateRoomSecret();
+    const roomId = 'test-room-123';
+    const url = buildRoomJoinUrl(roomId, secret);
+
+    const parsed = parseRoomUrl(url);
+    expect(parsed).not.toBeNull();
+    expect(parsed!.roomId).toBe(roomId);
+    expect(parsed!.roomSecret).toEqual(secret);
+  });
+
+  test('returns null for missing fragment', () => {
+    expect(parseRoomUrl('https://room.plannotator.ai/c/abc123')).toBeNull();
+  });
+
+  test('returns null for missing key parameter', () => {
+    expect(parseRoomUrl('https://room.plannotator.ai/c/abc123#other=value')).toBeNull();
+  });
+
+  test('returns null for wrong path', () => {
+    expect(parseRoomUrl('https://room.plannotator.ai/p/abc123#key=AAAA')).toBeNull();
+  });
+
+  test('returns null for missing roomId', () => {
+    expect(parseRoomUrl('https://room.plannotator.ai/c/#key=AAAA')).toBeNull();
+  });
+
+  test('returns null for empty key value', () => {
+    expect(parseRoomUrl('https://room.plannotator.ai/c/abc123#key=')).toBeNull();
+  });
+
+  test('returns null for non-256-bit room secrets', () => {
+    expect(parseRoomUrl('https://room.plannotator.ai/c/abc123#key=AQ')).toBeNull();
+    expect(parseRoomUrl('https://room.plannotator.ai/c/abc123#key=AAAA')).toBeNull();
+  });
+
+  test('returns null for completely invalid URL', () => {
+    expect(parseRoomUrl('not a url')).toBeNull();
+  });
+
+  test('returns null for empty string', () => {
+    expect(parseRoomUrl('')).toBeNull();
+  });
+});
+
+describe('buildRoomJoinUrl', () => {
+  test('constructs URL with default base', () => {
+    const secret = generateRoomSecret();
+    const url = buildRoomJoinUrl('my-room', secret);
+    expect(url).toMatch(/^https:\/\/room\.plannotator\.ai\/c\/my-room#key=/);
+  });
+
+  test('constructs URL with custom base', () => {
+    const secret = generateRoomSecret();
+    const url = buildRoomJoinUrl('my-room', secret, 'http://localhost:8787');
+    expect(url).toMatch(/^http:\/\/localhost:8787\/c\/my-room#key=/);
+  });
+
+  test('rejects non-256-bit room secrets', () => {
+    expect(() => buildRoomJoinUrl('my-room', new Uint8Array(31))).toThrow('Invalid room secret');
+    expect(() => buildRoomJoinUrl('my-room', new Uint8Array(33))).toThrow('Invalid room secret');
+  });
+});
+
+describe('round-trip', () => {
+  test('parse(build(id, secret)) recovers same values', () => {
+    const roomId = generateRoomId();
+    const secret = generateRoomSecret();
+    const url = buildRoomJoinUrl(roomId, secret);
+    const parsed = parseRoomUrl(url);
+
+    expect(parsed).not.toBeNull();
+    expect(parsed!.roomId).toBe(roomId);
+    expect(parsed!.roomSecret).toEqual(secret);
+  });
+
+  test('round-trip with custom base URL', () => {
+    const roomId = 'custom-room';
+    const secret = generateRoomSecret();
+    const url = buildRoomJoinUrl(roomId, secret, 'https://custom.example.com');
+    const parsed = parseRoomUrl(url);
+
+    expect(parsed).not.toBeNull();
+    expect(parsed!.roomId).toBe(roomId);
+    expect(parsed!.roomSecret).toEqual(secret);
+  });
+});
+
+describe('buildAdminRoomUrl', () => {
+  test('constructs URL with both key and admin', () => {
+    const secret = generateRoomSecret();
+    const adminSecret = generateAdminSecret();
+    const url = buildAdminRoomUrl('my-room', secret, adminSecret);
+    expect(url).toContain('/c/my-room#key=');
+    expect(url).toContain('&admin=');
+  });
+
+  test('rejects non-32-byte admin secret', () => {
+    expect(() => buildAdminRoomUrl('room', generateRoomSecret(), new Uint8Array(31)))
+      .toThrow('Invalid admin secret');
+  });
+
+  test('rejects non-32-byte room secret', () => {
+    expect(() => buildAdminRoomUrl('room', new Uint8Array(31), generateAdminSecret()))
+      .toThrow('Invalid room secret');
+  });
+
+  test('round-trip: parseRoomUrl recovers admin secret', () => {
+    const roomId = generateRoomId();
+    const secret = generateRoomSecret();
+    const adminSecret = generateAdminSecret();
+    const url = buildAdminRoomUrl(roomId, secret, adminSecret);
+    const parsed = parseRoomUrl(url);
+
+    expect(parsed).not.toBeNull();
+    expect(parsed!.roomId).toBe(roomId);
+    expect(parsed!.roomSecret).toEqual(secret);
+    expect(parsed!.adminSecret).toEqual(adminSecret);
+  });
+
+  test('parseRoomUrl without admin leaves adminSecret undefined', () => {
+    const secret = generateRoomSecret();
+    const url = buildRoomJoinUrl('room-abc', secret);
+    const parsed = parseRoomUrl(url);
+    expect(parsed!.adminSecret).toBeUndefined();
+  });
+
+  test('parseRoomUrl rejects malformed admin (wrong length)', () => {
+    // Manually construct URL with 1-byte admin
+    const secret = generateRoomSecret();
+    const url = buildRoomJoinUrl('room', secret) + '&admin=AQ';
+    expect(parseRoomUrl(url)).toBeNull();
+  });
+});
+
+describe('URL building — trailing slash hygiene (P3)', () => {
+  test('buildRoomJoinUrl strips trailing slash from baseUrl', () => {
+    const roomSecret = generateRoomSecret();
+    const withSlash = buildRoomJoinUrl('room-42', roomSecret, 'https://example.com/');
+    const withoutSlash = buildRoomJoinUrl('room-42', roomSecret, 'https://example.com');
+    expect(withSlash).toBe(withoutSlash);
+    expect(withSlash).not.toContain('com//c/');
+  });
+
+  test('buildAdminRoomUrl strips trailing slash from baseUrl', () => {
+    const roomSecret = generateRoomSecret();
+    const adminSecret = generateAdminSecret();
+    const withSlash = buildAdminRoomUrl('r', roomSecret, adminSecret, 'https://example.com/');
+    const withoutSlash = buildAdminRoomUrl('r', roomSecret, adminSecret, 'https://example.com');
+    expect(withSlash).toBe(withoutSlash);
+  });
+
+  test('round-trips the constructed URL through parseRoomUrl regardless of trailing slash', () => {
+    const roomSecret = generateRoomSecret();
+    const roomId = generateRoomId();
+    const url = buildRoomJoinUrl(roomId, roomSecret, 'https://example.com/');
+    const parsed = parseRoomUrl(url);
+    expect(parsed).not.toBeNull();
+    expect(parsed!.roomId).toBe(roomId);
+    expect(parsed!.roomSecret).toEqual(roomSecret);
+  });
+});
diff --git a/packages/shared/collab/url.ts b/packages/shared/collab/url.ts
new file mode 100644
index 000000000..38057c163
--- /dev/null
+++ b/packages/shared/collab/url.ts
@@ -0,0 +1,114 @@
+/**
+ * @module CLIENT-ONLY
+ *
+ * Room URL parsing and construction for browser and direct-agent clients.
+ *
+ * The Worker and Durable Object must NEVER import this module.
+ * They never receive URL fragments and must not parse full room URLs.
+ * They receive only roomId via /api/rooms request bodies or /ws/<roomId>
+ * routes, plus verifiers/proofs in request or WebSocket message bodies.
+ */
+
+import { bytesToBase64url, base64urlToBytes } from './encoding';
+import { ADMIN_SECRET_LENGTH_BYTES, ROOM_SECRET_LENGTH_BYTES } from './constants';
+
+const DEFAULT_BASE_URL = 'https://room.plannotator.ai';
+
+/** Strip a single trailing slash from a base URL so path concatenation is safe. */
+function normalizeBaseUrl(baseUrl: string): string {
+  return baseUrl.endsWith('/') ? baseUrl.slice(0, -1) : baseUrl;
+}
+
+export interface ParsedRoomUrl {
+  roomId: string;
+  roomSecret: Uint8Array;
+  /** Present only if the URL fragment includes `&admin=...` (creator/recovery URLs). */
+  adminSecret?: Uint8Array;
+}
+
+/**
+ * Parse a room join URL. Extracts roomId, roomSecret, and optional adminSecret.
+ * Returns null if the URL is malformed.
+ *
+ * Expected formats:
+ *   https://room.plannotator.ai/c/<roomId>#key=<base64url-roomSecret>
+ *   https://room.plannotator.ai/c/<roomId>#key=<base64url-roomSecret>&admin=<base64url-adminSecret>
+ *
+ * If `admin=` is present but malformed (wrong length, bad encoding), returns null.
+ */
+export function parseRoomUrl(url: string): ParsedRoomUrl | null {
+  try {
+    const parsed = new URL(url);
+
+    // Extract roomId from pathname /c/<roomId>
+    const match = parsed.pathname.match(/^\/c\/([^/]+)$/);
+    if (!match) return null;
+
+    const roomId = match[1];
+    if (!roomId) return null;
+
+    // Extract key from fragment
+    const hash = parsed.hash.startsWith('#') ? parsed.hash.slice(1) : parsed.hash;
+    if (!hash) return null;
+
+    const params = new URLSearchParams(hash);
+    const keyParam = params.get('key');
+    if (!keyParam) return null;
+
+    const roomSecret = base64urlToBytes(keyParam);
+    if (roomSecret.length !== ROOM_SECRET_LENGTH_BYTES) return null;
+
+    const result: ParsedRoomUrl = { roomId, roomSecret };
+
+    // Optional admin capability
+    const adminParam = params.get('admin');
+    if (adminParam !== null) {
+      const adminSecret = base64urlToBytes(adminParam);
+      if (adminSecret.length !== ADMIN_SECRET_LENGTH_BYTES) return null;
+      result.adminSecret = adminSecret;
+    }
+
+    return result;
+  } catch {
+    return null;
+  }
+}
+
+/**
+ * Construct a #key-only room join URL (safe to share with participants).
+ *
+ * @param roomId - The room identifier
+ * @param roomSecret - The 256-bit room secret (raw bytes)
+ * @param baseUrl - Base URL (defaults to "https://room.plannotator.ai")
+ */
+export function buildRoomJoinUrl(
+  roomId: string,
+  roomSecret: Uint8Array,
+  baseUrl: string = DEFAULT_BASE_URL,
+): string {
+  if (roomSecret.length !== ROOM_SECRET_LENGTH_BYTES) {
+    throw new Error(`Invalid room secret: expected ${ROOM_SECRET_LENGTH_BYTES} bytes`);
+  }
+  return `${normalizeBaseUrl(baseUrl)}/c/${roomId}#key=${bytesToBase64url(roomSecret)}`;
+}
+
+/**
+ * Construct a room URL that includes admin capability (creator-only / recovery).
+ *
+ * WARNING: adminUrl grants delete capability. It must NOT be the default
+ * share target. Use `buildRoomJoinUrl()` for normal participant sharing.
+ */
+export function buildAdminRoomUrl(
+  roomId: string,
+  roomSecret: Uint8Array,
+  adminSecret: Uint8Array,
+  baseUrl: string = DEFAULT_BASE_URL,
+): string {
+  if (roomSecret.length !== ROOM_SECRET_LENGTH_BYTES) {
+    throw new Error(`Invalid room secret: expected ${ROOM_SECRET_LENGTH_BYTES} bytes`);
+  }
+  if (adminSecret.length !== ADMIN_SECRET_LENGTH_BYTES) {
+    throw new Error(`Invalid admin secret: expected ${ADMIN_SECRET_LENGTH_BYTES} bytes`);
+  }
+  return `${normalizeBaseUrl(baseUrl)}/c/${roomId}#key=${bytesToBase64url(roomSecret)}&admin=${bytesToBase64url(adminSecret)}`;
+}
diff --git a/packages/shared/collab/validation.test.ts b/packages/shared/collab/validation.test.ts
new file mode 100644
index 000000000..fdbc128a3
--- /dev/null
+++ b/packages/shared/collab/validation.test.ts
@@ -0,0 +1,57 @@
+import { describe, expect, test } from 'bun:test';
+import {
+  BASE64URL_32_BYTE_RE,
+  isBase64Url32ByteString,
+  isValidPermissionMode,
+} from './validation';
+
+describe('isBase64Url32ByteString', () => {
+  const valid43 = 'A'.repeat(43);
+  test('accepts a 43-character base64url string', () => {
+    expect(isBase64Url32ByteString(valid43)).toBe(true);
+    expect(isBase64Url32ByteString('abcdefghij_ABCDEFGHIJ-klmnopqrst_KLMNOPQRST')).toBe(true);
+  });
+  test('rejects wrong-length strings', () => {
+    expect(isBase64Url32ByteString('A'.repeat(42))).toBe(false);
+    expect(isBase64Url32ByteString('A'.repeat(44))).toBe(false);
+    expect(isBase64Url32ByteString('')).toBe(false);
+  });
+  test('rejects base64url-invalid characters', () => {
+    expect(isBase64Url32ByteString('A'.repeat(42) + '/')).toBe(false);  // '/' not base64url
+    expect(isBase64Url32ByteString('A'.repeat(42) + '+')).toBe(false);  // '+' not base64url
+    expect(isBase64Url32ByteString('A'.repeat(42) + '=')).toBe(false);  // padding not expected
+    expect(isBase64Url32ByteString('A'.repeat(42) + ' ')).toBe(false);
+  });
+  test('rejects non-string values', () => {
+    expect(isBase64Url32ByteString(null)).toBe(false);
+    expect(isBase64Url32ByteString(undefined)).toBe(false);
+    expect(isBase64Url32ByteString(42)).toBe(false);
+    expect(isBase64Url32ByteString({})).toBe(false);
+  });
+  test('regex constant matches helper behavior', () => {
+    expect(BASE64URL_32_BYTE_RE.test(valid43)).toBe(true);
+    expect(BASE64URL_32_BYTE_RE.test('A'.repeat(44))).toBe(false);
+  });
+});
+
+describe('isValidPermissionMode', () => {
+  test('accepts bypassPermissions', () => {
+    expect(isValidPermissionMode('bypassPermissions')).toBe(true);
+  });
+  test('accepts acceptEdits', () => {
+    expect(isValidPermissionMode('acceptEdits')).toBe(true);
+  });
+  test('accepts default', () => {
+    expect(isValidPermissionMode('default')).toBe(true);
+  });
+  test('rejects unknown strings', () => {
+    expect(isValidPermissionMode('admin')).toBe(false);
+    expect(isValidPermissionMode('')).toBe(false);
+  });
+  test('rejects non-string values', () => {
+    expect(isValidPermissionMode(42)).toBe(false);
+    expect(isValidPermissionMode(null)).toBe(false);
+    expect(isValidPermissionMode(undefined)).toBe(false);
+    expect(isValidPermissionMode(true)).toBe(false);
+  });
+});
diff --git a/packages/shared/collab/validation.ts b/packages/shared/collab/validation.ts
new file mode 100644
index 000000000..fe5c3428b
--- /dev/null
+++ b/packages/shared/collab/validation.ts
@@ -0,0 +1,30 @@
+/**
+ * Shape validators shared between AppRoot (admin-secret fragments)
+ * and the Bun / Pi servers (`/api/approve` permission-mode bodies).
+ */
+
+/**
+ * 43-character base64url pattern for a 32-byte random value.
+ *
+ * Live Rooms uses this shape for admin secrets
+ * (`ADMIN_SECRET_LENGTH_BYTES === 32`; see `./constants.ts`).
+ */
+export const BASE64URL_32_BYTE_RE = /^[A-Za-z0-9_-]{43}$/;
+
+export function isBase64Url32ByteString(value: unknown): value is string {
+  return typeof value === 'string' && BASE64URL_32_BYTE_RE.test(value);
+}
+
+const VALID_PERMISSION_MODES = new Set(['bypassPermissions', 'acceptEdits', 'default']);
+
+/**
+ * Accepts the three Claude Code permission-mode tokens. Used by the
+ * local `/api/approve` handlers in both servers to validate the
+ * request body's `permissionMode` field before forwarding it into
+ * the hook result.
+ */
+export function isValidPermissionMode(
+  value: unknown,
+): value is 'bypassPermissions' | 'acceptEdits' | 'default' {
+  return typeof value === 'string' && VALID_PERMISSION_MODES.has(value);
+}
diff --git a/packages/shared/config.test.ts b/packages/shared/config.test.ts
new file mode 100644
index 000000000..98544ad69
--- /dev/null
+++ b/packages/shared/config.test.ts
@@ -0,0 +1,94 @@
+import { afterEach, describe, expect, test } from 'bun:test';
+import { existsSync, rmSync } from 'fs';
+import { join } from 'path';
+import { tmpdir } from 'os';
+
+/**
+ * The config module reads `homedir()` at import time to fix its
+ * CONFIG_DIR, so we re-import it in a subprocess per scenario with
+ * HOME pointed at a tmp dir — matches the pattern already used in
+ * `improvement-hooks.test.ts`. We're only validating that
+ * `presenceColor` now rides the same save/load/getServerConfig path
+ * as `displayName`; those APIs used to silently drop the field.
+ */
+
+const TEST_HOME = join(tmpdir(), `config-test-${Date.now()}`);
+
+afterEach(() => {
+  if (existsSync(TEST_HOME)) {
+    rmSync(TEST_HOME, { recursive: true, force: true });
+  }
+});
+
+async function runScript(script: string): Promise<string> {
+  const proc = Bun.spawn(
+    ['bun', '-e', script],
+    {
+      env: { ...process.env, HOME: TEST_HOME },
+      cwd: join(import.meta.dir, '../..'),
+      stdout: 'pipe',
+      stderr: 'pipe',
+    },
+  );
+  const stdout = await new Response(proc.stdout).text();
+  const exit = await proc.exited;
+  if (exit !== 0) {
+    const stderr = await new Response(proc.stderr).text();
+    throw new Error(`Subprocess failed (exit ${exit}): ${stderr}`);
+  }
+  return stdout.trim();
+}
+
+describe('config — presenceColor save/load roundtrip', () => {
+  test('saveConfig({presenceColor}) persists and loadConfig reads it back', async () => {
+    const script = `
+      import { saveConfig, loadConfig } from "./packages/shared/config";
+      saveConfig({ displayName: "alice", presenceColor: "#10b981" });
+      const reloaded = loadConfig();
+      console.log(JSON.stringify(reloaded));
+    `;
+    const out = await runScript(script);
+    const cfg = JSON.parse(out);
+    expect(cfg.displayName).toBe('alice');
+    expect(cfg.presenceColor).toBe('#10b981');
+  });
+
+  test('getServerConfig includes presenceColor when set', async () => {
+    const script = `
+      import { saveConfig, getServerConfig } from "./packages/shared/config";
+      saveConfig({ presenceColor: "#f97316" });
+      console.log(JSON.stringify(getServerConfig(null)));
+    `;
+    const out = await runScript(script);
+    const sc = JSON.parse(out);
+    expect(sc.presenceColor).toBe('#f97316');
+  });
+
+  test('getServerConfig omits presenceColor when not set', async () => {
+    const script = `
+      import { saveConfig, getServerConfig } from "./packages/shared/config";
+      // Only displayName written; presenceColor should not appear in
+      // the serverConfig payload so clients don't override their
+      // local cookie with undefined.
+      saveConfig({ displayName: "bob" });
+      console.log(JSON.stringify(getServerConfig(null)));
+    `;
+    const out = await runScript(script);
+    const sc = JSON.parse(out);
+    expect(sc.displayName).toBe('bob');
+    expect('presenceColor' in sc).toBe(false);
+  });
+
+  test('partial saveConfig updates only the fields given', async () => {
+    const script = `
+      import { saveConfig, loadConfig } from "./packages/shared/config";
+      saveConfig({ displayName: "carol", presenceColor: "#ec4899" });
+      saveConfig({ presenceColor: "#06b6d4" });
+      console.log(JSON.stringify(loadConfig()));
+    `;
+    const out = await runScript(script);
+    const cfg = JSON.parse(out);
+    expect(cfg.displayName).toBe('carol');
+    expect(cfg.presenceColor).toBe('#06b6d4');
+  });
+});
diff --git a/packages/shared/config.ts b/packages/shared/config.ts
index f37fc9001..8da391732 100644
--- a/packages/shared/config.ts
+++ b/packages/shared/config.ts
@@ -97,6 +97,15 @@ export function mergePromptConfig(
 
 export interface PlannotatorConfig {
   displayName?: string;
+  /**
+   * Presence color (`#RRGGBB`) used in Live Rooms — the color peers
+   * see on remote cursors/avatars. Stored alongside `displayName` so
+   * identity (name + color) persists through the config file, not
+   * only through the origin-scoped browser cookie. Without this,
+   * color would be lost on machine move, profile restore, cookie
+   * wipe, or when running against a non-default local port.
+   */
+  presenceColor?: string;
   diffOptions?: DiffOptions;
   prompts?: PromptConfig;
   conventionalComments?: boolean;
@@ -188,6 +197,7 @@ export function detectGitUser(): string | null {
  */
 export function getServerConfig(gitUser: string | null): {
   displayName?: string;
+  presenceColor?: string;
   diffOptions?: DiffOptions;
   gitUser?: string;
   conventionalComments?: boolean;
@@ -196,6 +206,7 @@ export function getServerConfig(gitUser: string | null): {
   const cfg = loadConfig();
   return {
     displayName: cfg.displayName,
+    ...(cfg.presenceColor !== undefined && { presenceColor: cfg.presenceColor }),
     diffOptions: cfg.diffOptions,
     gitUser: gitUser ?? undefined,
     ...(cfg.conventionalComments !== undefined && { conventionalComments: cfg.conventionalComments }),
diff --git a/packages/shared/package.json b/packages/shared/package.json
index 9159965d4..54fb776d9 100644
--- a/packages/shared/package.json
+++ b/packages/shared/package.json
@@ -36,6 +36,10 @@
     "./html-to-markdown": "./html-to-markdown.ts",
     "./url-to-markdown": "./url-to-markdown.ts",
     "./tour": "./tour.ts",
+    "./collab": "./collab/index.ts",
+    "./collab/client": "./collab/client.ts",
+    "./collab/constants": "./collab/constants.ts",
+    "./collab/validation": "./collab/validation.ts",
     "./annotate-args": "./annotate-args.ts",
     "./at-reference": "./at-reference.ts"
   },
diff --git a/packages/shared/url-to-markdown.ts b/packages/shared/url-to-markdown.ts
index b6c96f554..ef04f0f4f 100644
--- a/packages/shared/url-to-markdown.ts
+++ b/packages/shared/url-to-markdown.ts
@@ -101,19 +101,29 @@ export async function urlToMarkdown(
     }
   }
 
+  let jinaError: Error | undefined;
   if (options.useJina && !local) {
     try {
       const markdown = await fetchViaJina(url);
       return { markdown, source: "jina" };
     } catch (err) {
-      process.stderr.write(
-        `[plannotator] Warning: Jina Reader failed (${err instanceof Error ? err.message : String(err)}), falling back to direct fetch...\n`,
+      jinaError = err instanceof Error ? err : new Error(String(err));
+      console.warn(
+        `[plannotator] Jina Reader failed (${jinaError.message}), falling back to direct fetch`,
       );
     }
   }
 
-  const markdown = await fetchViaTurndown(url);
-  return { markdown, source: "fetch+turndown" };
+  try {
+    const markdown = await fetchViaTurndown(url);
+    return { markdown, source: "fetch+turndown" };
+  } catch (err) {
+    const turndownMsg = err instanceof Error ? err.message : String(err);
+    if (jinaError) {
+      throw new Error(`Jina Reader failed: ${jinaError.message}`);
+    }
+    throw new Error(turndownMsg);
+  }
 }
 
 /** Read response body with a size limit. Throws if the body exceeds MAX_BODY_BYTES. */
@@ -149,7 +159,13 @@ async function readBodyWithLimit(res: Response): Promise<string> {
     }
     chunks.push(value);
   }
-  return new TextDecoder().decode(Buffer.concat(chunks));
+  const merged = new Uint8Array(totalBytes);
+  let offset = 0;
+  for (const chunk of chunks) {
+    merged.set(chunk, offset);
+    offset += chunk.byteLength;
+  }
+  return new TextDecoder().decode(merged);
 }
 
 /**
@@ -265,7 +281,7 @@ async function fetchViaJina(url: string): Promise<string> {
     Accept: "text/plain",
   };
 
-  const apiKey = process.env.JINA_API_KEY;
+  const apiKey = typeof process !== 'undefined' ? process.env?.JINA_API_KEY : undefined;
   if (apiKey) {
     headers.Authorization = `Bearer ${apiKey}`;
   }
diff --git a/packages/ui/bunfig.toml b/packages/ui/bunfig.toml
new file mode 100644
index 000000000..9e75dd230
--- /dev/null
+++ b/packages/ui/bunfig.toml
@@ -0,0 +1,2 @@
+[test]
+preload = ["./test-setup.ts"]
diff --git a/packages/ui/components/AnnotationPanel.tsx b/packages/ui/components/AnnotationPanel.tsx
index 2d8922c84..ef5eb6d0e 100644
--- a/packages/ui/components/AnnotationPanel.tsx
+++ b/packages/ui/components/AnnotationPanel.tsx
@@ -1,4 +1,4 @@
-import React, { useState, useRef, useEffect } from 'react';
+import React, { useState, useRef, useEffect, useMemo } from 'react';
 import { Annotation, AnnotationType, Block, type CodeAnnotation, type EditorAnnotation } from '../types';
 import { isCurrentUser } from '../utils/identity';
 import { ImageThumbnail } from './ImageThumbnail';
@@ -27,6 +27,27 @@ interface PanelProps {
   onShare?: () => void;
   otherFileAnnotations?: { count: number; files: number };
   onOtherFileAnnotationsClick?: () => void;
+  /**
+   * Room-mode sync state. `pendingIds` are annotations sent but not yet
+   * echoed; `failedIds` are sends that rejected and need Retry/Discard;
+   * `pendingAdditions` are optimistic ADD rows to render inline for
+   * "Sending…" feedback before server echo. They are NOT part of the
+   * `annotations` prop so the canonical feed to approve/deny/export
+   * stays server-authoritative.
+   * All five props are optional — local mode consumers don't pass them.
+   */
+  pendingIds?: ReadonlySet<string>;
+  failedIds?: ReadonlyMap<string, { kind: string; error: string }>;
+  pendingAdditions?: ReadonlyMap<string, Annotation>;
+  onRetry?: (id: string) => void;
+  onDiscard?: (id: string) => void;
+  /**
+   * When set, "(me)" and the muted-color treatment match this value
+   * instead of the cookie-backed `getIdentity()` used by `isCurrentUser`.
+   * In room mode App passes the joined display name so the panel
+   * matches remote cursor labels.
+   */
+  authorOverride?: string;
 }
 
 export const AnnotationPanel: React.FC<PanelProps> = ({
@@ -50,17 +71,39 @@ export const AnnotationPanel: React.FC<PanelProps> = ({
   onShare,
   otherFileAnnotations,
   onOtherFileAnnotationsClick,
+  pendingIds,
+  failedIds,
+  pendingAdditions,
+  onRetry,
+  onDiscard,
+  authorOverride,
 }) => {
+  // Unified "is this the current user?" check. Room mode passes the
+  // joined display name via authorOverride; local mode falls through
+  // to the cookie-backed isCurrentUser.
+  const isMe = (author: string | undefined): boolean =>
+    author !== undefined && (authorOverride !== undefined
+      ? author === authorOverride
+      : isCurrentUser(author));
   const isMobile = useIsMobile();
   const [copiedText, setCopiedText] = useState(false);
   const listRef = useRef<HTMLDivElement>(null);
-  const sortedAnnotations = [...annotations].sort((a, b) => a.createdA - b.createdA);
+  const renderAnnotations = useMemo(() => {
+    if (!pendingAdditions || pendingAdditions.size === 0) return annotations;
+    const seen = new Set(annotations.map(a => a.id));
+    const extra: Annotation[] = [];
+    for (const [id, a] of pendingAdditions) {
+      if (!seen.has(id)) extra.push(a);
+    }
+    return extra.length > 0 ? [...annotations, ...extra] : annotations;
+  }, [annotations, pendingAdditions]);
+  const sortedAnnotations = [...renderAnnotations].sort((a, b) => a.createdA - b.createdA);
   const sortedCodeAnnotations = [...codeAnnotations].sort((a, b) => a.createdAt - b.createdAt);
   const timelineEntries = [
     ...sortedAnnotations.map(annotation => ({ kind: 'plan' as const, ts: annotation.createdA, annotation })),
     ...sortedCodeAnnotations.map(annotation => ({ kind: 'code' as const, ts: annotation.createdAt, annotation })),
   ].sort((a, b) => a.ts - b.ts);
-  const totalCount = annotations.length + codeAnnotations.length + (editorAnnotations?.length ?? 0);
+  const totalCount = renderAnnotations.length + codeAnnotations.length + (editorAnnotations?.length ?? 0);
 
   // Scroll selected annotation card into view
   useEffect(() => {
@@ -131,27 +174,68 @@ export const AnnotationPanel: React.FC<PanelProps> = ({
           </div>
         ) : (
           <>
-            {timelineEntries.map(entry => (
-              entry.kind === 'plan' ? (
-                <AnnotationCard
-                  key={entry.annotation.id}
-                  annotation={entry.annotation}
-                  isSelected={selectedId === entry.annotation.id}
-                  onSelect={() => onSelect(entry.annotation.id)}
-                  onDelete={() => onDelete(entry.annotation.id)}
-                  onEdit={onEdit ? (updates: Partial<Annotation>) => onEdit(entry.annotation.id, updates) : undefined}
-                />
-              ) : (
-                <CodeAnnotationCard
-                  key={entry.annotation.id}
-                  annotation={entry.annotation}
-                  isSelected={selectedId === entry.annotation.id}
-                  onSelect={() => onSelectCodeAnnotation?.(entry.annotation.id)}
-                  onDelete={() => onDeleteCodeAnnotation?.(entry.annotation.id)}
-                  onEdit={onEditCodeAnnotation ? (updates: Partial<CodeAnnotation>) => onEditCodeAnnotation(entry.annotation.id, updates) : undefined}
-                />
-              )
-            ))}
+            {timelineEntries.map(entry => {
+              if (entry.kind === 'code') {
+                return (
+                  <CodeAnnotationCard
+                    key={entry.annotation.id}
+                    annotation={entry.annotation}
+                    isSelected={selectedId === entry.annotation.id}
+                    onSelect={() => onSelectCodeAnnotation?.(entry.annotation.id)}
+                    onDelete={() => onDeleteCodeAnnotation?.(entry.annotation.id)}
+                    onEdit={onEditCodeAnnotation ? (updates: Partial<CodeAnnotation>) => onEditCodeAnnotation(entry.annotation.id, updates) : undefined}
+                  />
+                );
+              }
+              const ann = entry.annotation;
+              const isPending = pendingIds?.has(ann.id) ?? false;
+              const failure = failedIds?.get(ann.id);
+              return (
+                <div
+                  key={ann.id}
+                  className={
+                    failure
+                      ? 'border-l-2 border-destructive pl-1'
+                      : isPending
+                      ? 'opacity-70'
+                      : ''
+                  }
+                  data-testid={
+                    failure ? `annotation-failed-${ann.id}` : isPending ? `annotation-pending-${ann.id}` : undefined
+                  }
+                >
+                  <AnnotationCard
+                    annotation={ann}
+                    isSelected={selectedId === ann.id}
+                    isMe={isMe}
+                    onSelect={() => onSelect(ann.id)}
+                    onDelete={
+                      isPending || failure
+                        ? undefined
+                        : () => onDelete(ann.id)
+                    }
+                    onEdit={
+                      !onEdit || isPending || failure
+                        ? undefined
+                        : (updates: Partial<Annotation>) => onEdit(ann.id, updates)
+                    }
+                  />
+                  {failure && onRetry && onDiscard && (
+                    <div
+                      className="text-[10px] text-destructive flex items-center gap-2 px-2 py-1"
+                      role="alert"
+                    >
+                      <span className="flex-1">Failed to {failure.kind}: {failure.error}</span>
+                      <button type="button" className="underline" onClick={() => onRetry(ann.id)} data-testid={`annotation-retry-${ann.id}`}>Retry</button>
+                      <button type="button" className="underline" onClick={() => onDiscard(ann.id)} data-testid={`annotation-discard-${ann.id}`}>Discard</button>
+                    </div>
+                  )}
+                  {isPending && !failure && (
+                    <div className="text-[10px] text-muted-foreground px-2 py-0.5">Sending…</div>
+                  )}
+                </div>
+              );
+            })}
             {editorAnnotations && editorAnnotations.length > 0 && (
               <>
                 {timelineEntries.length > 0 && (
@@ -255,10 +339,19 @@ function formatTimestamp(ts: number): string {
 const AnnotationCard: React.FC<{
   annotation: Annotation;
   isSelected: boolean;
+  /**
+   * "Is this annotation authored by the current user?" — passed in
+   * from AnnotationPanel so the helper can bake in the room-mode
+   * override (the joined display name instead of the cookie Tater).
+   * Taking it as a prop rather than closing over the parent's local
+   * helper keeps AnnotationCard module-scoped.
+   */
+  isMe: (author: string | undefined) => boolean;
   onSelect: () => void;
-  onDelete: () => void;
+  /** Undefined = hide delete button (e.g. row is pending or failed). */
+  onDelete?: () => void;
   onEdit?: (updates: Partial<Annotation>) => void;
-}> = ({ annotation, isSelected, onSelect, onDelete, onEdit }) => {
+}> = ({ annotation, isSelected, isMe, onSelect, onDelete, onEdit }) => {
   const [isEditing, setIsEditing] = useState(false);
   const [editText, setEditText] = useState(annotation.text || '');
   const textareaRef = useRef<HTMLTextAreaElement>(null);
@@ -277,6 +370,17 @@ const AnnotationCard: React.FC<{
     }
   }, [annotation.text, isEditing]);
 
+  // Cancel in-progress edits when `onEdit` disappears — happens when
+  // the row flips into pending/failed room-sync state mid-edit.
+  // Without this the textarea would persist visually; Save would
+  // silently no-op because onEdit is now undefined, confusing the
+  // user.
+  useEffect(() => {
+    if (!onEdit && isEditing) {
+      setIsEditing(false);
+    }
+  }, [onEdit, isEditing]);
+
   const handleStartEdit = (e: React.MouseEvent) => {
     e.stopPropagation();
     setEditText(annotation.text || '');
@@ -364,11 +468,11 @@ const AnnotationCard: React.FC<{
     >
       {/* Author */}
       {annotation.author && (
-        <div className={`flex items-center gap-1.5 text-[10px] font-mono truncate mb-1.5 ${isCurrentUser(annotation.author) ? 'text-muted-foreground/60' : 'text-muted-foreground'}`}>
+        <div className={`flex items-center gap-1.5 text-[10px] font-mono truncate mb-1.5 ${isMe(annotation.author) ? 'text-muted-foreground/60' : 'text-muted-foreground'}`}>
           <svg className="w-3 h-3 flex-shrink-0" fill="none" viewBox="0 0 24 24" stroke="currentColor" strokeWidth={2}>
             <path strokeLinecap="round" strokeLinejoin="round" d="M16 7a4 4 0 11-8 0 4 4 0 018 0zM12 14a7 7 0 00-7 7h14a7 7 0 00-7-7z" />
           </svg>
-          <span className="truncate">{annotation.author}{isCurrentUser(annotation.author) && ' (me)'}</span>
+          <span className="truncate">{annotation.author}{isMe(annotation.author) && ' (me)'}</span>
         </div>
       )}
 
@@ -404,15 +508,17 @@ const AnnotationCard: React.FC<{
               </svg>
             </button>
           )}
-          <button
-            onClick={(e: React.MouseEvent<HTMLButtonElement>) => { e.stopPropagation(); onDelete(); }}
-            className="p-1 rounded hover:bg-destructive/10 text-muted-foreground hover:text-destructive transition-all"
-            title="Delete annotation"
-          >
-            <svg className="w-3 h-3" fill="none" viewBox="0 0 24 24" stroke="currentColor" strokeWidth={2}>
-              <path strokeLinecap="round" strokeLinejoin="round" d="M6 18L18 6M6 6l12 12" />
-            </svg>
-          </button>
+          {onDelete && (
+            <button
+              onClick={(e: React.MouseEvent<HTMLButtonElement>) => { e.stopPropagation(); onDelete(); }}
+              className="p-1 rounded hover:bg-destructive/10 text-muted-foreground hover:text-destructive transition-all"
+              title="Delete annotation"
+            >
+              <svg className="w-3 h-3" fill="none" viewBox="0 0 24 24" stroke="currentColor" strokeWidth={2}>
+                <path strokeLinecap="round" strokeLinejoin="round" d="M6 18L18 6M6 6l12 12" />
+              </svg>
+            </button>
+          )}
         </div>
       </div>
 
diff --git a/packages/ui/components/BlockRenderer.tsx b/packages/ui/components/BlockRenderer.tsx
index f0c7bbb29..f4639718b 100644
--- a/packages/ui/components/BlockRenderer.tsx
+++ b/packages/ui/components/BlockRenderer.tsx
@@ -19,8 +19,9 @@ export const BlockRenderer: React.FC<{
   orderedIndex?: number | null;
   githubRepo?: string;
   headingAnchorId?: string;
+  localDocLinksEnabled?: boolean;
   onNavigateAnchor?: (hash: string) => void;
-}> = ({ block, onOpenLinkedDoc, onOpenCodeFile, imageBaseDir, onImageClick, onToggleCheckbox, checkboxOverrides, orderedIndex, githubRepo, headingAnchorId, onNavigateAnchor }) => {
+}> = ({ block, onOpenLinkedDoc, onOpenCodeFile, imageBaseDir, onImageClick, onToggleCheckbox, checkboxOverrides, orderedIndex, githubRepo, headingAnchorId, localDocLinksEnabled, onNavigateAnchor }) => {
   switch (block.type) {
     case 'heading': {
       const Tag = `h${block.level || 1}` as React.ElementType;
@@ -36,7 +37,7 @@ export const BlockRenderer: React.FC<{
           data-block-id={block.id}
           data-block-type="heading"
         >
-          <InlineMarkdown imageBaseDir={imageBaseDir} onImageClick={onImageClick} text={block.content} onOpenLinkedDoc={onOpenLinkedDoc} onOpenCodeFile={onOpenCodeFile} githubRepo={githubRepo} onNavigateAnchor={onNavigateAnchor} />
+          <InlineMarkdown imageBaseDir={imageBaseDir} onImageClick={onImageClick} text={block.content} onOpenLinkedDoc={onOpenLinkedDoc} onOpenCodeFile={onOpenCodeFile} localDocLinksEnabled={localDocLinksEnabled} githubRepo={githubRepo} onNavigateAnchor={onNavigateAnchor} />
         </Tag>
       );
     }
@@ -50,6 +51,7 @@ export const BlockRenderer: React.FC<{
             body={block.content}
             onOpenLinkedDoc={onOpenLinkedDoc}
             onOpenCodeFile={onOpenCodeFile}
+            localDocLinksEnabled={localDocLinksEnabled}
             imageBaseDir={imageBaseDir}
             onImageClick={onImageClick}
             githubRepo={githubRepo}
@@ -67,7 +69,7 @@ export const BlockRenderer: React.FC<{
         >
           {paragraphs.map((para, i) => (
             <p key={i} className={i > 0 ? 'mt-2' : ''}>
-              <InlineMarkdown imageBaseDir={imageBaseDir} onImageClick={onImageClick} text={para} onOpenLinkedDoc={onOpenLinkedDoc} onOpenCodeFile={onOpenCodeFile} githubRepo={githubRepo} onNavigateAnchor={onNavigateAnchor} />
+              <InlineMarkdown imageBaseDir={imageBaseDir} onImageClick={onImageClick} text={para} onOpenLinkedDoc={onOpenLinkedDoc} onOpenCodeFile={onOpenCodeFile} localDocLinksEnabled={localDocLinksEnabled} githubRepo={githubRepo} onNavigateAnchor={onNavigateAnchor} />
             </p>
           ))}
         </blockquote>
@@ -83,7 +85,7 @@ export const BlockRenderer: React.FC<{
       const isInteractive = isCheckbox && !!onToggleCheckbox;
       const textClass = `text-sm leading-relaxed ${isCheckbox && isChecked ? 'text-muted-foreground line-through' : 'text-foreground/90'}`;
       const paragraphs = block.content.split(/\n\n+/);
-      const inlineProps = { imageBaseDir, onImageClick, onOpenLinkedDoc, onOpenCodeFile, githubRepo, onNavigateAnchor };
+      const inlineProps = { imageBaseDir, onImageClick, onOpenLinkedDoc, onOpenCodeFile, localDocLinksEnabled, githubRepo, onNavigateAnchor };
       return (
         <div
           className="flex items-start gap-3 my-1.5"
@@ -126,6 +128,7 @@ export const BlockRenderer: React.FC<{
           onImageClick={onImageClick}
           onOpenLinkedDoc={onOpenLinkedDoc}
           onOpenCodeFile={onOpenCodeFile}
+          localDocLinksEnabled={localDocLinksEnabled}
           githubRepo={githubRepo}
           onNavigateAnchor={onNavigateAnchor}
         />
@@ -149,6 +152,7 @@ export const BlockRenderer: React.FC<{
           kindAttribute={kind}
           onOpenLinkedDoc={onOpenLinkedDoc}
           onOpenCodeFile={onOpenCodeFile}
+          localDocLinksEnabled={localDocLinksEnabled}
           imageBaseDir={imageBaseDir}
           onImageClick={onImageClick}
           githubRepo={githubRepo}
@@ -163,7 +167,7 @@ export const BlockRenderer: React.FC<{
           className="mb-4 leading-relaxed text-foreground/90 text-[15px]"
           data-block-id={block.id}
         >
-          <InlineMarkdown imageBaseDir={imageBaseDir} onImageClick={onImageClick} text={block.content} onOpenLinkedDoc={onOpenLinkedDoc} onOpenCodeFile={onOpenCodeFile} githubRepo={githubRepo} onNavigateAnchor={onNavigateAnchor} />
+          <InlineMarkdown imageBaseDir={imageBaseDir} onImageClick={onImageClick} text={block.content} onOpenLinkedDoc={onOpenLinkedDoc} onOpenCodeFile={onOpenCodeFile} localDocLinksEnabled={localDocLinksEnabled} githubRepo={githubRepo} onNavigateAnchor={onNavigateAnchor} />
         </p>
       );
   }
diff --git a/packages/ui/components/CommentPopover.tsx b/packages/ui/components/CommentPopover.tsx
index 4baa11750..e2f4ad496 100644
--- a/packages/ui/components/CommentPopover.tsx
+++ b/packages/ui/components/CommentPopover.tsx
@@ -20,6 +20,14 @@ interface CommentPopoverProps {
   onSubmit: (text: string, images?: ImageAttachment[]) => void;
   /** Called when popover is closed/cancelled */
   onClose: () => void;
+  /**
+   * Default true. Set false in room mode: Live Rooms V1 strips image
+   * attachments at room-create time and doesn't carry them over the
+   * wire for new annotations either, so the attachments UI would
+   * either silently drop images or fail validation at send. Hiding
+   * the affordance is the honest surface.
+   */
+  attachmentsEnabled?: boolean;
 }
 
 const MAX_POPOVER_WIDTH = 384;
@@ -48,6 +56,7 @@ export const CommentPopover: React.FC<CommentPopoverProps> = ({
   initialText = '',
   onSubmit,
   onClose,
+  attachmentsEnabled = true,
 }) => {
   const [mode, setMode] = useState<'popover' | 'dialog'>('popover');
   const [text, setText] = useState(initialText);
@@ -200,12 +209,14 @@ export const CommentPopover: React.FC<CommentPopoverProps> = ({
           {/* Footer */}
           <div className="flex items-center justify-between px-4 py-3 border-t border-border/50">
             <div className="flex items-center gap-2">
-              <AttachmentsButton
-                images={images}
-                onAdd={(img) => setImages((prev) => [...prev, img])}
-                onRemove={(path) => setImages((prev) => prev.filter((i) => i.path !== path))}
-                variant="inline"
-              />
+              {attachmentsEnabled && (
+                <AttachmentsButton
+                  images={images}
+                  onAdd={(img) => setImages((prev) => [...prev, img])}
+                  onRemove={(path) => setImages((prev) => prev.filter((i) => i.path !== path))}
+                  variant="inline"
+                />
+              )}
             </div>
             <div className="flex items-center gap-3">
               <span className="text-[10px] text-muted-foreground">{submitHint}</span>
@@ -296,12 +307,14 @@ export const CommentPopover: React.FC<CommentPopoverProps> = ({
       {/* Footer */}
       <div className="flex items-center justify-between px-3 py-2 border-t border-border/50">
         <div className="flex items-center gap-2">
-          <AttachmentsButton
-            images={images}
-            onAdd={(img) => setImages((prev) => [...prev, img])}
-            onRemove={(path) => setImages((prev) => prev.filter((i) => i.path !== path))}
-            variant="inline"
-          />
+          {attachmentsEnabled && (
+            <AttachmentsButton
+              images={images}
+              onAdd={(img) => setImages((prev) => [...prev, img])}
+              onRemove={(path) => setImages((prev) => prev.filter((i) => i.path !== path))}
+              variant="inline"
+            />
+          )}
         </div>
         <div className="flex items-center gap-3">
           <span className="text-[10px] text-muted-foreground">{submitHint}</span>
diff --git a/packages/ui/components/ExportModal.tsx b/packages/ui/components/ExportModal.tsx
index 251001f00..1b4f1da2e 100644
--- a/packages/ui/components/ExportModal.tsx
+++ b/packages/ui/components/ExportModal.tsx
@@ -33,6 +33,13 @@ interface ExportModalProps {
   markdown?: string;
   isApiMode?: boolean;
   initialTab?: Tab;
+  /**
+   * Optional. When present, the Share tab surfaces a primary
+   * "Start live room" CTA above the existing static-share links. Absent
+   * → the existing UI is unchanged (local mode with no room backend
+   * configured).
+   */
+  onStartLiveRoom?: () => void;
 }
 
 type Tab = 'share' | 'annotations' | 'notes';
@@ -56,6 +63,7 @@ export const ExportModal: React.FC<ExportModalProps> = ({
   markdown,
   isApiMode = false,
   initialTab,
+  onStartLiveRoom,
 }) => {
   const defaultTab = initialTab || (sharingEnabled ? 'share' : 'annotations');
   const [activeTab, setActiveTab] = useState<Tab>(defaultTab);
@@ -254,6 +262,27 @@ export const ExportModal: React.FC<ExportModalProps> = ({
           {/* Tab content */}
           {activeTab === 'share' && sharingEnabled ? (
             <div className="space-y-4">
+              {onStartLiveRoom && (
+                <div className="p-3 rounded-lg border border-accent/40 bg-accent/5 space-y-2">
+                  <div className="text-sm font-medium">Start a live room</div>
+                  <p className="text-xs text-muted-foreground">
+                    Real-time collaborative review. The link you share is participant-only;
+                    admin controls stay with you.
+                  </p>
+                  <button
+                    onClick={() => { onStartLiveRoom(); onClose(); }}
+                    className="w-full px-3 py-1.5 text-sm rounded bg-foreground text-background"
+                    data-testid="share-tab-start-live-room"
+                  >
+                    Start live room…
+                  </button>
+                </div>
+              )}
+              {onStartLiveRoom && (
+                <div className="text-xs text-muted-foreground uppercase tracking-wide pt-1">
+                  Static share
+                </div>
+              )}
               {/* Short URL — primary copy target when available */}
               {shortShareUrl ? (
                 <div>
diff --git a/packages/ui/components/InlineMarkdown.tsx b/packages/ui/components/InlineMarkdown.tsx
index 1871a86c7..b89a561e3 100644
--- a/packages/ui/components/InlineMarkdown.tsx
+++ b/packages/ui/components/InlineMarkdown.tsx
@@ -393,7 +393,8 @@ export const InlineMarkdown: React.FC<{
   imageBaseDir?: string;
   onImageClick?: (src: string, alt: string) => void;
   githubRepo?: string;
-}> = ({ text, onOpenLinkedDoc, onOpenCodeFile, onNavigateAnchor, imageBaseDir, onImageClick, githubRepo }) => {
+  localDocLinksEnabled?: boolean;
+}> = ({ text, onOpenLinkedDoc, onOpenCodeFile, onNavigateAnchor, imageBaseDir, onImageClick, githubRepo, localDocLinksEnabled = true }) => {
   const validation = useCodePathValidation();
   const parts: React.ReactNode[] = [];
   let remaining = text;
@@ -497,6 +498,7 @@ export const InlineMarkdown: React.FC<{
             text={match[1]}
             onOpenLinkedDoc={onOpenLinkedDoc}
             onOpenCodeFile={onOpenCodeFile}
+            localDocLinksEnabled={localDocLinksEnabled}
             onNavigateAnchor={onNavigateAnchor}
             githubRepo={githubRepo}
           />
@@ -519,6 +521,7 @@ export const InlineMarkdown: React.FC<{
               text={match[1]}
               onOpenLinkedDoc={onOpenLinkedDoc}
               onOpenCodeFile={onOpenCodeFile}
+              localDocLinksEnabled={localDocLinksEnabled}
               onNavigateAnchor={onNavigateAnchor}
               githubRepo={githubRepo}
             />
@@ -541,6 +544,7 @@ export const InlineMarkdown: React.FC<{
             text={match[1]}
             onOpenLinkedDoc={onOpenLinkedDoc}
             onOpenCodeFile={onOpenCodeFile}
+            localDocLinksEnabled={localDocLinksEnabled}
             onNavigateAnchor={onNavigateAnchor}
             githubRepo={githubRepo}
           />
@@ -562,6 +566,7 @@ export const InlineMarkdown: React.FC<{
             text={match[1]}
             onOpenLinkedDoc={onOpenLinkedDoc}
             onOpenCodeFile={onOpenCodeFile}
+            localDocLinksEnabled={localDocLinksEnabled}
             onNavigateAnchor={onNavigateAnchor}
             githubRepo={githubRepo}
           />
@@ -584,6 +589,7 @@ export const InlineMarkdown: React.FC<{
             text={match[1]}
             onOpenLinkedDoc={onOpenLinkedDoc}
             onOpenCodeFile={onOpenCodeFile}
+            localDocLinksEnabled={localDocLinksEnabled}
             onNavigateAnchor={onNavigateAnchor}
             githubRepo={githubRepo}
           />
@@ -721,7 +727,11 @@ export const InlineMarkdown: React.FC<{
         ? target
         : `${target}.md`;
 
-      if (onOpenLinkedDoc) {
+      // `localDocLinksEnabled === false` pins the wikilink to plain
+      // text regardless of handler presence — room mode uses this so
+      // a click doesn't attempt to resolve a local path on the room
+      // origin (which has no `/api/doc` or Obsidian endpoint).
+      if (onOpenLinkedDoc && localDocLinksEnabled) {
         parts.push(
           <a
             key={key++}
@@ -859,7 +869,7 @@ export const InlineMarkdown: React.FC<{
             {linkText}
           </a>,
         );
-      } else if (isLocalDoc && onOpenLinkedDoc) {
+      } else if (isLocalDoc && onOpenLinkedDoc && localDocLinksEnabled) {
         parts.push(
           <a
             key={key++}
@@ -888,6 +898,10 @@ export const InlineMarkdown: React.FC<{
             </svg>
           </a>,
         );
+      } else if (isLocalDoc && !localDocLinksEnabled) {
+        parts.push(
+          <span key={key++} className="text-primary">{linkText}</span>,
+        );
       } else if (isCodeFile && onOpenCodeFile) {
         parts.push(
           <a
@@ -905,7 +919,9 @@ export const InlineMarkdown: React.FC<{
           </a>,
         );
       } else if (isLocalDoc) {
-        // No handler — render as plain link (e.g., in shared/portal views)
+        // No handler (e.g. shared/portal views) — render as a plain
+        // `<a>`. Clicking navigates to `<current-origin>/<path>`,
+        // which may or may not resolve depending on deployment.
         parts.push(
           <a
             key={key++}
@@ -944,6 +960,7 @@ export const InlineMarkdown: React.FC<{
             text={before}
             onOpenLinkedDoc={onOpenLinkedDoc}
             onOpenCodeFile={onOpenCodeFile}
+            localDocLinksEnabled={localDocLinksEnabled}
             onNavigateAnchor={onNavigateAnchor}
             githubRepo={githubRepo}
             imageBaseDir={imageBaseDir}
diff --git a/packages/ui/components/PlanHeaderMenu.tsx b/packages/ui/components/PlanHeaderMenu.tsx
index 85baf34b9..d0a6edee9 100644
--- a/packages/ui/components/PlanHeaderMenu.tsx
+++ b/packages/ui/components/PlanHeaderMenu.tsx
@@ -18,6 +18,12 @@ interface PlanHeaderMenuProps {
   onPrint: () => void;
   onCopyShareLink: () => void;
   onOpenImport: () => void;
+  /**
+   * Opens the Start-live-room modal. Optional so existing consumers
+   * (build-time and tests) don't need to thread the prop; when omitted
+   * the menu item is hidden.
+   */
+  onStartLiveRoom?: () => void;
   onSaveToObsidian: () => void;
   onSaveToBear: () => void;
   onSaveToOctarine: () => void;
@@ -38,6 +44,7 @@ export const PlanHeaderMenu: React.FC<PlanHeaderMenuProps> = ({
   onPrint,
   onCopyShareLink,
   onOpenImport,
+  onStartLiveRoom,
   onSaveToObsidian,
   onSaveToBear,
   onSaveToOctarine,
@@ -156,6 +163,19 @@ export const PlanHeaderMenu: React.FC<PlanHeaderMenuProps> = ({
               label="Copy Share Link"
             />
           )}
+          {onStartLiveRoom && (
+            <ActionMenuItem
+              onClick={() => {
+                closeMenu();
+                onStartLiveRoom();
+              }}
+              // 👥 (people) distinguishes "Start live room" from the
+              // visually-similar "Copy Share Link" entry above, which
+              // keeps its chain-link icon for static sharing.
+              icon={<span aria-hidden>👥</span>}
+              label="Start live room…"
+            />
+          )}
           {sharingEnabled && (
             <ActionMenuItem
               onClick={() => {
@@ -294,3 +314,4 @@ const NoteIcon = () => (
   </svg>
 );
 
+
diff --git a/packages/ui/components/Settings.tsx b/packages/ui/components/Settings.tsx
index e2982315b..321ee2669 100644
--- a/packages/ui/components/Settings.tsx
+++ b/packages/ui/components/Settings.tsx
@@ -5,7 +5,8 @@ import type { DiffLineBgIntensity } from '@plannotator/shared/config';
 import { configStore, useConfigValue } from '../config';
 import { loadDiffFont } from '../utils/diffFonts';
 import { TaterSpritePullup } from './TaterSpritePullup';
-import { getIdentity, regenerateIdentity, setCustomIdentity } from '../utils/identity';
+import { getIdentity, regenerateIdentity, setCustomIdentity, getPresenceColor, setPresenceColor } from '../utils/identity';
+import { PRESENCE_SWATCHES } from '../utils/presenceColor';
 import { GitUser } from '../icons/GitUser';
 import {
   getObsidianSettings,
@@ -613,6 +614,7 @@ export const Settings: React.FC<SettingsProps> = ({ taterMode, onTaterModeChange
   }, [themePreview]);
   const [activeTab, setActiveTab] = useState<SettingsTab>('general');
   const [identity, setIdentity] = useState('');
+  const [presenceColor, setPresenceColorState] = useState<string>(PRESENCE_SWATCHES[0]);
   const [obsidian, setObsidian] = useState<ObsidianSettings>({
     enabled: false,
     vaultPath: '',
@@ -686,6 +688,7 @@ export const Settings: React.FC<SettingsProps> = ({ taterMode, onTaterModeChange
   useEffect(() => {
     if (showDialog) {
       setIdentity(getIdentity())
+      setPresenceColorState(getPresenceColor());
       setObsidian(getObsidianSettings());
       setBear(getBearSettings());
       setOctarine(getOctarineSettings());
@@ -833,6 +836,12 @@ export const Settings: React.FC<SettingsProps> = ({ taterMode, onTaterModeChange
     handleIdentitySave(gitUser);
   };
 
+  const handlePresenceColorChange = (color: string) => {
+    if (color === presenceColor) return;
+    const saved = setPresenceColor(color);
+    setPresenceColorState(saved);
+  };
+
   return (
     <>
       <button
@@ -977,6 +986,26 @@ export const Settings: React.FC<SettingsProps> = ({ taterMode, onTaterModeChange
                           </svg>
                         </button>
                       </div>
+                      {/*
+                        Presence color lives next to the name as part
+                        of identity. The Live Rooms create/join gates
+                        read the same preference, so editing here
+                        updates what peers see on the next room join.
+                      */}
+                      <div className="flex items-center gap-1 pt-1">
+                        {PRESENCE_SWATCHES.map(s => (
+                          <button
+                            key={s}
+                            type="button"
+                            onClick={() => handlePresenceColorChange(s)}
+                            onMouseDown={(e) => e.preventDefault()}
+                            className={`w-6 h-6 rounded-full border-2 ${presenceColor === s ? 'border-foreground' : 'border-transparent'}`}
+                            style={{ backgroundColor: s }}
+                            aria-label={`Presence color ${s}`}
+                            title={`Presence color ${s}`}
+                          />
+                        ))}
+                      </div>
                     </div>
 
                     {/* Permission Mode (Claude Code only) */}
diff --git a/packages/ui/components/Viewer.tsx b/packages/ui/components/Viewer.tsx
index 6f5c917e9..94e9ae1bc 100644
--- a/packages/ui/components/Viewer.tsx
+++ b/packages/ui/components/Viewer.tsx
@@ -96,6 +96,43 @@ interface ViewerProps {
   // Checkbox toggle props
   onToggleCheckbox?: (blockId: string, checked: boolean) => void;
   checkboxOverrides?: Map<string, boolean>;
+  /**
+   * When set, newly-created annotations stamp `author` with this
+   * value instead of the cookie-backed `getIdentity()`. Threaded
+   * from App in room mode so annotations carry the display name
+   * the participant typed into the JoinRoomGate — matches the
+   * name peers see on remote cursors/avatars.
+   */
+  authorOverride?: string;
+  /**
+   * Default true. Passed to CommentPopover to hide the attachments
+   * UI when false. Used by App in room mode: Live Rooms V1 strips
+   * image attachments at room-create time and doesn't carry new
+   * attachments over the wire, so offering the affordance would
+   * silently drop the user's image.
+   */
+  attachmentsEnabled?: boolean;
+  /**
+   * When false, links to local documents (wikilinks like `[[foo]]`
+   * and markdown links to `*.md`/`*.mdx`/`*.html`) render as plain
+   * text instead of clickable anchors. Used by room mode because
+   * `room.plannotator.ai` has no `/api/doc` or Obsidian endpoint —
+   * clicking such a link would either trigger a broken fetch or
+   * navigate the room tab to a non-existent room-origin path.
+   * Non-local links (http/https) are unaffected.
+   */
+  localDocLinksEnabled?: boolean;
+  /**
+   * Notifies the parent that the internal highlight surface has been
+   * (re)initialized or cleared. Fires once on initial highlighter
+   * construction and on each `clearAllHighlights()` call.
+   *
+   * The callback is a bare event — it carries no number. The parent
+   * owns the monotonic generation counter so a Viewer remount (which
+   * resets any Viewer-local state) still produces a fresh value that
+   * `setState` won't dedupe as a no-op.
+   */
+  onHighlightSurfaceReset?: () => void;
 }
 
 export interface ViewerHandle {
@@ -170,6 +207,10 @@ export const Viewer = forwardRef<ViewerHandle, ViewerProps>(({
   sourceInfo,
   onToggleCheckbox,
   checkboxOverrides,
+  authorOverride,
+  attachmentsEnabled = true,
+  localDocLinksEnabled = true,
+  onHighlightSurfaceReset,
 }, ref) => {
   const [copied, setCopied] = useState(false);
   const [lightbox, setLightbox] = useState<{ src: string; alt: string } | null>(null);
@@ -238,6 +279,8 @@ export const Viewer = forwardRef<ViewerHandle, ViewerProps>(({
     onSelectAnnotation,
     selectedAnnotationId,
     mode,
+    authorOverride,
+    onSurfaceReset: onHighlightSurfaceReset,
   });
 
   // Refs for code block annotation path
@@ -438,7 +481,7 @@ export const Viewer = forwardRef<ViewerHandle, ViewerProps>(({
       text,
       originalText: codeText,
       createdA: Date.now(),
-      author: getIdentity(),
+      author: authorOverride ?? getIdentity(),
       images,
       ...(isQuickLabel ? { isQuickLabel: true } : {}),
       ...(quickLabelTip ? { quickLabelTip } : {}),
@@ -499,7 +542,7 @@ export const Viewer = forwardRef<ViewerHandle, ViewerProps>(({
         text: text.trim(),
         originalText: '',
         createdA: Date.now(),
-        author: getIdentity(),
+        author: authorOverride ?? getIdentity(),
         images,
       };
       onAddAnnotation(newAnnotation);
@@ -624,6 +667,7 @@ export const Viewer = forwardRef<ViewerHandle, ViewerProps>(({
                       orderedIndex={indices[i]}
                       onOpenLinkedDoc={onOpenLinkedDoc}
                       onOpenCodeFile={onOpenCodeFile}
+                      localDocLinksEnabled={localDocLinksEnabled}
                       onToggleCheckbox={onToggleCheckbox}
                       checkboxOverrides={checkboxOverrides}
                       githubRepo={repoInfo?.display}
@@ -699,7 +743,7 @@ export const Viewer = forwardRef<ViewerHandle, ViewerProps>(({
               isHovered={inputMethod !== 'pinpoint' && hoveredCodeBlock?.block.id === group.block.id}
             />
           ) : (
-            <BlockRenderer imageBaseDir={imageBaseDir} onImageClick={(src, alt) => setLightbox({ src, alt })} key={group.block.id} block={group.block} onOpenLinkedDoc={onOpenLinkedDoc} onOpenCodeFile={onOpenCodeFile} onNavigateAnchor={scrollToAnchor} onToggleCheckbox={onToggleCheckbox} checkboxOverrides={checkboxOverrides} githubRepo={repoInfo?.display} headingAnchorId={headingSlugMap.get(group.block.id)} />
+            <BlockRenderer imageBaseDir={imageBaseDir} onImageClick={(src, alt) => setLightbox({ src, alt })} key={group.block.id} block={group.block} onOpenLinkedDoc={onOpenLinkedDoc} onOpenCodeFile={onOpenCodeFile} localDocLinksEnabled={localDocLinksEnabled} onNavigateAnchor={scrollToAnchor} onToggleCheckbox={onToggleCheckbox} checkboxOverrides={checkboxOverrides} githubRepo={repoInfo?.display} headingAnchorId={headingSlugMap.get(group.block.id)} />
           )
         )}
 
@@ -797,6 +841,7 @@ export const Viewer = forwardRef<ViewerHandle, ViewerProps>(({
             onOpenLinkedDoc={onOpenLinkedDoc}
             onOpenCodeFile={onOpenCodeFile}
             githubRepo={repoInfo?.display}
+            localDocLinksEnabled={localDocLinksEnabled}
             onNavigateAnchor={scrollToAnchor}
           />
         )}
@@ -813,6 +858,7 @@ export const Viewer = forwardRef<ViewerHandle, ViewerProps>(({
             contextText={hookCommentPopover.contextText}
             isGlobal={false}
             initialText={hookCommentPopover.initialText}
+            attachmentsEnabled={attachmentsEnabled}
             onSubmit={hookCommentSubmit}
             onClose={hookCommentClose}
           />
@@ -823,6 +869,7 @@ export const Viewer = forwardRef<ViewerHandle, ViewerProps>(({
             contextText={viewerCommentPopover.contextText}
             isGlobal={viewerCommentPopover.isGlobal}
             initialText={viewerCommentPopover.initialText}
+            attachmentsEnabled={attachmentsEnabled}
             onSubmit={handleViewerCommentSubmit}
             onClose={handleViewerCommentClose}
           />
diff --git a/packages/ui/components/blocks/AlertBlock.tsx b/packages/ui/components/blocks/AlertBlock.tsx
index 793b190f5..fbfc7b10f 100644
--- a/packages/ui/components/blocks/AlertBlock.tsx
+++ b/packages/ui/components/blocks/AlertBlock.tsx
@@ -11,6 +11,7 @@ interface AlertBlockProps {
   imageBaseDir?: string;
   onImageClick?: (src: string, alt: string) => void;
   githubRepo?: string;
+  localDocLinksEnabled?: boolean;
   onNavigateAnchor?: (hash: string) => void;
 }
 
@@ -39,7 +40,7 @@ const Icon: React.FC<{ kind: AlertKind }> = ({ kind }) => {
 };
 
 export const AlertBlock: React.FC<AlertBlockProps> = ({
-  blockId, kind, body, onOpenLinkedDoc, onOpenCodeFile, imageBaseDir, onImageClick, githubRepo, onNavigateAnchor,
+  blockId, kind, body, onOpenLinkedDoc, onOpenCodeFile, imageBaseDir, onImageClick, githubRepo, localDocLinksEnabled, onNavigateAnchor,
 }) => {
   return (
     <div
@@ -52,7 +53,7 @@ export const AlertBlock: React.FC<AlertBlockProps> = ({
         <Icon kind={kind} />
         <span>{TITLE[kind]}</span>
       </div>
-      {renderProseBody({ body, imageBaseDir, onImageClick, onOpenLinkedDoc, onOpenCodeFile, onNavigateAnchor, githubRepo })}
+      {renderProseBody({ body, imageBaseDir, onImageClick, onOpenLinkedDoc, onOpenCodeFile, onNavigateAnchor, githubRepo, localDocLinksEnabled })}
     </div>
   );
 };
diff --git a/packages/ui/components/blocks/Callout.tsx b/packages/ui/components/blocks/Callout.tsx
index b71b7759d..ad4bf4485 100644
--- a/packages/ui/components/blocks/Callout.tsx
+++ b/packages/ui/components/blocks/Callout.tsx
@@ -13,6 +13,7 @@ interface CalloutProps {
   imageBaseDir?: string;
   onImageClick?: (src: string, alt: string) => void;
   githubRepo?: string;
+  localDocLinksEnabled?: boolean;
   onNavigateAnchor?: (hash: string) => void;
 }
 
@@ -28,6 +29,7 @@ export const Callout: React.FC<CalloutProps> = ({
   imageBaseDir,
   onImageClick,
   githubRepo,
+  localDocLinksEnabled,
   onNavigateAnchor,
 }) => {
   const kindAttr =
@@ -54,6 +56,7 @@ export const Callout: React.FC<CalloutProps> = ({
         onOpenCodeFile,
         onNavigateAnchor,
         githubRepo,
+        localDocLinksEnabled,
       })}
     </div>
   );
diff --git a/packages/ui/components/blocks/TableBlock.tsx b/packages/ui/components/blocks/TableBlock.tsx
index 81388b819..926381334 100644
--- a/packages/ui/components/blocks/TableBlock.tsx
+++ b/packages/ui/components/blocks/TableBlock.tsx
@@ -12,6 +12,7 @@ interface TableBlockProps {
   imageBaseDir?: string;
   onImageClick?: (src: string, alt: string) => void;
   githubRepo?: string;
+  localDocLinksEnabled?: boolean;
 }
 
 // Parse pipe-delimited markdown table content into headers + rows.
@@ -87,6 +88,7 @@ export const TableBlock: React.FC<TableBlockProps> = ({
   imageBaseDir,
   onImageClick,
   githubRepo,
+  localDocLinksEnabled,
 }) => {
   const containerRef = useRef<HTMLDivElement>(null);
   const { headers, rows } = parseTableContent(block.content);
@@ -116,6 +118,7 @@ export const TableBlock: React.FC<TableBlockProps> = ({
                   onOpenCodeFile={onOpenCodeFile}
                   onNavigateAnchor={onNavigateAnchor}
                   githubRepo={githubRepo}
+                  localDocLinksEnabled={localDocLinksEnabled}
                 />
               </th>
             ))}
@@ -134,6 +137,7 @@ export const TableBlock: React.FC<TableBlockProps> = ({
                     onOpenCodeFile={onOpenCodeFile}
                     onNavigateAnchor={onNavigateAnchor}
                     githubRepo={githubRepo}
+                    localDocLinksEnabled={localDocLinksEnabled}
                   />
                 </td>
               ))}
diff --git a/packages/ui/components/blocks/TablePopout.tsx b/packages/ui/components/blocks/TablePopout.tsx
index e4c650862..88f7334d7 100644
--- a/packages/ui/components/blocks/TablePopout.tsx
+++ b/packages/ui/components/blocks/TablePopout.tsx
@@ -27,6 +27,7 @@ interface TablePopoutProps {
   imageBaseDir?: string;
   onImageClick?: (src: string, alt: string) => void;
   githubRepo?: string;
+  localDocLinksEnabled?: boolean;
 }
 
 type Row = Record<string, string>;
@@ -42,6 +43,7 @@ const TablePopoutImpl: React.FC<TablePopoutProps> = ({
   imageBaseDir,
   onImageClick,
   githubRepo,
+  localDocLinksEnabled,
 }) => {
   const { headers, rows } = useMemo(() => parseTableContent(block.content), [block.content]);
 
@@ -82,11 +84,12 @@ const TablePopoutImpl: React.FC<TablePopoutProps> = ({
             onOpenCodeFile={onOpenCodeFile}
             onNavigateAnchor={onNavigateAnchor}
             githubRepo={githubRepo}
+            localDocLinksEnabled={localDocLinksEnabled}
           />
         ),
       }),
     );
-  }, [columnIds, headers, imageBaseDir, onImageClick, onOpenLinkedDoc, onNavigateAnchor, githubRepo]);
+  }, [columnIds, headers, imageBaseDir, onImageClick, onOpenLinkedDoc, onNavigateAnchor, githubRepo, localDocLinksEnabled]);
 
   const [sorting, setSorting] = useState<SortingState>([]);
   const [globalFilter, setGlobalFilter] = useState('');
diff --git a/packages/ui/components/blocks/proseBody.tsx b/packages/ui/components/blocks/proseBody.tsx
index 04fe3e2fc..e301a4421 100644
--- a/packages/ui/components/blocks/proseBody.tsx
+++ b/packages/ui/components/blocks/proseBody.tsx
@@ -19,6 +19,7 @@ export function renderProseBody(args: {
   onOpenCodeFile?: (path: string) => void;
   onNavigateAnchor?: (hash: string) => void;
   githubRepo?: string;
+  localDocLinksEnabled?: boolean;
 }): React.ReactNode {
   const {
     body,
@@ -30,6 +31,7 @@ export function renderProseBody(args: {
     onOpenCodeFile,
     onNavigateAnchor,
     githubRepo,
+    localDocLinksEnabled,
   } = args;
 
   const inline = (text: string) => (
@@ -41,6 +43,7 @@ export function renderProseBody(args: {
       onOpenCodeFile={onOpenCodeFile}
       onNavigateAnchor={onNavigateAnchor}
       githubRepo={githubRepo}
+      localDocLinksEnabled={localDocLinksEnabled}
     />
   );
 
diff --git a/packages/ui/components/collab/ImageStripNotice.tsx b/packages/ui/components/collab/ImageStripNotice.tsx
new file mode 100644
index 000000000..e234a5e8c
--- /dev/null
+++ b/packages/ui/components/collab/ImageStripNotice.tsx
@@ -0,0 +1,43 @@
+import React from 'react';
+
+/**
+ * Dismissible banner shown after room creation when one or more local
+ * annotations carried images that were stripped for the shared snapshot.
+ * Text annotations are preserved; only the image attachments are dropped.
+ *
+ * Presentational only — parent controls mount/unmount and dismissal.
+ */
+
+export interface ImageStripNoticeProps {
+  strippedCount: number;
+  onDismiss(): void;
+  className?: string;
+}
+
+export function ImageStripNotice({
+  strippedCount,
+  onDismiss,
+  className = '',
+}: ImageStripNoticeProps): React.ReactElement | null {
+  if (strippedCount <= 0) return null;
+  return (
+    <div
+      role="status"
+      className={`flex items-start gap-2 p-3 rounded border border-warning/20 bg-warning/10 text-warning text-sm ${className}`}
+      data-testid="image-strip-notice"
+    >
+      <div className="flex-1">
+        <strong>Images stripped.</strong>{' '}
+        {strippedCount} item{strippedCount === 1 ? '' : 's'} with image attachments {strippedCount === 1 ? 'was' : 'were'} removed before sharing — text comments are preserved. Your local copies are unchanged.
+      </div>
+      <button
+        type="button"
+        onClick={onDismiss}
+        className="text-xs underline opacity-80 hover:opacity-100"
+        aria-label="Dismiss image-strip notice"
+      >
+        Dismiss
+      </button>
+    </div>
+  );
+}
diff --git a/packages/ui/components/collab/JoinRoomGate.tsx b/packages/ui/components/collab/JoinRoomGate.tsx
new file mode 100644
index 000000000..892778143
--- /dev/null
+++ b/packages/ui/components/collab/JoinRoomGate.tsx
@@ -0,0 +1,122 @@
+import React, { useState } from 'react';
+import type { ConnectionStatus } from '@plannotator/shared/collab/client';
+import { PRESENCE_SWATCHES } from '@plannotator/ui/utils/presenceColor';
+
+/**
+ * Pre-connect identity gate for room participants. Parent mounts this
+ * BEFORE connecting — captures a display name + color, then calls
+ * `onJoin` with the settled identity. While connecting, this same
+ * component also surfaces status messages (connecting / authenticating)
+ * so the user has constant feedback.
+ *
+ * Both `initialDisplayName` and `initialColor` should come from the
+ * user's Plannotator preferences (`getIdentity()` / `getPresenceColor()`).
+ * Parent persists edits back via the corresponding setters after the
+ * user submits; the gate itself is pure presentation.
+ *
+ * Fatal failure states (malformed URL / access denied / room deleted)
+ * are rendered by the parent as a full-screen replacement — this gate
+ * handles only the happy-path and the in-flight connection states.
+ */
+
+export interface JoinRoomSubmit {
+  displayName: string;
+  color: string;
+}
+
+export interface JoinRoomGateProps {
+  initialDisplayName?: string;
+  initialColor?: string;
+  connectionStatus: ConnectionStatus;
+  onJoin(submit: JoinRoomSubmit): void;
+}
+
+function statusMessage(s: ConnectionStatus): string | null {
+  switch (s) {
+    case 'connecting':     return 'Connecting to room…';
+    case 'authenticating': return 'Verifying access…';
+    case 'reconnecting':   return 'Reconnecting…';
+    default:               return null;
+  }
+}
+
+export function JoinRoomGate({
+  initialDisplayName = '',
+  initialColor = PRESENCE_SWATCHES[0],
+  connectionStatus,
+  onJoin,
+}: JoinRoomGateProps): React.ReactElement {
+  const [displayName, setDisplayName] = useState(initialDisplayName);
+  const [color, setColor] = useState(initialColor);
+  const [submitted, setSubmitted] = useState(false);
+
+  const showStatus = submitted && statusMessage(connectionStatus);
+
+  function handleSubmit(e: React.FormEvent) {
+    e.preventDefault();
+    const trimmed = displayName.trim();
+    if (!trimmed) return;
+    setSubmitted(true);
+    onJoin({ displayName: trimmed, color });
+  }
+
+  return (
+    <div
+      className="fixed inset-0 z-[100] flex items-center justify-center bg-background/80 backdrop-blur-sm p-4"
+      data-testid="join-room-gate"
+    >
+      <form
+        onSubmit={handleSubmit}
+        className="bg-card border border-border rounded-xl shadow-2xl w-[380px] max-w-[90vw] p-5 space-y-4"
+      >
+        <h2 className="text-base font-semibold">Join live review</h2>
+
+        <div className="space-y-2">
+          <label className="text-xs font-medium uppercase text-muted-foreground">Display name</label>
+          <input
+            type="text"
+            value={displayName}
+            onChange={e => setDisplayName(e.target.value)}
+            disabled={submitted}
+            className="w-full px-2 py-1 border rounded text-sm"
+            placeholder="Your name"
+            autoFocus
+          />
+        </div>
+
+        <div className="space-y-2">
+          <label className="text-xs font-medium uppercase text-muted-foreground">Color</label>
+          <div className="flex items-center gap-1">
+            {PRESENCE_SWATCHES.map(s => (
+              <button
+                key={s}
+                type="button"
+                disabled={submitted}
+                onClick={() => setColor(s)}
+                className={`w-6 h-6 rounded-full border-2 ${color === s ? 'border-foreground' : 'border-transparent'}`}
+                style={{ backgroundColor: s }}
+                aria-label={`Color ${s}`}
+              />
+            ))}
+          </div>
+        </div>
+
+        {showStatus && (
+          <div className="text-sm text-muted-foreground" data-testid="join-status">
+            {showStatus}
+          </div>
+        )}
+
+        <div className="flex items-center justify-end pt-2">
+          <button
+            type="submit"
+            disabled={submitted || !displayName.trim()}
+            className="px-3 py-1.5 text-sm rounded bg-foreground text-background disabled:opacity-50"
+          >
+            {submitted ? 'Joining…' : 'Join'}
+          </button>
+        </div>
+      </form>
+    </div>
+  );
+}
diff --git a/packages/ui/components/collab/LandingPage.tsx b/packages/ui/components/collab/LandingPage.tsx
new file mode 100644
index 000000000..ab0a0a246
--- /dev/null
+++ b/packages/ui/components/collab/LandingPage.tsx
@@ -0,0 +1,479 @@
+import React, { useState, useRef, useCallback, useEffect, useMemo, lazy, Suspense } from 'react';
+import { PRESENCE_SWATCHES } from '@plannotator/ui/utils/presenceColor';
+import { getIdentity, getPresenceColor } from '@plannotator/ui/utils/identity';
+import { useLandingCreateRoom } from '@plannotator/ui/hooks/collab/useLandingCreateRoom';
+import type { LandingCreateRoomSubmit } from '@plannotator/ui/hooks/collab/useLandingCreateRoom';
+
+const MarkdownPreview = lazy(() => import('./LandingPreview'));
+
+// Sprite: 59x96 native, 24 frames
+const SPRITE_NATIVE_W = 59;
+const SPRITE_NATIVE_H = 96;
+const SPRITE_DISPLAY_H = 96;
+const SPRITE_SCALE = SPRITE_DISPLAY_H / SPRITE_NATIVE_H;
+const SPRITE_DISPLAY_W = SPRITE_NATIVE_W * SPRITE_SCALE;
+const SPRITE_TOTAL_FRAMES = 24;
+const SPRITE_SKIP_FRAMES = 4;
+const SPRITE_PLAY_FRAMES = SPRITE_TOTAL_FRAMES - SPRITE_SKIP_FRAMES;
+const SPRITE_FRAME_DURATION = 2;
+const SPRITE_SHEET_W = SPRITE_NATIVE_W * SPRITE_TOTAL_FRAMES * SPRITE_SCALE;
+const SPRITE_OFFSET = SPRITE_NATIVE_W * SPRITE_SKIP_FRAMES * SPRITE_SCALE;
+const SPRITE_PLAY_W = SPRITE_NATIVE_W * SPRITE_PLAY_FRAMES * SPRITE_SCALE;
+const SPRITE_RISE_DURATION = 8;
+
+function FloatingSprite({ side, delay }: { side: 'left' | 'right'; delay: number }) {
+  const [visible, setVisible] = useState(false);
+  const x = useMemo(() => {
+    const min = side === 'left' ? 5 : 55;
+    const max = side === 'left' ? 40 : 90;
+    return min + Math.random() * (max - min);
+  }, [side]);
+
+  useEffect(() => {
+    const show = setTimeout(() => setVisible(true), delay);
+    const hide = setTimeout(() => setVisible(false), delay + SPRITE_RISE_DURATION * 1000);
+    return () => { clearTimeout(show); clearTimeout(hide); };
+  }, [delay]);
+
+  if (!visible) return null;
+
+  return (
+    <div
+      className="fixed pointer-events-none z-50 hidden md:block"
+      style={{
+        left: `${x}%`,
+        bottom: -SPRITE_DISPLAY_H,
+        width: SPRITE_DISPLAY_W,
+        height: SPRITE_DISPLAY_H,
+        backgroundImage: 'url(/sprite.png)',
+        backgroundSize: `${SPRITE_SHEET_W}px ${SPRITE_DISPLAY_H}px`,
+        backgroundPosition: `-${SPRITE_OFFSET}px center`,
+        imageRendering: 'pixelated',
+        transform: side === 'right' ? 'scaleX(-1)' : undefined,
+        animation: `landing-sprite-play ${SPRITE_FRAME_DURATION}s steps(${SPRITE_PLAY_FRAMES}) infinite, landing-sprite-rise ${SPRITE_RISE_DURATION}s linear forwards`,
+      }}
+    />
+  );
+}
+
+const MAX_FILE_SIZE = 500 * 1024;
+const ALLOWED_EXTENSIONS = new Set(['md', 'txt', 'markdown', 'html', 'htm']);
+const HTML_EXTENSIONS = new Set(['html', 'htm']);
+
+const DEMOS: readonly { label: string; url?: string; staticPath?: string }[] = [
+  { label: 'Attention is all you need', staticPath: '/demo-aiayn.md' },
+  { label: 'Kimi Paper', staticPath: '/demo-kimi.md' },
+  { label: 'Cloudflare Artifacts', url: 'https://developers.cloudflare.com/artifacts/get-started/workers/index.md' },
+];
+
+type InputMode = 'upload' | 'paste' | 'url';
+
+export function LandingPage(): React.ReactElement {
+  const [markdown, setMarkdown] = useState('');
+  const [fileName, setFileName] = useState<string | null>(null);
+  const [inputMode, setInputMode] = useState<InputMode>('upload');
+  const [dragOver, setDragOver] = useState(false);
+  const [displayName, setDisplayName] = useState(() => getIdentity() || '');
+  const [color, setColor] = useState<string>(() => getPresenceColor() || PRESENCE_SWATCHES[0]);
+  const [expiresInDays, setExpiresInDays] = useState<0 | 1 | 7 | 30>(7);
+  const [fileError, setFileError] = useState('');
+  const fileInputRef = useRef<HTMLInputElement>(null);
+
+  const hasContent = markdown.trim().length > 0;
+
+  const { inFlight, error, handleCreate, handleCancel } = useLandingCreateRoom({ markdown });
+
+  const [urlInput, setUrlInput] = useState('');
+  const [urlLoading, setUrlLoading] = useState(false);
+  const [showDemos, setShowDemos] = useState(false);
+
+  const loadFile = useCallback(async (file: File) => {
+    setFileError('');
+    const ext = file.name.split('.').pop()?.toLowerCase() ?? '';
+    if (!ALLOWED_EXTENSIONS.has(ext)) {
+      setFileError(`Unsupported file type (.${ext}). Use .md, .txt, .html, or .markdown.`);
+      if (fileInputRef.current) fileInputRef.current.value = '';
+      return;
+    }
+    if (file.size > MAX_FILE_SIZE) {
+      setFileError(`File too large (${(file.size / 1024).toFixed(0)} KB). Maximum is 500 KB.`);
+      if (fileInputRef.current) fileInputRef.current.value = '';
+      return;
+    }
+    try {
+      const text = await file.text();
+      if (HTML_EXTENSIONS.has(ext)) {
+        const { htmlToMarkdown } = await import('@plannotator/shared/html-to-markdown');
+        setMarkdown(htmlToMarkdown(text));
+      } else {
+        setMarkdown(text);
+      }
+      setFileName(file.name);
+    } catch {
+      setFileError('Could not read file. Try again or paste the content instead.');
+    }
+  }, []);
+
+  const fetchUrl = useCallback(async (url: string) => {
+    setUrlLoading(true);
+    setFileError('');
+    try {
+      const res = await fetch('/api/fetch-markdown', {
+        method: 'POST',
+        headers: { 'Content-Type': 'application/json' },
+        body: JSON.stringify({ url }),
+      });
+      const data = await res.json() as { markdown?: string; source?: string; error?: string };
+      if (!res.ok || !data.markdown) {
+        throw new Error(data.error || 'Failed to fetch URL');
+      }
+      setMarkdown(data.markdown);
+      setFileName(url);
+    } catch (err) {
+      setFileError(err instanceof Error ? err.message : 'Failed to fetch URL');
+    } finally {
+      setUrlLoading(false);
+    }
+  }, []);
+
+  const handleFileInput = useCallback((e: React.ChangeEvent<HTMLInputElement>) => {
+    const file = e.target.files?.[0];
+    if (file) loadFile(file);
+  }, [loadFile]);
+
+  const handleDrop = useCallback((e: React.DragEvent) => {
+    e.preventDefault();
+    setDragOver(false);
+    const file = e.dataTransfer.files?.[0];
+    if (file) loadFile(file);
+  }, [loadFile]);
+
+  const handleUrlSubmit = useCallback((e: React.FormEvent) => {
+    e.preventDefault();
+    const trimmed = urlInput.trim();
+    if (!trimmed || urlLoading) return;
+    if (!/^https:\/\//i.test(trimmed)) {
+      setFileError('Enter a valid URL starting with https://');
+      return;
+    }
+    fetchUrl(trimmed);
+  }, [urlInput, urlLoading, fetchUrl]);
+
+  const handleSubmit = useCallback((e: React.FormEvent) => {
+    e.preventDefault();
+    if (inFlight || !displayName.trim()) return;
+    const submit: LandingCreateRoomSubmit = {
+      displayName: displayName.trim(),
+      color,
+      expiresInDays,
+    };
+    handleCreate(submit);
+  }, [inFlight, displayName, color, expiresInDays, handleCreate]);
+
+  const clearContent = useCallback(() => {
+    setMarkdown('');
+    setFileName(null);
+    setFileError('');
+    setUrlInput('');
+    if (fileInputRef.current) fileInputRef.current.value = '';
+  }, []);
+
+  return (
+    <div className="h-screen flex flex-col bg-background text-foreground overflow-hidden">
+      <style>{`
+        @keyframes landing-sprite-play { from { background-position: -${SPRITE_OFFSET}px 0; } to { background-position: -${SPRITE_OFFSET + SPRITE_PLAY_W}px 0; } }
+        @keyframes landing-sprite-rise { from { bottom: -${SPRITE_DISPLAY_H}px; } to { bottom: 110vh; } }
+      `}</style>
+      <FloatingSprite side="left" delay={500} />
+      <FloatingSprite side="right" delay={2000} />
+      {/* Ghost header bar */}
+      <div className="h-12 border-b border-border/30 bg-card/30 backdrop-blur-sm flex items-center px-4 shrink-0">
+        <div className="flex items-center gap-2 text-sm text-foreground/60">
+          <a href="https://github.com/backnotprop/plannotator" target="_blank" rel="noopener noreferrer" className="font-semibold hover:text-foreground/80 transition-colors">
+            Plannotator
+          </a>
+          <span className="text-foreground/20">|</span>
+          <a href="https://github.com/backnotprop/plannotator" target="_blank" rel="noopener noreferrer" className="flex items-center gap-1 hover:text-foreground/80 transition-colors">
+            <svg className="w-3.5 h-3.5" viewBox="0 0 1024 1024" fill="currentColor" aria-hidden>
+              <path fillRule="evenodd" clipRule="evenodd" d="M8 0C3.58 0 0 3.58 0 8C0 11.54 2.29 14.53 5.47 15.59C5.87 15.66 6.02 15.42 6.02 15.21C6.02 15.02 6.01 14.39 6.01 13.72C4 14.09 3.48 13.23 3.32 12.78C3.23 12.55 2.84 11.84 2.5 11.65C2.22 11.5 1.82 11.13 2.49 11.12C3.12 11.11 3.57 11.7 3.72 11.94C4.44 13.15 5.59 12.81 6.05 12.6C6.12 12.08 6.33 11.73 6.56 11.53C4.78 11.33 2.92 10.64 2.92 7.58C2.92 6.71 3.23 5.99 3.74 5.43C3.66 5.23 3.38 4.41 3.82 3.31C3.82 3.31 4.49 3.1 6.02 4.13C6.66 3.95 7.34 3.86 8.02 3.86C8.7 3.86 9.38 3.95 10.02 4.13C11.55 3.09 12.22 3.31 12.22 3.31C12.66 4.41 12.38 5.23 12.3 5.43C12.81 5.99 13.12 6.7 13.12 7.58C13.12 10.65 11.25 11.33 9.47 11.53C9.76 11.78 10.01 12.26 10.01 13.01C10.01 14.08 10 14.94 10 15.21C10 15.42 10.15 15.67 10.55 15.59C13.71 14.53 16 11.53 16 8C16 3.58 12.42 0 8 0Z" transform="scale(64)" />
+            </svg>
+            <span className="text-xs">Open Source</span>
+          </a>
+          <span className="text-foreground/20">|</span>
+          <span className="text-xs px-1.5 py-0.5 rounded bg-foreground/10 text-foreground/50 font-medium">Beta</span>
+        </div>
+      </div>
+
+      {/* Workspace area */}
+      <div className="flex-1 min-h-0">
+        {/* Grid surface with card + overlay */}
+        <div className="h-full bg-grid relative overflow-auto">
+          {/* Ghost plan card */}
+          <div className="absolute inset-0 flex justify-center pt-16 pointer-events-none">
+            <div className="w-full max-w-[832px] mx-8">
+              <div className="bg-card/5 border border-border/10 rounded-xl h-[600px]" />
+            </div>
+          </div>
+
+          {/* Foreground: upload form as floating card */}
+          <div className="relative z-10 flex justify-center pt-12 pb-12 px-4">
+            <div className="w-full max-w-xl space-y-6">
+              {/* Main card */}
+              <div className="bg-card border border-border/50 rounded-xl shadow-2xl overflow-hidden backdrop-blur-sm">
+                <img src="/banner_lite.webp" alt="" className="w-full h-40 object-cover" />
+                <div className="p-6 space-y-5">
+                <div className="text-center space-y-1">
+                  <h1 className="text-lg font-semibold tracking-tight">Start a live review room</h1>
+                  <p className="text-xs text-muted-foreground">
+                    Upload a plan, invite collaborators, annotate together
+                  </p>
+                </div>
+
+                {/* Input mode toggle */}
+                <div className="flex items-center justify-center gap-2 flex-wrap">
+                  {(['upload', 'paste', 'url'] as const).map(mode => (
+                    <button
+                      key={mode}
+                      type="button"
+                      onClick={() => { setInputMode(mode); setShowDemos(false); }}
+                      className={`px-3 py-1 text-xs rounded-full transition-colors ${
+                        inputMode === mode && !showDemos
+                          ? 'bg-foreground text-background'
+                          : 'bg-muted text-muted-foreground hover:bg-muted/80'
+                      }`}
+                    >
+                      {mode === 'upload' ? 'Upload file' : mode === 'paste' ? 'Paste markdown' : 'From URL'}
+                    </button>
+                  ))}
+                  {!hasContent && (
+                    <button
+                      type="button"
+                      onClick={() => setShowDemos(!showDemos)}
+                      className={`px-3 py-1 text-xs rounded-full transition-colors ${
+                        showDemos
+                          ? 'bg-foreground text-background'
+                          : 'bg-muted text-muted-foreground hover:bg-muted/80'
+                      }`}
+                    >
+                      Try a demo
+                    </button>
+                  )}
+                </div>
+
+                {/* Demo options */}
+                {showDemos && !hasContent && (
+                  <div className="flex items-center justify-center gap-2 flex-wrap">
+                    {DEMOS.map(demo => (
+                      <button
+                        key={demo.label}
+                        type="button"
+                        onClick={() => {
+                          setShowDemos(false);
+                          if (demo.staticPath) {
+                            setUrlLoading(true);
+                            setFileError('');
+                            fetch(demo.staticPath).then(r => {
+                              if (!r.ok) throw new Error('Failed to load demo');
+                              return r.text();
+                            }).then(text => {
+                              setMarkdown(text);
+                              setFileName(demo.label);
+                            }).catch(err => {
+                              setFileError(err instanceof Error ? err.message : 'Failed to load demo');
+                            }).finally(() => setUrlLoading(false));
+                          } else if (demo.url) {
+                            setInputMode('url');
+                            setUrlInput(demo.url);
+                            fetchUrl(demo.url);
+                          }
+                        }}
+                        disabled={urlLoading}
+                        className="px-2.5 py-1 text-xs rounded-full border border-border/50 text-muted-foreground hover:bg-muted/50 hover:text-foreground transition-colors disabled:opacity-50"
+                      >
+                        {demo.label}
+                      </button>
+                    ))}
+                  </div>
+                )}
+
+                {/* Upload zone */}
+                {inputMode === 'upload' && !hasContent && (
+                  <div
+                    onDragOver={e => { e.preventDefault(); setDragOver(true); }}
+                    onDragLeave={() => setDragOver(false)}
+                    onDrop={handleDrop}
+                    onClick={() => fileInputRef.current?.click()}
+                    className={`border-2 border-dashed rounded-lg p-8 text-center cursor-pointer transition-colors ${
+                      dragOver
+                        ? 'border-foreground/50 bg-muted/50'
+                        : 'border-border hover:border-foreground/30'
+                    }`}
+                  >
+                    <p className="text-sm text-muted-foreground">
+                      Drop a file here, or click to browse
+                    </p>
+                    <p className="text-xs text-muted-foreground/60 mt-1">
+                      .md, .txt, .html, .markdown
+                    </p>
+                    <input
+                      ref={fileInputRef}
+                      type="file"
+                      accept=".md,.txt,.markdown,.html,.htm"
+                      onChange={handleFileInput}
+                      className="hidden"
+                    />
+                  </div>
+                )}
+
+                {/* Paste textarea */}
+                {inputMode === 'paste' && (
+                  <textarea
+                    value={markdown}
+                    onChange={e => setMarkdown(e.target.value)}
+                    placeholder="Paste or type your markdown here..."
+                    className="w-full h-32 px-3 py-2 bg-background border border-border rounded-lg text-sm font-mono resize-y focus:outline-none focus:ring-1 focus:ring-foreground/20"
+                  />
+                )}
+
+                {/* URL input */}
+                {inputMode === 'url' && !hasContent && (
+                  <form onSubmit={handleUrlSubmit} className="flex gap-2">
+                    <input
+                      type="text"
+                      value={urlInput}
+                      onChange={e => setUrlInput(e.target.value)}
+                      disabled={urlLoading}
+                      placeholder="https://example.com/document"
+                      className="flex-1 px-3 py-2 bg-background border border-border rounded-lg text-sm focus:outline-none focus:ring-1 focus:ring-foreground/20"
+                    />
+                    <button
+                      type="submit"
+                      disabled={urlLoading || !urlInput.trim()}
+                      className="px-4 py-2 text-xs font-medium rounded-lg bg-foreground text-background disabled:opacity-50"
+                    >
+                      {urlLoading ? 'Fetching...' : 'Fetch'}
+                    </button>
+                  </form>
+                )}
+
+                {fileError && (
+                  <div className="text-xs bg-destructive/10 text-destructive p-2 rounded" role="alert">
+                    {fileError}
+                  </div>
+                )}
+
+                {/* Compact preview with fade */}
+                {hasContent && (
+                  <div className="relative rounded-lg border border-border overflow-y-auto max-h-32">
+                    <Suspense fallback={null}>
+                      <MarkdownPreview markdown={markdown} fileName={null} onClear={clearContent} />
+                    </Suspense>
+                    <div
+                      className="pointer-events-none absolute bottom-0 left-0 right-0 h-12 bg-background"
+                      style={{
+                        WebkitMaskImage: 'linear-gradient(to top, white, transparent)',
+                        maskImage: 'linear-gradient(to top, white, transparent)',
+                      }}
+                    />
+                  </div>
+                )}
+
+                {/* Room settings */}
+                <form onSubmit={handleSubmit} className="space-y-3 pt-1">
+                  <div className="grid grid-cols-2 gap-3">
+                    <div className="space-y-1.5">
+                      <label className="text-xs font-medium uppercase text-muted-foreground">Name</label>
+                      <input
+                        type="text"
+                        value={displayName}
+                        onChange={e => setDisplayName(e.target.value)}
+                        disabled={inFlight}
+                        className="w-full px-2.5 py-1.5 bg-background border border-border rounded text-sm focus:outline-none focus:ring-1 focus:ring-foreground/20"
+                        placeholder="Your name"
+                        autoComplete="off"
+                      />
+                    </div>
+                    <div className="space-y-1.5">
+                      <label className="text-xs font-medium uppercase text-muted-foreground">Expires</label>
+                      <select
+                        value={expiresInDays}
+                        onChange={e => setExpiresInDays(Number(e.target.value) as 0 | 1 | 7 | 30)}
+                        disabled={inFlight}
+                        className="w-full px-2.5 py-1.5 bg-background border border-border rounded text-sm"
+                      >
+                        <option value={1}>1 day</option>
+                        <option value={7}>7 days</option>
+                        <option value={30}>30 days</option>
+                        <option value={0}>Never</option>
+                      </select>
+                    </div>
+                  </div>
+
+                  <div className="space-y-1.5">
+                    <label className="text-xs font-medium uppercase text-muted-foreground">Color</label>
+                    <div className="flex items-center gap-1.5">
+                      {PRESENCE_SWATCHES.map(s => (
+                        <button
+                          key={s}
+                          type="button"
+                          disabled={inFlight}
+                          onClick={() => setColor(s)}
+                          className={`w-5 h-5 rounded-full border-2 transition-all ${
+                            color === s ? 'border-foreground scale-110' : 'border-transparent'
+                          }`}
+                          style={{ backgroundColor: s }}
+                          aria-label={`Color ${s}`}
+                        />
+                      ))}
+                    </div>
+                  </div>
+
+                  {error && (
+                    <div className="text-xs bg-destructive/10 text-destructive p-2 rounded" role="alert">
+                      {error}
+                    </div>
+                  )}
+
+                  <div className="flex items-center justify-between pt-1">
+                    <p className="text-xs text-muted-foreground/70">
+                      {hasContent ? 'Encrypted end-to-end' : 'Upload or paste a document to get started'}
+                    </p>
+                    <div className="flex items-center gap-2">
+                      {inFlight && (
+                        <button
+                          type="button"
+                          onClick={handleCancel}
+                          className="px-3 py-1.5 text-xs rounded hover:bg-muted"
+                        >
+                          Cancel
+                        </button>
+                      )}
+                      <button
+                        type="submit"
+                        disabled={inFlight || !displayName.trim() || !hasContent}
+                        className="px-4 py-1.5 text-xs font-medium rounded bg-foreground text-background disabled:opacity-50"
+                      >
+                        {inFlight ? 'Creating...' : 'Create room'}
+                      </button>
+                    </div>
+                  </div>
+                </form>
+                </div>
+              {/* Trust footer */}
+              <div className="text-center px-6 pb-4 pt-2 space-y-1">
+                <p className="text-xs text-muted-foreground/50">
+                  All content is end-to-end encrypted on your device. The server only stores ciphertext.
+                  Rooms are deleted after their expiry period, or by the creator at any time.
+                </p>
+                <a href="https://plannotator.ai/privacy/" target="_blank" rel="noopener noreferrer" className="text-[10px] text-muted-foreground/40 hover:text-muted-foreground/60 transition-colors">
+                  Privacy Policy
+                </a>
+              </div>
+              </div>
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  );
+}
diff --git a/packages/ui/components/collab/LandingPreview.tsx b/packages/ui/components/collab/LandingPreview.tsx
new file mode 100644
index 000000000..da2e7df1e
--- /dev/null
+++ b/packages/ui/components/collab/LandingPreview.tsx
@@ -0,0 +1,25 @@
+import React, { useMemo } from 'react';
+import { parseMarkdownToBlocks } from '@plannotator/ui/utils/parser';
+import { BlockRenderer } from '@plannotator/ui/components/BlockRenderer';
+
+interface LandingPreviewProps {
+  markdown: string;
+  /** Unused — kept for future header/breadcrumb display. */
+  fileName: string | null;
+  /** Unused — kept for future clear-from-preview affordance. */
+  onClear: () => void;
+}
+
+export default function LandingPreview({ markdown }: LandingPreviewProps): React.ReactElement {
+  const blocks = useMemo(() => parseMarkdownToBlocks(markdown), [markdown]);
+
+  return (
+    <div className="p-4">
+      <div className="prose prose-sm dark:prose-invert max-w-none">
+        {blocks.map(block => (
+          <BlockRenderer key={block.id} block={block} />
+        ))}
+      </div>
+    </div>
+  );
+}
diff --git a/packages/ui/components/collab/ParticipantAvatars.test.tsx b/packages/ui/components/collab/ParticipantAvatars.test.tsx
new file mode 100644
index 000000000..37a8d5f94
--- /dev/null
+++ b/packages/ui/components/collab/ParticipantAvatars.test.tsx
@@ -0,0 +1,85 @@
+import { describe, expect, test } from 'bun:test';
+import { render } from '@testing-library/react';
+import { ParticipantAvatars } from './ParticipantAvatars';
+import type { PresenceState } from '@plannotator/shared/collab';
+
+function peer(name: string, color = '#abc'): PresenceState {
+  return {
+    user: { id: name.toLowerCase(), name, color },
+    cursor: null,
+  };
+}
+
+describe('ParticipantAvatars', () => {
+  test('returns null with no peers', () => {
+    const { container } = render(<ParticipantAvatars remotePresence={{}} />);
+    expect(container.querySelector('[data-testid="participant-avatars"]')).toBeNull();
+  });
+
+  test('renders one avatar per peer with correct initial', () => {
+    const { container } = render(
+      <ParticipantAvatars remotePresence={{ c1: peer('Alice'), c2: peer('Bob') }} />,
+    );
+    const avatars = container.querySelectorAll('[data-participant-id]');
+    expect(avatars.length).toBe(2);
+    const initials = Array.from(avatars).map(a => a.textContent);
+    expect(initials).toEqual(['A', 'B']);  // sorted by name
+  });
+
+  test('collapses extras above maxVisible into "+N"', () => {
+    const presence: Record<string, PresenceState> = {};
+    for (let i = 0; i < 6; i++) {
+      presence[`c${i}`] = peer(String.fromCharCode(65 + i));
+    }
+    const { container } = render(
+      <ParticipantAvatars remotePresence={presence} maxVisible={3} />,
+    );
+    expect(container.querySelectorAll('[data-participant-id]').length).toBe(3);
+    const overflow = container.querySelector('[data-testid="participant-overflow"]');
+    expect(overflow?.textContent).toBe('+3');
+  });
+
+  test('overflow title lists names not shown', () => {
+    const presence = {
+      c1: peer('Alice'), c2: peer('Bob'), c3: peer('Charlie'), c4: peer('Dana'), c5: peer('Eve'),
+    };
+    const { container } = render(
+      <ParticipantAvatars remotePresence={presence} maxVisible={2} />,
+    );
+    const overflow = container.querySelector('[data-testid="participant-overflow"]');
+    expect(overflow?.getAttribute('title')).toBe('Charlie, Dana, Eve');
+  });
+
+  test('falls back to "?" initial when name is blank', () => {
+    const { container } = render(
+      <ParticipantAvatars remotePresence={{ c1: peer('') }} />,
+    );
+    const avatars = container.querySelectorAll('[data-participant-id]');
+    expect(avatars[0].textContent).toBe('G');  // falls through to "Guest" → "G"
+  });
+
+  test('marks agent peers with the agent indicator', () => {
+    const { container } = render(
+      <ParticipantAvatars
+        remotePresence={{
+          human: peer('Alice'),
+          bot: peer('alice-agent-claude'),
+        }}
+      />,
+    );
+    const avatars = container.querySelectorAll<HTMLElement>('[data-participant-id]');
+    const kinds = Array.from(avatars).map(a => a.dataset.participantKind);
+    // deriveParticipants sorts by name; 'Alice' < 'alice-agent-claude' (case-insensitive localeCompare)
+    expect(kinds).toEqual(['human', 'agent']);
+
+    // The agent avatar has the marker; the human avatar does not.
+    const humanMarker = avatars[0].querySelector('[data-testid="participant-agent-marker"]');
+    const agentMarker = avatars[1].querySelector('[data-testid="participant-agent-marker"]');
+    expect(humanMarker).toBeNull();
+    expect(agentMarker).not.toBeNull();
+
+    // Agent tooltip includes the type.
+    expect(avatars[1].getAttribute('title')).toContain('agent');
+    expect(avatars[1].getAttribute('title')).toContain('claude');
+  });
+});
diff --git a/packages/ui/components/collab/ParticipantAvatars.tsx b/packages/ui/components/collab/ParticipantAvatars.tsx
new file mode 100644
index 000000000..e36199812
--- /dev/null
+++ b/packages/ui/components/collab/ParticipantAvatars.tsx
@@ -0,0 +1,105 @@
+import React, { useMemo } from 'react';
+import type { PresenceState } from '@plannotator/shared/collab';
+import { isAgentIdentity, getAgentType } from '@plannotator/ui/utils/agentIdentity';
+
+/**
+ * Pure avatar stack for room participants. Reads from `remotePresence`
+ * (keyed by clientId) and renders one colored initial per peer. Does NOT
+ * include the local user — callers render their own user elsewhere.
+ *
+ * Overflow: show at most `maxVisible` avatars; the rest are summarized
+ * as "+N" with a tooltip listing the extra names.
+ *
+ * Agent peers (identity ending in `-agent-<type>`) render with a small
+ * marker overlay so observers can tell them apart from human peers.
+ * Detection is purely identity-based via `isAgentIdentity` — no other
+ * protocol fields are consulted.
+ */
+
+export interface ParticipantAvatarsProps {
+  remotePresence: Record<string, PresenceState>;
+  maxVisible?: number;
+  className?: string;
+}
+
+interface Participant {
+  clientId: string;
+  name: string;
+  color: string;
+  initial: string;
+  isAgent: boolean;
+  agentType: string | undefined;
+}
+
+function deriveParticipants(
+  remotePresence: Record<string, PresenceState>,
+): Participant[] {
+  const out: Participant[] = [];
+  for (const [clientId, p] of Object.entries(remotePresence)) {
+    const name = (p.user?.name ?? '').trim() || 'Guest';
+    const color = p.user?.color ?? '#888';
+    const initial = name.charAt(0).toUpperCase() || '?';
+    const isAgent = isAgentIdentity(name);
+    const agentType = getAgentType(name);
+    out.push({ clientId, name, color, initial, isAgent, agentType });
+  }
+  // Stable sort by name so order doesn't thrash when presence maps rehydrate.
+  out.sort((a, b) => a.name.localeCompare(b.name));
+  return out;
+}
+
+export function ParticipantAvatars({
+  remotePresence,
+  maxVisible = 4,
+  className = '',
+}: ParticipantAvatarsProps): React.ReactElement | null {
+  const participants = useMemo(() => deriveParticipants(remotePresence), [remotePresence]);
+  if (participants.length === 0) return null;
+
+  const visible = participants.slice(0, maxVisible);
+  const overflow = participants.slice(maxVisible);
+  const overflowTitle = overflow.map(p => p.name).join(', ');
+
+  return (
+    <div
+      className={`inline-flex items-center -space-x-1 ${className}`}
+      data-testid="participant-avatars"
+    >
+      {visible.map(p => (
+        <span
+          key={p.clientId}
+          // Tooltip distinguishes agents so hover reveals the type; the
+          // marker itself is the glyph at the corner of the avatar chip.
+          title={p.isAgent ? `${p.name} (agent · ${p.agentType ?? 'unknown'})` : p.name}
+          className="relative inline-flex items-center justify-center w-6 h-6 rounded-full text-[10px] font-medium text-white ring-2 ring-background"
+          style={{ backgroundColor: p.color }}
+          data-participant-id={p.clientId}
+          data-participant-kind={p.isAgent ? 'agent' : 'human'}
+        >
+          {p.initial}
+          {p.isAgent && (
+            <span
+              aria-hidden
+              // Small ⚙ marker pinned to the bottom-right corner. Theme
+              // tokens so it stays legible on both light and dark
+              // themes; no color prop needed.
+              className="absolute -bottom-0.5 -right-0.5 inline-flex items-center justify-center w-3 h-3 rounded-full text-[8px] leading-none bg-background text-foreground ring-1 ring-border"
+              data-testid="participant-agent-marker"
+            >
+              ⚙
+            </span>
+          )}
+        </span>
+      ))}
+      {overflow.length > 0 && (
+        <span
+          className="inline-flex items-center justify-center w-6 h-6 rounded-full text-[10px] font-medium bg-muted text-muted-foreground ring-2 ring-background"
+          title={overflowTitle}
+          data-testid="participant-overflow"
+        >
+          +{overflow.length}
+        </span>
+      )}
+    </div>
+  );
+}
diff --git a/packages/ui/components/collab/RemoteCursorLayer.tsx b/packages/ui/components/collab/RemoteCursorLayer.tsx
new file mode 100644
index 000000000..30a738c71
--- /dev/null
+++ b/packages/ui/components/collab/RemoteCursorLayer.tsx
@@ -0,0 +1,460 @@
+import React, { useEffect, useMemo, useRef } from 'react';
+import type { PresenceState, CursorState } from '@plannotator/shared/collab';
+import { isAgentIdentity } from '@plannotator/ui/utils/agentIdentity';
+
+/**
+ * Absolute-positioned overlay that renders remote cursor flags. Parent
+ * mounts this as a sibling of the Viewer inside the scroll viewport so
+ * cursors scroll with content without any extra math.
+ *
+ * Rendering model:
+ *   - One `<div>` per remote client; mount/unmount is React-driven so
+ *     adds/removes during a session update cleanly.
+ *   - Position is NOT React state. A single `requestAnimationFrame`
+ *     loop reads the latest target from `remotePresence`/`containerRect`
+ *     refs, lerps each cursor's current position toward its target, and
+ *     mutates `transform` on the DOM node directly. This matches the
+ *     industry pattern used by Figma-style / Liveblocks-style cursor
+ *     systems — avoids React reconciliation on every frame (~60Hz * N
+ *     cursors would otherwise churn the scheduler for nothing) and
+ *     leans on the GPU compositor for `translate3d`.
+ *
+ * Smoothing:
+ *   - Latest-wins target per clientId. On each frame: lerp toward target
+ *     with a fixed alpha (~0.3 feels responsive without overshoot).
+ *   - Snap (bypass lerp) when:
+ *       1. First frame for a clientId — avoid sliding from (0,0).
+ *       2. Cursor reappears after going null/idle — treat like first.
+ *       3. Single-frame distance > SNAP_THRESHOLD — usually a
+ *          coordinate-space flip (block ↔ viewport) or scroll jump,
+ *          where animating the "swoosh" would look worse than snapping.
+ *
+ * Offscreen indicators:
+ *   - When a cursor's resolved position falls outside the overlay
+ *     container rect, the same element is repurposed as a small edge
+ *     label (`↑ Alice` / `↓ Alice`) pinned to the nearest edge and
+ *     clamped horizontally. Tells the reader "they're somewhere else
+ *     in the doc" instead of letting the cursor vanish.
+ *
+ * Coordinate model (matches the protocol's `CursorState`):
+ *   - `coordinateSpace: 'document'` — (x, y) in scroll-document coords.
+ *     Render at (x - scrollX, y - scrollY) within the viewport.
+ *   - `coordinateSpace: 'viewport'` — (x, y) in viewport coords.
+ *     Rendered as-is minus the container offset.
+ *   - `coordinateSpace: 'block'` — relative to the block's bounding
+ *     rect, identified by `blockId`. Resolved via `[data-block-id=…]`.
+ *
+ * Local cursor is NOT rendered — that cursor is the browser's own caret.
+ */
+
+export interface RemoteCursorLayerProps {
+  remotePresence: Record<string, PresenceState>;
+  /**
+   * Bounding rect of the overlay container in viewport coords. Used to
+   * translate viewport-space cursor coords into overlay-local coords
+   * and to decide whether a cursor is onscreen vs. pinned to an edge.
+   */
+  containerRect: DOMRect | null;
+  /** ParentNode to search within for block elements. Defaults to document. */
+  root?: ParentNode;
+  className?: string;
+}
+
+interface CursorRenderState {
+  displayX: number;
+  displayY: number;
+  /** True once we've ever painted this cursor; toggled off on idle. */
+  everRendered: boolean;
+}
+
+function findBlockRect(blockId: string, root: ParentNode): DOMRect | null {
+  // `blockId` arrives as decrypted remote presence. The bundled UI only
+  // emits real `data-block-id` values, but anything holding the room URL +
+  // key (direct WebSocket client, modified console, agent) can send an
+  // arbitrary string. A newline or other CSS-invalid character makes the
+  // selector throw `SyntaxError` during render, taking the whole cursor
+  // layer down for every participant. Escape safely and swallow any
+  // residual selector failures so bad remote input just drops the cursor.
+  try {
+    const escaped =
+      typeof CSS !== 'undefined' && typeof CSS.escape === 'function'
+        ? CSS.escape(blockId)
+        : blockId.replace(/["\\]/g, '\\$&');
+    const el = root.querySelector(`[data-block-id="${escaped}"]`) as HTMLElement | null;
+    return el ? el.getBoundingClientRect() : null;
+  } catch {
+    return null;
+  }
+}
+
+/**
+ * Find the plan's scroll viewport element. App tags it with
+ * `data-plan-scroll-viewport` when the OverlayScrollbars instance
+ * settles. Used to resolve `document`-space cursors (protocol supports
+ * all three coordinate spaces) — the bundled UI's LocalPresenceEmitter
+ * emits `block`-space with a sticky anchor, but a direct-agent or
+ * future client could still use `document`, and the layer handles
+ * both uniformly via `resolveCursor` below.
+ *
+ * Fall-through to `null` is safe — the caller skips rendering when
+ * `resolveCursor` returns null, so the cursor waits for the scroll
+ * area to mount instead of rendering at a garbage position.
+ */
+function findScrollViewport(): HTMLElement | null {
+  return typeof document !== 'undefined'
+    ? document.querySelector<HTMLElement>('[data-plan-scroll-viewport]')
+    : null;
+}
+
+function resolveCursor(
+  cursor: CursorState,
+  root: ParentNode,
+): { viewportX: number; viewportY: number } | null {
+  switch (cursor.coordinateSpace) {
+    case 'viewport':
+      return { viewportX: cursor.x, viewportY: cursor.y };
+    case 'document': {
+      // Content-space: cursor.(x, y) is relative to the scroll
+      // container's inner content origin. Map to this viewer's
+      // viewport by re-applying their scroll container rect and
+      // current scroll position.
+      const vp = findScrollViewport();
+      if (!vp) return null;
+      const rect = vp.getBoundingClientRect();
+      return {
+        viewportX: rect.left + cursor.x - vp.scrollLeft,
+        viewportY: rect.top  + cursor.y - vp.scrollTop,
+      };
+    }
+    case 'block': {
+      // The bundled UI's LocalPresenceEmitter writes block-space with
+      // a sticky anchor (same block until the pointer crosses into a
+      // new one), so this is the hot path for same-app peers. Also
+      // honors direct-agent clients that send block coords.
+      if (!cursor.blockId) return null;
+      const blockRect = findBlockRect(cursor.blockId, root);
+      if (!blockRect) return null;
+      return {
+        viewportX: blockRect.left + cursor.x,
+        viewportY: blockRect.top + cursor.y,
+      };
+    }
+    default:
+      return null;
+  }
+}
+
+// Line-height fallback for cursor caret — we don't know the remote
+// user's line-height at the cursor, and resolving per-block metrics on
+// every update would be expensive. 18px covers standard body copy.
+const CURSOR_HEIGHT_PX = 18;
+
+// Smoothing tuning. See component docstring.
+const LERP_ALPHA = 0.3;
+const SNAP_THRESHOLD_PX = 600;
+
+/**
+ * Inset applied when clamping an offscreen cursor to the container
+ * edge. Keeps the pinned glyph fully visible instead of clipping half
+ * of it against the edge.
+ */
+const EDGE_INSET_PX = 8;
+
+export function RemoteCursorLayer({
+  remotePresence,
+  containerRect,
+  root = typeof document !== 'undefined' ? document : undefined as unknown as ParentNode,
+  className = '',
+}: RemoteCursorLayerProps): React.ReactElement | null {
+  // Refs the rAF loop reads. React updates these on every prop change;
+  // the loop picks up the latest values on its next frame without
+  // depending on React render cycles for motion.
+  const presenceRef = useRef(remotePresence);
+  presenceRef.current = remotePresence;
+  const containerRectRef = useRef(containerRect);
+  containerRectRef.current = containerRect;
+  const rootRef = useRef(root);
+  rootRef.current = root;
+
+  const renderStatesRef = useRef<Map<string, CursorRenderState>>(new Map());
+  const nodeRefsRef = useRef<Map<string, HTMLDivElement>>(new Map());
+
+  // Gate the animation loop on actually having remote cursors to draw.
+  // Solo rooms (the common case) would otherwise run a 60Hz no-op loop
+  // for every session. Effect restarts only when this boolean flips
+  // empty↔non-empty, so continuous cursor updates during a busy session
+  // don't retear the loop down.
+  const hasRemoteCursors = Object.keys(remotePresence).length > 0;
+
+  useEffect(() => {
+    if (!hasRemoteCursors) return;
+    let rafId = 0;
+
+    const tick = () => {
+      const presence = presenceRef.current;
+      const rect = containerRectRef.current;
+      const rootEl = rootRef.current ?? (typeof document !== 'undefined' ? document : null);
+      if (!rootEl) {
+        rafId = requestAnimationFrame(tick);
+        return;
+      }
+
+      const states = renderStatesRef.current;
+      const nodes = nodeRefsRef.current;
+
+      // Drop render state for cursors no longer in presence. The node
+      // itself is unmounted by React on the next render — we just
+      // release our tracking so a rejoin starts fresh (snap).
+      for (const id of Array.from(states.keys())) {
+        if (!(id in presence)) {
+          states.delete(id);
+        }
+      }
+
+      for (const [clientId, p] of Object.entries(presence)) {
+        const node = nodes.get(clientId);
+        if (!node) continue;  // React hasn't committed the element yet.
+
+        const resolved = p.cursor ? resolveCursor(p.cursor, rootEl) : null;
+        if (!resolved) {
+          // Null / unresolvable cursor — mark idle and hide. Next
+          // non-null packet snaps back in from the new position instead
+          // of sliding from wherever the ghost was left.
+          node.style.display = 'none';
+          const prev = states.get(clientId);
+          if (prev) prev.everRendered = false;
+          continue;
+        }
+
+        // Target in overlay-local space.
+        const targetX = resolved.viewportX - (rect?.left ?? 0);
+        const targetY = resolved.viewportY - (rect?.top ?? 0);
+
+        let state = states.get(clientId);
+        if (!state || !state.everRendered) {
+          // First paint for this clientId (or just came back from
+          // idle): snap so we don't see a slide from (0,0) or the
+          // previous stale position.
+          state = { displayX: targetX, displayY: targetY, everRendered: true };
+          states.set(clientId, state);
+        } else {
+          const dx = targetX - state.displayX;
+          const dy = targetY - state.displayY;
+          if (Math.hypot(dx, dy) > SNAP_THRESHOLD_PX) {
+            // Huge single-frame jump — usually a block↔viewport
+            // coordinate flip or a scroll that moved the block rect
+            // hundreds of pixels. Animating it looks like a
+            // full-screen swoosh; snap instead.
+            state.displayX = targetX;
+            state.displayY = targetY;
+          } else {
+            state.displayX += dx * LERP_ALPHA;
+            state.displayY += dy * LERP_ALPHA;
+          }
+        }
+
+        // Onscreen check against the overlay container bounds. The
+        // container IS the editor viewport in our current layout, so
+        // "outside container" == "outside visible editor" == pin to
+        // the nearest edge.
+        const containerWidth = rect?.width ?? (typeof window !== 'undefined' ? window.innerWidth : 0);
+        const containerHeight = rect?.height ?? (typeof window !== 'undefined' ? window.innerHeight : 0);
+        const above = state.displayY < 0;
+        const below = state.displayY > containerHeight;
+        const leftOf = state.displayX < 0;
+        const rightOf = state.displayX > containerWidth;
+        const offscreen = above || below || leftOf || rightOf;
+
+        let renderX = state.displayX;
+        let renderY = state.displayY;
+        let edgeDirection: 'none' | 'above' | 'below' | 'left' | 'right' = 'none';
+        if (offscreen) {
+          // Clamp to the nearest edge with a small inset so the glyph
+          // stays fully visible. Direction picks vertical over
+          // horizontal because most scrolling is vertical; a corner-
+          // case cursor gets the vertical indicator with horizontal
+          // clamping applied for position.
+          renderX = Math.max(EDGE_INSET_PX, Math.min(containerWidth - EDGE_INSET_PX, state.displayX));
+          renderY = Math.max(EDGE_INSET_PX, Math.min(containerHeight - EDGE_INSET_PX, state.displayY));
+          edgeDirection = above ? 'above' : below ? 'below' : leftOf ? 'left' : 'right';
+        }
+
+        node.style.display = '';
+        node.style.transform = `translate3d(${renderX}px, ${renderY}px, 0)`;
+
+        // Toggle the visual via dataset — CSS (below) swaps caret vs.
+        // edge indicator based on `data-edge-direction`.
+        if (node.dataset.edgeDirection !== edgeDirection) {
+          node.dataset.edgeDirection = edgeDirection;
+        }
+      }
+
+      rafId = requestAnimationFrame(tick);
+    };
+
+    rafId = requestAnimationFrame(tick);
+    return () => cancelAnimationFrame(rafId);
+  }, [hasRemoteCursors]);
+
+  // React owns the set of mounted cursor nodes (keyed by clientId).
+  // The rAF loop positions them. Recomputed each render — trivial cost
+  // and keeps the list stable in key order so React doesn't reorder
+  // DOM nodes when presence iteration order shifts.
+  const clientIds = useMemo(
+    () => Object.keys(remotePresence).sort(),
+    // `remotePresence` is a new object each state emit, but its key
+    // set changes rarely; depending on the whole object is fine given
+    // the sort is O(n log n) on tiny n.
+    [remotePresence],
+  );
+
+  if (clientIds.length === 0) return null;
+
+  return (
+    <div
+      className={`pointer-events-none absolute inset-0 ${className}`}
+      data-testid="remote-cursor-layer"
+      aria-hidden
+    >
+      {/*
+        Self-contained style block. Keeps the swap between onscreen
+        caret and offscreen edge-pin pure CSS, driven by the
+        `data-edge-direction` attribute the rAF loop mutates on each
+        cursor node.
+        .remote-cursor-offscreen is default-hidden via CSS here
+        (NOT via inline `style={{ display: 'flex' }}` on the element)
+        because inline styles beat stylesheet rules — with an inline
+        default of flex, the `data-edge-direction="none"` rule that
+        tries to hide the pill would lose and both variants would
+        paint on every cursor.
+      */}
+      <style>{`
+        .remote-cursor-offscreen {
+          display: none;
+          align-items: center;
+          gap: 2px;
+        }
+        .remote-cursor:not([data-edge-direction="none"]) .remote-cursor-onscreen { display: none; }
+        .remote-cursor:not([data-edge-direction="none"]) .remote-cursor-offscreen { display: flex; }
+        .remote-cursor[data-edge-direction="above"] .remote-cursor-arrow::before { content: "↑"; }
+        .remote-cursor[data-edge-direction="below"] .remote-cursor-arrow::before { content: "↓"; }
+        .remote-cursor[data-edge-direction="left"]  .remote-cursor-arrow::before { content: "←"; }
+        .remote-cursor[data-edge-direction="right"] .remote-cursor-arrow::before { content: "→"; }
+      `}</style>
+      {clientIds.map(clientId => {
+        const p = remotePresence[clientId];
+        const name = p?.user?.name ?? 'Guest';
+        const color = p?.user?.color ?? '#888';
+        const isAgent = isAgentIdentity(p?.user?.name);
+        return (
+          <RemoteCursor
+            key={clientId}
+            clientId={clientId}
+            name={name}
+            color={color}
+            isAgent={isAgent}
+            nodeRefsRef={nodeRefsRef}
+          />
+        );
+      })}
+    </div>
+  );
+}
+
+/**
+ * Single cursor glyph. Position is NEVER set here — the parent's rAF
+ * loop mutates `transform` and `data-edge-direction` on the node
+ * directly via the shared ref map. This component only owns the
+ * static-per-client bits: color, name, and the SVG/label markup.
+ *
+ * Contains both the normal caret+label and the offscreen edge-pin
+ * variants in the DOM; CSS selectors on the parent's `data-edge-*`
+ * dataset decide which is visible. Keeps motion allocation-free
+ * since the DOM structure never changes during animation.
+ */
+function RemoteCursor({
+  clientId,
+  name,
+  color,
+  isAgent,
+  nodeRefsRef,
+}: {
+  clientId: string;
+  name: string;
+  color: string;
+  isAgent: boolean;
+  nodeRefsRef: React.RefObject<Map<string, HTMLDivElement>>;
+}): React.ReactElement {
+  // Callback ref keyed by clientId. Each mount/unmount registers or
+  // releases in the shared ref map that the rAF loop reads.
+  const setRef = (el: HTMLDivElement | null) => {
+    const map = nodeRefsRef.current;
+    if (!map) return;
+    if (el) map.set(clientId, el);
+    else map.delete(clientId);
+  };
+
+  return (
+    <div
+      ref={setRef}
+      data-client-id={clientId}
+      data-client-kind={isAgent ? 'agent' : 'human'}
+      data-edge-direction="none"
+      className="remote-cursor absolute top-0 left-0 will-change-transform"
+      style={{ display: 'none' }}  // hidden until the first rAF tick resolves position
+    >
+      {/* Onscreen: vertical caret bar + name label. */}
+      <div className="remote-cursor-onscreen">
+        <div
+          style={{
+            width: 2,
+            height: CURSOR_HEIGHT_PX,
+            backgroundColor: color,
+          }}
+        />
+        <div
+          style={{
+            position: 'absolute',
+            top: 0,
+            left: 4,
+            backgroundColor: color,
+            color: '#fff',
+            fontSize: 10,
+            padding: '1px 4px',
+            borderRadius: 2,
+            whiteSpace: 'nowrap',
+            lineHeight: 1.2,
+          }}
+        >
+          {isAgent && <span aria-hidden style={{ marginRight: 3 }}>⚙</span>}
+          {name}
+        </div>
+      </div>
+      {/* Offscreen: single colored pill with directional arrow. CSS
+          hides this when `data-edge-direction="none"` and swaps the
+          arrow glyph based on direction. */}
+      <div
+        className="remote-cursor-offscreen"
+        // `display` deliberately OMITTED from inline style — it's
+        // owned by the stylesheet block in the parent layer so the
+        // `data-edge-direction` swap can win. Other visual props
+        // remain inline (color is dynamic per peer, rest is layout).
+        style={{
+          backgroundColor: color,
+          color: '#fff',
+          fontSize: 10,
+          padding: '2px 6px',
+          borderRadius: 10,
+          whiteSpace: 'nowrap',
+          lineHeight: 1.2,
+        }}
+      >
+        <span className="remote-cursor-arrow" aria-hidden>
+          {/* Placeholder; CSS rewrites via ::before based on direction. */}
+        </span>
+        {isAgent && <span aria-hidden style={{ marginRight: 3 }}>⚙</span>}
+        <span>{name}</span>
+      </div>
+    </div>
+  );
+}
diff --git a/packages/ui/components/collab/RoomAdminErrorToast.tsx b/packages/ui/components/collab/RoomAdminErrorToast.tsx
new file mode 100644
index 000000000..dc8a0b7f4
--- /dev/null
+++ b/packages/ui/components/collab/RoomAdminErrorToast.tsx
@@ -0,0 +1,63 @@
+import React, { useEffect } from 'react';
+import type { AdminAction } from '../../hooks/collab/useRoomAdminActions';
+
+/**
+ * Bottom-right toast for admin command failures (currently delete).
+ * Replaces the inline error banner that used to live inside
+ * `RoomPanel`. A transient toast matches the action-is-rare-and-
+ * retriable shape of admin commands better than a sticky panel
+ * element: the user clicks, nothing happens if it failed, they see
+ * the toast, click Dismiss or let it auto-dismiss, and click again.
+ *
+ * Auto-dismiss is 8s — long enough for the user to read a short
+ * error message, short enough that a forgotten toast doesn't linger
+ * across sessions. Manual dismiss is always available.
+ */
+
+export interface RoomAdminErrorToastProps {
+  action: AdminAction;
+  message: string;
+  onDismiss(): void;
+}
+
+const AUTO_DISMISS_MS = 8_000;
+
+function actionLabel(action: AdminAction): string {
+  switch (action) {
+    case 'delete': return 'Failed to delete room';
+  }
+}
+
+export function RoomAdminErrorToast({
+  action,
+  message,
+  onDismiss,
+}: RoomAdminErrorToastProps): React.ReactElement {
+  useEffect(() => {
+    const t = setTimeout(onDismiss, AUTO_DISMISS_MS);
+    return () => clearTimeout(t);
+    // Dep on message + action so a fresh error resets the timer.
+  }, [action, message, onDismiss]);
+
+  return (
+    <div
+      role="alert"
+      className="fixed bottom-4 right-4 z-[60] max-w-sm px-3 py-2 rounded-lg text-xs font-medium shadow-lg bg-destructive/15 text-destructive border border-destructive/30 flex items-start gap-2"
+      data-testid="room-admin-error-toast"
+    >
+      <div className="flex-1">
+        <div className="font-semibold">{actionLabel(action)}</div>
+        {message && <div className="opacity-80 mt-0.5 break-words">{message}</div>}
+      </div>
+      <button
+        type="button"
+        onClick={onDismiss}
+        className="text-[11px] underline opacity-80 hover:opacity-100"
+        aria-label="Dismiss error"
+        data-testid="room-admin-error-toast-dismiss"
+      >
+        Dismiss
+      </button>
+    </div>
+  );
+}
diff --git a/packages/ui/components/collab/RoomHeaderControls.tsx b/packages/ui/components/collab/RoomHeaderControls.tsx
new file mode 100644
index 000000000..5ba70e942
--- /dev/null
+++ b/packages/ui/components/collab/RoomHeaderControls.tsx
@@ -0,0 +1,80 @@
+import React from 'react';
+import type { ConnectionStatus } from '@plannotator/shared/collab/client';
+import type { PresenceState } from '@plannotator/shared/collab';
+import { RoomStatusBadge } from './RoomStatusBadge';
+import { ParticipantAvatars } from './ParticipantAvatars';
+import { RoomMenu } from './RoomMenu';
+import type { AdminAction } from '../../hooks/collab/useRoomAdminActions';
+
+/**
+ * Compact header cluster that replaces the floating RoomPanel.
+ * Renders inline in the editor header next to the existing PlanHeaderMenu
+ * whenever the editor is in room mode.
+ *
+ * Layout (left → right):
+ *   [conditional status pill] [peer avatars] [Room actions ▾]
+ *
+ * The status pill is only shown when the connection isn't authenticated
+ * (reconnecting / connecting / offline). A healthy "Live" connection
+ * shows nothing here, keeping the header quiet on the common case.
+ * Terminal states (room gone) don't appear here — the caller swaps to
+ * `RoomUnavailableScreen` instead of rendering the header at all.
+ *
+ * All mutations (delete, link copy, feedback copy) are owned by
+ * the caller. This component is a pure surface.
+ */
+
+export interface RoomHeaderControlsProps {
+  connectionStatus: ConnectionStatus;
+  remotePresence: Record<string, PresenceState>;
+  isAdmin: boolean;
+  adminUrl?: string;
+  pendingAdminAction?: AdminAction;
+  onCopyParticipantUrl(): void;
+  onCopyAdminUrl(): void;
+  onCopyConsolidatedFeedback(): void;
+  onCopyAgentInstructions(): void;
+  onDelete(): void;
+  className?: string;
+}
+
+export function RoomHeaderControls({
+  connectionStatus,
+  remotePresence,
+  isAdmin,
+  adminUrl,
+  pendingAdminAction,
+  onCopyParticipantUrl,
+  onCopyAdminUrl,
+  onCopyConsolidatedFeedback,
+  onCopyAgentInstructions,
+  onDelete,
+  className = '',
+}: RoomHeaderControlsProps): React.ReactElement {
+  const showStatus = connectionStatus !== 'authenticated';
+  const hasPeers = Object.keys(remotePresence).length > 0;
+
+  return (
+    <div
+      className={`flex items-center gap-2 ${className}`}
+      data-testid="room-header-controls"
+    >
+      {showStatus && (
+        <RoomStatusBadge connectionStatus={connectionStatus} />
+      )}
+      {hasPeers && (
+        <ParticipantAvatars remotePresence={remotePresence} />
+      )}
+      <RoomMenu
+        isAdmin={isAdmin}
+        adminUrl={adminUrl}
+        pendingAdminAction={pendingAdminAction}
+        onCopyParticipantUrl={onCopyParticipantUrl}
+        onCopyAdminUrl={onCopyAdminUrl}
+        onCopyConsolidatedFeedback={onCopyConsolidatedFeedback}
+        onCopyAgentInstructions={onCopyAgentInstructions}
+        onDelete={onDelete}
+      />
+    </div>
+  );
+}
diff --git a/packages/ui/components/collab/RoomMenu.tsx b/packages/ui/components/collab/RoomMenu.tsx
new file mode 100644
index 000000000..e4699991f
--- /dev/null
+++ b/packages/ui/components/collab/RoomMenu.tsx
@@ -0,0 +1,191 @@
+import React, { useState } from 'react';
+import { ActionMenu, ActionMenuDivider, ActionMenuItem } from '../ActionMenu';
+import type { AdminAction } from '../../hooks/collab/useRoomAdminActions';
+
+/**
+ * Room actions dropdown, anchored in the editor header next to the
+ * participant avatars. Replaces the floating `RoomPanel` — copy links,
+ * copy consolidated feedback, and (for admins) delete and the admin
+ * recovery link disclosure all live behind one click.
+ *
+ * Click-outside / Esc close is handled by the shared `ActionMenu`
+ * primitive. The trigger is a pill-shaped button with a link icon and
+ * chevron, visually grouped with the avatar cluster but semantically
+ * its own click target (avatars stay tooltip-only per the agreed UX).
+ */
+
+export interface RoomMenuProps {
+  isAdmin: boolean;
+  /** Non-null when the caller holds admin capability. */
+  adminUrl?: string;
+  /** Set while an admin command is in flight; disables the Delete item. */
+  pendingAdminAction?: AdminAction;
+  onCopyParticipantUrl(): void;
+  onCopyConsolidatedFeedback(): void;
+  onCopyAgentInstructions(): void;
+  onCopyAdminUrl(): void;
+  onDelete(): void;
+}
+
+// Small inline icons, same stroke + size convention as PlanHeaderMenu.
+const ICON_CLASS = 'w-3.5 h-3.5';
+const LinkIcon = (
+  <svg className={ICON_CLASS} fill="none" viewBox="0 0 24 24" stroke="currentColor" strokeWidth={2} aria-hidden>
+    <path strokeLinecap="round" strokeLinejoin="round" d="M13.828 10.172a4 4 0 00-5.656 0l-4 4a4 4 0 105.656 5.656l1.102-1.101m-.758-4.899a4 4 0 005.656 0l4-4a4 4 0 00-5.656-5.656l-1.1 1.1" />
+  </svg>
+);
+const CopyIcon = (
+  <svg className={ICON_CLASS} fill="none" viewBox="0 0 24 24" stroke="currentColor" strokeWidth={2} aria-hidden>
+    <path strokeLinecap="round" strokeLinejoin="round" d="M8 16H6a2 2 0 01-2-2V6a2 2 0 012-2h8a2 2 0 012 2v2m-6 12h8a2 2 0 002-2v-8a2 2 0 00-2-2h-8a2 2 0 00-2 2v8a2 2 0 002 2z" />
+  </svg>
+);
+const DeleteIcon = (
+  <svg className={ICON_CLASS} fill="none" viewBox="0 0 24 24" stroke="currentColor" strokeWidth={2} aria-hidden>
+    <path strokeLinecap="round" strokeLinejoin="round" d="M19 7l-.867 12.142A2 2 0 0116.138 21H7.862a2 2 0 01-1.995-1.858L5 7m5 4v6m4-6v6M1 7h22M10 7V3a1 1 0 011-1h2a1 1 0 011 1v4" />
+  </svg>
+);
+const KeyIcon = (
+  <svg className={ICON_CLASS} fill="none" viewBox="0 0 24 24" stroke="currentColor" strokeWidth={2} aria-hidden>
+    <path strokeLinecap="round" strokeLinejoin="round" d="M15 7a2 2 0 012 2m4 0a6 6 0 01-7.743 5.743L11 17H9v2H7v2H4a1 1 0 01-1-1v-2.586a1 1 0 01.293-.707l5.964-5.964A6 6 0 1121 9z" />
+  </svg>
+);
+const RobotIcon = (
+  <svg className={ICON_CLASS} fill="none" viewBox="0 0 24 24" stroke="currentColor" strokeWidth={2} aria-hidden>
+    <path strokeLinecap="round" strokeLinejoin="round" d="M9.75 17L9 20l-1 1h8l-1-1-.75-3M3 13h2m14 0h2M5 17h14a2 2 0 002-2V7a2 2 0 00-2-2H5a2 2 0 00-2 2v8a2 2 0 002 2zM9 10h.01M15 10h.01M10 14h4" />
+  </svg>
+);
+const ChevronIcon = (
+  <svg className="w-3 h-3 opacity-60" fill="none" viewBox="0 0 24 24" stroke="currentColor" strokeWidth={2} aria-hidden>
+    <path strokeLinecap="round" strokeLinejoin="round" d="M19 9l-7 7-7-7" />
+  </svg>
+);
+
+export function RoomMenu({
+  isAdmin,
+  adminUrl,
+  pendingAdminAction,
+  onCopyParticipantUrl,
+  onCopyConsolidatedFeedback,
+  onCopyAgentInstructions,
+  onCopyAdminUrl,
+  onDelete,
+}: RoomMenuProps): React.ReactElement {
+  // Admin recovery link is disclosure-gated inside the menu, same as
+  // the prior RoomPanel design — revealing the full admin URL behind a
+  // click makes accidental copy-paste into the participant channel
+  // harder.
+  const [adminDisclosed, setAdminDisclosed] = useState(false);
+
+  return (
+    <ActionMenu
+      renderTrigger={({ isOpen, toggleMenu }) => (
+        <button
+          type="button"
+          onClick={toggleMenu}
+          className={`inline-flex items-center gap-1 px-2 py-1 rounded-md text-xs font-medium transition-colors ${
+            isOpen
+              ? 'bg-muted text-foreground'
+              : 'text-muted-foreground hover:text-foreground hover:bg-muted'
+          }`}
+          title="Room actions"
+          aria-haspopup="menu"
+          aria-expanded={isOpen}
+          data-testid="room-menu-trigger"
+        >
+          {/*
+            Intentional visual distinction from "Copy participant link"
+            inside the dropdown: the trigger uses 👥 (room / people),
+            the link item inside uses the chain icon (a URL). Sharing
+            the link icon on both was ambiguous — the reviewer flagged
+            the trigger as reading like another "copy link" button.
+          */}
+          <span aria-hidden>👥</span>
+          <span className="hidden sm:inline">Room</span>
+          {ChevronIcon}
+        </button>
+      )}
+      panelClassName="absolute top-full right-0 mt-1 w-60 rounded-lg border border-border bg-popover py-1 shadow-xl z-[70]"
+    >
+      {({ closeMenu }) => (
+        <>
+          <ActionMenuItem
+            icon={LinkIcon}
+            label="Copy participant link"
+            onClick={() => {
+              closeMenu();
+              onCopyParticipantUrl();
+            }}
+          />
+          {/*
+            "Copy agent instructions" — the clipboard payload teaches
+            an AI agent (Claude Code, Codex, etc.) how to join THIS
+            room via the collab-agent CLI and post comments as a
+            first-class peer. The payload pre-fills this room's URL
+            and the current user's identity so the agent doesn't
+            have to extract them from a separate message.
+          */}
+          <ActionMenuItem
+            icon={RobotIcon}
+            label="Copy agent instructions"
+            onClick={() => {
+              closeMenu();
+              onCopyAgentInstructions();
+            }}
+          />
+
+          {isAdmin && (
+            <>
+              <ActionMenuDivider />
+              {/*
+                Admin recovery link: keep the two-step disclosure so a
+                creator can't accidentally paste it into the same
+                channel they share the participant link on. Menu stays
+                open on toggle so the Copy button inside is reachable.
+              */}
+              <button
+                type="button"
+                onClick={() => setAdminDisclosed(v => !v)}
+                className="flex w-full items-center gap-2 px-3 py-2 text-left text-xs text-muted-foreground transition-colors hover:bg-muted"
+                data-testid="admin-disclosure-toggle"
+              >
+                <span className="text-muted-foreground">{KeyIcon}</span>
+                <span className="flex-1">
+                  {adminDisclosed ? 'Hide admin recovery link' : 'Show admin recovery link'}
+                </span>
+              </button>
+              {adminDisclosed && adminUrl && (
+                <div className="px-3 pb-2 space-y-1">
+                  <p className="text-[10px] text-amber-900 dark:text-amber-200 leading-tight">
+                    Grants full admin control. Keep it private; do not share.
+                  </p>
+                  <button
+                    type="button"
+                    onClick={() => {
+                      closeMenu();
+                      onCopyAdminUrl();
+                    }}
+                    className="w-full px-2 py-1.5 text-xs rounded bg-destructive/10 text-destructive hover:bg-destructive/20"
+                    data-testid="copy-admin-url"
+                  >
+                    Copy admin link
+                  </button>
+                </div>
+              )}
+
+              <ActionMenuDivider />
+              <ActionMenuItem
+                icon={<span className="text-destructive">{DeleteIcon}</span>}
+                label={pendingAdminAction === 'delete' ? 'Deleting…' : 'Delete room'}
+                onClick={() => {
+                  if (pendingAdminAction) return;
+                  closeMenu();
+                  onDelete();
+                }}
+              />
+            </>
+          )}
+        </>
+      )}
+    </ActionMenu>
+  );
+}
diff --git a/packages/ui/components/collab/RoomStatusBadge.test.tsx b/packages/ui/components/collab/RoomStatusBadge.test.tsx
new file mode 100644
index 000000000..89eb2774d
--- /dev/null
+++ b/packages/ui/components/collab/RoomStatusBadge.test.tsx
@@ -0,0 +1,42 @@
+import { describe, expect, test } from 'bun:test';
+import { render } from '@testing-library/react';
+import { RoomStatusBadge } from './RoomStatusBadge';
+
+function label(el: HTMLElement): string {
+  const badge = el.querySelector('[data-testid="room-status-badge"]');
+  return badge?.getAttribute('data-status-label') ?? '';
+}
+
+describe('RoomStatusBadge', () => {
+  test('renders "Live" when authenticated', () => {
+    const { container } = render(
+      <RoomStatusBadge connectionStatus="authenticated" />,
+    );
+    expect(label(container)).toBe('Live');
+  });
+
+  test('renders "Connecting" during connecting/authenticating', () => {
+    const { container, rerender } = render(
+      <RoomStatusBadge connectionStatus="connecting" />,
+    );
+    expect(label(container)).toBe('Connecting');
+    rerender(<RoomStatusBadge connectionStatus="authenticating" />);
+    expect(label(container)).toBe('Connecting');
+  });
+
+  test('renders "Reconnecting" during reconnect', () => {
+    const { container } = render(
+      <RoomStatusBadge connectionStatus="reconnecting" />,
+    );
+    expect(label(container)).toBe('Reconnecting');
+  });
+
+  test('renders "Offline" when disconnected or closed', () => {
+    const { container, rerender } = render(
+      <RoomStatusBadge connectionStatus="disconnected" />,
+    );
+    expect(label(container)).toBe('Offline');
+    rerender(<RoomStatusBadge connectionStatus="closed" />);
+    expect(label(container)).toBe('Offline');
+  });
+});
diff --git a/packages/ui/components/collab/RoomStatusBadge.tsx b/packages/ui/components/collab/RoomStatusBadge.tsx
new file mode 100644
index 000000000..f6037924f
--- /dev/null
+++ b/packages/ui/components/collab/RoomStatusBadge.tsx
@@ -0,0 +1,55 @@
+import React from 'react';
+import type { ConnectionStatus } from '@plannotator/shared/collab/client';
+
+/**
+ * Pure status-pill for the live room. Renders a single label based on
+ * connection health. Terminal states (room gone) no longer have a badge —
+ * the caller transitions to `RoomUnavailableScreen` instead. No side
+ * effects; identity driven entirely by props so memoization is trivial.
+ *
+ * Labels: reconnecting / connecting / offline / Live (default when
+ * authenticated).
+ */
+
+export interface RoomStatusBadgeProps {
+  connectionStatus: ConnectionStatus;
+  className?: string;
+}
+
+interface Variant {
+  label: string;
+  dotClass: string;
+  /** Bg/text utility class bundle for the pill itself. */
+  pillClass: string;
+}
+
+function deriveVariant(connectionStatus: ConnectionStatus): Variant {
+  if (connectionStatus === 'reconnecting') {
+    return { label: 'Reconnecting', dotClass: 'bg-warning animate-pulse', pillClass: 'bg-warning/10 text-warning' };
+  }
+  if (connectionStatus === 'connecting' || connectionStatus === 'authenticating') {
+    return { label: 'Connecting', dotClass: 'bg-primary animate-pulse', pillClass: 'bg-primary/10 text-primary' };
+  }
+  if (connectionStatus === 'disconnected' || connectionStatus === 'closed') {
+    return { label: 'Offline', dotClass: 'bg-muted-foreground', pillClass: 'bg-muted text-muted-foreground' };
+  }
+  return { label: 'Live', dotClass: 'bg-success', pillClass: 'bg-success/10 text-success' };
+}
+
+export function RoomStatusBadge({
+  connectionStatus,
+  className = '',
+}: RoomStatusBadgeProps): React.ReactElement {
+  const variant = deriveVariant(connectionStatus);
+  return (
+    <span
+      className={`inline-flex items-center gap-1.5 px-2 py-0.5 rounded-full text-xs font-medium ${variant.pillClass} ${className}`}
+      aria-live="polite"
+      data-testid="room-status-badge"
+      data-status-label={variant.label}
+    >
+      <span className={`w-1.5 h-1.5 rounded-full ${variant.dotClass}`} aria-hidden />
+      {variant.label}
+    </span>
+  );
+}
diff --git a/packages/ui/components/collab/RoomUnavailableScreen.tsx b/packages/ui/components/collab/RoomUnavailableScreen.tsx
new file mode 100644
index 000000000..4d75a5c93
--- /dev/null
+++ b/packages/ui/components/collab/RoomUnavailableScreen.tsx
@@ -0,0 +1,25 @@
+import React from 'react';
+
+/**
+ * Terminal screen shown when a room URL no longer resolves. Covers every
+ * "link doesn't work" case: admin-initiated delete, auto-expiry at the
+ * 30-day mark, or a request against a room that never existed / has
+ * already been purged. The server does not surface the cause to the
+ * client; the user experience is the same for all three.
+ *
+ * Minimal on purpose — this is the web-standard "gone resource" UX,
+ * not a branded "session has ended" memorial.
+ */
+export function RoomUnavailableScreen(): React.ReactElement {
+  return (
+    <div
+      className="fixed inset-0 flex items-center justify-center bg-background"
+      data-testid="room-unavailable-screen"
+    >
+      <div className="text-center space-y-2 max-w-sm">
+        <h2 className="text-lg font-semibold">This link doesn't go anywhere</h2>
+        <p className="text-sm text-muted-foreground">Ask for a new one.</p>
+      </div>
+    </div>
+  );
+}
diff --git a/packages/ui/components/collab/StartRoomModal.tsx b/packages/ui/components/collab/StartRoomModal.tsx
new file mode 100644
index 000000000..296eadaf6
--- /dev/null
+++ b/packages/ui/components/collab/StartRoomModal.tsx
@@ -0,0 +1,163 @@
+import React, { useState } from 'react';
+import { PRESENCE_SWATCHES } from '@plannotator/ui/utils/presenceColor';
+
+/**
+ * Pure create-room dialog. Collects display name, color, expiry, and
+ * confirms the image-strip consequence when relevant. Emits one callback
+ * (`onStart`) with the settled options; the parent (`App.tsx`'s
+ * `handleConfirmStartRoom`) calls `createRoom()` directly because the
+ * flow needs a synchronous `window.open()` inside the click handler's
+ * user-activation window — a React hook boundary between click and open
+ * would get the popup blocked in most browsers.
+ *
+ * Identity is a confirmation step, not a setup step: callers pass
+ * `initialDisplayName` and `initialColor` from the user's existing
+ * Plannotator preferences (`getIdentity()` / `getPresenceColor()`), and
+ * the parent persists any edits back via `setCustomIdentity` /
+ * `setPresenceColor` after submit. Peers see the submitted color via
+ * presence.
+ *
+ * Not a controlled modal — parent decides when to mount. Dismiss via the
+ * Cancel button (not Esc-only) so the caller can abort an in-flight
+ * createRoom via AbortController.
+ */
+
+export interface StartRoomSubmit {
+  displayName: string;
+  color: string;
+  expiresInDays: 0 | 1 | 7 | 30;
+}
+
+export interface StartRoomModalProps {
+  initialDisplayName?: string;
+  initialColor?: string;
+  imageAnnotationsToStrip?: number;
+  inFlight?: boolean;
+  errorMessage?: string;
+  onStart(submit: StartRoomSubmit): void;
+  onCancel(): void;
+}
+
+export function StartRoomModal({
+  initialDisplayName = '',
+  initialColor = PRESENCE_SWATCHES[0],
+  imageAnnotationsToStrip = 0,
+  inFlight = false,
+  errorMessage,
+  onStart,
+  onCancel,
+}: StartRoomModalProps): React.ReactElement {
+  const [displayName, setDisplayName] = useState(initialDisplayName);
+  const [color, setColor] = useState(initialColor);
+  const [expiresInDays, setExpiresInDays] = useState<0 | 1 | 7 | 30>(7);
+
+  const strips = imageAnnotationsToStrip > 0;
+  const ctaLabel = inFlight
+    ? 'Creating…'
+    : strips ? 'Strip images and start' : 'Start room';
+
+  function handleSubmit(e: React.FormEvent) {
+    e.preventDefault();
+    if (inFlight) return;
+    const trimmed = displayName.trim();
+    if (!trimmed) return;
+    onStart({ displayName: trimmed, color, expiresInDays });
+  }
+
+  return (
+    <div
+      className="fixed inset-0 z-[100] flex items-center justify-center bg-background/80 backdrop-blur-sm p-4"
+      data-testid="start-room-modal"
+    >
+      <form
+        onSubmit={handleSubmit}
+        className="bg-card border border-border rounded-xl shadow-2xl w-[420px] max-w-[90vw] p-5 space-y-4"
+      >
+        <div>
+          <h2 className="text-base font-semibold">Start a live review session</h2>
+          <p className="text-sm text-muted-foreground mt-1">
+            Share a link. Collaborators see your plan and annotations in real time.
+            Their changes sync to you.
+          </p>
+        </div>
+
+        <div className="space-y-2">
+          <label className="text-xs font-medium uppercase text-muted-foreground">Display name</label>
+          <input
+            type="text"
+            value={displayName}
+            onChange={e => setDisplayName(e.target.value)}
+            disabled={inFlight}
+            className="w-full px-2 py-1 border rounded text-sm"
+            placeholder="Your name"
+            autoFocus
+          />
+        </div>
+
+        <div className="space-y-2">
+          <label className="text-xs font-medium uppercase text-muted-foreground">Color</label>
+          <div className="flex items-center gap-1">
+            {PRESENCE_SWATCHES.map(s => (
+              <button
+                key={s}
+                type="button"
+                disabled={inFlight}
+                onClick={() => setColor(s)}
+                className={`w-6 h-6 rounded-full border-2 ${color === s ? 'border-foreground' : 'border-transparent'}`}
+                style={{ backgroundColor: s }}
+                aria-label={`Color ${s}`}
+              />
+            ))}
+          </div>
+        </div>
+
+        <div className="space-y-2">
+          <label className="text-xs font-medium uppercase text-muted-foreground">Expires</label>
+          <select
+            value={expiresInDays}
+            onChange={e => setExpiresInDays(Number(e.target.value) as 0 | 1 | 7 | 30)}
+            disabled={inFlight}
+            className="w-full px-2 py-1 border rounded text-sm"
+          >
+            <option value={1}>1 day</option>
+            <option value={7}>7 days (default)</option>
+            <option value={30}>30 days</option>
+            <option value={0}>Never</option>
+          </select>
+        </div>
+
+        {strips && (
+          <div className="text-xs bg-amber-50 text-amber-900 dark:bg-amber-900/20 dark:text-amber-200 p-2 rounded">
+            <strong>Images won't travel.</strong>{' '}
+            {imageAnnotationsToStrip} item{imageAnnotationsToStrip === 1 ? '' : 's'} with image attachments will be stripped before sharing. Your local copies stay intact.
+          </div>
+        )}
+
+        {errorMessage && (
+          <div className="text-xs bg-destructive/10 text-destructive p-2 rounded" role="alert">
+            {errorMessage}
+          </div>
+        )}
+
+        <div className="flex items-center justify-end gap-2 pt-2">
+          <button
+            type="button"
+            onClick={onCancel}
+            // Cancel must remain enabled during in-flight so the user can
+            // abort createRoom via the AbortController the parent wired.
+            className="px-3 py-1.5 text-sm rounded hover:bg-muted"
+          >
+            Cancel
+          </button>
+          <button
+            type="submit"
+            disabled={inFlight || !displayName.trim()}
+            className="px-3 py-1.5 text-sm rounded bg-foreground text-background disabled:opacity-50"
+          >
+            {ctaLabel}
+          </button>
+        </div>
+      </form>
+    </div>
+  );
+}
diff --git a/packages/ui/components/plan-diff/VSCodeIcon.tsx b/packages/ui/components/plan-diff/VSCodeIcon.tsx
index 129f11113..31ce0eb36 100644
--- a/packages/ui/components/plan-diff/VSCodeIcon.tsx
+++ b/packages/ui/components/plan-diff/VSCodeIcon.tsx
@@ -9,7 +9,10 @@ export const VSCodeIcon: React.FC<{ className?: string }> = ({ className }) => (
   >
     <mask
       id="mask0"
-      {...{ 'mask-type': 'alpha' }}
+      // `maskType` is a valid SVG presentation attribute but missing
+      // from React's SVGMaskElement typing. Apply via the CSS `mask-type`
+      // property (the DOM representation is identical) so tsc is happy.
+      style={{ maskType: 'alpha' }}
       maskUnits="userSpaceOnUse"
       x="0"
       y="0"
diff --git a/packages/ui/components/types.d.ts b/packages/ui/components/types.d.ts
index 76c6549de..5aab779ef 100644
--- a/packages/ui/components/types.d.ts
+++ b/packages/ui/components/types.d.ts
@@ -1,7 +1,9 @@
 // Vite globals injected at build time
 declare const __APP_VERSION__: string;
 
-// declare webp
+// Asset imports — declared as side-effect-safe so bundler-resolved
+// imports don't fail typecheck. Value imports are typed as `string`
+// (Vite resolves them to public URLs).
 
 declare module "*.webp" {
   const content: string;
@@ -12,3 +14,8 @@ declare module "*.png" {
   const content: string;
   export default content;
 }
+
+// CSS side-effect imports (e.g. `import 'highlight.js/styles/github-dark.css'`).
+// Viewer and several components rely on these at runtime via Vite; the
+// type declaration is just so typecheck stops complaining.
+declare module "*.css" {}
diff --git a/packages/ui/config/settings.ts b/packages/ui/config/settings.ts
index 01f6d0cac..086ed7764 100644
--- a/packages/ui/config/settings.ts
+++ b/packages/ui/config/settings.ts
@@ -12,6 +12,7 @@
 import type { DiffLineBgIntensity } from '@plannotator/shared/config';
 import { storage } from '../utils/storage';
 import { generateIdentity } from '../utils/generateIdentity';
+import { hashNameToSwatch, isValidPresenceColor, normalizePresenceColor } from '../utils/presenceColor';
 
 const DIFF_LINE_BG_INTENSITY_VALUES = ['subtle', 'normal', 'strong'] as const;
 function isDiffLineBgIntensity(v: unknown): v is DiffLineBgIntensity {
@@ -20,12 +21,19 @@ function isDiffLineBgIntensity(v: unknown): v is DiffLineBgIntensity {
 
 export interface SettingDef<T> {
   defaultValue: T | (() => T);
-  fromCookie: () => T | undefined;
-  toCookie: (value: T) => void;
+  // Method signatures (not arrow-typed properties) so TypeScript compares
+  // parameter types bivariantly. SETTINGS entries declare concrete
+  // parameter types (e.g. `toCookie: (v: string) => void`); with
+  // arrow-typed properties those are contravariantly incompatible with
+  // the generic's default inference as `unknown`. Method signatures
+  // admit the intended usage without forcing every entry to declare its
+  // generic parameter explicitly.
+  fromCookie(): T | undefined;
+  toCookie(value: T): void;
   /** If set, this setting syncs to server via POST /api/config */
   serverKey?: string;
-  fromServer?: (serverConfig: Record<string, unknown>) => T | undefined;
-  toServer?: (value: T) => Record<string, unknown>;
+  fromServer?(serverConfig: Record<string, unknown>): T | undefined;
+  toServer?(value: T): Record<string, unknown>;
 }
 
 export const SETTINGS = {
@@ -39,6 +47,37 @@ export const SETTINGS = {
     toServer: (v: string) => ({ displayName: v }),
   },
 
+  /**
+   * Presence color for Live Rooms. Surfaced in Settings, StartRoomModal,
+   * and JoinRoomGate; peers see it via the presence channel.
+   *
+   * Default: hash of the current displayName to a swatch index, so a
+   * first-time user gets a stable distinct color without opening the
+   * picker. Depends on `displayName`'s cookie being populated first;
+   * declaration order in this object is the resolution order in
+   * `ConfigStore.constructor`, so `displayName` above is guaranteed
+   * to have written its cookie before this default runs.
+   */
+  presenceColor: {
+    defaultValue: () => {
+      const name = storage.getItem('plannotator-identity') ?? '';
+      return hashNameToSwatch(name);
+    },
+    fromCookie: () => {
+      const v = storage.getItem('plannotator-presence-color');
+      return v && isValidPresenceColor(v) ? normalizePresenceColor(v) : undefined;
+    },
+    toCookie: (v: string) => storage.setItem('plannotator-presence-color', v),
+    serverKey: 'presenceColor',
+    fromServer: (sc: Record<string, unknown>) => {
+      const v = sc.presenceColor;
+      return typeof v === 'string' && isValidPresenceColor(v)
+        ? normalizePresenceColor(v)
+        : undefined;
+    },
+    toServer: (v: string) => ({ presenceColor: v }),
+  },
+
   // --- Diff display options (namespaced under diffOptions in config.json) ---
 
   defaultDiffType: {
diff --git a/packages/ui/hooks/collab/useCollabRoom.test.tsx b/packages/ui/hooks/collab/useCollabRoom.test.tsx
new file mode 100644
index 000000000..6659ee462
--- /dev/null
+++ b/packages/ui/hooks/collab/useCollabRoom.test.tsx
@@ -0,0 +1,56 @@
+import { describe, expect, test } from 'bun:test';
+import { renderHook, waitFor } from '@testing-library/react';
+import { useCollabRoom } from './useCollabRoom';
+import type { CollabRoomUser } from '@plannotator/shared/collab/client';
+
+const USER: CollabRoomUser = { id: 'u1', name: 'alice', color: '#f00' };
+
+/**
+ * `lastErrorId` contract check for the join-phase error path.
+ *
+ * The shared client owns `lastErrorId` for client-internal errors, but join
+ * failures happen before the client is wired up — the hook surfaces them via
+ * its own branch. Without a hook-owned counter, that branch would spread
+ * DISCONNECTED_STATE (`lastErrorId: 0`) and callers dedupe-ing on id would
+ * silently ignore join errors.
+ */
+describe('useCollabRoom — join error id', () => {
+  test('first join failure surfaces a positive lastErrorId', async () => {
+    // Malformed URL triggers InvalidRoomUrlError in joinRoom() before any
+    // network contact — deterministic failure, no timing.
+    const { result } = renderHook(() =>
+      useCollabRoom({
+        url: 'not-a-room-url',
+        user: USER,
+      }),
+    );
+
+    await waitFor(() => {
+      expect(result.current.lastError).not.toBeNull();
+    });
+    expect(result.current.lastError?.scope).toBe('join');
+    expect(result.current.lastErrorId).toBeGreaterThan(0);
+  });
+
+  test('a second join failure bumps lastErrorId', async () => {
+    let url = 'not-a-room-url';
+    const { result, rerender } = renderHook(
+      () => useCollabRoom({ url, user: USER }),
+    );
+
+    await waitFor(() => {
+      expect(result.current.lastErrorId).toBeGreaterThan(0);
+    });
+    const firstId = result.current.lastErrorId;
+
+    // Change the url so the effect tears down and re-runs with a fresh
+    // failing URL; the hook should issue a new error id.
+    url = 'also-not-a-room-url';
+    rerender();
+
+    await waitFor(() => {
+      expect(result.current.lastError).not.toBeNull();
+      expect(result.current.lastErrorId).toBeGreaterThan(firstId);
+    });
+  });
+});
diff --git a/packages/ui/hooks/collab/useCollabRoom.ts b/packages/ui/hooks/collab/useCollabRoom.ts
new file mode 100644
index 000000000..f5e42371f
--- /dev/null
+++ b/packages/ui/hooks/collab/useCollabRoom.ts
@@ -0,0 +1,322 @@
+/**
+ * React hook wrapping CollabRoomClient for editor/component consumption.
+ *
+ * Usage:
+ *   const room = useCollabRoom({ url, user, adminSecret? });
+ *   room.addAnnotations([ann]);
+ *
+ * Effect deps: [url, adminSecret, user.id, enabled]. Change any and the hook
+ * tears down the client and creates a new one. For stable connections, consumers
+ * should memoize `user` (used by value) and avoid mutating `url`/`adminSecret`.
+ *
+ * Changes to user.name/color propagate via the next sendPresence() call without
+ * reconnecting.
+ *
+ * === Key-gated client ===
+ * The effect runs AFTER the render commits. So when url/adminSecret/user.id/
+ * enabled change, React could otherwise return a render of the previous
+ * authenticated state and old client before the effect fires. To prevent a
+ * click in that window sending to the wrong room, every read (state +
+ * requireClient) compares the CURRENT render's prop key against the key the
+ * stored client was created for. Mismatch returns DISCONNECTED_STATE /
+ * client: null / mutations throw unavailable-client.
+ *
+ * === Mutation contract (V1) ===
+ * Mutation methods (`addAnnotations`, `updateAnnotation`, `removeAnnotations`,
+ * `clearAnnotations`) resolve when the op is SENT to the server, not when
+ * local state has been updated. The returned `annotations` array reflects
+ * server-echoed state — awaiting `addAnnotations(...)` and then reading
+ * `annotations` synchronously may still show pre-echo state.
+ *
+ * For reactive UI, render from the returned `annotations` field; it updates
+ * via React state when the server echo arrives and is applied by the client.
+ * This mirrors `CollabRoomClient`'s `state` event contract.
+ */
+
+import { useCallback, useEffect, useRef, useState } from 'react';
+import {
+  joinRoom,
+  InvalidRoomUrlError,
+  InvalidAdminSecretError,
+  ConnectTimeoutError,
+  AuthRejectedError,
+  RoomUnavailableError,
+  type CollabRoomClient,
+  type CollabRoomState,
+  type CollabRoomUser,
+  type ConnectionStatus,
+} from '@plannotator/shared/collab/client';
+import type {
+  PresenceState,
+  RoomAnnotation,
+} from '@plannotator/shared/collab';
+
+export interface UseCollabRoomOptions {
+  /** Full room URL including #key= fragment. */
+  url: string;
+  /** base64url admin secret if not carried in URL. Hook does NOT persist. */
+  adminSecret?: string;
+  /** User identity. Consumer should memoize for stable reconnect behavior. */
+  user: CollabRoomUser;
+  /** Default true. When false, no connection is established. */
+  enabled?: boolean;
+}
+
+export interface UseCollabRoomReturn {
+  connectionStatus: ConnectionStatus;
+  /** True once the server closed our socket with the terminal "room unavailable" signal. */
+  roomUnavailable: boolean;
+  planMarkdown: string;
+  annotations: RoomAnnotation[];
+  /**
+   * Last server seq applied locally. Advances monotonically for every
+   * server-admitted op. Pending-op reconciliation in useAnnotationController
+   * uses this to detect "the server has processed past my send" without
+   * needing opId-level echo matching.
+   */
+  seq: number;
+  remotePresence: Record<string, PresenceState>;
+  hasAdminCapability: boolean;
+  lastError: { code: string; message: string; scope: 'mutation' | 'admin' | 'event' | 'presence' | 'snapshot' | 'join' } | null;
+  /**
+   * Monotonic id bumped on every NEW server-side error. Consumers that
+   * react to errors (e.g. annotation controller rejecting in-flight
+   * pending ops) MUST dedupe on this id — object identity is unstable
+   * across state emissions because the client clones `lastError`.
+   */
+  lastErrorId: number;
+
+  addAnnotations: (a: RoomAnnotation[]) => Promise<void>;
+  updateAnnotation: (id: string, patch: Partial<RoomAnnotation>) => Promise<void>;
+  removeAnnotations: (ids: string[]) => Promise<void>;
+  clearAnnotations: (source?: string) => Promise<void>;
+  updatePresence: (p: PresenceState) => Promise<void>;
+
+  deleteRoom: () => Promise<void>;
+
+  /**
+   * Escape hatch for advanced consumers. May be non-null before authentication
+   * completes (e.g. during the `connecting` / `authenticating` window); gate
+   * mutations on `connectionStatus === 'authenticated'` rather than on this
+   * field being non-null.
+   *
+   * Additionally, the hook key-gates this reference — if the current render's
+   * props (url/adminSecret/user.id/enabled) don't match the props the stored
+   * client was created for, this returns null to prevent sending to a stale
+   * room between render and the next effect run.
+   */
+  client: CollabRoomClient | null;
+}
+
+const DISCONNECTED_STATE: CollabRoomState = {
+  connectionStatus: 'disconnected',
+  roomUnavailable: false,
+  roomId: '',
+  clientId: '',
+  seq: 0,
+  planMarkdown: '',
+  annotations: [],
+  remotePresence: {},
+  hasAdminCapability: false,
+  lastError: null,
+  lastErrorId: 0,
+};
+
+/**
+ * Map joinRoom() / connect() errors to stable, UI-friendly codes so consumers
+ * can render actionable messages without string-matching `err.message`.
+ *
+ * Scope is 'join': these are join/connect-phase failures surfaced by the
+ * hook wrapper itself, not client-internal mutation or admin rejections.
+ * Consumers (annotation controller, RoomApp error banner) dedupe on
+ * `lastErrorId` and branch on `scope === 'join'` to distinguish
+ * "couldn't get into the room" from "server rejected my op."
+ */
+function mapJoinFailure(err: unknown): {
+  code: string;
+  message: string;
+  scope: 'mutation' | 'admin' | 'event' | 'presence' | 'snapshot' | 'join';
+} {
+  const scope = 'join' as const;
+  if (err instanceof InvalidRoomUrlError) return { code: 'invalid_room_url', message: err.message, scope };
+  if (err instanceof InvalidAdminSecretError) return { code: 'invalid_admin_secret', message: err.message, scope };
+  if (err instanceof ConnectTimeoutError) return { code: 'connect_timeout', message: err.message, scope };
+  if (err instanceof AuthRejectedError) return { code: 'auth_rejected', message: err.message, scope };
+  if (err instanceof RoomUnavailableError) return { code: 'room_unavailable', message: err.message, scope };
+  return { code: 'join_failed', message: err instanceof Error ? err.message : String(err), scope };
+}
+
+/**
+ * Serializable identity of the current hook props for comparison.
+ * JSON-array encoding avoids ambiguity around delimiters in url/user.id —
+ * this key is the ONLY barrier preventing a stale-room send, so it must be
+ * collision-proof regardless of what the caller passes.
+ */
+function roomKeyFor(url: string, adminSecret: string | undefined, userId: string, enabled: boolean): string {
+  return JSON.stringify([enabled, userId, adminSecret ?? null, url]);
+}
+
+export function useCollabRoom(options: UseCollabRoomOptions): UseCollabRoomReturn {
+  const { url, adminSecret, user, enabled = true } = options;
+  const currentKey = roomKeyFor(url, adminSecret, user.id, enabled);
+
+  const [state, setState] = useState<CollabRoomState>(DISCONNECTED_STATE);
+  const [stateKey, setStateKey] = useState<string>('');  // key the state belongs to
+  const clientRef = useRef<CollabRoomClient | null>(null);
+  const clientKeyRef = useRef<string>('');  // key the stored client was created for
+
+  // Keep user in a ref so mutation callbacks see latest name/color without
+  // triggering a reconnect. Reconnect only fires when user.id changes.
+  const userRef = useRef(user);
+  userRef.current = user;
+
+  // Monotonic counter for join-phase errors surfaced by this hook. The
+  // underlying client increments its own id for client-internal errors
+  // (mutation, admin, event, ...); join failures never reach that path
+  // because they happen before the client is wired up. Without a hook-owned
+  // counter, the failure branch would spread DISCONNECTED_STATE and leave
+  // `lastErrorId` at 0 — violating the contract that 0 means "no error has
+  // ever occurred" and breaking consumers that dedupe errors on id.
+  const joinErrorIdRef = useRef(0);
+
+  useEffect(() => {
+    // Reset synchronously on every dep change BEFORE any async setup. Between
+    // render and the async setup completing, key-gated reads below see
+    // DISCONNECTED_STATE / client: null for the new key so consumers can't
+    // send to the previous room.
+    clientRef.current = null;
+    clientKeyRef.current = '';
+    setState(DISCONNECTED_STATE);
+    setStateKey(currentKey);
+
+    if (!enabled) {
+      return;
+    }
+
+    const effectKey = currentKey;
+    let cancelled = false;
+    let unsubscribe: (() => void) | null = null;
+    let createdClient: CollabRoomClient | null = null;
+
+    (async () => {
+      try {
+        const client = await joinRoom({
+          url,
+          adminSecret,
+          user: userRef.current,
+          autoConnect: false,
+        });
+        createdClient = client;
+
+        if (cancelled) {
+          client.disconnect();
+          return;
+        }
+
+        clientRef.current = client;
+        clientKeyRef.current = effectKey;
+        unsubscribe = client.on('state', (s) => {
+          // React Strict Mode runs effects twice in dev: mount → cleanup → mount.
+          // The outgoing cleanup sets `cancelled = true` but does not unsubscribe
+          // listeners from the previous client synchronously before disconnect,
+          // and disconnect() may emit a final 'closed' state event on this
+          // listener's tick. Without this guard, that late emission would call
+          // React setters on a cleaned-up effect and produce noisy state/flicker
+          // (and is a teardown race under unmount-during-reconnect in prod too).
+          if (cancelled) return;
+          setState(s);
+          setStateKey(effectKey);
+        });
+
+        // Push initial state
+        setState(client.getState());
+        setStateKey(effectKey);
+
+        await client.connect();
+      } catch (err) {
+        // Unsubscribe BEFORE disconnecting so we don't receive a spurious
+        // 'closed' state event during teardown between the failure and the
+        // error surface below.
+        unsubscribe?.();
+        unsubscribe = null;
+        if (createdClient) {
+          try { createdClient.disconnect(); } catch { /* ignore */ }
+          if (clientRef.current === createdClient) {
+            clientRef.current = null;
+            clientKeyRef.current = '';
+          }
+        }
+        if (!cancelled) {
+          joinErrorIdRef.current += 1;
+          setState({
+            ...DISCONNECTED_STATE,
+            lastError: mapJoinFailure(err),
+            lastErrorId: joinErrorIdRef.current,
+          });
+          setStateKey(effectKey);
+        }
+      }
+    })();
+
+    return () => {
+      cancelled = true;
+      unsubscribe?.();
+      clientRef.current?.disconnect();
+      clientRef.current = null;
+      clientKeyRef.current = '';
+    };
+    // eslint-disable-next-line react-hooks/exhaustive-deps
+  }, [url, adminSecret, user.id, enabled]);
+
+  const requireClient = useCallback((): CollabRoomClient => {
+    const c = clientRef.current;
+    if (!c || clientKeyRef.current !== currentKey) {
+      throw new Error('Collab room client is not available (disabled, not yet connected, or room identity changed)');
+    }
+    return c;
+  }, [currentKey]);
+
+  const addAnnotations = useCallback(async (a: RoomAnnotation[]) => {
+    await requireClient().sendAnnotationAdd(a);
+  }, [requireClient]);
+  const updateAnnotation = useCallback(async (id: string, patch: Partial<RoomAnnotation>) => {
+    await requireClient().sendAnnotationUpdate(id, patch);
+  }, [requireClient]);
+  const removeAnnotations = useCallback(async (ids: string[]) => {
+    await requireClient().sendAnnotationRemove(ids);
+  }, [requireClient]);
+  const clearAnnotations = useCallback(async (source?: string) => {
+    await requireClient().sendAnnotationClear(source);
+  }, [requireClient]);
+  const updatePresence = useCallback(async (p: PresenceState) => {
+    await requireClient().sendPresence(p);
+  }, [requireClient]);
+  const deleteRoom = useCallback(async () => {
+    await requireClient().deleteRoom();
+  }, [requireClient]);
+
+  // Key-gate the returned state. If the hook's props have changed this render
+  // but the state was written against the previous key, return DISCONNECTED.
+  // Also gate the client escape hatch against the same key.
+  const stateForRender = stateKey === currentKey ? state : DISCONNECTED_STATE;
+  const clientForRender = clientKeyRef.current === currentKey ? clientRef.current : null;
+
+  return {
+    connectionStatus: stateForRender.connectionStatus,
+    roomUnavailable: stateForRender.roomUnavailable,
+    planMarkdown: stateForRender.planMarkdown,
+    annotations: stateForRender.annotations,
+    seq: stateForRender.seq,
+    remotePresence: stateForRender.remotePresence,
+    hasAdminCapability: stateForRender.hasAdminCapability,
+    lastError: stateForRender.lastError,
+    lastErrorId: stateForRender.lastErrorId,
+    addAnnotations,
+    updateAnnotation,
+    removeAnnotations,
+    clearAnnotations,
+    updatePresence,
+    deleteRoom,
+    client: clientForRender,
+  };
+}
diff --git a/packages/ui/hooks/collab/useCollabRoomSession.test.tsx b/packages/ui/hooks/collab/useCollabRoomSession.test.tsx
new file mode 100644
index 000000000..6057bbd3c
--- /dev/null
+++ b/packages/ui/hooks/collab/useCollabRoomSession.test.tsx
@@ -0,0 +1,59 @@
+import { describe, expect, test } from 'bun:test';
+import { renderHook } from '@testing-library/react';
+import { useCollabRoomSession } from './useCollabRoomSession';
+import type { CollabRoomUser } from '@plannotator/shared/collab/client';
+
+const USER: CollabRoomUser = { id: 'u1', name: 'alice', color: '#f00' };
+
+/**
+ * Join-only wrapper sanity. Full WebSocket lifecycle is covered by
+ * packages/shared/collab/client-runtime tests; here we check URL
+ * parsing and the share-link rebuild path.
+ */
+describe('useCollabRoomSession — join intent', () => {
+  test('starts in "ready" phase immediately (no HTTP)', () => {
+    // enabled:false to keep this shape-only — we're not exercising the
+    // WebSocket lifecycle here, just the wrapper's return shape. Leaving
+    // it enabled would open a real ws against localhost in the test env
+    // and surface an unhandled ws error between tests.
+    const { result } = renderHook(() =>
+      useCollabRoomSession({
+        intent: 'join',
+        url: 'http://localhost/c/room123#key=' + 'A'.repeat(43),
+        user: USER,
+        enabled: false,
+      }),
+    );
+    expect(result.current.phase).toBe('ready');
+    // room is present (useCollabRoom-returned object) even if connection is disabled.
+    expect(result.current.room).toBeDefined();
+    expect(result.current.joinUrl).toContain('/c/room123');
+  });
+
+  test('does not connect when disabled=false', async () => {
+    const { result } = renderHook(() =>
+      useCollabRoomSession({
+        intent: 'join',
+        url: 'http://localhost/c/room123#key=' + 'A'.repeat(43),
+        user: USER,
+        enabled: false,
+      }),
+    );
+    expect(result.current.phase).toBe('ready');
+    // useCollabRoom returns DISCONNECTED_STATE under enabled=false.
+    expect(result.current.room?.connectionStatus).toBe('disconnected');
+  });
+
+  test('surfaces "error" phase for an unparseable URL', () => {
+    const { result } = renderHook(() =>
+      useCollabRoomSession({
+        intent: 'join',
+        url: 'not-a-room-url',
+        user: USER,
+        enabled: false,
+      }),
+    );
+    expect(result.current.phase).toBe('error');
+    expect(result.current.error?.code).toBe('invalid_room_url');
+  });
+});
diff --git a/packages/ui/hooks/collab/useCollabRoomSession.ts b/packages/ui/hooks/collab/useCollabRoomSession.ts
new file mode 100644
index 000000000..dbb6ca520
--- /dev/null
+++ b/packages/ui/hooks/collab/useCollabRoomSession.ts
@@ -0,0 +1,154 @@
+/**
+ * useCollabRoomSession — join-intent wrapper around useCollabRoom.
+ *
+ * useCollabRoom supports the WebSocket join flow (parse URL →
+ * authenticate → subscribe). This wrapper adds URL parsing + admin URL
+ * reconstruction on top so RoomApp can render the participant/admin
+ * share links without re-implementing that logic.
+ *
+ * The create flow (createRoom → persist adminSecret → redirect) is NOT
+ * hosted here. It lives inline in `packages/editor/App.tsx`'s
+ * `handleConfirmStartRoom` because the browser requires
+ * `window.open('', '_blank')` to run synchronously inside the click
+ * handler's user-activation window; wrapping that in a hook would add
+ * an unavoidable React render boundary between click and open, which
+ * most browsers classify as untrusted and block. If the create flow
+ * ever needs to live elsewhere, it needs its own plan for the popup
+ * timing — do not move it back here as-is.
+ *
+ * Phases:
+ *   'ready'    — client constructed; useCollabRoom mounted. Not
+ *                necessarily authenticated yet — consumers watch
+ *                `room.connectionStatus`.
+ *   'error'    — URL failed to parse; `error` populated.
+ *
+ * Admin recovery: the caller may pass `adminSecretOverride` (base64url,
+ * typically read from sessionStorage via `loadAdminSecret`) when the
+ * URL fragment no longer carries `&admin=`. This lets a tab refresh
+ * re-enter as admin without re-including the admin secret in the
+ * address bar.
+ */
+
+import { useMemo } from 'react';
+import { useCollabRoom, type UseCollabRoomReturn } from './useCollabRoom';
+import {
+  parseRoomUrl,
+  buildRoomJoinUrl,
+  buildAdminRoomUrl,
+  type CollabRoomUser,
+} from '@plannotator/shared/collab/client';
+import { base64urlToBytes, ADMIN_SECRET_LENGTH_BYTES } from '@plannotator/shared/collab';
+
+export type CollabRoomSessionPhase = 'ready' | 'error';
+
+export interface UseCollabRoomSessionOptions {
+  intent: 'join';
+  url: string;
+  user: CollabRoomUser;
+  /** Default true. */
+  enabled?: boolean;
+  /** base64url; passed through to useCollabRoom if not already in the URL fragment. */
+  adminSecretOverride?: string;
+}
+
+export interface UseCollabRoomSessionReturn {
+  phase: CollabRoomSessionPhase;
+  room?: UseCollabRoomReturn;
+  /** Participant URL, rebuilt without any admin fragment. Safe to share. */
+  joinUrl?: string;
+  /** Present when the caller holds admin capability (URL or override). */
+  adminUrl?: string;
+  /** Resolved roomId. */
+  roomId?: string;
+  /**
+   * The room identity the caller passed in — mirrored here so the editor
+   * can stamp annotation `author` from the joined room display name
+   * instead of the local `getIdentity()` cookie, which may be stale or
+   * unset on room.plannotator.ai.
+   */
+  user?: CollabRoomUser;
+  /** Populated when phase === 'error'. */
+  error?: { code: string; message: string };
+}
+
+export function useCollabRoomSession(
+  options: UseCollabRoomSessionOptions,
+): UseCollabRoomSessionReturn {
+  const enabled = options.enabled ?? true;
+
+  const room = useCollabRoom({
+    url: options.url,
+    adminSecret: options.adminSecretOverride,
+    user: options.user,
+    enabled,
+  });
+
+  return useMemo<UseCollabRoomSessionReturn>(() => {
+    // `joinUrl` MUST be a participant-only URL — never the raw input URL,
+    // which may include `&admin=...`. We rebuild from the parsed roomId +
+    // roomSecret. When the parsed URL also carries an admin secret (the
+    // creator arrived via their admin URL), we rebuild the admin URL too
+    // so the RoomPanel's "Show admin recovery link" disclosure has
+    // something concrete to copy. Participants without admin capability
+    // see `adminUrl: undefined`.
+    //
+    // If parsing fails we surface the error phase rather than leak
+    // whatever the user pasted.
+    const parsed = parseRoomUrl(options.url);
+    if (!parsed) {
+      return { phase: 'error', error: { code: 'invalid_room_url', message: 'Invalid room URL' } };
+    }
+    const origin = safeOrigin(options.url);
+    const participantUrl = buildRoomJoinUrl(parsed.roomId, parsed.roomSecret, origin);
+    // Rebuild the admin URL from whichever source carries the admin
+    // secret: the URL fragment (creator's first visit) OR the
+    // adminSecretOverride prop (sessionStorage recovery on refresh).
+    // Without this fallback, a recovered admin can delete but the
+    // "Show admin recovery link" disclosure has nothing to copy —
+    // confusing because the admin controls work fine.
+    let adminSecretBytes: Uint8Array | undefined = parsed.adminSecret;
+    if (!adminSecretBytes && options.adminSecretOverride) {
+      try {
+        const decoded = base64urlToBytes(options.adminSecretOverride);
+        if (decoded.length === ADMIN_SECRET_LENGTH_BYTES) adminSecretBytes = decoded;
+      } catch { /* invalid override — ignore, admin URL stays undefined */ }
+    }
+    const adminUrl = adminSecretBytes
+      ? buildAdminRoomUrl(parsed.roomId, parsed.roomSecret, adminSecretBytes, origin)
+      : undefined;
+    return {
+      phase: 'ready',
+      room,
+      joinUrl: participantUrl,
+      adminUrl,
+      roomId: parsed.roomId,
+      user: options.user,
+    };
+  // Deps use stable individual values — NOT `options` (unstable object
+  // identity from inline JSX). Without this, cursor presence updates
+  // (~20Hz) would re-render RoomApp → fresh options → useMemo churn →
+  // new roomSession prop into App → full editor tree reconciliation.
+  // eslint-disable-next-line react-hooks/exhaustive-deps
+  }, [
+    room,
+    options.url,
+    options.adminSecretOverride ?? '',
+    // Track user name/color changes so the `user` field we expose
+    // on the return reflects mid-session rename (unlikely but cheap).
+    options.user.id, options.user.name, options.user.color, enabled,
+  ]);
+}
+
+/**
+ * Extract `origin` (scheme + host + port) from a URL without throwing.
+ * Used so `buildRoomJoinUrl` produces a URL on the same host the user
+ * is currently on, not the default `https://room.plannotator.ai` hardcoded
+ * in `DEFAULT_BASE_URL`.
+ */
+function safeOrigin(url: string): string | undefined {
+  try {
+    return new URL(url).origin;
+  } catch {
+    return undefined;
+  }
+}
diff --git a/packages/ui/hooks/collab/useLandingCreateRoom.ts b/packages/ui/hooks/collab/useLandingCreateRoom.ts
new file mode 100644
index 000000000..f21e28b73
--- /dev/null
+++ b/packages/ui/hooks/collab/useLandingCreateRoom.ts
@@ -0,0 +1,94 @@
+import { useCallback, useRef, useState } from 'react';
+
+export interface LandingCreateRoomSubmit {
+  displayName: string;
+  color: string;
+  expiresInDays: 0 | 1 | 7 | 30;
+}
+
+export interface UseLandingCreateRoomOptions {
+  markdown: string;
+}
+
+export interface UseLandingCreateRoomReturn {
+  inFlight: boolean;
+  error: string;
+  handleCreate: (submit: LandingCreateRoomSubmit) => Promise<void>;
+  handleCancel: () => void;
+}
+
+export function useLandingCreateRoom({
+  markdown,
+}: UseLandingCreateRoomOptions): UseLandingCreateRoomReturn {
+  const [inFlight, setInFlight] = useState(false);
+  const [error, setError] = useState('');
+  const abortRef = useRef<AbortController | null>(null);
+
+  const handleCancel = useCallback(() => {
+    abortRef.current?.abort();
+    abortRef.current = null;
+    setInFlight(false);
+  }, []);
+
+  const handleCreate = useCallback(async (submit: LandingCreateRoomSubmit) => {
+    setInFlight(true);
+    setError('');
+
+    const ctrl = new AbortController();
+    abortRef.current = ctrl;
+
+    try {
+      const { createRoom } = await import('@plannotator/shared/collab/client');
+      const { bytesToBase64url } = await import('@plannotator/shared/collab');
+      const { storeAdminSecret } = await import('@plannotator/ui/utils/adminSecretStorage');
+
+      const baseUrl = window.location.origin;
+
+      const result = await createRoom({
+        baseUrl,
+        expiresInDays: submit.expiresInDays,
+        signal: ctrl.signal,
+        initialSnapshot: {
+          versionId: 'v1',
+          planMarkdown: markdown,
+          annotations: [],
+        },
+        user: {
+          id: crypto.randomUUID(),
+          name: submit.displayName,
+          color: submit.color,
+        },
+      });
+
+      if (ctrl.signal.aborted) return;
+
+      storeAdminSecret(result.roomId, bytesToBase64url(result.adminSecret));
+
+      try {
+        await navigator.clipboard.writeText(result.joinUrl);
+      } catch { /* best-effort */ }
+
+      const appendFragment = (url: string, param: string): string =>
+        `${url}${url.includes('#') ? '&' : '#'}${param}`;
+      let safeUrl = result.joinUrl;
+      if (submit.displayName) {
+        safeUrl = appendFragment(safeUrl, `name=${encodeURIComponent(submit.displayName)}`);
+      }
+      if (submit.color) {
+        safeUrl = appendFragment(safeUrl, `color=${encodeURIComponent(submit.color)}`);
+      }
+
+      window.location.replace(safeUrl);
+    } catch (err) {
+      if (ctrl.signal.aborted) return;
+      const { redactRoomSecrets } = await import('@plannotator/shared/collab');
+      const msg = err instanceof Error ? err.message : String(err);
+      setError(redactRoomSecrets(msg) || 'Failed to create room');
+      setInFlight(false);
+    } finally {
+      if (abortRef.current === ctrl) abortRef.current = null;
+    }
+  }, [markdown]);
+
+  return { inFlight, error, handleCreate, handleCancel };
+}
diff --git a/packages/ui/hooks/collab/usePresenceThrottle.test.tsx b/packages/ui/hooks/collab/usePresenceThrottle.test.tsx
new file mode 100644
index 000000000..29169175c
--- /dev/null
+++ b/packages/ui/hooks/collab/usePresenceThrottle.test.tsx
@@ -0,0 +1,115 @@
+import { describe, expect, test, mock } from 'bun:test';
+import { renderHook } from '@testing-library/react';
+import { usePresenceThrottle } from './usePresenceThrottle';
+
+const TICK = 60;  // buffer above the 50ms throttle window for test timing
+
+function sleep(ms: number) {
+  return new Promise<void>(r => setTimeout(r, ms));
+}
+
+describe('usePresenceThrottle', () => {
+  test('sends the first non-null state (after trailing delay)', async () => {
+    const send = mock((_v: string) => {});
+    const { rerender } = renderHook(
+      ({ state }: { state: string | null }) => usePresenceThrottle(state, send, 50),
+      { initialProps: { state: 'a' as string | null } },
+    );
+    await sleep(TICK);
+    expect(send).toHaveBeenCalledTimes(1);
+    expect(send.mock.calls[0][0]).toBe('a');
+    rerender({ state: 'a' });
+  });
+
+  test('collapses a rapid burst to a single trailing send carrying the latest value', async () => {
+    const send = mock((_v: number) => {});
+    const { rerender } = renderHook(
+      ({ state }: { state: number | null }) => usePresenceThrottle(state, send, 50),
+      { initialProps: { state: 1 as number | null } },
+    );
+
+    // Immediately bump the state several times within the throttle window.
+    rerender({ state: 2 });
+    rerender({ state: 3 });
+    rerender({ state: 4 });
+
+    await sleep(TICK);
+    // Single send with the last value in the burst.
+    expect(send).toHaveBeenCalledTimes(1);
+    expect(send.mock.calls[0][0]).toBe(4);
+  });
+
+  test('allows a second send after the throttle window elapses', async () => {
+    const send = mock((_v: string) => {});
+    const { rerender } = renderHook(
+      ({ state }: { state: string | null }) => usePresenceThrottle(state, send, 50),
+      { initialProps: { state: 'a' as string | null } },
+    );
+    await sleep(TICK);
+    expect(send).toHaveBeenCalledTimes(1);
+
+    rerender({ state: 'b' });
+    await sleep(TICK);
+    expect(send).toHaveBeenCalledTimes(2);
+    expect(send.mock.calls[1][0]).toBe('b');
+  });
+
+  test('null cancels any pending send', async () => {
+    const send = mock((_v: string) => {});
+    const { rerender } = renderHook(
+      ({ state }: { state: string | null }) => usePresenceThrottle(state, send, 50),
+      { initialProps: { state: 'a' as string | null } },
+    );
+    // Before the trailing timer fires, transition to null.
+    rerender({ state: null });
+    await sleep(TICK);
+    expect(send).not.toHaveBeenCalled();
+  });
+
+  test('no-op when send is undefined', async () => {
+    let sendCalls = 0;
+    const _fn = () => { sendCalls++; };
+    const { rerender } = renderHook(
+      ({ state, send }: { state: string | null; send: ((v: string) => void) | undefined }) =>
+        usePresenceThrottle(state, send, 50),
+      { initialProps: { state: 'a' as string | null, send: undefined as ((v: string) => void) | undefined } },
+    );
+    await sleep(TICK);
+    expect(sendCalls).toBe(0);
+
+    // Attach send later; next state change should send.
+    rerender({ state: 'b', send: _fn });
+    await sleep(TICK);
+    expect(sendCalls).toBe(1);
+  });
+
+  test('cancels pending timer on unmount', async () => {
+    const send = mock((_v: string) => {});
+    const { rerender, unmount } = renderHook(
+      ({ state }: { state: string | null }) => usePresenceThrottle(state, send, 50),
+      { initialProps: { state: 'a' as string | null } },
+    );
+    rerender({ state: 'b' });  // schedule a send
+    unmount();
+    await sleep(TICK);
+    expect(send).not.toHaveBeenCalled();
+  });
+
+  test('swallows throwing send so the throttle does not wedge', async () => {
+    let callCount = 0;
+    const send = (_: string) => {
+      callCount++;
+      if (callCount === 1) throw new Error('boom');
+    };
+    const { rerender } = renderHook(
+      ({ state }: { state: string | null }) => usePresenceThrottle(state, send, 50),
+      { initialProps: { state: 'a' as string | null } },
+    );
+    await sleep(TICK);
+    expect(callCount).toBe(1);
+
+    rerender({ state: 'b' });
+    await sleep(TICK);
+    expect(callCount).toBe(2);
+  });
+});
diff --git a/packages/ui/hooks/collab/usePresenceThrottle.ts b/packages/ui/hooks/collab/usePresenceThrottle.ts
new file mode 100644
index 000000000..aaa8aaba5
--- /dev/null
+++ b/packages/ui/hooks/collab/usePresenceThrottle.ts
@@ -0,0 +1,83 @@
+/**
+ * Trailing-throttle presence updates to a send function.
+ *
+ * Motivation: remote cursor presence is produced by pointermove/selection
+ * events that fire far faster than we should transmit. Policy is a
+ * 50ms trailing throttle (≈20Hz). Presence is lossy — the runtime swallows
+ * disconnect errors inside `sendPresence`, so latest-cursor-wins is fine.
+ *
+ * Contract:
+ * - When `state` changes, schedule `send(state)`.
+ *   - If the last send was > `ms` ago, schedule it for next tick (so the
+ *     trailing debouncer collapses rapid bursts to at most one send per
+ *     `ms` window).
+ *   - Otherwise push out the trailing timer so the eventual send carries
+ *     the freshest state.
+ * - `state: null` cancels any pending send without emitting.
+ * - `send: undefined` is a no-op (not yet connected; wait for reconnect).
+ * - On unmount / dep change, cancel any pending timer — no leaked sends.
+ */
+
+import { useEffect, useRef } from 'react';
+
+export function usePresenceThrottle<T>(
+  state: T | null,
+  send: ((value: T) => unknown) | undefined,
+  ms: number = 50,
+): void {
+  const lastSentAtRef = useRef<number>(0);
+  const timerRef = useRef<ReturnType<typeof setTimeout> | null>(null);
+  const latestRef = useRef<T | null>(null);
+  const sendRef = useRef(send);
+
+  // Keep sendRef current so the trailing timer uses the latest send fn
+  // without resetting the throttle window when the callback identity changes
+  // (parents often pass inline lambdas).
+  sendRef.current = send;
+
+  useEffect(() => {
+    latestRef.current = state;
+
+    if (state === null) {
+      if (timerRef.current !== null) {
+        clearTimeout(timerRef.current);
+        timerRef.current = null;
+      }
+      return;
+    }
+
+    if (!sendRef.current) return;
+
+    const now = Date.now();
+    const elapsed = now - lastSentAtRef.current;
+    const delay = elapsed >= ms ? 0 : ms - elapsed;
+
+    if (timerRef.current !== null) {
+      clearTimeout(timerRef.current);
+    }
+    timerRef.current = setTimeout(() => {
+      timerRef.current = null;
+      const value = latestRef.current;
+      const fn = sendRef.current;
+      if (value === null || !fn) return;
+      lastSentAtRef.current = Date.now();
+      try {
+        fn(value);
+      } catch {
+        // Sends are lossy by contract; swallow errors so a throwing send
+        // doesn't wedge the throttle.
+      }
+    }, delay);
+  }, [state, ms]);
+
+  // Cleanup on unmount: cancel any pending timer so an already-scheduled
+  // send cannot fire against a detached component.
+  useEffect(() => {
+    return () => {
+      if (timerRef.current !== null) {
+        clearTimeout(timerRef.current);
+        timerRef.current = null;
+      }
+    };
+  }, []);
+}
diff --git a/packages/ui/hooks/collab/useRoomAdminActions.ts b/packages/ui/hooks/collab/useRoomAdminActions.ts
new file mode 100644
index 000000000..50e294f8d
--- /dev/null
+++ b/packages/ui/hooks/collab/useRoomAdminActions.ts
@@ -0,0 +1,58 @@
+/**
+ * Owns the UI-facing state around the delete command: the in-flight
+ * action (for button disabling + "…ing" labels) and the most recent
+ * failure (for the toast surface).
+ *
+ * State is single-slot by design: one pending action at a time, one
+ * "last error" slot cleared on the next attempt or manual dismiss.
+ * Admin commands are rare and user-initiated; a history queue would
+ * be overengineering for V1.
+ */
+
+import { useCallback, useState } from 'react';
+import type { UseCollabRoomReturn } from './useCollabRoom';
+
+/**
+ * Discriminant for in-flight admin commands. Consumed by the menu,
+ * the pending-state chrome, and the error toast so each surface can
+ * label itself consistently. V1 has a single admin action (delete);
+ * the discriminant is preserved so a future action can slot in without
+ * reshaping every surface that rendered "Failed to delete" etc.
+ */
+export type AdminAction = 'delete';
+
+export interface UseRoomAdminActionsReturn {
+  /** Action currently in flight, if any. Drives button disabled + label. */
+  pending: AdminAction | undefined;
+  /** Most recent failure; null when clear. */
+  error: { action: AdminAction; message: string } | null;
+  /** Dispatch an admin command. No-op when `room` is undefined. */
+  run(action: AdminAction): Promise<void>;
+  /** Clear the current error manually (user dismiss from toast). */
+  dismissError(): void;
+}
+
+export function useRoomAdminActions(
+  room: UseCollabRoomReturn | undefined,
+): UseRoomAdminActionsReturn {
+  const [pending, setPending] = useState<AdminAction | undefined>();
+  const [error, setError] = useState<{ action: AdminAction; message: string } | null>(null);
+
+  const run = useCallback(async (action: AdminAction) => {
+    if (!room) return;
+    setPending(action);
+    setError(null);
+    try {
+      if (action === 'delete') await room.deleteRoom();
+    } catch (err) {
+      const message = err instanceof Error ? err.message : String(err);
+      setError({ action, message });
+    } finally {
+      setPending(undefined);
+    }
+  }, [room]);
+
+  const dismissError = useCallback(() => setError(null), []);
+
+  return { pending, error, run, dismissError };
+}
diff --git a/packages/ui/hooks/collab/useRoomMode.test.tsx b/packages/ui/hooks/collab/useRoomMode.test.tsx
new file mode 100644
index 000000000..517613fa2
--- /dev/null
+++ b/packages/ui/hooks/collab/useRoomMode.test.tsx
@@ -0,0 +1,111 @@
+import { afterEach, beforeEach, describe, expect, test } from 'bun:test';
+import { renderHook } from '@testing-library/react';
+import { useRoomMode } from './useRoomMode';
+import { generateRoomSecret, generateAdminSecret } from '@plannotator/shared/collab';
+import { buildRoomJoinUrl, buildAdminRoomUrl } from '@plannotator/shared/collab/client';
+
+// happy-dom exposes the History API via window.location.href assignment and
+// history.replaceState. We use the latter so the roomId in the path is valid
+// without forcing a full navigation.
+function setLocation(url: string) {
+  window.history.replaceState(null, '', url);
+}
+
+// Note: parseRoomUrl accepts any non-empty pathname segment as a room ID.
+// The server's stricter 22-char base64url check (isRoomId in validation.ts)
+// runs at WebSocket upgrade time; the client parser is intentionally lenient
+// so parse failures surface as 'invalid-room' (missing key/fragment) rather
+// than roomId-shape errors.
+const ROOM_ID = 'ROOM123';
+
+describe('useRoomMode', () => {
+  const originalHref = 'http://localhost/';
+
+  beforeEach(() => {
+    setLocation(originalHref);
+  });
+
+  afterEach(() => {
+    setLocation(originalHref);
+  });
+
+  test('returns local mode on plain "/" with no fragment', () => {
+    setLocation('http://localhost/');
+    const { result } = renderHook(() => useRoomMode());
+    expect(result.current).toEqual({ mode: 'local' });
+  });
+
+  test('returns room mode for a well-formed /c/:roomId#key= URL', () => {
+    const secret = generateRoomSecret();
+    const url = buildRoomJoinUrl(ROOM_ID, secret, 'http://localhost');
+    setLocation(url);
+
+    const { result } = renderHook(() => useRoomMode());
+    expect(result.current.mode).toBe('room');
+    if (result.current.mode === 'room') {
+      expect(result.current.roomId).toBe(ROOM_ID);
+      expect(result.current.url).toBe(url);
+    }
+  });
+
+  test('returns room mode for a URL with both key and admin', () => {
+    const secret = generateRoomSecret();
+    const admin = generateAdminSecret();
+    const url = buildAdminRoomUrl(ROOM_ID, secret, admin, 'http://localhost');
+    setLocation(url);
+
+    const { result } = renderHook(() => useRoomMode());
+    expect(result.current.mode).toBe('room');
+    if (result.current.mode === 'room') {
+      expect(result.current.roomId).toBe(ROOM_ID);
+    }
+  });
+
+  test('returns invalid-room on /c/:roomId with no fragment (not local)', () => {
+    setLocation('http://localhost/c/ROOM123');
+    const { result } = renderHook(() => useRoomMode());
+    expect(result.current.mode).toBe('invalid-room');
+  });
+
+  test('returns invalid-room on /c/:roomId with malformed key (too short)', () => {
+    setLocation('http://localhost/c/ROOM123#key=AAAA');
+    const { result } = renderHook(() => useRoomMode());
+    expect(result.current.mode).toBe('invalid-room');
+  });
+
+  test('returns invalid-room when key is not valid base64url', () => {
+    setLocation('http://localhost/c/ROOM123#key=!!!invalid!!!');
+    const { result } = renderHook(() => useRoomMode());
+    expect(result.current.mode).toBe('invalid-room');
+  });
+
+  test('returns invalid-room when admin param is malformed', () => {
+    const secret = generateRoomSecret();
+    const keyParam = buildRoomJoinUrl(ROOM_ID, secret, 'http://localhost').split('#key=')[1];
+    setLocation(`http://localhost/c/${ROOM_ID}#key=${keyParam}&admin=short`);
+    const { result } = renderHook(() => useRoomMode());
+    expect(result.current.mode).toBe('invalid-room');
+  });
+
+  test('returns local mode for non-/c/ paths with a key fragment', () => {
+    const secret = generateRoomSecret();
+    const keyParam = buildRoomJoinUrl(ROOM_ID, secret, 'http://localhost').split('#key=')[1];
+    setLocation(`http://localhost/other/path#key=${keyParam}`);
+    const { result } = renderHook(() => useRoomMode());
+    expect(result.current).toEqual({ mode: 'local' });
+  });
+
+  test('ignores hashchange after initial mount (value is cached)', () => {
+    const secret = generateRoomSecret();
+    const url = buildRoomJoinUrl(ROOM_ID, secret, 'http://localhost');
+    setLocation(url);
+    const { result, rerender } = renderHook(() => useRoomMode());
+    expect(result.current.mode).toBe('room');
+
+    // Navigate away AFTER mount — the hook holds its initial read and does
+    // not re-subscribe. Slice 5 contract: mode changes require a full reload.
+    setLocation('http://localhost/');
+    rerender();
+    expect(result.current.mode).toBe('room');
+  });
+});
diff --git a/packages/ui/hooks/collab/useRoomMode.ts b/packages/ui/hooks/collab/useRoomMode.ts
new file mode 100644
index 000000000..d3f5d12f1
--- /dev/null
+++ b/packages/ui/hooks/collab/useRoomMode.ts
@@ -0,0 +1,68 @@
+/**
+ * Detect whether the editor is running in live-room mode, local mode, or
+ * a broken-room-link state that must NOT fall through to local mode.
+ *
+ * Three-way return:
+ *   - `{ mode: 'room', roomId, url }`: the URL is `/c/<roomId>` AND
+ *     parseRoomUrl succeeds (valid 32-byte roomSecret in the fragment).
+ *   - `{ mode: 'invalid-room', reason }`: the URL is a room-shaped path
+ *     (`/c/...` or any `/c/*` variant) but parseRoomUrl fails — missing
+ *     fragment, malformed key, invalid base64url encoding, or extra path
+ *     segments. Note: parseRoomUrl does NOT enforce the server's 22-char
+ *     base64url roomId contract (see validation.ts `isRoomId`); the
+ *     server rejects invalid roomIds at the WebSocket upgrade step
+ *     before the client even authenticates. AppRoot renders a terminal
+ *     error instead of booting
+ *     the local editor. This closes the "public room origin boots local
+ *     app on a broken link" loophole — a user landing on
+ *     room.plannotator.ai/c/<foo> with no #key should see "this link
+ *     looks broken", not the full local editor with no plan.
+ *   - `{ mode: 'local' }`: everything else (bare `/`, `/about`, etc.).
+ *     Callers that are sure the origin is room-only (i.e., Cloudflare
+ *     deployment) can ignore this branch; AppRoot still renders it for
+ *     dev/test scenarios where the room bundle gets loaded at `/`.
+ *
+ * Parses once on mount. Mode transitions require a full reload — the
+ * two shells own substantially different state machines.
+ *
+ * SSR-safe: returns local mode if `window` is undefined.
+ */
+
+import { useState } from 'react';
+import { parseRoomUrl } from '@plannotator/shared/collab/client';
+
+export type RoomMode =
+  | { mode: 'local' }
+  | { mode: 'room'; roomId: string; url: string }
+  | { mode: 'invalid-room'; reason: string };
+
+const ROOM_PATH_RE = /^\/c(\/|$)/;
+
+export function useRoomMode(): RoomMode {
+  const [value] = useState<RoomMode>(() => {
+    if (typeof window === 'undefined') return { mode: 'local' };
+
+    const href = window.location.href;
+    const pathname = window.location.pathname;
+
+    // Path doesn't look room-shaped at all → local mode.
+    if (!ROOM_PATH_RE.test(pathname)) {
+      return { mode: 'local' };
+    }
+
+    // Path starts with /c/ — it's claiming to be a room URL. From here
+    // every failure is an 'invalid-room' (NOT a silent fallthrough to
+    // local), so a public room origin never renders the full local
+    // editor for malformed inputs.
+    const parsed = parseRoomUrl(href);
+    if (!parsed) {
+      return {
+        mode: 'invalid-room',
+        reason:
+          'This room link is missing or malformed. Check that the URL includes a valid #key= fragment.',
+      };
+    }
+    return { mode: 'room', roomId: parsed.roomId, url: href };
+  });
+  return value;
+}
diff --git a/packages/ui/hooks/useAnnotationController.room.test.tsx b/packages/ui/hooks/useAnnotationController.room.test.tsx
new file mode 100644
index 000000000..01aec6447
--- /dev/null
+++ b/packages/ui/hooks/useAnnotationController.room.test.tsx
@@ -0,0 +1,465 @@
+import { act } from 'react';
+import { describe, expect, test } from 'bun:test';
+import { renderHook } from '@testing-library/react';
+import { useRoomAnnotationController } from './useAnnotationController';
+import { AnnotationType, type Annotation } from '../types';
+import type { UseCollabRoomReturn } from './collab/useCollabRoom';
+import type { RoomAnnotation } from '@plannotator/shared/collab';
+
+function makeAnn(id: string, overrides: Partial<Annotation> = {}): Annotation {
+  return {
+    id,
+    blockId: 'b1',
+    startOffset: 0,
+    endOffset: 5,
+    type: AnnotationType.COMMENT,
+    text: `text ${id}`,
+    originalText: 'hello',
+    createdA: Date.now(),
+    ...overrides,
+  };
+}
+
+/**
+ * Build a UseCollabRoomReturn stub. Tests control `annotations` and `seq`
+ * via mutator functions, then rerender with the same room reference — the
+ * controller reads via getters so mutations land in the next render
+ * without rebuilding the stub.
+ */
+function mockRoom(initial: {
+  annotations?: RoomAnnotation[];
+  seq?: number;
+}): {
+  room: UseCollabRoomReturn;
+  setAnnotations(next: RoomAnnotation[]): void;
+  setSeq(next: number): void;
+  /** Advance room state: new annotations + new seq in one mutation. */
+  advance(next: RoomAnnotation[], seqDelta?: number): void;
+  /** Raise a new server-side error (simulates room.error wire message). */
+  emitError(
+    code: string,
+    message: string,
+    scope?: 'mutation' | 'admin' | 'event' | 'presence' | 'snapshot' | 'join',
+  ): void;
+  calls: { method: string; args: unknown[] }[];
+  makeSendFail(shouldFail: boolean): void;
+} {
+  let annotations = initial.annotations ?? [];
+  let seq = initial.seq ?? 0;
+  let lastError: { code: string; message: string; scope: 'mutation' | 'admin' | 'event' | 'presence' | 'snapshot' | 'join' } | null = null;
+  let lastErrorId = 0;
+  let shouldFail = false;
+  const calls: { method: string; args: unknown[] }[] = [];
+
+  const record = (method: string, args: unknown[]) => {
+    calls.push({ method, args });
+  };
+  const maybeFail = async (method: string, args: unknown[]) => {
+    record(method, args);
+    if (shouldFail) throw new Error(`simulated failure for ${method}`);
+  };
+
+  const makeReturn = (): UseCollabRoomReturn => ({
+    connectionStatus: 'authenticated',
+    roomUnavailable: false,
+    planMarkdown: '',
+    get annotations() { return annotations; },
+    get seq() { return seq; },
+    remotePresence: {},
+    hasAdminCapability: false,
+    get lastError() { return lastError; },
+    get lastErrorId() { return lastErrorId; },
+    addAnnotations: async (a) => maybeFail('addAnnotations', [a]),
+    updateAnnotation: async (id, patch) => maybeFail('updateAnnotation', [id, patch]),
+    removeAnnotations: async (ids) => maybeFail('removeAnnotations', [ids]),
+    clearAnnotations: async (src) => maybeFail('clearAnnotations', [src]),
+    updatePresence: async () => {},
+    deleteRoom: async () => {},
+    client: null,
+  });
+
+  return {
+    room: makeReturn(),
+    setAnnotations: (next) => { annotations = next; },
+    setSeq: (next) => { seq = next; },
+    advance: (next, delta = 1) => { annotations = next; seq += delta; },
+    emitError: (code, message, scope = 'mutation') => {
+      lastError = { code, message, scope };
+      lastErrorId++;
+    },
+    calls,
+    makeSendFail: (v) => { shouldFail = v; },
+  };
+}
+
+describe('useRoomAnnotationController', () => {
+  test('mode is "room"', () => {
+    const m = mockRoom({});
+    const { result } = renderHook(
+      ({ room }) => useRoomAnnotationController(room),
+      { initialProps: { room: m.room } },
+    );
+    expect(result.current.mode).toBe('room');
+  });
+
+  test('add() marks pending + populates pendingAdditions; NOT annotations, NOT echoed yet', async () => {
+    const m = mockRoom({ seq: 0 });
+    const { result, rerender } = renderHook(
+      ({ room }) => useRoomAnnotationController(room),
+      { initialProps: { room: m.room } },
+    );
+
+    const ann = makeAnn('a1');
+    await act(async () => {
+      result.current.add(ann);
+    });
+    // Canonical annotations stay server-only — V1 server-authoritative.
+    expect(result.current.annotations.some(a => a.id === 'a1')).toBe(false);
+    // Optimistic row is surfaced via pendingAdditions for panel rendering.
+    expect(result.current.pendingAdditions.has('a1')).toBe(true);
+    expect(result.current.pending.get('a1')?.kind).toBe('add');
+    expect(m.calls.some(c => c.method === 'addAnnotations')).toBe(true);
+
+    // Server applies — seq advances and id appears in room.annotations.
+    m.advance([toRoomAnnotation(ann)]);
+    await act(async () => { rerender({ room: m.room }); });
+    expect(result.current.pending.has('a1')).toBe(false);
+    // Optimistic buffer dropped; canonical list now holds the echo.
+    expect(result.current.annotations.filter(a => a.id === 'a1').length).toBe(1);
+    expect(result.current.pendingAdditions.has('a1')).toBe(false);
+  });
+
+  test('add pending does NOT clear on an unrelated seq advance', async () => {
+    // An unrelated peer's op advances seq while our add is still in flight.
+    // Canonical annotations get a different id from the peer; our id still
+    // hasn't echoed. Pending MUST stay set so the optimistic row keeps its
+    // "Sending…" chrome instead of silently demoting to a normal row.
+    const m = mockRoom({ seq: 5 });
+    const { result, rerender } = renderHook(
+      ({ room }) => useRoomAnnotationController(room),
+      { initialProps: { room: m.room } },
+    );
+
+    const mine = makeAnn('mine');
+    await act(async () => { result.current.add(mine); });
+    expect(result.current.pending.has('mine')).toBe(true);
+
+    // Peer's op bumps seq and adds their annotation — our id is absent.
+    const theirs = makeAnn('theirs');
+    m.advance([toRoomAnnotation(theirs)]);
+    await act(async () => { rerender({ room: m.room }); });
+
+    expect(result.current.pending.get('mine')?.kind).toBe('add');
+    expect(result.current.pendingAdditions.has('mine')).toBe(true);
+  });
+
+  test('server-side rejection (room.error) moves in-flight pending to failed', async () => {
+    // Transport promise resolves on SEND, so sendOp doesn't reject when
+    // the server later rejects the op. The controller must observe
+    // room.lastError to transition pending → failed, otherwise the row
+    // would sit as "Sending…" forever.
+    const m = mockRoom({ seq: 1 });
+    const { result, rerender } = renderHook(
+      ({ room }) => useRoomAnnotationController(room),
+      { initialProps: { room: m.room } },
+    );
+
+    await act(async () => { result.current.add(makeAnn('failed-add')); });
+    expect(result.current.pending.has('failed-add')).toBe(true);
+
+    m.emitError('validation_error', 'Malformed annotation payload');
+    await act(async () => { rerender({ room: m.room }); });
+
+    expect(result.current.pending.has('failed-add')).toBe(false);
+    const failure = result.current.failed.get('failed-add');
+    expect(failure?.kind).toBe('add');
+    expect(failure?.error).toContain('validation_error');
+    // Row remains in pendingAdditions so Retry/Discard can render.
+    expect(result.current.pendingAdditions.has('failed-add')).toBe(true);
+  });
+
+  test('server-side rejection also catches update and remove', async () => {
+    const a = makeAnn('u-edit', { text: 'before' });
+    const b = makeAnn('u-rm');
+    const m = mockRoom({
+      annotations: [toRoomAnnotation(a), toRoomAnnotation(b)],
+      seq: 2,
+    });
+    const { result, rerender } = renderHook(
+      ({ room }) => useRoomAnnotationController(room),
+      { initialProps: { room: m.room } },
+    );
+
+    await act(async () => {
+      result.current.update('u-edit', { text: 'after' });
+      result.current.remove('u-rm');
+    });
+    expect(result.current.pending.size).toBe(2);
+
+    m.emitError('validation_error', 'bad payload');
+    await act(async () => { rerender({ room: m.room }); });
+
+    expect(result.current.pending.size).toBe(0);
+    expect(result.current.failed.has('u-edit')).toBe(true);
+    expect(result.current.failed.has('u-rm')).toBe(true);
+  });
+
+  test('non-mutation error scopes (presence/snapshot/event/join) do NOT fail pending ops', async () => {
+    // A peer's malformed presence frame or a local snapshot decode
+    // failure is not a rejection of OUR sends. Only server-sent
+    // 'mutation'-scoped errors must move pending → failed.
+    const m = mockRoom({ seq: 3 });
+    const { result, rerender } = renderHook(
+      ({ room }) => useRoomAnnotationController(room),
+      { initialProps: { room: m.room } },
+    );
+    await act(async () => { result.current.add(makeAnn('still-pending')); });
+    expect(result.current.pending.has('still-pending')).toBe(true);
+
+    m.emitError('presence_malformed', 'peer bad presence', 'presence');
+    await act(async () => { rerender({ room: m.room }); });
+    expect(result.current.pending.has('still-pending')).toBe(true);
+    expect(result.current.failed.has('still-pending')).toBe(false);
+
+    m.emitError('event_decrypt_failed', 'peer event failed', 'event');
+    await act(async () => { rerender({ room: m.room }); });
+    expect(result.current.pending.has('still-pending')).toBe(true);
+
+    m.emitError('snapshot_malformed', 'bad snapshot', 'snapshot');
+    await act(async () => { rerender({ room: m.room }); });
+    expect(result.current.pending.has('still-pending')).toBe(true);
+  });
+
+  test('admin-scoped errors do NOT trip mutation pending → failed', async () => {
+    // A failed admin-scope command (e.g. delete) must not mark racing
+    // annotation sends as failed. The controller filters by scope.
+    const m = mockRoom({ seq: 1 });
+    const { result, rerender } = renderHook(
+      ({ room }) => useRoomAnnotationController(room),
+      { initialProps: { room: m.room } },
+    );
+    await act(async () => { result.current.add(makeAnn('ann-safe')); });
+    expect(result.current.pending.has('ann-safe')).toBe(true);
+
+    m.emitError('delete_failed', 'admin delete rejected', 'admin');
+    await act(async () => { rerender({ room: m.room }); });
+
+    // Pending should STAY pending — admin error didn't reject the add.
+    expect(result.current.pending.has('ann-safe')).toBe(true);
+    expect(result.current.failed.has('ann-safe')).toBe(false);
+  });
+
+  test('a single error is processed exactly once (dedup by lastErrorId)', async () => {
+    // Simulate the CollabRoomClient re-emitting state with a cloned
+    // lastError object: the object identity changes every render but
+    // lastErrorId does not. The controller must not double-process.
+    const m = mockRoom({ seq: 2 });
+    const { result, rerender } = renderHook(
+      ({ room }) => useRoomAnnotationController(room),
+      { initialProps: { room: m.room } },
+    );
+
+    const first = makeAnn('first-add');
+    await act(async () => { result.current.add(first); });
+
+    m.emitError('validation_error', 'bad payload', 'mutation');
+    await act(async () => { rerender({ room: m.room }); });
+    expect(result.current.failed.has('first-add')).toBe(true);
+
+    // Another add races through AFTER the first rejection. The new one
+    // must not be swept into the same failed bucket just because
+    // lastError is still non-null.
+    await act(async () => { result.current.add(makeAnn('second-add')); });
+    // Simulate a state re-emission with the SAME error (clone, same id).
+    // `emitError` without a new call keeps lastErrorId stable; we just
+    // force a rerender.
+    await act(async () => { rerender({ room: m.room }); });
+
+    expect(result.current.pending.has('second-add')).toBe(true);
+    expect(result.current.failed.has('second-add')).toBe(false);
+  });
+
+  test('failed add keeps pendingAdditions row so Retry/Discard render', async () => {
+    const m = mockRoom({});
+    m.makeSendFail(true);
+    const { result } = renderHook(() => useRoomAnnotationController(m.room));
+
+    await act(async () => {
+      result.current.add(makeAnn('failed-add'));
+      await new Promise(r => setTimeout(r, 10));
+    });
+    expect(result.current.failed.has('failed-add')).toBe(true);
+    // Failed row lives in pendingAdditions (panel-only), NOT in annotations.
+    expect(result.current.annotations.some(a => a.id === 'failed-add')).toBe(false);
+    expect(result.current.pendingAdditions.has('failed-add')).toBe(true);
+
+    await act(async () => { result.current.discard!('failed-add'); });
+    expect(result.current.pendingAdditions.has('failed-add')).toBe(false);
+  });
+
+  test('update() pending clears once seq advances past send (regardless of patch match)', async () => {
+    // Reconciliation uses seq-advance as the sole clear trigger. Gating on
+    // "echo reflects our patch" would leave pending stuck forever when
+    // another user's concurrent write supersedes ours — not the UX we want.
+    const ann = makeAnn('u1', { text: 'before' });
+    const m = mockRoom({ annotations: [toRoomAnnotation(ann)], seq: 10 });
+    const { result, rerender } = renderHook(
+      ({ room }) => useRoomAnnotationController(room),
+      { initialProps: { room: m.room } },
+    );
+
+    await act(async () => {
+      result.current.update('u1', { text: 'after' });
+    });
+    expect(result.current.pending.get('u1')?.kind).toBe('update');
+
+    // Seq does not advance — pending stays.
+    await act(async () => { rerender({ room: m.room }); });
+    expect(result.current.pending.has('u1')).toBe(true);
+
+    // Seq advances with the post-patch value — pending clears.
+    m.advance([toRoomAnnotation({ ...ann, text: 'after' })]);
+    await act(async () => { rerender({ room: m.room }); });
+    expect(result.current.pending.has('u1')).toBe(false);
+  });
+
+  test('update() pending also clears when seq advances but value was superseded', async () => {
+    const ann = makeAnn('u2', { text: 'before' });
+    const m = mockRoom({ annotations: [toRoomAnnotation(ann)], seq: 10 });
+    const { result, rerender } = renderHook(
+      ({ room }) => useRoomAnnotationController(room),
+      { initialProps: { room: m.room } },
+    );
+
+    await act(async () => { result.current.update('u2', { text: 'mine' }); });
+
+    // Server admits another op (seq advances) whose echoed value is
+    // `theirs` — NOT our patch. Pending must still clear: the server has
+    // moved past our send and the UI correctly shows the winning value.
+    m.advance([toRoomAnnotation({ ...ann, text: 'theirs' })]);
+    await act(async () => { rerender({ room: m.room }); });
+    expect(result.current.pending.has('u2')).toBe(false);
+  });
+
+  test('remove() pending clears when seq advances and id is absent', async () => {
+    const ann = makeAnn('r1');
+    const m = mockRoom({ annotations: [toRoomAnnotation(ann)], seq: 5 });
+    const { result, rerender } = renderHook(
+      ({ room }) => useRoomAnnotationController(room),
+      { initialProps: { room: m.room } },
+    );
+
+    await act(async () => {
+      result.current.remove('r1');
+    });
+    expect(result.current.pending.get('r1')?.kind).toBe('remove');
+
+    // Server processes the remove — seq advances, id gone.
+    m.advance([]);
+    await act(async () => { rerender({ room: m.room }); });
+    expect(result.current.pending.has('r1')).toBe(false);
+  });
+
+  test('remove() pending stays when seq has NOT advanced even if id is absent', async () => {
+    // Edge case: removing an id that is already absent from the server snapshot.
+    const m = mockRoom({ annotations: [], seq: 3 });
+    const { result, rerender } = renderHook(
+      ({ room }) => useRoomAnnotationController(room),
+      { initialProps: { room: m.room } },
+    );
+
+    await act(async () => { result.current.remove('already-gone'); });
+    expect(result.current.pending.has('already-gone')).toBe(true);
+
+    // No seq advance yet → pending must not prematurely clear.
+    await act(async () => { rerender({ room: m.room }); });
+    expect(result.current.pending.has('already-gone')).toBe(true);
+
+    // Now seq advances. Even though id was never in the snapshot, we
+    // consider the server to have processed the remove (idempotent).
+    m.setSeq(4);
+    await act(async () => { rerender({ room: m.room }); });
+    expect(result.current.pending.has('already-gone')).toBe(false);
+  });
+
+  test('failed send moves id from pending to failed with kind + error', async () => {
+    const m = mockRoom({});
+    m.makeSendFail(true);
+    const { result } = renderHook(() => useRoomAnnotationController(m.room));
+
+    await act(async () => {
+      result.current.add(makeAnn('f1'));
+      await new Promise(r => setTimeout(r, 10));
+    });
+
+    expect(result.current.pending.has('f1')).toBe(false);
+    const fail = result.current.failed.get('f1');
+    expect(fail?.kind).toBe('add');
+    expect(fail?.error).toContain('simulated failure');
+  });
+
+  test('retry resends a previously-failed op', async () => {
+    const m = mockRoom({});
+    m.makeSendFail(true);
+    const { result } = renderHook(() => useRoomAnnotationController(m.room));
+
+    await act(async () => {
+      result.current.add(makeAnn('r2'));
+      await new Promise(r => setTimeout(r, 10));
+    });
+    expect(result.current.failed.has('r2')).toBe(true);
+
+    m.makeSendFail(false);
+    await act(async () => {
+      result.current.retry!('r2');
+      await new Promise(r => setTimeout(r, 10));
+    });
+    expect(result.current.failed.has('r2')).toBe(false);
+    expect(result.current.pending.has('r2')).toBe(true);
+    expect(m.calls.filter(c => c.method === 'addAnnotations').length).toBe(2);
+  });
+
+  test('discard drops a failed id without resending', async () => {
+    const m = mockRoom({});
+    m.makeSendFail(true);
+    const { result } = renderHook(() => useRoomAnnotationController(m.room));
+
+    await act(async () => {
+      result.current.add(makeAnn('d1'));
+      await new Promise(r => setTimeout(r, 10));
+    });
+    expect(result.current.failed.has('d1')).toBe(true);
+
+    await act(async () => result.current.discard!('d1'));
+    expect(result.current.failed.has('d1')).toBe(false);
+  });
+
+  test('setAll is undefined in room mode', () => {
+    const m = mockRoom({});
+    const { result } = renderHook(() => useRoomAnnotationController(m.room));
+    expect(result.current.setAll).toBeUndefined();
+  });
+
+  test('strips images field when sending', async () => {
+    const m = mockRoom({});
+    const { result } = renderHook(() => useRoomAnnotationController(m.room));
+
+    const annWithImages = makeAnn('img1', {
+      images: [{ path: '/tmp/x.png', name: 'x' }],
+    });
+    await act(async () => {
+      result.current.add(annWithImages);
+    });
+
+    const addCall = m.calls.find(c => c.method === 'addAnnotations');
+    expect(addCall).toBeDefined();
+    const [sent] = addCall!.args as [RoomAnnotation[]];
+    expect(sent[0].id).toBe('img1');
+    expect('images' in sent[0]).toBe(false);
+  });
+});
+
+function toRoomAnnotation(a: Annotation): RoomAnnotation {
+  const { images: _images, ...rest } = a;
+  return rest as RoomAnnotation;
+}
diff --git a/packages/ui/hooks/useAnnotationController.test.tsx b/packages/ui/hooks/useAnnotationController.test.tsx
new file mode 100644
index 000000000..77ee0f2e4
--- /dev/null
+++ b/packages/ui/hooks/useAnnotationController.test.tsx
@@ -0,0 +1,103 @@
+import { act } from 'react';
+import { describe, expect, test } from 'bun:test';
+import { renderHook } from '@testing-library/react';
+import { useAnnotationController } from './useAnnotationController';
+import { AnnotationType, type Annotation } from '../types';
+
+function makeAnn(id: string, overrides: Partial<Annotation> = {}): Annotation {
+  return {
+    id,
+    blockId: 'b1',
+    startOffset: 0,
+    endOffset: 5,
+    type: AnnotationType.COMMENT,
+    text: `text ${id}`,
+    originalText: 'hello',
+    createdA: Date.now(),
+    ...overrides,
+  };
+}
+
+describe('useAnnotationController — local mode', () => {
+  test('starts empty with no pending/failed/pendingAdditions', () => {
+    const { result } = renderHook(() => useAnnotationController({}));
+    expect(result.current.mode).toBe('local');
+    expect(result.current.annotations).toEqual([]);
+    expect(result.current.pending.size).toBe(0);
+    expect(result.current.failed.size).toBe(0);
+    expect(result.current.pendingAdditions.size).toBe(0);
+  });
+
+  test('add appends to the list', () => {
+    const { result } = renderHook(() => useAnnotationController({}));
+    act(() => result.current.add(makeAnn('a')));
+    expect(result.current.annotations).toHaveLength(1);
+    expect(result.current.annotations[0].id).toBe('a');
+  });
+
+  test('update patches a specific id', () => {
+    const { result } = renderHook(() => useAnnotationController({}));
+    act(() => result.current.add(makeAnn('a', { text: 'before' })));
+    act(() => result.current.update('a', { text: 'after' }));
+    expect(result.current.annotations[0].text).toBe('after');
+  });
+
+  test('update on unknown id is a no-op', () => {
+    const { result } = renderHook(() => useAnnotationController({}));
+    act(() => result.current.add(makeAnn('a')));
+    act(() => result.current.update('missing', { text: 'x' }));
+    expect(result.current.annotations).toHaveLength(1);
+    expect(result.current.annotations[0].text).toBe('text a');
+  });
+
+  test('remove drops the matching id', () => {
+    const { result } = renderHook(() => useAnnotationController({}));
+    act(() => {
+      result.current.add(makeAnn('a'));
+      result.current.add(makeAnn('b'));
+    });
+    act(() => result.current.remove('a'));
+    expect(result.current.annotations.map(a => a.id)).toEqual(['b']);
+  });
+
+  test('clear() without source removes all', () => {
+    const { result } = renderHook(() => useAnnotationController({}));
+    act(() => {
+      result.current.add(makeAnn('a'));
+      result.current.add(makeAnn('b'));
+    });
+    act(() => result.current.clear());
+    expect(result.current.annotations).toEqual([]);
+  });
+
+  test('clear(source) removes only matching source', () => {
+    const { result } = renderHook(() => useAnnotationController({}));
+    act(() => {
+      result.current.add(makeAnn('a', { source: 'eslint' }));
+      result.current.add(makeAnn('b', { source: 'prettier' }));
+      result.current.add(makeAnn('c'));  // no source
+    });
+    act(() => result.current.clear('eslint'));
+    expect(result.current.annotations.map(a => a.id).sort()).toEqual(['b', 'c']);
+  });
+
+  test('setAll performs atomic replace-all', () => {
+    const { result } = renderHook(() => useAnnotationController({}));
+    act(() => result.current.add(makeAnn('a')));
+    act(() => result.current.setAll!([makeAnn('x'), makeAnn('y')]));
+    expect(result.current.annotations.map(a => a.id)).toEqual(['x', 'y']);
+  });
+
+  test('respects initial annotations', () => {
+    const initial = [makeAnn('a'), makeAnn('b')];
+    const { result } = renderHook(() => useAnnotationController({ initial }));
+    expect(result.current.annotations).toHaveLength(2);
+  });
+
+  test('retry/discard are undefined in local mode', () => {
+    const { result } = renderHook(() => useAnnotationController({}));
+    expect(result.current.retry).toBeUndefined();
+    expect(result.current.discard).toBeUndefined();
+  });
+
+});
diff --git a/packages/ui/hooks/useAnnotationController.ts b/packages/ui/hooks/useAnnotationController.ts
new file mode 100644
index 000000000..b50a5314a
--- /dev/null
+++ b/packages/ui/hooks/useAnnotationController.ts
@@ -0,0 +1,511 @@
+/**
+ * useAnnotationController — returns an AnnotationController bound to either
+ * local state (useState<Annotation[]>) or a CollabRoom session.
+ *
+ * This hook is the single mode-awareness point in App.tsx. Before Slice 5
+ * every annotation mutation site called `setAnnotations(prev => ...)`
+ * directly; now those call sites invoke `controller.add/update/remove/clear`,
+ * which do the right thing for whichever mode is active.
+ *
+ * Room mode delegates to `useCollabRoom` with KIND-SPECIFIC pending
+ * reconciliation:
+ *
+ *   add    — pending clears ONLY when the id appears in
+ *            `room.annotations`. An unrelated peer's op advancing seq
+ *            must NOT clear an add pending, because the optimistic
+ *            row (exposed via `pendingAdditions`) would otherwise
+ *            linger as an ordinary-looking panel row with no
+ *            "Sending…" chrome and no Retry affordance. We need a real
+ *            echo-by-id, a transport-promise rejection (→ `failed`),
+ *            or explicit Discard to progress the row.
+ *
+ *   update — pending clears once `room.seq > sentAtSeq`. Concurrent-
+ *            write supersession is acceptable: the canonical list
+ *            shows the winning value, which is correct server state.
+ *            Gating on patch-match would leave pending stuck forever
+ *            when another user's write wins.
+ *
+ *   remove — pending clears once `room.seq > sentAtSeq`. Remove has no
+ *            optimistic row to strand, so a spurious clear is harmless
+ *            even for remove-of-already-absent (server no-op).
+ *
+ * Optimistic adds live in `pendingAdditions` (panel-only; NOT merged
+ * into the canonical `annotations` list). This preserves the V1
+ * server-authoritative contract — approve/deny/export never see
+ * un-echoed rows.
+ *
+ * `failed` entries carry kind + payload so retry() can re-send without
+ * the caller providing the op args again. Slice 5 is online-only:
+ * failed ops surface Retry/Discard UI; they do NOT auto-replay on
+ * reconnect.
+ */
+
+import { useCallback, useEffect, useMemo, useRef, useState } from 'react';
+import type {
+  AnnotationController,
+  PendingKind,
+  PendingOp,
+  FailedOp,
+} from '../types/annotationController';
+import type { Annotation } from '../types';
+import type { UseCollabRoomReturn } from './collab/useCollabRoom';
+import type { RoomAnnotation } from '@plannotator/shared/collab';
+import { toRoomAnnotation as sharedToRoomAnnotation } from '@plannotator/shared/collab';
+
+const EMPTY_PENDING_PUBLIC: ReadonlyMap<string, PendingOp> = new Map();
+const EMPTY_FAILED: ReadonlyMap<string, FailedOp> = new Map();
+const EMPTY_PENDING_ADDITIONS: ReadonlyMap<string, Annotation> = new Map();
+
+export function useLocalAnnotationController(
+  initial: Annotation[] = [],
+): AnnotationController {
+  const [annotations, setAnnotations] = useState<Annotation[]>(initial);
+
+  const add = useCallback((ann: Annotation) => {
+    setAnnotations(prev => [...prev, ann]);
+  }, []);
+
+  const update = useCallback((id: string, patch: Partial<Annotation>) => {
+    setAnnotations(prev => prev.map(a => (a.id === id ? { ...a, ...patch } : a)));
+  }, []);
+
+  const remove = useCallback((id: string) => {
+    setAnnotations(prev => prev.filter(a => a.id !== id));
+  }, []);
+
+  const clear = useCallback((source?: string) => {
+    if (source === undefined) {
+      setAnnotations([]);
+    } else {
+      setAnnotations(prev => prev.filter(a => a.source !== source));
+    }
+  }, []);
+
+  return {
+    mode: 'local',
+    annotations,
+    pendingAdditions: EMPTY_PENDING_ADDITIONS,
+    pending: EMPTY_PENDING_PUBLIC,
+    failed: EMPTY_FAILED,
+    add,
+    update,
+    remove,
+    clear,
+    setAll: setAnnotations,
+  };
+}
+
+/** Payload retained per-failed-op so retry() can reconstruct the send. */
+type RetryPayload =
+  | { kind: 'add'; value: RoomAnnotation }
+  | { kind: 'update'; value: { id: string; patch: Partial<RoomAnnotation> } }
+  | { kind: 'remove'; value: { id: string } };
+
+/**
+ * Room-mode pending entry. `sentAtSeq` is the server seq at send time,
+ * consulted by the kind-specific reconciliation effect below:
+ *
+ *   add    — NOT cleared by seq advance. Only cleared when the echoed
+ *            annotation appears in `room.annotations` (id match), or
+ *            by the server-rejection / transport-rejection paths.
+ *            Clearing on unrelated seq advance would leave the
+ *            optimistic row in `pendingAdditions` stranded as an
+ *            ordinary-looking panel row with no "Sending…" chrome.
+ *   update — cleared once `room.seq > sentAtSeq`. Concurrent-write
+ *            supersession is acceptable; the canonical list already
+ *            shows the winning value.
+ *   remove — cleared once `room.seq > sentAtSeq`. Has no optimistic row
+ *            to strand, so a spurious clear on remove-of-absent is
+ *            harmless.
+ *
+ * `expectedPatch` is snapshotted for update ops and consumed by retry()
+ * to rebuild the retry payload; the reconcile effect doesn't consult it.
+ */
+interface RoomPending extends PendingOp {
+  /** Server seq at the moment this op was sent. */
+  sentAtSeq: number;
+  /** For 'update' only — retained for retry()'s payload reconstruction. */
+  expectedPatch?: Partial<RoomAnnotation>;
+}
+
+export function useRoomAnnotationController(
+  room: UseCollabRoomReturn,
+): AnnotationController {
+  const [pending, setPending] = useState<ReadonlyMap<string, RoomPending>>(
+    () => new Map<string, RoomPending>(),
+  );
+  const [failed, setFailed] = useState<ReadonlyMap<string, FailedOp>>(EMPTY_FAILED);
+  /**
+   * Optimistic-add buffer surfaced via the `pendingAdditions` field —
+   * PANEL-ONLY. These entries are NOT merged into the canonical
+   * `annotations` list, so the Viewer (which renders off the canonical
+   * list) never sees them; only the annotation sidebar does, where it
+   * attaches "Sending…" / failed chrome around the row. Keeping them
+   * out of the canonical list preserves the V1 server-authoritative
+   * contract for approve/deny/export.
+   *
+   * Entries are removed:
+   *   - when the server echoes the id (it appears in room.annotations), OR
+   *   - on explicit Discard (failed row dismissed by the user).
+   *
+   * Failed adds keep their buffer entry so the sidebar still has a row
+   * on which to render the Retry/Discard affordances.
+   */
+  const [optimisticAdds, setOptimisticAdds] = useState<ReadonlyMap<string, Annotation>>(
+    () => new Map<string, Annotation>(),
+  );
+  // Buffer failed-op payloads keyed by id so retry() can re-send without
+  // requiring the caller to pass the annotation back in.
+  const failedPayloadsRef = useRef<Map<string, RetryPayload>>(new Map());
+
+  // Project room.annotations to a by-id Map. The reconcile effect below
+  // consults it for the 'add' kind (clear when id echoes), and takes it
+  // as a dep so any `room.annotations` update re-runs the reconciliation
+  // for update/remove seq-advance checks.
+  const echoedById = useMemo(() => {
+    const m = new Map<string, RoomAnnotation>();
+    for (const a of room.annotations) m.set(a.id, a);
+    return m;
+  }, [room.annotations]);
+
+  // Server-rejection reconciliation for MUTATION errors.
+  //
+  // V1 has no opId-correlated reject: a rejected mutation produces a
+  // `room.error` on the client, with no seq advance and no per-op
+  // correlation. Without an explicit clear path, a server-side
+  // rejection (e.g. a validation_error or event_persist_failed) would
+  // leave `add` pending forever (never echoed) and `update`/`remove`
+  // pending until some unrelated op bumped seq.
+  //
+  // Three correctness invariants enforced here:
+  //
+  //   1. Dedupe by `lastErrorId`, not object identity. CollabRoomClient
+  //      clones `lastError` on every state emit, so a stale error re-
+  //      emerges as a fresh object. Reacting to that would falsely mark
+  //      later successful sends as failed.
+  //
+  //   2. Filter by `scope === 'mutation'`. The client now classifies
+  //      errors into narrow scopes: only server-sent rejections of a
+  //      mutation this client sent use 'mutation'. Admin rejections,
+  //      peer inbound-event decode failures, presence decode failures,
+  //      snapshot decode failures, and join-phase failures all share
+  //      the `lastError` field but MUST NOT transition our pending ops.
+  //      Without this filter, a peer's malformed presence frame could
+  //      spuriously move our valid in-flight annotation add to failed.
+  //
+  //   3. Best-effort correlation within those constraints: on a new
+  //      mutation-scoped error, mark every currently-pending op as
+  //      failed. V1 has no opId-level correlation, so if two sends
+  //      raced and the server only rejected one, both get marked failed
+  //      and the user will Retry one unnecessarily — accepted tradeoff
+  //      over a silent stuck shimmer.
+  const lastErrorIdRef = useRef<number>(0);
+  useEffect(() => {
+    const id = room.lastErrorId;
+    if (id === lastErrorIdRef.current) return;
+    lastErrorIdRef.current = id;
+
+    const err = room.lastError;
+    if (!err || err.scope !== 'mutation') return;
+    if (pending.size === 0) return;
+
+    // Snapshot current pending → failed with the server's error message.
+    setPending(prev => (prev.size === 0 ? prev : new Map()));
+    setFailed(prev => {
+      const next = new Map(prev);
+      for (const [pid, op] of pending) {
+        next.set(pid, { id: pid, kind: op.kind, error: `${err.code}: ${err.message}` });
+        // Reconstruct a retry payload if we still have enough context.
+        // For 'add' we need the original RoomAnnotation — it lives in
+        // optimisticAdds. For update/remove the op carried its patch/id.
+        if (op.kind === 'add') {
+          const stashed = optimisticAdds.get(pid);
+          if (stashed) {
+            failedPayloadsRef.current.set(pid, {
+              kind: 'add',
+              value: toRoomAnnotation(stashed),
+            });
+          }
+        } else if (op.kind === 'update' && op.expectedPatch) {
+          failedPayloadsRef.current.set(pid, {
+            kind: 'update',
+            value: { id: pid, patch: op.expectedPatch },
+          });
+        } else if (op.kind === 'remove') {
+          failedPayloadsRef.current.set(pid, {
+            kind: 'remove',
+            value: { id: pid },
+          });
+        }
+      }
+      return next;
+    });
+  }, [room.lastErrorId, room.lastError, pending, optimisticAdds]);
+
+  // Reconciliation is KIND-SPECIFIC to avoid a leaky pending state when
+  // an unrelated op advances seq before our send echoes:
+  //
+  //   add     — clear only when the id appears in room.annotations. An
+  //             unrelated seq advance must NOT clear an add, because the
+  //             optimistic row (pendingAdditions) is still visible and we
+  //             need either a real echo or an explicit
+  //             reject-via-promise/Retry/Discard to progress it. Without
+  //             this, a concurrent peer's op could bump seq while our add
+  //             is in flight, the pending entry would drop, and the
+  //             optimistic row would linger as an ordinary-looking panel
+  //             row (no Sending… chrome, no Retry affordance) until the
+  //             eventual echo or manual dismissal.
+  //   update  — clear on seq advance past sentAtSeq. Concurrent-write
+  //             supersession is acceptable; the canonical annotation list
+  //             already shows the winning value.
+  //   remove  — same seq-based clear. Remove has no optimistic row to
+  //             strand, so a spurious clear is harmless.
+  useEffect(() => {
+    if (pending.size === 0) return;
+    let changed = false;
+    const next = new Map(pending);
+    for (const [id, op] of pending) {
+      if (op.kind === 'add') {
+        if (echoedById.has(id)) {
+          next.delete(id);
+          changed = true;
+        }
+        continue;
+      }
+      // KNOWN V1 EDGE CASE: if an unrelated peer op bumps seq past our
+      // sentAtSeq before the server processes our mutation, this clears
+      // the pending entry. If the server then REJECTS our mutation (via
+      // room.error), the error-driven path (below) finds nothing in
+      // `pending` to mark as failed. The user never sees the failure.
+      //
+      // This race requires: (a) we send an update/remove, (b) a peer's
+      // op is admitted and echoed before our op, (c) the server then
+      // rejects ours. Window is narrow (sub-RTT). Proper fix requires
+      // opId-correlated reject from the server (V2 protocol work).
+      // Accepted for Slice 5 over stuck-shimmer on every concurrent-
+      // edit scenario.
+      if (room.seq > op.sentAtSeq) {
+        next.delete(id);
+        changed = true;
+      }
+    }
+    if (changed) setPending(next);
+  }, [echoedById, pending, room.seq]);
+
+  const markPending = useCallback((op: RoomPending) => {
+    setPending(prev => {
+      const next = new Map(prev);
+      next.set(op.id, op);
+      return next;
+    });
+  }, []);
+
+  const markFailed = useCallback((
+    id: string,
+    kind: PendingKind,
+    payload: RetryPayload,
+    err: unknown,
+  ) => {
+    setPending(prev => {
+      if (!prev.has(id)) return prev;
+      const next = new Map(prev);
+      next.delete(id);
+      return next;
+    });
+    const message = err instanceof Error ? err.message : String(err);
+    setFailed(prev => {
+      const next = new Map(prev);
+      next.set(id, { id, kind, error: message });
+      return next;
+    });
+    failedPayloadsRef.current.set(id, payload);
+  }, []);
+
+  const clearFailedFor = useCallback((id: string) => {
+    failedPayloadsRef.current.delete(id);
+    setFailed(prev => {
+      if (!prev.has(id)) return prev;
+      const next = new Map(prev);
+      next.delete(id);
+      return next;
+    });
+  }, []);
+
+  const addOptimistic = useCallback((ann: Annotation) => {
+    setOptimisticAdds(prev => {
+      const next = new Map(prev);
+      next.set(ann.id, ann);
+      return next;
+    });
+  }, []);
+
+  const clearOptimisticAdd = useCallback((id: string) => {
+    setOptimisticAdds(prev => {
+      if (!prev.has(id)) return prev;
+      const next = new Map(prev);
+      next.delete(id);
+      return next;
+    });
+  }, []);
+
+  const add = useCallback((ann: Annotation) => {
+    const roomAnn = toRoomAnnotation(ann);
+    addOptimistic(ann);
+    markPending({ id: ann.id, kind: 'add', sentAtSeq: room.seq });
+    void room.addAnnotations([roomAnn]).catch(err => {
+      markFailed(ann.id, 'add', { kind: 'add', value: roomAnn }, err);
+    });
+  }, [room, addOptimistic, markPending, markFailed]);
+
+  const update = useCallback((id: string, patch: Partial<Annotation>) => {
+    const roomPatch = toRoomAnnotationPatch(patch);
+    markPending({ id, kind: 'update', sentAtSeq: room.seq, expectedPatch: roomPatch });
+    void room.updateAnnotation(id, roomPatch).catch(err => {
+      markFailed(id, 'update', { kind: 'update', value: { id, patch: roomPatch } }, err);
+    });
+  }, [room, markPending, markFailed]);
+
+  const remove = useCallback((id: string) => {
+    markPending({ id, kind: 'remove', sentAtSeq: room.seq });
+    void room.removeAnnotations([id]).catch(err => {
+      markFailed(id, 'remove', { kind: 'remove', value: { id } }, err);
+    });
+  }, [room, markPending, markFailed]);
+
+  const clear = useCallback((source?: string) => {
+    void room.clearAnnotations(source).catch(() => {
+      // clear has no single-id identity — failure surfaces via room.lastError
+      // and the UI disables further writes while disconnected.
+    });
+  }, [room]);
+
+  const retry = useCallback((id: string) => {
+    const p = failedPayloadsRef.current.get(id);
+    if (!p) return;
+    clearFailedFor(id);
+    switch (p.kind) {
+      case 'add':
+        markPending({ id, kind: 'add', sentAtSeq: room.seq });
+        void room.addAnnotations([p.value]).catch(err => {
+          markFailed(id, 'add', p, err);
+        });
+        break;
+      case 'update':
+        markPending({ id, kind: 'update', sentAtSeq: room.seq, expectedPatch: p.value.patch });
+        void room.updateAnnotation(p.value.id, p.value.patch).catch(err => {
+          markFailed(id, 'update', p, err);
+        });
+        break;
+      case 'remove':
+        markPending({ id, kind: 'remove', sentAtSeq: room.seq });
+        void room.removeAnnotations([p.value.id]).catch(err => {
+          markFailed(id, 'remove', p, err);
+        });
+        break;
+    }
+  }, [room, clearFailedFor, markPending, markFailed]);
+
+  const discard = useCallback((id: string) => {
+    clearFailedFor(id);
+    clearOptimisticAdd(id);  // failed-add row goes away on Discard
+  }, [clearFailedFor, clearOptimisticAdd]);
+
+  // Drop optimistic entries for ids that have arrived via echo. We run
+  // this as an effect so the UI doesn't double-render a row from both the
+  // buffer and room.annotations.
+  useEffect(() => {
+    if (optimisticAdds.size === 0) return;
+    let changed = false;
+    const next = new Map(optimisticAdds);
+    for (const a of room.annotations) {
+      if (next.delete(a.id)) changed = true;
+    }
+    if (changed) setOptimisticAdds(next);
+  }, [optimisticAdds, room.annotations]);
+
+  // `annotations` is strictly the server-echoed state — V1 is
+  // server-authoritative, so pending/failed adds must NOT appear here.
+  // Rendering them in the panel is the UI's job via `pendingAdditions`.
+  const annotations = useMemo<Annotation[]>(
+    () => room.annotations.map(toEditorAnnotation),
+    [room.annotations],
+  );
+
+  // Expose optimistic adds separately so the annotation panel can draw
+  // "Sending…"/failed rows without contaminating the canonical list.
+  const pendingAdditions = optimisticAdds;
+
+  return {
+    mode: 'room',
+    annotations,
+    pendingAdditions,
+    pending,
+    failed,
+    add,
+    update,
+    remove,
+    clear,
+    retry,
+    discard,
+  };
+}
+
+/** Public selector. Pass `room` to enter room mode, otherwise returns local. */
+export function useAnnotationController(options: {
+  initial?: Annotation[];
+  room?: UseCollabRoomReturn;
+}): AnnotationController {
+  // Hooks must be called unconditionally in the same order per render, so
+  // both impls run. We only consume the relevant one based on `room`.
+  // This costs one extra useState in the unused branch — acceptable for the
+  // simpler call-site contract.
+  const local = useLocalAnnotationController(options.initial);
+  const roomController = useRoomAnnotationControllerOptional(options.room);
+  return options.room ? roomController : local;
+}
+
+function useRoomAnnotationControllerOptional(
+  room: UseCollabRoomReturn | undefined,
+): AnnotationController {
+  // Always call the hook; pass a dummy placeholder when room is undefined
+  // so we don't violate the rules-of-hooks. The returned controller is
+  // discarded unless the caller passed a real room.
+  const placeholder = usePlaceholderRoom();
+  return useRoomAnnotationController(room ?? placeholder);
+}
+
+function usePlaceholderRoom(): UseCollabRoomReturn {
+  return useMemo<UseCollabRoomReturn>(() => ({
+    connectionStatus: 'disconnected',
+    roomUnavailable: false,
+    planMarkdown: '',
+    annotations: [],
+    seq: 0,
+    remotePresence: {},
+    hasAdminCapability: false,
+    lastError: null,
+    lastErrorId: 0,
+    addAnnotations: async () => {},
+    updateAnnotation: async () => {},
+    removeAnnotations: async () => {},
+    clearAnnotations: async () => {},
+    updatePresence: async () => {},
+    deleteRoom: async () => {},
+    client: null,
+  }), []);
+}
+
+/** Narrow the shared helper's generic return to Annotation-compatible shape. */
+function toRoomAnnotation(a: Annotation): RoomAnnotation {
+  return sharedToRoomAnnotation(a) as RoomAnnotation;
+}
+
+function toRoomAnnotationPatch(p: Partial<Annotation>): Partial<RoomAnnotation> {
+  return sharedToRoomAnnotation(p) as Partial<RoomAnnotation>;
+}
+
+function toEditorAnnotation(a: RoomAnnotation): Annotation {
+  // RoomAnnotation has no images; Annotation's images is optional, so the
+  // shape is already compatible without images.
+  return a as Annotation;
+}
diff --git a/packages/ui/hooks/useAnnotationHighlightReconciler.test.tsx b/packages/ui/hooks/useAnnotationHighlightReconciler.test.tsx
new file mode 100644
index 000000000..9b1c4bb0a
--- /dev/null
+++ b/packages/ui/hooks/useAnnotationHighlightReconciler.test.tsx
@@ -0,0 +1,155 @@
+import { describe, expect, test } from 'bun:test';
+import { renderHook, waitFor } from '@testing-library/react';
+import { useRef } from 'react';
+import { useAnnotationHighlightReconciler } from './useAnnotationHighlightReconciler';
+import type { ViewerHandle } from '../components/Viewer';
+import type { Annotation } from '../types';
+import { AnnotationType } from '../types';
+
+/**
+ * The reconciler was extracted from two duplicate implementations (external
+ * SSE + room mode). The `surfaceGeneration` dep is the key invariant: when
+ * the Viewer's highlight surface is reset (highlighter reinit,
+ * `clearAllHighlights`), the applied map must clear so eligible annotations
+ * repaint against the fresh DOM.
+ */
+describe('useAnnotationHighlightReconciler', () => {
+  function makeMockViewer() {
+    const applied: Annotation[] = [];
+    const removed: string[] = [];
+    const handle: ViewerHandle = {
+      removeHighlight: (id: string) => { removed.push(id); },
+      clearAllHighlights: () => {},
+      applySharedAnnotations: (anns: Annotation[]) => { applied.push(...anns); },
+    };
+    return { handle, applied, removed };
+  }
+
+  const ANN_A: Annotation = {
+    id: 'a1',
+    blockId: 'b1',
+    startOffset: 0,
+    endOffset: 3,
+    type: AnnotationType.COMMENT,
+    originalText: 'foo',
+    createdA: 0,
+    text: 'nit',
+  };
+  const ANN_B: Annotation = {
+    id: 'b2',
+    blockId: 'b2',
+    startOffset: 0,
+    endOffset: 3,
+    type: AnnotationType.COMMENT,
+    originalText: 'bar',
+    createdA: 0,
+    text: 'here',
+  };
+
+  test('applies eligible annotations once', async () => {
+    const { handle, applied } = makeMockViewer();
+    renderHook(() => {
+      const ref = useRef<ViewerHandle>(handle);
+      return useAnnotationHighlightReconciler({
+        viewerRef: ref,
+        annotations: [ANN_A, ANN_B],
+        enabled: true,
+        planKey: 'plan-1',
+        surfaceGeneration: 1,
+        eligibleFilter: a => !!a.originalText,
+        paintDelayMs: 0,
+      });
+    });
+
+    await waitFor(() => {
+      expect(applied.length).toBe(2);
+    });
+    expect(applied.map(a => a.id).sort()).toEqual(['a1', 'b2']);
+  });
+
+  test('bumping surfaceGeneration clears the applied map and repaints', async () => {
+    const { handle, applied } = makeMockViewer();
+
+    let generation = 1;
+    const { rerender } = renderHook(() => {
+      const ref = useRef<ViewerHandle>(handle);
+      return useAnnotationHighlightReconciler({
+        viewerRef: ref,
+        annotations: [ANN_A],
+        enabled: true,
+        planKey: 'plan-1',
+        surfaceGeneration: generation,
+        eligibleFilter: a => !!a.originalText,
+        paintDelayMs: 0,
+      });
+    });
+
+    await waitFor(() => {
+      expect(applied.length).toBe(1);
+    });
+
+    // Simulate the Viewer resetting its highlight surface — in App.tsx this
+    // happens when `Viewer.clearAllHighlights()` fires `onHighlightSurfaceReset`,
+    // and the parent bumps the generation counter in response.
+    generation = 2;
+    rerender();
+
+    await waitFor(() => {
+      expect(applied.length).toBe(2);
+    });
+    // Same annotation id should have been reapplied the second time.
+    expect(applied.filter(a => a.id === 'a1').length).toBe(2);
+  });
+
+  test('fingerprint change triggers remove+reapply', async () => {
+    const { handle, applied, removed } = makeMockViewer();
+
+    let annotation: Annotation = { ...ANN_A, text: 'nit' };
+    const { rerender } = renderHook(() => {
+      const ref = useRef<ViewerHandle>(handle);
+      return useAnnotationHighlightReconciler<Annotation>({
+        viewerRef: ref,
+        annotations: [annotation],
+        enabled: true,
+        planKey: 'plan-1',
+        surfaceGeneration: 1,
+        fingerprint: a => `${a.type}\u0000${a.originalText}\u0000${a.text ?? ''}`,
+        paintDelayMs: 0,
+      });
+    });
+
+    await waitFor(() => {
+      expect(applied.length).toBe(1);
+    });
+
+    // Peer updated the comment text; fingerprint changes → remove + reapply.
+    annotation = { ...annotation, text: 'actually blocking' };
+    rerender();
+
+    await waitFor(() => {
+      expect(removed).toContain('a1');
+      expect(applied.length).toBe(2);
+    });
+  });
+
+  test('disabled does not apply', async () => {
+    const { handle, applied } = makeMockViewer();
+
+    renderHook(() => {
+      const ref = useRef<ViewerHandle>(handle);
+      return useAnnotationHighlightReconciler({
+        viewerRef: ref,
+        annotations: [ANN_A],
+        enabled: false,
+        planKey: 'plan-1',
+        surfaceGeneration: 1,
+        paintDelayMs: 0,
+      });
+    });
+
+    // Wait a tick — without `enabled`, the effect should no-op and nothing
+    // should land in `applied`.
+    await new Promise(r => setTimeout(r, 30));
+    expect(applied.length).toBe(0);
+  });
+});
diff --git a/packages/ui/hooks/useAnnotationHighlightReconciler.ts b/packages/ui/hooks/useAnnotationHighlightReconciler.ts
new file mode 100644
index 000000000..1bdd60080
--- /dev/null
+++ b/packages/ui/hooks/useAnnotationHighlightReconciler.ts
@@ -0,0 +1,150 @@
+/**
+ * Generic annotation → DOM highlight reconciler.
+ *
+ * Two callers:
+ *   - `useExternalAnnotationHighlights` — SSE-delivered external annotations.
+ *   - `App.tsx` (room-mode) — server-authoritative room annotations.
+ *
+ * Both need identical bookkeeping: "which annotation IDs are currently
+ * materialized as DOM highlights, and with which fingerprint," so that
+ *   (a) removals are dropped from the DOM,
+ *   (b) updates trigger remove+reapply,
+ *   (c) adds get applied after a paint tick (the Viewer's DOM may not be
+ *       mounted yet on initial snapshot load).
+ *
+ * The applied-map is cleared on two signals:
+ *   - `planKey` change — plan markdown changed; the Viewer re-parsed
+ *     blocks and wiped marks, so any "already applied" tracking is stale.
+ *   - `surfaceGeneration` change — the Viewer's underlying highlighter
+ *     was reinitialized or explicitly cleared (e.g. `clearAllHighlights`
+ *     during a share-import). Same invariant: DOM marks are gone, tracking
+ *     must reset so every eligible annotation repaints.
+ *
+ * The `reset()` escape hatch exists for callers that can't observe a
+ * surface generation bump but know their surface was reset out-of-band.
+ * New callers should prefer wiring `surfaceGeneration` instead.
+ */
+
+import { useCallback, useEffect, useRef, useState } from 'react';
+import type { Annotation } from '../types';
+import type { ViewerHandle } from '../components/Viewer';
+
+export interface UseAnnotationHighlightReconcilerOptions<A extends { id: string }> {
+  viewerRef: React.RefObject<ViewerHandle | null>;
+  annotations: A[];
+  enabled: boolean;
+  /** Bump to force a full re-apply when plan content changes. */
+  planKey: string;
+  /**
+   * Monotonic counter from `Viewer` that increments whenever the
+   * underlying highlight surface is (re)initialized or cleared.
+   * Starts at 0 before Viewer has emitted; first Viewer-side bump is 1.
+   */
+  surfaceGeneration: number;
+  /**
+   * Decide which annotations take part. Default: all.
+   * Ineligible annotations are never added to the applied map and
+   * are proactively removed if present.
+   */
+  eligibleFilter?: (annotation: A) => boolean;
+  /**
+   * Fingerprint an annotation. Fingerprint changes trigger
+   * remove+reapply. Default: identity (`id`), meaning updates never
+   * repaint — most callers override this.
+   */
+  fingerprint?: (annotation: A) => string;
+  /**
+   * How long to wait before walking the DOM to apply marks. Default 100ms
+   * to match the historical paint-delay used across drafts/shares.
+   */
+  paintDelayMs?: number;
+}
+
+export interface UseAnnotationHighlightReconcilerReturn {
+  /**
+   * Force a full re-apply on the next tick. Most callers should prefer
+   * bumping `surfaceGeneration` from the Viewer side instead; this exists
+   * for paths that don't own the surface (e.g. legacy share-import).
+   */
+  reset: () => void;
+}
+
+export function useAnnotationHighlightReconciler<A extends { id: string }>(
+  params: UseAnnotationHighlightReconcilerOptions<A> & {
+    // Generic `A`-shaped applySharedAnnotations payload — the Viewer
+    // handle types it as `Annotation[]`. Internal narrow.
+    _applyAs?: (annotation: A) => Annotation;
+  },
+): UseAnnotationHighlightReconcilerReturn {
+  const {
+    viewerRef,
+    annotations,
+    enabled,
+    planKey,
+    surfaceGeneration,
+    eligibleFilter,
+    fingerprint,
+    paintDelayMs = 100,
+  } = params;
+
+  const appliedRef = useRef<Map<string, string>>(new Map());
+  const [resetCount, setResetCount] = useState(0);
+
+  // Clear tracking on surface-identity changes. `planKey` covers markdown
+  // reparses; `surfaceGeneration` covers Viewer-internal resets (highlighter
+  // reinit, `clearAllHighlights`).
+  useEffect(() => {
+    appliedRef.current.clear();
+  }, [planKey, surfaceGeneration]);
+
+  useEffect(() => {
+    if (!enabled) return;
+    const viewer = viewerRef.current;
+    if (!viewer) return;
+
+    const filter = eligibleFilter ?? (() => true);
+    const fp = fingerprint ?? ((a: A) => a.id);
+
+    const eligible = annotations.filter(filter);
+    const eligibleById = new Map(eligible.map(a => [a.id, a]));
+    const applied = appliedRef.current;
+
+    // 1. Remove: applied IDs no longer eligible, or whose fingerprint drifted.
+    for (const [id, storedFp] of applied) {
+      const ann = eligibleById.get(id);
+      if (!ann || fp(ann) !== storedFp) {
+        viewer.removeHighlight(id);
+        applied.delete(id);
+      }
+    }
+
+    // 2. Apply: eligible IDs not yet recorded.
+    const toApply = eligible.filter(a => !applied.has(a.id));
+    if (toApply.length === 0) return;
+
+    const timer = setTimeout(() => {
+      const v = viewerRef.current;
+      if (!v) return;
+      // Viewer's imperative API takes the UI `Annotation` shape. Callers
+      // supply annotation objects that either ARE that shape (external)
+      // or are assignment-compatible at runtime (room — `RoomAnnotation`
+      // has the required fields minus `images`). The viewer's apply path
+      // reads only `id`/`type`/`originalText`, so the cast is safe.
+      v.applySharedAnnotations(toApply as unknown as Annotation[]);
+      for (const a of toApply) {
+        applied.set(a.id, fp(a));
+      }
+    }, paintDelayMs);
+
+    return () => clearTimeout(timer);
+    // viewerRef is a stable ref object; intentionally omitted.
+    // eslint-disable-next-line react-hooks/exhaustive-deps
+  }, [annotations, enabled, planKey, surfaceGeneration, resetCount, paintDelayMs]);
+
+  const reset = useCallback(() => {
+    appliedRef.current.clear();
+    setResetCount(c => c + 1);
+  }, []);
+
+  return { reset };
+}
diff --git a/packages/ui/hooks/useAnnotationHighlighter.matrix.test.tsx b/packages/ui/hooks/useAnnotationHighlighter.matrix.test.tsx
new file mode 100644
index 000000000..7c163c3e1
--- /dev/null
+++ b/packages/ui/hooks/useAnnotationHighlighter.matrix.test.tsx
@@ -0,0 +1,260 @@
+/**
+ * Selection-accuracy characterization matrix.
+ *
+ * This is NOT a test that enforces desired behavior. It's a
+ * characterization of what the CURRENT `findTextInDOM` matcher in
+ * `useAnnotationHighlighter.ts` does — producing a
+ * pass/fail-per-category count that a future fix effort starts
+ * from. Reviewers reading the test output learn exactly which
+ * agent-shipped text shapes land on the wrong anchor, which fail
+ * entirely, and which work.
+ *
+ * If you change the matcher, update this test's expectations to
+ * describe the NEW behavior. Don't delete failing cases to make
+ * it green; the whole point is recording reality.
+ *
+ * The matcher logic is vendored verbatim from
+ * useAnnotationHighlighter.ts:173-236 (findTextInDOM closure).
+ * Any drift in the original needs a corresponding update here.
+ *
+ * See `specs/v1-selection-accuracy.md` for the write-up that
+ * explains which rows are bugs, which are acceptable, and the
+ * sketch of a fix.
+ */
+
+import { describe, expect, test } from 'bun:test';
+import { render } from '@testing-library/react';
+import React from 'react';
+
+// Vendored verbatim from useAnnotationHighlighter.ts:173-236.
+// Keep in sync if the source closure changes.
+function findTextInDOM(container: HTMLElement, searchText: string): Range | null {
+  const walker = document.createTreeWalker(container, NodeFilter.SHOW_TEXT, null);
+
+  let node: Text | null;
+  while ((node = walker.nextNode() as Text | null)) {
+    const text = node.textContent || '';
+    const index = text.indexOf(searchText);
+    if (index !== -1) {
+      const range = document.createRange();
+      range.setStart(node, index);
+      range.setEnd(node, index + searchText.length);
+      return range;
+    }
+  }
+
+  // Try across multiple text nodes for multi-line content
+  const fullText = container.textContent || '';
+  const searchIndex = fullText.indexOf(searchText);
+  if (searchIndex === -1) return null;
+
+  const walker2 = document.createTreeWalker(container, NodeFilter.SHOW_TEXT, null);
+
+  let charCount = 0;
+  let startNode: Text | null = null;
+  let startOffset = 0;
+  let endNode: Text | null = null;
+  let endOffset = 0;
+
+  while ((node = walker2.nextNode() as Text | null)) {
+    const nodeLength = node.textContent?.length || 0;
+
+    if (!startNode && charCount + nodeLength > searchIndex) {
+      startNode = node;
+      startOffset = searchIndex - charCount;
+    }
+
+    if (startNode && charCount + nodeLength >= searchIndex + searchText.length) {
+      endNode = node;
+      endOffset = searchIndex + searchText.length - charCount;
+      break;
+    }
+
+    charCount += nodeLength;
+  }
+
+  if (startNode && endNode) {
+    const range = document.createRange();
+    range.setStart(startNode, startOffset);
+    range.setEnd(endNode, endOffset);
+    return range;
+  }
+
+  return null;
+}
+
+interface MatrixCase {
+  n: number;
+  label: string;
+  /** DOM content for the container. Renderer-equivalent markup. */
+  dom: React.ReactElement;
+  /** What the agent would ship as `originalText`. */
+  agentShips: string;
+  /**
+   * What the CURRENT matcher does:
+   *   "found"  — returns a non-null range with text === agentShips
+   *   "missed" — returns null (annotation silently drops)
+   *
+   * Note that "found" does NOT imply "correct" for the agent's
+   * intent. A case where the same substring appears multiple times
+   * in the block still returns "found" (first occurrence), even
+   * though the agent may have meant a different occurrence. Such
+   * cases are classified as `found` here but carry an
+   * `ambiguous: true` flag so the spec note can single them out.
+   */
+  currentBehavior: 'found' | 'missed';
+  /** True when "found" but on potentially-wrong text without more context. */
+  ambiguous?: boolean;
+  /** Short commentary for the write-up. */
+  note: string;
+}
+
+const CASES: MatrixCase[] = [
+  {
+    n: 1,
+    label: 'exact match, plain text',
+    dom: <p>The quick brown fox</p>,
+    agentShips: 'quick brown fox',
+    currentBehavior: 'found',
+    note: 'Happy path; indexOf hits.',
+  },
+  {
+    n: 2,
+    label: 'trailing whitespace on agent side',
+    dom: <p>The quick brown fox</p>,
+    agentShips: 'quick brown fox ', // trailing space
+    currentBehavior: 'missed',
+    note: 'indexOf requires exact match; trailing whitespace not tolerated.',
+  },
+  {
+    n: 3,
+    label: 'leading whitespace on agent side',
+    dom: <p>The quick brown fox</p>,
+    agentShips: ' quick brown fox',
+    currentBehavior: 'found',
+    note: 'indexOf finds " quick brown fox" starting at the space BETWEEN "The" and "quick" — match succeeds because the DOM happens to contain the leading-space variant as a substring. Brittle: works only when the preceding character is a space; different formatting would flip this to miss.',
+  },
+  {
+    n: 4,
+    label: 'extra space between words (agent shipped double-space)',
+    dom: <p>The quick brown fox</p>,
+    agentShips: 'quick  brown fox', // two spaces
+    currentBehavior: 'missed',
+    note: 'Whitespace normalization not applied; double-space != single-space.',
+  },
+  {
+    n: 5,
+    label: 'tab vs spaces (agent shipped tab)',
+    dom: <p>The quick brown fox</p>,
+    agentShips: 'quick\tbrown fox',
+    currentBehavior: 'missed',
+    note: 'Tab treated as literal; no tab→space normalization.',
+  },
+  {
+    n: 6,
+    label: 'non-breaking space vs regular space',
+    dom: <p>{'The quick\u00A0brown fox'}</p>, // DOM has NBSP
+    agentShips: 'quick brown fox', // agent ships regular space
+    currentBehavior: 'missed',
+    note: 'NBSP (U+00A0) != space (U+0020); agents that copy from rendered HTML may ship one and see the other.',
+  },
+  {
+    n: 7,
+    label: 'agent ships **markdown** when DOM renders bolded text',
+    dom: (
+      <p>
+        The <strong>quick</strong> brown fox
+      </p>
+    ),
+    agentShips: 'the **quick** brown fox',
+    currentBehavior: 'missed',
+    note: 'Rendered DOM has "The quick brown fox"; agent ships markdown source. No markdown-stripping.',
+  },
+  {
+    n: 8,
+    label: 'agent ships _italic_ when DOM renders italicized text',
+    dom: (
+      <p>
+        The <em>quick</em> brown fox
+      </p>
+    ),
+    agentShips: 'the _quick_ brown fox',
+    currentBehavior: 'missed',
+    note: 'Same family as case 7. DOM has no underscores.',
+  },
+  {
+    n: 9,
+    label: 'agent ships text spanning two blocks',
+    dom: (
+      <div>
+        <p>first block ends here.</p>
+        <p>second block starts there.</p>
+      </div>
+    ),
+    agentShips: 'ends here.\nsecond block starts there.',
+    currentBehavior: 'missed',
+    note: 'Single-node pass looks at one text node at a time; multi-node pass uses container.textContent which concatenates WITHOUT inserting the newline the agent shipped.',
+  },
+  {
+    n: 10,
+    label: 'text appears twice in block; agent wants the second occurrence',
+    dom: <p>fox jumps. fox sleeps.</p>,
+    agentShips: 'fox',
+    currentBehavior: 'found',
+    ambiguous: true,
+    note: 'Matcher returns the FIRST occurrence. Agent has no way to request the second without shipping more surrounding context. Silent anchor mismatch to the agent\'s intent.',
+  },
+  {
+    n: 11,
+    label: 'agent ships the exact whole-block content',
+    dom: <p>A complete thought in one paragraph.</p>,
+    agentShips: 'A complete thought in one paragraph.',
+    currentBehavior: 'found',
+    note: 'Block-level targeting is robust. The collab-agent CLI uses this pattern exclusively in V1.',
+  },
+  {
+    n: 12,
+    label: 'smart quote (U+201C/U+201D) vs straight quote',
+    dom: <p>{'She said \u201Chello\u201D quietly.'}</p>,
+    agentShips: '"hello"', // straight ASCII quotes
+    currentBehavior: 'missed',
+    note: 'Markdown renderers often convert " → U+201C / U+201D. Agents copying from source see straight; DOM has curly.',
+  },
+];
+
+/**
+ * Render the case's DOM and return the container element.
+ */
+function renderCase(c: MatrixCase): HTMLElement {
+  const { container } = render(<div data-testid="root">{c.dom}</div>);
+  return container.querySelector('[data-testid="root"]') as HTMLElement;
+}
+
+describe('selection-accuracy matrix (findTextInDOM characterization)', () => {
+  for (const c of CASES) {
+    test(`${String(c.n).padStart(2, '0')}: ${c.label}`, () => {
+      const container = renderCase(c);
+      const range = findTextInDOM(container, c.agentShips);
+
+      if (c.currentBehavior === 'missed') {
+        expect(range).toBeNull();
+      } else {
+        expect(range).not.toBeNull();
+        expect(range!.toString()).toBe(c.agentShips);
+      }
+    });
+  }
+
+  test('summary: category counts', () => {
+    const found = CASES.filter(c => c.currentBehavior === 'found');
+    const missed = CASES.filter(c => c.currentBehavior === 'missed');
+    const ambiguous = CASES.filter(c => c.ambiguous);
+    console.log(
+      `\n[selection-accuracy matrix] ` +
+        `found=${found.length} missed=${missed.length} ambiguous=${ambiguous.length} ` +
+        `(of ${CASES.length} cases). ` +
+        `"ambiguous" = matcher returns a range but not necessarily on the agent's intended text.`,
+    );
+    expect(found.length + missed.length).toBe(CASES.length);
+  });
+});
diff --git a/packages/ui/hooks/useAnnotationHighlighter.ts b/packages/ui/hooks/useAnnotationHighlighter.ts
index 63ab2dcab..94452184b 100644
--- a/packages/ui/hooks/useAnnotationHighlighter.ts
+++ b/packages/ui/hooks/useAnnotationHighlighter.ts
@@ -44,6 +44,29 @@ export interface UseAnnotationHighlighterOptions {
   selectedAnnotationId: string | null;
   mode: EditorMode;
   enabled?: boolean;
+  /**
+   * Override the `author` field stamped on newly-created annotations.
+   * When unset, falls back to `getIdentity()` (configStore displayName,
+   * the cookie-backed Tater name). Passed from App when in room mode so
+   * annotations carry the identity the participant typed into the
+   * JoinRoomGate instead of a stale/missing per-origin cookie —
+   * participants on room.plannotator.ai don't have the creator's
+   * local-origin Tater cookie and would otherwise get generated names
+   * that don't match the cursor label peers see.
+   */
+  authorOverride?: string;
+  /**
+   * Invoked whenever the underlying highlight surface is (re)initialized
+   * or explicitly cleared via `clearAllHighlights()`. Consumers (the
+   * Viewer) translate this into a monotonically-bumped generation that
+   * downstream reconcilers use to clear their applied-highlight caches.
+   *
+   * Fires AFTER the surface change is in effect — on init, after the
+   * highlighter is constructed and `highlighterRef.current` is set; on
+   * clear, after the DOM marks are removed. Same-tick re-entry is safe
+   * because React effects run after commit.
+   */
+  onSurfaceReset?: () => void;
 }
 
 export interface UseAnnotationHighlighterReturn {
@@ -75,7 +98,18 @@ export function useAnnotationHighlighter({
   selectedAnnotationId,
   mode,
   enabled = true,
+  authorOverride,
+  onSurfaceReset,
 }: UseAnnotationHighlighterOptions): UseAnnotationHighlighterReturn {
+  // Ref so the annotation-creation closure sees the latest override
+  // without re-binding event handlers on every change.
+  const authorOverrideRef = useRef(authorOverride);
+  useEffect(() => { authorOverrideRef.current = authorOverride; }, [authorOverride]);
+  // Ref for the surface-reset callback so the init effect can call the
+  // latest version without re-binding (and dropping) the highlighter on
+  // every parent re-render.
+  const onSurfaceResetRef = useRef(onSurfaceReset);
+  useEffect(() => { onSurfaceResetRef.current = onSurfaceReset; }, [onSurfaceReset]);
   const highlighterRef = useRef<Highlighter | null>(null);
   const modeRef = useRef<EditorMode>(mode);
   const onAddAnnotationRef = useRef(onAddAnnotation);
@@ -222,7 +256,7 @@ export function useAnnotationHighlighter({
       text,
       originalText: source.text,
       createdA: Date.now(),
-      author: getIdentity(),
+      author: authorOverrideRef.current ?? getIdentity(),
       startMeta: source.startMeta,
       endMeta: source.endMeta,
       images,
@@ -370,6 +404,10 @@ export function useAnnotationHighlighter({
       }
       el.remove();
     });
+
+    // DOM marks are gone; any reconciler that was tracking "already
+    // applied" needs to know so it can repaint from scratch.
+    onSurfaceResetRef.current?.();
   }, []);
 
   // --- Effects ---
@@ -386,6 +424,10 @@ export function useAnnotationHighlighter({
     });
 
     highlighterRef.current = highlighter;
+    // Surface exists and is empty — let reconcilers (external SSE,
+    // room annotations) know so they clear any stale applied maps
+    // inherited from before the surface was (re)created.
+    onSurfaceResetRef.current?.();
 
     highlighter.on(Highlighter.event.CREATE, ({ sources }: { sources: any[] }) => {
       if (sources.length > 0) {
@@ -436,7 +478,9 @@ export function useAnnotationHighlighter({
 
     highlighter.run();
 
-    // Mobile bridge
+    // Mobile bridge — on touch devices, forward selectionchange events
+    // into the highlighter via a debounced fromRange() call so
+    // tap-and-hold selections surface the annotation toolbar.
     const isTouchPrimary = window.matchMedia('(pointer: coarse)').matches;
     let selectionTimer: ReturnType<typeof setTimeout>;
     const handleSelectionChange = isTouchPrimary
diff --git a/packages/ui/hooks/useDismissOnOutsideAndEscape.ts b/packages/ui/hooks/useDismissOnOutsideAndEscape.ts
index d0df6ed08..1e2d9dd66 100644
--- a/packages/ui/hooks/useDismissOnOutsideAndEscape.ts
+++ b/packages/ui/hooks/useDismissOnOutsideAndEscape.ts
@@ -6,7 +6,10 @@ export function useDismissOnOutsideAndEscape({
   onDismiss,
 }: {
   enabled: boolean;
-  ref: React.RefObject<HTMLElement>;
+  // React 18→19 migration: `useRef<HTMLElement>(null)` returns
+  // `RefObject<HTMLElement | null>` now, so callers can't pass a
+  // non-null-typed ref here. Accept the nullable form.
+  ref: React.RefObject<HTMLElement | null>;
   onDismiss: () => void;
 }) {
   useEffect(() => {
diff --git a/packages/ui/hooks/useExternalAnnotationHighlights.ts b/packages/ui/hooks/useExternalAnnotationHighlights.ts
index 2d5cdf021..88b216d3e 100644
--- a/packages/ui/hooks/useExternalAnnotationHighlights.ts
+++ b/packages/ui/hooks/useExternalAnnotationHighlights.ts
@@ -1,28 +1,33 @@
-import { useCallback, useEffect, useRef, useState } from 'react';
-import type { Annotation } from '../types';
-import { AnnotationType } from '../types';
+import { AnnotationType, type Annotation } from '../types';
 import type { ViewerHandle } from '../components/Viewer';
+import {
+  useAnnotationHighlightReconciler,
+  type UseAnnotationHighlightReconcilerReturn,
+} from './useAnnotationHighlightReconciler';
 
 /**
  * Bridges SSE-delivered external annotations into the Viewer's imperative
  * highlight API so tools can POST annotations with `originalText` and have
  * them highlight real spans of the rendered plan.
  *
- * The Viewer's `applySharedAnnotations` already searches the DOM for
- * `originalText` and dedupes against already-applied marks, so this hook
- * just needs to drive it when the external list changes.
+ * This is a thin wrapper around `useAnnotationHighlightReconciler` that
+ * pins the external-specific eligibility filter and fingerprint. The
+ * reconciler is also used by room mode in `App.tsx`; keeping a named
+ * external-facing hook preserves existing call sites and keeps the
+ * external fingerprint (which deliberately excludes comment `text`)
+ * distinct from the room fingerprint.
  *
  * - Annotations without `originalText` (or `GLOBAL_COMMENT`) stay sidebar-only.
  * - Annotations with `diffContext` are skipped (diff view owns those).
- * - On plan markdown change the applied set is cleared so re-rendered blocks
- *   get re-highlighted.
- * - Callers can invoke the returned `reset()` to force a full re-apply — used
- *   by the share-import path in App.tsx after it calls `clearAllHighlights()`,
- *   which would otherwise leave our bookkeeping stale against a wiped DOM.
- * - Disabled state no-ops WITHOUT clearing the applied set. This preserves the
- *   bookkeeping while the Viewer DOM is hidden (diff view / linked doc) so that
- *   any SSE removals that arrive while hidden are correctly reconciled when the
- *   hook re-enables.
+ * - The Viewer's `onHighlightSurfaceReset` event bumps the parent-owned
+ *   generation counter; callers thread that counter in via
+ *   `surfaceGeneration` so reconcilers automatically repaint when the
+ *   highlighter surface is reset (e.g. `clearAllHighlights` during share
+ *   import, or a Viewer remount). The `reset()` escape hatch remains for
+ *   paths that can't wire a generation signal.
+ * - Disabled state no-ops WITHOUT clearing the applied set. This preserves
+ *   the bookkeeping while the Viewer DOM is hidden (diff view / linked doc)
+ *   so any SSE removals that arrive while hidden reconcile on re-enable.
  */
 export function useExternalAnnotationHighlights(params: {
   viewerRef: React.RefObject<ViewerHandle | null>;
@@ -30,76 +35,30 @@ export function useExternalAnnotationHighlights(params: {
   enabled: boolean;
   /** Bump to force a full re-apply (e.g. plan markdown changed and blocks re-rendered). */
   planKey: string;
-}): { reset: () => void } {
-  const { viewerRef, externalAnnotations, enabled, planKey } = params;
+  /** Monotonic counter from Viewer; clears tracking on highlighter reset. Default 0. */
+  surfaceGeneration?: number;
+}): UseAnnotationHighlightReconcilerReturn {
+  const { viewerRef, externalAnnotations, enabled, planKey, surfaceGeneration = 0 } = params;
 
-  // Tracks annotation IDs currently materialized as DOM highlights, along
-  // with a fingerprint so updates trigger remove+reapply.
-  const appliedRef = useRef<Map<string, string>>(new Map());
-
-  // Bumped to force the main effect to treat every current external as a
-  // fresh application target — used by `reset()` below.
-  const [resetCount, setResetCount] = useState(0);
-
-  // Clear tracking when plan content changes — the Viewer re-parses blocks
-  // and wipes marks, so our bookkeeping is stale.
-  useEffect(() => {
-    appliedRef.current.clear();
-  }, [planKey]);
-
-  useEffect(() => {
-    if (!enabled) return;
-
-    const viewer = viewerRef.current;
-    if (!viewer) return;
-
-    const eligible = externalAnnotations.filter(
-      a => a.type !== AnnotationType.GLOBAL_COMMENT && !a.diffContext && a.originalText,
-    );
-    const applied = appliedRef.current;
-
-    // Removals: previously applied but no longer present, or fingerprint changed.
-    const toRemove: string[] = [];
-    for (const [id, fp] of applied) {
-      const match = eligible.find(a => a.id === id);
-      if (!match || fingerprint(match) !== fp) {
-        toRemove.push(id);
-      }
-    }
-    toRemove.forEach(id => {
-      viewer.removeHighlight(id);
-      applied.delete(id);
-    });
-
-    // Additions: eligible but not yet applied (includes re-adds from updates).
-    const toAdd = eligible.filter(a => !applied.has(a.id));
-    if (toAdd.length === 0) return;
-
-    // Paint delay matches the existing draft/share restore pattern —
-    // ensures blocks are mounted before we walk the DOM.
-    const timer = setTimeout(() => {
-      const v = viewerRef.current;
-      if (!v) return;
-      v.applySharedAnnotations(toAdd);
-      toAdd.forEach(a => applied.set(a.id, fingerprint(a)));
-    }, 100);
-
-    return () => clearTimeout(timer);
-    // viewerRef is a stable ref object and intentionally omitted from deps.
-  }, [externalAnnotations, enabled, planKey, resetCount]);
-
-  // Forget everything we've tracked and force a full re-apply on the next
-  // effect run. Callers invoke this after an external action has wiped the
-  // Viewer DOM out from under us (e.g. `clearAllHighlights()` during share
-  // import) so live externals get repainted.
-  const reset = useCallback(() => {
-    appliedRef.current.clear();
-    setResetCount(c => c + 1);
-  }, []);
+  return useAnnotationHighlightReconciler<Annotation>({
+    viewerRef,
+    annotations: externalAnnotations,
+    enabled,
+    planKey,
+    surfaceGeneration,
+    eligibleFilter: externalEligible,
+    fingerprint: externalFingerprint,
+  });
+}
 
-  return { reset };
+function externalEligible(a: Annotation): boolean {
+  return a.type !== AnnotationType.GLOBAL_COMMENT && !a.diffContext && !!a.originalText;
 }
 
-function fingerprint(a: Annotation): string {
+// External annotations can be updated by tools via PATCH, but the apply
+// path keys off `originalText`; comment `text` changes do not require
+// repainting the mark. Keep the external fingerprint focused on the
+// fields the DOM surface actually depends on.
+function externalFingerprint(a: Annotation): string {
   return `${a.type}\u0000${a.originalText}`;
 }
diff --git a/packages/ui/hooks/useSharing.ts b/packages/ui/hooks/useSharing.ts
index 7d5bb9846..614509a2b 100644
--- a/packages/ui/hooks/useSharing.ts
+++ b/packages/ui/hooks/useSharing.ts
@@ -99,6 +99,7 @@ export function useSharing(
   onSharedLoad?: () => void,
   shareBaseUrl?: string,
   pasteApiUrl?: string,
+  disabled?: boolean,
   rawHtml?: string,
   setRawHtml?: (h: string) => void,
   setRenderAs?: (m: 'markdown' | 'html') => void,
@@ -238,13 +239,30 @@ export function useSharing(
     }
   }, [setMarkdown, setAnnotations, setGlobalAttachments, onSharedLoad, pasteApiUrl, setRawHtml, setRenderAs]);
 
-  // Load from hash on mount
+  // Load from hash on mount. Captured from the FIRST render and never
+  // re-evaluated: in room mode the URL fragment is `#key=<roomSecret>`
+  // and must never be parsed as a static-share payload, even if some
+  // future code path flips `disabled` from true to false (e.g. a mode
+  // transition). Keying this effect on `disabled` would re-parse the
+  // room fragment and surface a spurious "Failed to load shared plan"
+  // error. The initial capture is the single source of truth for
+  // "is this a share-eligible mount?".
+  const initiallyDisabledRef = useRef(disabled);
   useEffect(() => {
+    if (initiallyDisabledRef.current) {
+      setIsLoadingShared(false);
+      return;
+    }
     loadFromHash().finally(() => setIsLoadingShared(false));
-  }, []); // Only run on mount
+    // Intentionally mount-only. `loadFromHash` identity changes on
+    // prop updates and MUST NOT retrigger this effect.
+    // eslint-disable-next-line react-hooks/exhaustive-deps
+  }, []);
 
-  // Listen for hash changes (when user pastes a new share URL)
+  // Listen for hash changes (when user pastes a new share URL). Also skipped
+  // when disabled so hashchange events inside a live room are ignored.
   useEffect(() => {
+    if (disabled) return;
     const handleHashChange = () => {
       if (!looksLikeSharePayload(window.location.hash)) return;
       loadFromHash();
@@ -252,7 +270,7 @@ export function useSharing(
 
     window.addEventListener('hashchange', handleHashChange);
     return () => window.removeEventListener('hashchange', handleHashChange);
-  }, [loadFromHash]);
+  }, [loadFromHash, disabled]);
 
   // Generate share URL when markdown or annotations change
   const refreshShareUrl = useCallback(async () => {
@@ -267,10 +285,12 @@ export function useSharing(
     }
   }, [markdown, annotations, globalAttachments, shareBaseUrl, rawHtml]);
 
-  // Auto-refresh share URL when dependencies change
+  // Auto-refresh share URL when dependencies change. Skipped in room mode:
+  // static share URLs are not produced for live-room sessions.
   useEffect(() => {
+    if (disabled) return;
     refreshShareUrl();
-  }, [refreshShareUrl]);
+  }, [refreshShareUrl, disabled]);
 
   // Clear stale short URL when content changes (does NOT auto-regenerate —
   // the user must explicitly click "Create short link" again).
@@ -351,7 +371,10 @@ export function useSharing(
         payload = (await decompress(hash)) as SharePayload;
       }
 
-      // Extract plan title from embedded plan text (or HTML <title>)
+      if (!payload) {
+        return { success: false, count: 0, planTitle: '', error: 'Invalid share URL: no payload decoded' };
+      }
+
       let planTitle = 'Unknown Plan';
       if (payload.p) {
         const titleLine = payload.p.trim().split('\n').find(l => l.startsWith('#'));
diff --git a/packages/ui/package.json b/packages/ui/package.json
index 14d6dce97..8b7e9fb90 100644
--- a/packages/ui/package.json
+++ b/packages/ui/package.json
@@ -35,10 +35,13 @@
     "unique-username-generator": "^1.5.1"
   },
   "devDependencies": {
+    "@happy-dom/global-registrator": "^20.8.9",
+    "@testing-library/react": "^16.3.2",
     "@types/bun": "^1.2.0",
     "@types/dompurify": "^3.0.5",
     "@types/react": "^19.2.0",
     "@types/react-dom": "^19.2.0",
+    "happy-dom": "^20.8.9",
     "typescript": "~5.8.2"
   },
   "scripts": {
diff --git a/packages/ui/test-setup.ts b/packages/ui/test-setup.ts
new file mode 100644
index 000000000..26412e61a
--- /dev/null
+++ b/packages/ui/test-setup.ts
@@ -0,0 +1,25 @@
+/**
+ * Bun-test happy-dom bootstrap for DOM-dependent tests in @plannotator/ui and
+ * @plannotator/editor.
+ *
+ * Registered via `preload = ["./test-setup.ts"]` in `packages/ui/bunfig.toml`
+ * (scoped to this package) so other packages' tests don't pay the DOM cost.
+ *
+ * Installing the DOM globally means `document`, `window`, `Node`, etc. are
+ * available in every test in this scope, matching how React Testing Library
+ * expects to run.
+ */
+
+import { GlobalRegistrator } from '@happy-dom/global-registrator';
+
+if (!GlobalRegistrator.isRegistered) {
+  GlobalRegistrator.register({
+    url: 'http://localhost/',
+    width: 1024,
+    height: 768,
+  });
+}
+
+// Tell React that we're in an act-aware test environment so warnings don't
+// appear for every state update wrapped in renderHook/act.
+(globalThis as unknown as { IS_REACT_ACT_ENVIRONMENT?: boolean }).IS_REACT_ACT_ENVIRONMENT = true;
diff --git a/packages/ui/tsconfig.slice5.json b/packages/ui/tsconfig.slice5.json
new file mode 100644
index 000000000..66bd0b537
--- /dev/null
+++ b/packages/ui/tsconfig.slice5.json
@@ -0,0 +1,79 @@
+// Slice-5 scoped typecheck — lists the UI files we actively curate
+// for Live Rooms correctness.
+//
+// Explicit curation (the `include` list):
+//   - hooks added for room mode (useCollabRoom, useCollabRoomSession,
+//     useAnnotationController, useRoomMode, usePresenceThrottle)
+//   - hooks whose types changed for Slice 5 (useAnnotationHighlighter
+//     for authorOverride)
+//   - components/collab/** (all new)
+//   - components whose public API changed for Slice 5 (AnnotationPanel
+//     for authorOverride, Viewer for same)
+//   - utils added for Slice 5 (adminSecretStorage, blockTargeting)
+//
+// Transitive reality: the included files pull in siblings via normal
+// imports, and those files ARE type-checked. Errors anywhere in that
+// import closure block `bun run typecheck`. That's the point — this
+// config exists to catch the kind of bug that the old single-file
+// `tsconfig.collab.json` missed (the AnnotationPanel `isMe` scope
+// bug went unflagged for multiple review rounds because the narrower
+// config only loaded `useCollabRoom.ts`).
+//
+// What's intentionally NOT here: the rest of packages/ui. It has
+// pre-existing strict-mode drift unrelated to Live Rooms. A
+// package-wide typecheck is deferred to a later cleanup pass; this
+// config should not grow into one by accident.
+//
+// Replaces the previous `tsconfig.collab.json` (Slice 4, one file).
+// Root `bun run typecheck` references THIS file.
+{
+  "compilerOptions": {
+    "target": "ES2022",
+    "experimentalDecorators": true,
+    "useDefineForClassFields": false,
+    "module": "ESNext",
+    "lib": [
+      "ES2022",
+      "DOM",
+      "DOM.Iterable"
+    ],
+    "skipLibCheck": true,
+    "types": [
+      "node"
+    ],
+    "moduleResolution": "bundler",
+    "isolatedModules": true,
+    "moduleDetection": "force",
+    "allowJs": true,
+    "jsx": "react-jsx",
+    "paths": {
+      "@plannotator/ui/*": ["./*"],
+      "@plannotator/shared": ["../shared/index.ts"],
+      "@plannotator/shared/*": ["../shared/*"]
+    },
+    "allowImportingTsExtensions": true,
+    "noEmit": true
+  },
+  "include": [
+    "components/types.d.ts",
+    "hooks/collab/useCollabRoom.ts",
+    "hooks/collab/useCollabRoomSession.ts",
+    "hooks/useAnnotationController.ts",
+    "hooks/useAnnotationHighlighter.ts",
+    "hooks/collab/useRoomMode.ts",
+    "hooks/collab/usePresenceThrottle.ts",
+    "components/collab/**/*.tsx",
+    "components/collab/**/*.ts",
+    "components/AnnotationPanel.tsx",
+    "components/Viewer.tsx",
+    "utils/adminSecretStorage.ts",
+    "utils/blockTargeting.ts"
+  ],
+  "exclude": [
+    // Tests are run through `bun test` with the packages/ui bunfig
+    // preload; pulling them into typecheck brings in `bun:test` types
+    // that aren't part of this scoped config.
+    "**/*.test.ts",
+    "**/*.test.tsx"
+  ]
+}
diff --git a/packages/ui/types/annotationController.ts b/packages/ui/types/annotationController.ts
new file mode 100644
index 000000000..51c5102cf
--- /dev/null
+++ b/packages/ui/types/annotationController.ts
@@ -0,0 +1,82 @@
+/**
+ * AnnotationController — uniform mutation surface for the editor across
+ * local-only and live-room modes.
+ *
+ * App.tsx calls `controller.add/update/remove/clear` without caring whether
+ * state is owned by `useState` (local mode) or by `useCollabRoom` (room mode).
+ * Previously every mutation site in App.tsx called `setAnnotations(prev => ...)`
+ * directly; that pattern does not compose with the server-authoritative
+ * write model of live rooms.
+ *
+ * One field is implementation-specific and optional:
+ *   - `setAll` — local mode only. Exposed for `useSharing` (shared-URL
+ *     import) and draft-restore paths that need to REPLACE the entire list
+ *     atomically. Room mode cannot express "replace all" as a single
+ *     protocol op; callers must branch on `controller.setAll`.
+ *
+ * `pending` holds operations that have been sent but whose echo hasn't
+ * arrived yet. Keyed by id with the op kind attached. The room-mode
+ * reconciliation is kind-specific:
+ *   - add:    clears only when the id appears in room.annotations;
+ *             unrelated seq advances must NOT clear, or the optimistic
+ *             row in `pendingAdditions` would lose its "Sending…" chrome.
+ *   - update: clears once room.seq > sentAtSeq (concurrent supersession
+ *             is fine — canonical list shows the winning value).
+ *   - remove: clears once room.seq > sentAtSeq (no optimistic row to
+ *             strand; spurious clear on remove-of-absent is harmless).
+ * See `useAnnotationController.ts` for the full rationale.
+ *
+ * `failed` holds entries whose last send attempt rejected. Each carries
+ * kind + payload so the UI can offer per-op Retry/Discard without the
+ * caller holding onto the original Annotation reference. Slice 5 is
+ * online-only — failed ops do NOT auto-replay on reconnect.
+ */
+
+import type { Annotation } from '../types';
+
+export type PendingKind = 'add' | 'update' | 'remove';
+
+export interface PendingOp {
+  id: string;
+  kind: PendingKind;
+}
+
+export interface FailedOp {
+  id: string;
+  kind: PendingKind;
+  /** Human-readable error summary suitable for a tooltip/toast. */
+  error: string;
+}
+
+export interface AnnotationController {
+  mode: 'local' | 'room';
+  /**
+   * Canonical annotation list. In room mode this is ONLY the
+   * server-echoed state — pending adds do NOT appear here, so
+   * consumers that feed approve/deny/export never include un-confirmed
+   * ops (V1 contract: server-authoritative, no optimistic apply).
+   */
+  annotations: Annotation[];
+  /**
+   * Optimistic rows for sends that haven't been echoed yet. UI-only —
+   * render these in the annotation panel for "Sending…" feedback, but
+   * NEVER merge into approve/deny/export payloads. Always empty in
+   * local mode.
+   */
+  pendingAdditions: ReadonlyMap<string, Annotation>;
+  pending: ReadonlyMap<string, PendingOp>;
+  failed: ReadonlyMap<string, FailedOp>;
+
+  add(annotation: Annotation): void;
+  update(id: string, patch: Partial<Annotation>): void;
+  remove(id: string): void;
+  clear(source?: string): void;
+
+  /** Retry a previously-failed send. No-op in local mode. */
+  retry?(id: string): void;
+  /** Drop a failed pending record without retrying. No-op in local mode. */
+  discard?(id: string): void;
+
+  /** Local mode only. Atomic replace-all; undefined in room mode. */
+  setAll?: React.Dispatch<React.SetStateAction<Annotation[]>>;
+}
diff --git a/packages/ui/utils/adminSecretStorage.test.ts b/packages/ui/utils/adminSecretStorage.test.ts
new file mode 100644
index 000000000..249ac07ca
--- /dev/null
+++ b/packages/ui/utils/adminSecretStorage.test.ts
@@ -0,0 +1,72 @@
+import { afterEach, beforeEach, describe, expect, test } from 'bun:test';
+import { storeAdminSecret, loadAdminSecret, clearAdminSecret } from './adminSecretStorage';
+
+// 43-char base64url values for 32 random bytes — matches the on-wire admin
+// secret shape validated by `isBase64Url32ByteString`.
+const VALID_A = 'A'.repeat(43);
+const VALID_B = 'B'.repeat(43);
+const VALID_C = 'C'.repeat(43);
+
+describe('adminSecretStorage', () => {
+  beforeEach(() => {
+    sessionStorage.clear();
+  });
+  afterEach(() => {
+    sessionStorage.clear();
+  });
+
+  test('store/load round-trip', () => {
+    storeAdminSecret('room-a', VALID_A);
+    expect(loadAdminSecret('room-a')).toBe(VALID_A);
+  });
+
+  test('load returns null for unknown roomId', () => {
+    expect(loadAdminSecret('nonexistent')).toBeNull();
+  });
+
+  test('entries are scoped per roomId — storing one does not affect another', () => {
+    storeAdminSecret('room-a', VALID_A);
+    storeAdminSecret('room-b', VALID_B);
+    expect(loadAdminSecret('room-a')).toBe(VALID_A);
+    expect(loadAdminSecret('room-b')).toBe(VALID_B);
+  });
+
+  test('clear removes only the targeted room', () => {
+    storeAdminSecret('room-a', VALID_A);
+    storeAdminSecret('room-b', VALID_B);
+    clearAdminSecret('room-a');
+    expect(loadAdminSecret('room-a')).toBeNull();
+    expect(loadAdminSecret('room-b')).toBe(VALID_B);
+  });
+
+  test('clear on unknown roomId is a no-op', () => {
+    expect(() => clearAdminSecret('nonexistent')).not.toThrow();
+  });
+
+  test('overwriting an existing secret replaces the old value', () => {
+    storeAdminSecret('room-a', VALID_A);
+    storeAdminSecret('room-a', VALID_C);
+    expect(loadAdminSecret('room-a')).toBe(VALID_C);
+  });
+
+  test('uses the documented key prefix so storage inspection is predictable', () => {
+    storeAdminSecret('room-xyz', VALID_A);
+    expect(sessionStorage.getItem('plannotator.room.admin.room-xyz')).toBe(VALID_A);
+  });
+
+  test('load rejects and evicts a malformed stored value', () => {
+    // Simulate a corrupted sessionStorage entry — shape validation catches
+    // pre-validation values from older builds or external tampering.
+    sessionStorage.setItem('plannotator.room.admin.room-a', 'not-a-valid-secret');
+    expect(loadAdminSecret('room-a')).toBeNull();
+    // Evicted so subsequent reads don't keep rejecting the same garbage.
+    expect(sessionStorage.getItem('plannotator.room.admin.room-a')).toBeNull();
+  });
+
+  test('load rejects a stored value of the wrong length even if base64url-safe', () => {
+    // 42 chars — one short of a 32-byte base64url string.
+    sessionStorage.setItem('plannotator.room.admin.room-a', 'A'.repeat(42));
+    expect(loadAdminSecret('room-a')).toBeNull();
+    expect(sessionStorage.getItem('plannotator.room.admin.room-a')).toBeNull();
+  });
+});
diff --git a/packages/ui/utils/adminSecretStorage.ts b/packages/ui/utils/adminSecretStorage.ts
new file mode 100644
index 000000000..42186843d
--- /dev/null
+++ b/packages/ui/utils/adminSecretStorage.ts
@@ -0,0 +1,81 @@
+/**
+ * Admin secret persistence for room creators.
+ *
+ * Scope: sessionStorage, keyed per roomId (`plannotator.room.admin.<roomId>`).
+ * Survives tab refresh, dies on tab close. Deliberately NOT localStorage —
+ * the adminSecret is a URL-fragment-grade credential; long-term persistence
+ * would outlive the user's intent. Deliberately NOT in-memory only — the
+ * creator must be able to refresh their tab without losing admin capability.
+ *
+ * Threat model: anything that can read sessionStorage in this origin already
+ * controls the tab. The adminSecret grants delete on one specific room;
+ * leaking it out of sessionStorage would only happen via XSS in the same
+ * origin, at which point the attacker already has full control.
+ *
+ * Values are stored as base64url strings so a caller consuming
+ * `loadAdminSecret()` decodes the same format `parseRoomUrl()` produces from
+ * the fragment. The read path validates the shape on load and evicts
+ * malformed entries so downstream admin-join paths never see garbage.
+ */
+
+import { isBase64Url32ByteString } from '@plannotator/shared/collab/validation';
+
+const KEY_PREFIX = 'plannotator.room.admin.';
+
+function storageKey(roomId: string): string {
+  return `${KEY_PREFIX}${roomId}`;
+}
+
+/** Best-effort sessionStorage access — returns null if unavailable (SSR, sandboxed iframe). */
+function getStorage(): Storage | null {
+  try {
+    if (typeof sessionStorage === 'undefined') return null;
+    // Probe for quota / disabled storage without throwing.
+    const probeKey = `${KEY_PREFIX}__probe__`;
+    sessionStorage.setItem(probeKey, '1');
+    sessionStorage.removeItem(probeKey);
+    return sessionStorage;
+  } catch {
+    return null;
+  }
+}
+
+export function storeAdminSecret(roomId: string, adminSecretBase64url: string): void {
+  const s = getStorage();
+  if (!s) return;
+  try {
+    s.setItem(storageKey(roomId), adminSecretBase64url);
+  } catch {
+    // Quota / disabled — silently give up. The caller should degrade to
+    // "admin capability will be lost on refresh" rather than failing.
+  }
+}
+
+export function loadAdminSecret(roomId: string): string | null {
+  const s = getStorage();
+  if (!s) return null;
+  try {
+    const raw = s.getItem(storageKey(roomId));
+    if (raw === null) return null;
+    if (!isBase64Url32ByteString(raw)) {
+      // Evict so a bad value doesn't live on across reloads and so callers
+      // that key off "has stored secret?" don't attempt to recover admin
+      // capability from garbage.
+      try { s.removeItem(storageKey(roomId)); } catch { /* ignore */ }
+      return null;
+    }
+    return raw;
+  } catch {
+    return null;
+  }
+}
+
+export function clearAdminSecret(roomId: string): void {
+  const s = getStorage();
+  if (!s) return;
+  try {
+    s.removeItem(storageKey(roomId));
+  } catch {
+    // ignore
+  }
+}
diff --git a/packages/ui/utils/agentIdentity.test.ts b/packages/ui/utils/agentIdentity.test.ts
new file mode 100644
index 000000000..645ae092d
--- /dev/null
+++ b/packages/ui/utils/agentIdentity.test.ts
@@ -0,0 +1,156 @@
+import { describe, expect, test } from 'bun:test';
+import {
+  AGENT_TYPES,
+  constructAgentIdentity,
+  getAgentType,
+  InvalidAgentIdentityError,
+  isAgentIdentity,
+  toAgentUserSlug,
+} from './agentIdentity';
+
+describe('isAgentIdentity', () => {
+  test('true for canonical forms', () => {
+    expect(isAgentIdentity('alice-agent-claude')).toBe(true);
+    expect(isAgentIdentity('swift-falcon-tater-agent-codex')).toBe(true);
+    expect(isAgentIdentity('user123-agent-opencode')).toBe(true);
+    expect(isAgentIdentity('multi-dash-user-agent-junie')).toBe(true);
+    expect(isAgentIdentity('something-agent-other')).toBe(true);
+  });
+
+  test('false for plain human identities', () => {
+    expect(isAgentIdentity('alice')).toBe(false);
+    expect(isAgentIdentity('swift-falcon-tater')).toBe(false);
+    expect(isAgentIdentity('Free Agent')).toBe(false);
+    expect(isAgentIdentity('agent-of-chaos')).toBe(false);
+  });
+
+  test('false for unknown suffix types', () => {
+    expect(isAgentIdentity('alice-agent-gpt')).toBe(false);
+    expect(isAgentIdentity('bob-agent-')).toBe(false);
+  });
+
+  test('false for empty / null / non-string', () => {
+    expect(isAgentIdentity('')).toBe(false);
+    expect(isAgentIdentity(null)).toBe(false);
+    expect(isAgentIdentity(undefined)).toBe(false);
+    expect(isAgentIdentity(42 as unknown as string)).toBe(false);
+  });
+
+  test('case-sensitive: uppercase suffix does not match', () => {
+    // Rationale: identities round-trip through constructAgentIdentity
+    // which lowercases. A human whose name contains "Agent" shouldn't
+    // accidentally false-positive.
+    expect(isAgentIdentity('alice-agent-Claude')).toBe(false);
+    expect(isAgentIdentity('alice-AGENT-claude')).toBe(false);
+  });
+});
+
+describe('getAgentType', () => {
+  test('returns the type for valid identities', () => {
+    expect(getAgentType('alice-agent-claude')).toBe('claude');
+    expect(getAgentType('bob-agent-codex')).toBe('codex');
+    expect(getAgentType('x-agent-other')).toBe('other');
+  });
+
+  test('returns undefined for non-agents', () => {
+    expect(getAgentType('alice')).toBeUndefined();
+    expect(getAgentType('alice-agent-gpt')).toBeUndefined();
+    expect(getAgentType('')).toBeUndefined();
+  });
+});
+
+describe('constructAgentIdentity', () => {
+  test('basic construction', () => {
+    expect(constructAgentIdentity({ user: 'alice', type: 'claude' })).toBe('alice-agent-claude');
+    expect(
+      constructAgentIdentity({ user: 'swift-falcon-tater', type: 'codex' }),
+    ).toBe('swift-falcon-tater-agent-codex');
+  });
+
+  test('normalizes user to lowercase + trims', () => {
+    expect(constructAgentIdentity({ user: '  Alice  ', type: 'claude' })).toBe('alice-agent-claude');
+    expect(constructAgentIdentity({ user: 'BOB', type: 'junie' })).toBe('bob-agent-junie');
+  });
+
+  test('rejects users with invalid characters', () => {
+    expect(() => constructAgentIdentity({ user: 'alice.smith', type: 'claude' })).toThrow(InvalidAgentIdentityError);
+    expect(() => constructAgentIdentity({ user: 'alice_smith', type: 'claude' })).toThrow(InvalidAgentIdentityError);
+    expect(() => constructAgentIdentity({ user: 'alice smith', type: 'claude' })).toThrow(InvalidAgentIdentityError);
+    expect(() => constructAgentIdentity({ user: '-alice', type: 'claude' })).toThrow(InvalidAgentIdentityError);
+    expect(() => constructAgentIdentity({ user: '', type: 'claude' })).toThrow(InvalidAgentIdentityError);
+  });
+
+  test('rejects unknown types', () => {
+    expect(() =>
+      constructAgentIdentity({ user: 'alice', type: 'gpt' as never }),
+    ).toThrow(InvalidAgentIdentityError);
+  });
+
+  test('constructed identities round-trip through isAgentIdentity', () => {
+    for (const type of AGENT_TYPES) {
+      const id = constructAgentIdentity({ user: 'test-user', type });
+      expect(isAgentIdentity(id)).toBe(true);
+      expect(getAgentType(id)).toBe(type);
+    }
+  });
+});
+
+describe('toAgentUserSlug', () => {
+  test('space-separated display names become dash-separated slugs', () => {
+    expect(toAgentUserSlug('Michael Ramos')).toBe('michael-ramos');
+    expect(toAgentUserSlug('Ada Lovelace')).toBe('ada-lovelace');
+  });
+
+  test('already-slug inputs pass through unchanged', () => {
+    expect(toAgentUserSlug('alice')).toBe('alice');
+    expect(toAgentUserSlug('swift-falcon-tater')).toBe('swift-falcon-tater');
+    expect(toAgentUserSlug('user123')).toBe('user123');
+  });
+
+  test('trims outer whitespace', () => {
+    expect(toAgentUserSlug('  Bob  ')).toBe('bob');
+    expect(toAgentUserSlug('\tAlice\n')).toBe('alice');
+  });
+
+  test('lowercases uppercase letters', () => {
+    expect(toAgentUserSlug('ALICE')).toBe('alice');
+    expect(toAgentUserSlug('MixedCase')).toBe('mixedcase');
+  });
+
+  test('replaces punctuation and symbols with dashes', () => {
+    expect(toAgentUserSlug('alice.smith')).toBe('alice-smith');
+    expect(toAgentUserSlug('alice_smith')).toBe('alice-smith');
+    expect(toAgentUserSlug('alice@work')).toBe('alice-work');
+    expect(toAgentUserSlug('MIXED case+SYMBOLS!!!')).toBe('mixed-case-symbols');
+  });
+
+  test('collapses runs of dashes into a single dash', () => {
+    expect(toAgentUserSlug('a   b')).toBe('a-b');
+    expect(toAgentUserSlug('a...b')).toBe('a-b');
+    expect(toAgentUserSlug('a--b')).toBe('a-b');
+  });
+
+  test('strips leading and trailing dashes', () => {
+    expect(toAgentUserSlug('-alice-')).toBe('alice');
+    expect(toAgentUserSlug('...alice...')).toBe('alice');
+  });
+
+  test('falls back when slugification produces empty string', () => {
+    expect(toAgentUserSlug('')).toBe('participant');
+    expect(toAgentUserSlug('   ')).toBe('participant');
+    expect(toAgentUserSlug('!!!')).toBe('participant');
+    expect(toAgentUserSlug('---')).toBe('participant');
+  });
+
+  test('accepts a custom fallback', () => {
+    expect(toAgentUserSlug('', 'user')).toBe('user');
+    expect(toAgentUserSlug('!!!', 'guest')).toBe('guest');
+  });
+
+  test('slugs round-trip through constructAgentIdentity', () => {
+    const slug = toAgentUserSlug('Michael Ramos');
+    const identity = constructAgentIdentity({ user: slug, type: 'claude' });
+    expect(identity).toBe('michael-ramos-agent-claude');
+    expect(isAgentIdentity(identity)).toBe(true);
+  });
+});
diff --git a/packages/ui/utils/agentIdentity.ts b/packages/ui/utils/agentIdentity.ts
new file mode 100644
index 000000000..8a12e28a0
--- /dev/null
+++ b/packages/ui/utils/agentIdentity.ts
@@ -0,0 +1,136 @@
+/**
+ * Pure agent-identity helpers — shared between the `apps/collab-agent`
+ * CLI and the room-side UI components that mark agent cursors /
+ * avatars visually.
+ *
+ * Deliberately NOT placed alongside `identity.ts`. That file imports
+ * `../config` (ConfigStore: cookie + server-sync), which must NOT
+ * be pulled into the agent CLI's module graph. This file has zero
+ * imports so both the browser UI and a plain Bun script can use it
+ * without dragging browser storage or network code along.
+ *
+ * The identity convention is `<user>-agent-<type>`, where `<type>`
+ * is one of the agent kinds below. Receivers (UI) use
+ * `isAgentIdentity(name)` to decide whether to render the
+ * distinguishing marker; senders (CLI) use `constructAgentIdentity`
+ * to build the string from user + type inputs.
+ */
+
+/**
+ * Canonical agent kinds Plannotator recognises. `other` is the
+ * escape hatch — anything outside the known set still constructs a
+ * valid identity (`foo-agent-other`) and is detected by
+ * `isAgentIdentity`. New kinds get added here; detection expands
+ * automatically via `KNOWN_AGENT_TYPES`.
+ */
+export const AGENT_TYPES = [
+  'claude',
+  'codex',
+  'opencode',
+  'junie',
+  'other',
+] as const;
+
+export type AgentType = typeof AGENT_TYPES[number];
+
+const KNOWN_AGENT_TYPES: ReadonlySet<string> = new Set(AGENT_TYPES);
+
+/**
+ * True when the name ends in `-agent-<known-type>`. The match is
+ * case-sensitive: identities are lowercased by `constructAgentIdentity`
+ * so a mixed-case name in the wild indicates either manual
+ * construction (not through the CLI) or a human whose name happens
+ * to include "Agent" as a word — we treat the latter as a false
+ * positive worth avoiding.
+ */
+export function isAgentIdentity(name: string | undefined | null): boolean {
+  if (typeof name !== 'string' || name.length === 0) return false;
+  const lastDash = name.lastIndexOf('-agent-');
+  if (lastDash < 1) return false;
+  const suffix = name.slice(lastDash + '-agent-'.length);
+  return KNOWN_AGENT_TYPES.has(suffix);
+}
+
+/**
+ * Extract the trailing type from an agent identity. Returns
+ * undefined when the input isn't an agent identity — callers can
+ * gate UI (tooltip, icon choice) on this.
+ */
+export function getAgentType(name: string | undefined | null): AgentType | undefined {
+  if (typeof name !== 'string') return undefined;
+  const lastDash = name.lastIndexOf('-agent-');
+  if (lastDash < 1) return undefined;
+  const suffix = name.slice(lastDash + '-agent-'.length);
+  return KNOWN_AGENT_TYPES.has(suffix) ? (suffix as AgentType) : undefined;
+}
+
+export class InvalidAgentIdentityError extends Error {
+  constructor(message: string) {
+    super(message);
+    this.name = 'InvalidAgentIdentityError';
+  }
+}
+
+/**
+ * Normalize an arbitrary display name into a CLI-safe `--user` slug.
+ *
+ * `constructAgentIdentity` enforces a strict `/^[a-z0-9][a-z0-9-]*$/`
+ * charset on the user half of the identity, but human display names
+ * routinely carry spaces, uppercase, punctuation, and the occasional
+ * emoji. This function bridges the two — feeding raw names through
+ * slugification before they hit the agent CLI avoids either silent
+ * shell truncation (unquoted `--user Michael Ramos` splits on the
+ * space and drops "Ramos") or a thrown `InvalidAgentIdentityError`.
+ *
+ * Rules:
+ *  - trim surrounding whitespace
+ *  - lowercase
+ *  - replace any run of non-`[a-z0-9-]` with a single `-`
+ *  - collapse runs of `-`
+ *  - strip leading/trailing `-`
+ *  - if the result is empty (all-punctuation input), return `fallback`
+ *
+ * `fallback` exists so the slug is always a valid `--user` argument,
+ * even when the display name can't produce one. Default is
+ * `"participant"` to match the semantic level (a participant in a
+ * room) without guessing at the user's intent.
+ */
+export function toAgentUserSlug(name: string, fallback = 'participant'): string {
+  const slug = name
+    .trim()
+    .toLowerCase()
+    .replace(/[^a-z0-9-]+/g, '-')
+    .replace(/^-+|-+$/g, '')
+    .replace(/-{2,}/g, '-');
+  return slug.length > 0 ? slug : fallback;
+}
+
+/**
+ * Build `<user>-agent-<type>` from components. Normalizes to
+ * lowercase so downstream hashing (presence color) is stable
+ * across case variants. Rejects obviously malformed user inputs
+ * with a descriptive error so CLI argv validation happens in one
+ * place.
+ *
+ * `user` must match `/^[a-z0-9][a-z0-9-]*$/` (start with alnum,
+ * then alnum/dashes). This is a superset of the tater-name
+ * convention (`adjective-noun-tater`) so real agents identifying
+ * for real users still validate.
+ */
+export function constructAgentIdentity(opts: {
+  user: string;
+  type: AgentType;
+}): string {
+  const user = opts.user.trim().toLowerCase();
+  if (!/^[a-z0-9][a-z0-9-]*$/.test(user)) {
+    throw new InvalidAgentIdentityError(
+      `user must start with alnum and contain only lowercase alnum/dashes; got "${opts.user}"`,
+    );
+  }
+  if (!KNOWN_AGENT_TYPES.has(opts.type)) {
+    throw new InvalidAgentIdentityError(
+      `type must be one of ${AGENT_TYPES.join('|')}; got "${opts.type}"`,
+    );
+  }
+  return `${user}-agent-${opts.type}`;
+}
diff --git a/packages/ui/utils/identity.ts b/packages/ui/utils/identity.ts
index 8b73f7504..94ae05fa4 100644
--- a/packages/ui/utils/identity.ts
+++ b/packages/ui/utils/identity.ts
@@ -8,10 +8,16 @@
  * Resolution is delegated to ConfigStore (packages/ui/config/configStore.ts)
  * which handles: server config file > cookie > generated tater name.
  * This module provides the identity-specific API surface.
+ *
+ * Presence color (Live Rooms) is also stored here because it's part
+ * of the user's identity surface: Settings, StartRoomModal, and
+ * JoinRoomGate all read/write the same preference, and peer presence
+ * carries the self-declared color.
  */
 
 import { configStore } from '../config';
 import { generateIdentity } from './generateIdentity';
+import { hashNameToSwatch, normalizePresenceColor } from './presenceColor';
 
 /**
  * Get current identity from ConfigStore.
@@ -32,12 +38,23 @@ export function setCustomIdentity(name: string): string {
 }
 
 /**
- * Regenerate identity with a new random tater name.
- * Writes to cookie + queues server write-back via ConfigStore.
+ * Regenerate identity with a new random tater name AND a matching
+ * hash-derived presence color. Couples name and color on purpose:
+ * `presenceColor`'s default factory only runs on first-ever visit
+ * (cookie empty), so without this link, clicking "Regenerate" in
+ * Settings cycles the name but keeps the original color forever —
+ * users hit this as "my color never changes no matter what I try."
+ *
+ * The color stays deterministic per name (same tater = same swatch
+ * across sessions / machines, which helps teammates recognize each
+ * other). Users who want a specific color can still override via
+ * the Settings swatch row — that writes `presenceColor` directly
+ * and persists.
  */
 export function regenerateIdentity(): string {
   const identity = generateIdentity();
   configStore.set('displayName', identity);
+  configStore.set('presenceColor', hashNameToSwatch(identity));
   return identity;
 }
 
@@ -48,3 +65,18 @@ export function isCurrentUser(author: string | undefined): boolean {
   if (!author) return false;
   return author === configStore.get('displayName');
 }
+
+/** Get current presence color. */
+export function getPresenceColor(): string {
+  return configStore.get('presenceColor');
+}
+
+/**
+ * Persist a new presence color. Normalized to lowercase so "#FF0000"
+ * and "#ff0000" don't produce separate cookie values across surfaces.
+ */
+export function setPresenceColor(color: string): string {
+  const normalized = normalizePresenceColor(color);
+  configStore.set('presenceColor', normalized);
+  return normalized;
+}
diff --git a/packages/ui/utils/presenceColor.test.ts b/packages/ui/utils/presenceColor.test.ts
new file mode 100644
index 000000000..2a5e6fe7e
--- /dev/null
+++ b/packages/ui/utils/presenceColor.test.ts
@@ -0,0 +1,66 @@
+import { describe, expect, test } from 'bun:test';
+import {
+  PRESENCE_SWATCHES,
+  hashNameToSwatch,
+  isValidPresenceColor,
+  normalizePresenceColor,
+} from './presenceColor';
+
+describe('presenceColor — swatches', () => {
+  test('SWATCHES is non-empty and all values are #RRGGBB', () => {
+    expect(PRESENCE_SWATCHES.length).toBeGreaterThan(0);
+    for (const s of PRESENCE_SWATCHES) {
+      expect(s).toMatch(/^#[0-9a-f]{6}$/);
+    }
+  });
+});
+
+describe('presenceColor — hashNameToSwatch', () => {
+  test('returns a value from the palette', () => {
+    const out = hashNameToSwatch('alice');
+    expect(PRESENCE_SWATCHES).toContain(out);
+  });
+
+  test('is deterministic for the same input', () => {
+    const a = hashNameToSwatch('swift-falcon-tater');
+    const b = hashNameToSwatch('swift-falcon-tater');
+    expect(a).toBe(b);
+  });
+
+  test('empty name maps to a swatch (edge case: pre-identity boot)', () => {
+    // ConfigStore calls this during init when the displayName cookie
+    // hasn't been written yet; the function must not throw or return
+    // something outside the palette.
+    const out = hashNameToSwatch('');
+    expect(PRESENCE_SWATCHES).toContain(out);
+  });
+});
+
+describe('presenceColor — isValidPresenceColor', () => {
+  test('accepts #RRGGBB in lower, upper, mixed case', () => {
+    expect(isValidPresenceColor('#2563eb')).toBe(true);
+    expect(isValidPresenceColor('#2563EB')).toBe(true);
+    expect(isValidPresenceColor('#Ff00Aa')).toBe(true);
+  });
+
+  test('rejects shorthand, missing hash, length drift, and non-strings', () => {
+    expect(isValidPresenceColor('#abc')).toBe(false);        // 3-digit shorthand
+    expect(isValidPresenceColor('2563eb')).toBe(false);      // no #
+    expect(isValidPresenceColor('#2563eb0')).toBe(false);    // 7 chars after #
+    expect(isValidPresenceColor('#GGGGGG')).toBe(false);     // non-hex
+    expect(isValidPresenceColor('')).toBe(false);
+    expect(isValidPresenceColor(null)).toBe(false);
+    expect(isValidPresenceColor(undefined)).toBe(false);
+    expect(isValidPresenceColor(0xff0000)).toBe(false);
+  });
+});
+
+describe('presenceColor — normalizePresenceColor', () => {
+  test('lowercases', () => {
+    expect(normalizePresenceColor('#FF00AA')).toBe('#ff00aa');
+  });
+
+  test('lowercase input is unchanged', () => {
+    expect(normalizePresenceColor('#ff00aa')).toBe('#ff00aa');
+  });
+});
diff --git a/packages/ui/utils/presenceColor.ts b/packages/ui/utils/presenceColor.ts
new file mode 100644
index 000000000..b5d5c58f0
--- /dev/null
+++ b/packages/ui/utils/presenceColor.ts
@@ -0,0 +1,43 @@
+/**
+ * Pure presence-color helpers — SWATCHES palette, hash-to-swatch
+ * defaulter, and validation. No ConfigStore dependency, so this
+ * module is safe to import from `packages/ui/config/settings.ts`
+ * without creating an import cycle. Store-touching wrappers
+ * (getPresenceColor / setPresenceColor) live in `./identity.ts`
+ * because presence color is part of the user's identity surface
+ * in Live Rooms.
+ */
+
+export const PRESENCE_SWATCHES = [
+  '#2563eb', '#f97316', '#10b981', '#ef4444',
+  '#8b5cf6', '#eab308', '#06b6d4', '#ec4899',
+] as const;
+
+export type PresenceSwatch = typeof PRESENCE_SWATCHES[number];
+
+/**
+ * Deterministic swatch pick for a given name. First-time users get a
+ * distinct default without needing to open the color picker, and two
+ * runs of the same identity produce the same color so the creator's
+ * self-view matches what peers see.
+ */
+export function hashNameToSwatch(name: string): string {
+  let h = 0;
+  for (let i = 0; i < name.length; i++) {
+    h = (h * 31 + name.charCodeAt(i)) | 0;
+  }
+  const idx = Math.abs(h) % PRESENCE_SWATCHES.length;
+  return PRESENCE_SWATCHES[idx];
+}
+
+const HEX_RE = /^#[0-9a-fA-F]{6}$/;
+
+/** `#RRGGBB` shape check — narrow enough to catch garbage fragment input. */
+export function isValidPresenceColor(value: unknown): value is string {
+  return typeof value === 'string' && HEX_RE.test(value);
+}
+
+/** Lowercase-normalize so "#FF0000" and "#ff0000" don't fragment the cookie. */
+export function normalizePresenceColor(value: string): string {
+  return value.toLowerCase();
+}
diff --git a/packages/ui/utils/roomAgentInstructions.ts b/packages/ui/utils/roomAgentInstructions.ts
new file mode 100644
index 000000000..f083c59b9
--- /dev/null
+++ b/packages/ui/utils/roomAgentInstructions.ts
@@ -0,0 +1,170 @@
+/**
+ * Builds the clipboard payload that teaches an external agent (Claude
+ * Code, Codex, OpenCode, Junie, etc.) how to join THIS specific
+ * Plannotator Live Room as a first-class peer via the
+ * `@plannotator/collab-agent` CLI.
+ *
+ * Parallel to `planAgentInstructions.ts` — same shape, same purpose
+ * (a markdown payload the user copies from the room menu and pastes
+ * into their agent's prompt), but targets the direct-room path
+ * (WebSocket, encrypted) rather than the local /api/external-annotations
+ * path (local HTTP, unencrypted).
+ *
+ * The dynamic values are interpolated at click time:
+ *  - `joinUrl` — the full participant URL including the
+ *    `#key=<secret>` fragment. This is what the CLI's `--url` flag
+ *    takes. Admin URLs work too — the CLI strips `#admin=` before
+ *    connecting — but passing the participant URL is cleaner.
+ *  - `userIdentity` — the current user's display name. It's
+ *    slugified via `toAgentUserSlug` before templating so the
+ *    rendered `--user` value is always a valid CLI argument even
+ *    when the display name contains spaces, uppercase, or
+ *    punctuation (e.g. "Michael Ramos" → "michael-ramos"). Without
+ *    this pass, an unquoted `--user Michael Ramos` would truncate
+ *    to `Michael` in the shell and agents would silently join
+ *    under the wrong identity.
+ *
+ * Intentionally short. Agents don't read manuals; this is
+ * "top-to-bottom in 30 seconds and they can start posting."
+ */
+
+import { toAgentUserSlug } from './agentIdentity';
+
+export interface RoomAgentInstructionsInput {
+  /** Participant URL — must include `#key=<secret>` fragment. */
+  joinUrl: string;
+  /** Current user's display name (may contain spaces / caps / punctuation). */
+  userIdentity: string;
+}
+
+export function buildRoomAgentInstructions(input: RoomAgentInstructionsInput): string {
+  const { joinUrl, userIdentity } = input;
+  // Escape any characters that would break the markdown's inline-quoted
+  // argument values. The CLI itself doesn't care, but the markdown
+  // should paste cleanly into any reasonable editor.
+  const urlArg = joinUrl.replaceAll('"', '\\"');
+  // Slugify before templating so the rendered `--user` value is
+  // always shell-safe and CLI-valid. See the module docstring for
+  // why this matters (unquoted shell splitting / constructAgentIdentity
+  // charset).
+  const userArg = toAgentUserSlug(userIdentity);
+  return `# Plannotator Live Room — Agent Join Instructions
+
+You're being invited to join a live, encrypted review session hosted by a Plannotator user. You participate as a first-class peer — read the plan, read annotations, post comments, and remain visible on participants' screens via a distinguished agent marker.
+
+## Your identity
+
+The user has already chosen an identity for you. Pass it exactly as the \`--user\` value on every CLI invocation:
+
+- \`--user ${userArg}\`
+- \`--type <your kind>\` — one of: \`claude\`, \`codex\`, \`opencode\`, \`junie\`, \`other\`. Pick whichever describes you. Use \`other\` if none apply.
+
+The CLI assembles your full room identity as \`${userArg}-agent-<type>\`. That's what the user sees in their avatar row and above your cursor, with a \`⚙\` marker indicating agent.
+
+## Joining this room
+
+Every subcommand takes \`--url\`, \`--user\`, \`--type\`. This is the URL for THIS session:
+
+\`\`\`
+${joinUrl}
+\`\`\`
+
+## What to do right now
+
+**Don't wait for the user to give you a specific task.** The room is being shared in front of an audience and they expect to see agent activity within seconds of the link landing. Your default first action is to run \`demo\`:
+
+\`\`\`sh
+bun run agent:run demo \\
+  --url "${urlArg}" \\
+  --user ${userArg} --type claude \\
+  --duration 120
+\`\`\`
+
+\`demo\` walks your cursor through every heading in document order, anchors at each heading with a randomized horizontal offset (so parallel agents don't stack on the same pixel), pauses 3–6 s, and posts a block-level comment at each stop. Takes about two minutes and produces immediately-visible activity for the audience. The \`⚙\` marker next to your name makes it obvious you're an agent, not a human peer.
+
+After \`demo\` finishes (or in parallel if you can manage it), follow up with **one or two thoughtful observations** about substantive blocks — real comments on performance targets, design tradeoffs, concrete claims, anything where you have an opinion worth stating. Use \`comment\` for those. Templated "[demo] reviewing X" text is enough to prove you're there; a genuine observation is what proves you actually read the plan.
+
+If the user has given you a specific task instead (e.g. "review the infrastructure section for holes"), drop this default and follow their direction.
+
+## Reference — reading the plan and peers
+
+From the Plannotator repo root (the CLI is a workspace package under \`apps/collab-agent/\`):
+
+\`\`\`sh
+# Read the plan with block ids (you need the block ids to comment)
+bun run agent:run read-plan --with-block-ids \\
+  --url "${urlArg}" \\
+  --user ${userArg} --type claude
+
+# See existing annotations
+bun run agent:run read-annotations \\
+  --url "${urlArg}" \\
+  --user ${userArg} --type claude
+
+# See peers who've emitted presence recently
+bun run agent:run read-presence \\
+  --url "${urlArg}" \\
+  --user ${userArg} --type claude
+\`\`\`
+
+\`read-presence\` is "recent emitters," not a participant roster — connected-but-idle peers won't appear.
+
+## Posting a comment
+
+Block-level only in V1. You target an entire block; the comment attaches to that block's content. Inline text-range targeting is not supported here (use prose inside your \`--text\` to reference specific wording).
+
+\`\`\`sh
+bun run agent:run comment \\
+  --url "${urlArg}" \\
+  --user ${userArg} --type claude \\
+  --block <blockId> \\
+  --text "Your comment text."
+\`\`\`
+
+Need to see the blocks without running \`read-plan\`?
+
+\`\`\`sh
+bun run agent:run comment --list-blocks \\
+  --url "${urlArg}" \\
+  --user ${userArg} --type claude
+\`\`\`
+
+\`comment\` waits for the server echo before exiting. Exit 0 = the comment appeared in everyone's view. Exit 1 = timeout or server rejection (e.g. the room was deleted). Exit 2 = argv error.
+
+## Staying visible while you work
+
+\`read-*\` and \`comment\` are one-shots — you flash into the avatar row during the call and disappear. To be continuously visible (recommended when doing multi-step work so the user sees you "thinking"):
+
+\`\`\`sh
+bun run agent:run join \\
+  --url "${urlArg}" \\
+  --user ${userArg} --type claude
+\`\`\`
+
+Runs until SIGINT. Heartbeats presence every 10s so you stay in the avatar row. Streams room events to stdout as NDJSON — you can tail it while running other subcommands in other shells.
+
+## Demo mode — flags reference
+
+\`demo\` is covered above under "What to do right now" — this section is the flag reference.
+
+- \`--duration <sec>\` — total wall time across all headings (default 120). Per-heading pause is clamped to 3–6 s regardless.
+- \`--comment-template <str>\` — body for each posted comment. \`{heading}\` and \`{level}\` are substituted. Default: \`"[demo] reviewing {heading}"\`.
+- \`--dry-run\` — walk the cursor without posting comments. Use this if the user explicitly wants a quiet cursor-only showcase.
+
+Demo confirms each comment's echo per heading and exits non-zero if any comment failed to land (e.g. room deleted mid-tour). Streams \`demo.start\`, \`demo.visit\`, \`demo.comment\`, \`demo.comment.failed\`, and \`demo.end\` events as NDJSON so an invoking script can track progress.
+
+## Rules and limits
+
+- **No admin actions.** You cannot delete the room. If the URL contained \`#admin=\`, the CLI strips it and warns; you join as a regular participant.
+- **No image attachments.** V1 room annotations are text only.
+- **Server-authoritative.** Your post is not final until the server echoes it back. \`comment\` waits; \`demo\` tracks per-heading success. Don't assume local intent landed.
+- **Block-level only.** Do NOT attempt to select a sub-range of text for annotation anchoring. That path has known selection-accuracy issues. Quote specific wording inside your comment body if it matters.
+
+## Troubleshooting
+
+- \`Missing --url\` / \`Missing --user\` / \`Missing --type\` — add the flag.
+- \`Timed out waiting for snapshot\` — the URL parsed but the room service is unreachable. Check you can open the URL in a browser.
+- \`unknown --block\` — that block id isn't in the current plan. Run \`comment --list-blocks\` to see the valid set.
+- \`<code>: <message>\` on a comment — the server rejected the op. The message names the reason (e.g. \`validation_error\` for a malformed payload). Wait and retry, or move on.
+`;
+}
diff --git a/packages/ui/utils/roomIdentityConfirmed.ts b/packages/ui/utils/roomIdentityConfirmed.ts
new file mode 100644
index 000000000..ee36c15f3
--- /dev/null
+++ b/packages/ui/utils/roomIdentityConfirmed.ts
@@ -0,0 +1,52 @@
+/**
+ * Per-room "identity was confirmed in this tab" flag.
+ *
+ * Lives in sessionStorage (dies on tab close, survives reload) and is
+ * keyed per roomId. Two writers:
+ *   - `AppRoot` after consuming a creator identity handoff from the URL
+ *     fragment (creator already confirmed locally before navigating).
+ *   - `RoomApp.handleJoin` after the participant submits the gate.
+ *
+ * Consumer: `RoomApp` reads this on mount to decide whether to skip
+ * `JoinRoomGate`. A set flag for the current roomId means "we already
+ * have a confirmed identity for this specific room in this tab" —
+ * reload preserves it; opening a different room URL does not, so the
+ * user gets a prefilled gate again for the new room (per-room scoping
+ * matches the agreed UX: confirm once per room, reuse on reload).
+ */
+
+const KEY_PREFIX = 'plannotator.room.identity-confirmed.';
+
+function storageKey(roomId: string): string {
+  return `${KEY_PREFIX}${roomId}`;
+}
+
+function getStorage(): Storage | null {
+  try {
+    if (typeof sessionStorage === 'undefined') return null;
+    return sessionStorage;
+  } catch {
+    return null;
+  }
+}
+
+export function markRoomIdentityConfirmed(roomId: string): void {
+  const s = getStorage();
+  if (!s) return;
+  try {
+    s.setItem(storageKey(roomId), '1');
+  } catch {
+    // Quota / disabled — the worst case is the user sees the gate again
+    // on reload. Not worth bubbling.
+  }
+}
+
+export function isRoomIdentityConfirmed(roomId: string): boolean {
+  const s = getStorage();
+  if (!s) return false;
+  try {
+    return s.getItem(storageKey(roomId)) !== null;
+  } catch {
+    return false;
+  }
+}
diff --git a/packages/ui/utils/sharing.ts b/packages/ui/utils/sharing.ts
index 3be5ab26e..f102bcd76 100644
--- a/packages/ui/utils/sharing.ts
+++ b/packages/ui/utils/sharing.ts
@@ -195,6 +195,11 @@ export async function parseShareHash(): Promise<SharePayload | null> {
   }
 
   try {
+    // `decompress` returns `unknown` by design (it's a generic
+    // utility); the caller is responsible for shape-validating the
+    // result. We keep the historical cast and accept that malformed
+    // share hashes will surface downstream. Full runtime validation
+    // is tracked as follow-up cleanup.
     return (await decompress(hash)) as SharePayload;
   } catch (e) {
     console.warn('Failed to parse share hash:', e);
diff --git a/packages/ui/utils/storage.ts b/packages/ui/utils/storage.ts
index d8f1e3bad..1ff646828 100644
--- a/packages/ui/utils/storage.ts
+++ b/packages/ui/utils/storage.ts
@@ -9,6 +9,13 @@
 
 const ONE_YEAR_SECONDS = 60 * 60 * 24 * 365;
 
+function getCookieDomain(): string {
+  if (typeof document === 'undefined') return '';
+  const host = document.location.hostname;
+  if (host.endsWith('.plannotator.ai')) return '; domain=.plannotator.ai';
+  return '';
+}
+
 /**
  * Get a value from cookie storage
  */
@@ -27,7 +34,7 @@ export function getItem(key: string): string | null {
 export function setItem(key: string, value: string): void {
   try {
     const encoded = encodeURIComponent(value);
-    document.cookie = `${key}=${encoded}; path=/; max-age=${ONE_YEAR_SECONDS}; SameSite=Lax`;
+    document.cookie = `${key}=${encoded}${getCookieDomain()}; path=/; max-age=${ONE_YEAR_SECONDS}; SameSite=Lax`;
   } catch (e) {
     // Cookie not available
   }
@@ -38,7 +45,7 @@ export function setItem(key: string, value: string): void {
  */
 export function removeItem(key: string): void {
   try {
-    document.cookie = `${key}=; path=/; max-age=0`;
+    document.cookie = `${key}=${getCookieDomain()}; path=/; max-age=0`;
   } catch (e) {
     // Cookie not available
   }
diff --git a/scripts/dev-live-room-local.sh b/scripts/dev-live-room-local.sh
new file mode 100755
index 000000000..3fb54e90f
--- /dev/null
+++ b/scripts/dev-live-room-local.sh
@@ -0,0 +1,90 @@
+#!/usr/bin/env bash
+# Local manual E2E runner for Plannotator Live Rooms.
+#
+# Starts two long-running processes:
+#   - apps/room-service via `bun run dev:room` (wrangler dev on :8787).
+#   - apps/hook via `bun run dev:hook` (Vite on :3000) with
+#     VITE_ROOM_BASE_URL pointing at whichever room service the user
+#     wants the editor's `createRoom()` to target.
+#
+# Default target: http://localhost:8787 (the local wrangler dev above).
+# Tunnel / staging: pass ROOM_BASE_URL=<url> — generated participant
+# and admin links then carry that URL instead of localhost, so a
+# second machine can actually reach the room.
+#
+#   ROOM_BASE_URL=https://your-tunnel.trycloudflare.com bun run dev:live-room
+#
+# Traps Ctrl-C / exit and tears down both child processes so a second
+# run doesn't collide with orphaned wrangler or Vite instances.
+#
+# Iteration scope:
+#   - Creator tab at :3000 uses Vite HMR — changes to App.tsx land live.
+#   - Room tab served by the room service runs the built shell, so
+#     changes to RoomApp / collab components need a manual
+#     `bun run --cwd apps/room-service build:shell` + browser refresh.
+#     Not auto-watched here on purpose.
+#
+# Bash 3.2 compatible (macOS system Bash). `wait -n` is Bash 4.3+ and
+# is NOT available on macOS, so this script polls both child PIDs in
+# a loop with `kill -0` instead.
+set -euo pipefail
+
+REPO_ROOT="$(cd "$(dirname "$0")/.." && pwd)"
+cd "$REPO_ROOT"
+
+ROOM_BASE_URL="${ROOM_BASE_URL:-http://localhost:8787}"
+
+# Child PIDs populated as services start; cleaned up on signal.
+ROOM_PID=""
+HOOK_PID=""
+
+cleanup() {
+  # `|| true` on each kill so a missing/already-exited child doesn't
+  # mask the cleanup of the other.
+  if [[ -n "$ROOM_PID" ]]; then
+    kill "$ROOM_PID" 2>/dev/null || true
+  fi
+  if [[ -n "$HOOK_PID" ]]; then
+    kill "$HOOK_PID" 2>/dev/null || true
+  fi
+  # Give children a beat to flush and exit cleanly before returning.
+  wait 2>/dev/null || true
+}
+
+trap cleanup EXIT INT TERM
+
+printf '\n'
+printf 'Plannotator editor: http://localhost:3000\n'
+printf 'Room service:       http://localhost:8787  (wrangler dev)\n'
+printf 'Editor targets:     %s\n' "$ROOM_BASE_URL"
+printf '\n'
+printf 'Open the editor, click Start live room.\n'
+printf 'The room tab should open at %s/c/...\n' "$ROOM_BASE_URL"
+printf 'Copy the participant link into an incognito window or another browser profile.\n'
+printf 'Participants do not need to run Plannotator.\n'
+printf '\n'
+printf 'Ctrl-C to stop both services.\n'
+printf '\n'
+
+bun run dev:room &
+ROOM_PID=$!
+
+VITE_ROOM_BASE_URL="$ROOM_BASE_URL" bun run dev:hook &
+HOOK_PID=$!
+
+# Poll both PIDs; exit if either child dies so a crashed service
+# doesn't leave the other orphaned. `wait -n` would do this in one
+# line on Bash 4.3+, but macOS ships Bash 3.2 where that flag is
+# invalid ("bash: wait: -n: invalid option") — use `kill -0` as a
+# liveness probe instead.
+while true; do
+  if [[ -n "$ROOM_PID" ]] && ! kill -0 "$ROOM_PID" 2>/dev/null; then
+    wait "$ROOM_PID" 2>/dev/null || true
+    exit 1
+  fi
+  if [[ -n "$HOOK_PID" ]] && ! kill -0 "$HOOK_PID" 2>/dev/null; then
+    wait "$HOOK_PID" 2>/dev/null || true
+    exit 1
+  fi
+  sleep 1
+done
diff --git a/tests/parity/vendor-parity.test.ts b/tests/parity/vendor-parity.test.ts
index e0c84bca9..0e1f21eeb 100644
--- a/tests/parity/vendor-parity.test.ts
+++ b/tests/parity/vendor-parity.test.ts
@@ -57,6 +57,8 @@ function extractVendoredModules(): Set<string> {
       prefix = "ai/providers/";
     } else if (srcPath.includes("packages/ai/")) {
       prefix = "ai/";
+    } else if (srcPath.includes("packages/shared/collab/")) {
+      prefix = "collab/";
     }
     for (const name of names) {
       all.add(prefix + name);