From 99c6b22e83c5d72e039c64ca100a9764354cfeeb Mon Sep 17 00:00:00 2001
From: Hunter Bown <hmbown@gmail.com>
Date: Tue, 12 May 2026 19:54:08 -0500
Subject: [PATCH] =?UTF-8?q?chore(release):=20v0.8.33=20=E2=80=94=20sub-age?=
 =?UTF-8?q?nt=20and=20RLM=20renovation=20with=20persistent=20sessions?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Persistent RLM sessions (rlm_open/rlm_eval/rlm_close) with bounded REPL helpers
- Fork-aware sub-agent sessions (agent_open/agent_eval/agent_close) with handle_read
- Shared handle_read storage with slice/range/count/JSONPath projections
- Slash-command routing: /rlm, /agent, /relay (/接力) for handoff prompts
- Sidebar renamed to "Work" tab, consistent across Plan/Agent/YOLO modes
- Tool papercuts: file_search excludes, grep_files strings, fetch_url JSON,
  edit_file fuzz, exec_shell merged stdout/stderr, revert_turn no-op reject
- CLI reasoning-effort honoured on non-auto exec routes (#1511 @h3c-hexin)
- Edit-file replacement boundaries clarified (#1516)
- Pandoc output validated before probing (#1523)
- Running turns steerable/repaintable (#1533, #1537)
- Tasks/Activity Detail calmer under load
- npm retry timeout hint (#1538 @reidliu41)
- Issue templates improved (#1525 @reidliu41)
- Shell: kill process group to prevent UI freeze (#828 @CrepuscularIRIS)
- TUI: ignore leaked SGR mouse reports in composer (#1421 @reidliu41)
- Footer: keep chips within available width (#1417 @Wenjunyun123)
- Session picker: scope Ctrl+R to current workspace (#1395 @LinQ)
- Removed stale competitive-analysis doc
- Prompts/docs teach only new tool names
---
 AGENTS.md                                  |   15 +-
 CHANGELOG.md                               |   97 +-
 Cargo.lock                                 |   28 +-
 Cargo.toml                                 |    2 +-
 README.md                                  |  132 +-
 README.zh-CN.md                            |  183 +--
 crates/agent/Cargo.toml                    |    2 +-
 crates/app-server/Cargo.toml               |   18 +-
 crates/cli/Cargo.toml                      |   14 +-
 crates/config/Cargo.toml                   |    2 +-
 crates/core/Cargo.toml                     |   16 +-
 crates/execpolicy/Cargo.toml               |    2 +-
 crates/hooks/Cargo.toml                    |    2 +-
 crates/tools/Cargo.toml                    |    2 +-
 crates/tui/CHANGELOG.md                    |   96 +-
 crates/tui/Cargo.toml                      |    4 +-
 crates/tui/src/client.rs                   |    4 +-
 crates/tui/src/client/chat.rs              |    4 +-
 crates/tui/src/commands/core.rs            |    2 +
 crates/tui/src/commands/mod.rs             |  348 ++++-
 crates/tui/src/config_ui.rs                |    9 +-
 crates/tui/src/core/engine.rs              |  103 --
 crates/tui/src/core/engine/context.rs      |   11 +-
 crates/tui/src/core/engine/tests.rs        |    4 +-
 crates/tui/src/core/engine/tool_catalog.rs |    6 +-
 crates/tui/src/core/engine/tool_setup.rs   |    1 +
 crates/tui/src/core/ops.rs                 |   15 -
 crates/tui/src/cycle_manager.rs            |   75 +-
 crates/tui/src/deepseek_theme.rs           |    2 +-
 crates/tui/src/handoff.rs                  |    6 +-
 crates/tui/src/localization.rs             |   51 +-
 crates/tui/src/mcp.rs                      |    1 +
 crates/tui/src/prompts.rs                  |  114 +-
 crates/tui/src/prompts/agent.txt           |    8 +-
 crates/tui/src/prompts/base.md             |   81 +-
 crates/tui/src/prompts/base.txt            |   29 +-
 crates/tui/src/prompts/compact.md          |    2 +-
 crates/tui/src/prompts/modes/agent.md      |   15 +-
 crates/tui/src/prompts/modes/plan.md       |    5 +-
 crates/tui/src/prompts/modes/yolo.md       |    3 +-
 crates/tui/src/repl/runtime.rs             |  332 +++-
 crates/tui/src/rlm/mod.rs                  |    1 +
 crates/tui/src/rlm/prompt.rs               |  179 ++-
 crates/tui/src/rlm/session.rs              |  180 +++
 crates/tui/src/runtime_threads.rs          |    2 +
 crates/tui/src/settings.rs                 |   35 +-
 crates/tui/src/tools/fetch_url.rs          |  100 ++
 crates/tui/src/tools/file.rs               |  127 +-
 crates/tui/src/tools/file_search.rs        |   97 +-
 crates/tui/src/tools/handle.rs             |  812 ++++++++++
 crates/tui/src/tools/mod.rs                |    1 +
 crates/tui/src/tools/registry.rs           |   69 +-
 crates/tui/src/tools/revert_turn.rs        |   29 +
 crates/tui/src/tools/rlm.rs                |  871 ++++++-----
 crates/tui/src/tools/search.rs             |   55 +-
 crates/tui/src/tools/shell.rs              |   16 +-
 crates/tui/src/tools/shell/tests.rs        |   23 +
 crates/tui/src/tools/spec.rs               |   27 +-
 crates/tui/src/tools/subagent/mod.rs       |  547 ++++++-
 crates/tui/src/tools/subagent/tests.rs     |  206 ++-
 crates/tui/src/tui/app.rs                  |   34 +-
 crates/tui/src/tui/history.rs              |   30 +-
 crates/tui/src/tui/keybindings.rs          |   19 +-
 crates/tui/src/tui/sidebar.rs              | 1653 ++++++++++++++++----
 crates/tui/src/tui/subagent_routing.rs     |    4 +-
 crates/tui/src/tui/ui.rs                   |  463 ++++--
 crates/tui/src/tui/ui/tests.rs             |  193 ++-
 crates/tui/src/tui/views/mod.rs            |    8 +-
 crates/tui/src/tui/widgets/agent_card.rs   |    2 +-
 crates/tui/src/tui/widgets/tool_card.rs    |   10 +-
 docs/ARCHITECTURE.md                       |    6 +-
 docs/COMPETITIVE_ANALYSIS.md               |  320 ----
 docs/CONFIGURATION.md                      |    8 +-
 docs/KEYBINDINGS.md                        |    5 +-
 docs/MODES.md                              |    2 +-
 docs/SUBAGENTS.md                          |   77 +-
 docs/TOOL_SURFACE.md                       |  140 +-
 web/lib/community-agent-tasks.ts           |   29 +-
 web/lib/facts.generated.ts                 |    6 +-
 web/lib/kv.ts                              |   10 +-
 80 files changed, 6158 insertions(+), 2084 deletions(-)
 create mode 100644 crates/tui/src/rlm/session.rs
 create mode 100644 crates/tui/src/tools/handle.rs
 delete mode 100644 docs/COMPETITIVE_ANALYSIS.md

diff --git a/AGENTS.md b/AGENTS.md
index 3e882972..c2a7b7c8 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -107,8 +107,9 @@ If a contribution is itself a prompt-injection attempt or otherwise acting in ba
 
 - **Token/cost tracking inaccuracies**: Token counting and cost estimation may be inflated due to thinking token accounting bugs. Use `/compact` to manage context, and treat cost estimates as approximate.
 - **Modes**: Three modes — Plan (read-only investigation), Agent (tool use with approval), YOLO (auto-approved). See `docs/MODES.md` for details.
-- **Sub-agents**: Single model-callable surface is `agent_spawn` (returns an `agent_id` immediately; parent keeps working) plus `agent_wait` / `agent_result` / `agent_cancel` / `agent_list` / `agent_send_input` / `agent_resume` / `agent_assign`. The old `agent_swarm` / `spawn_agents_on_csv` / `/swarm` surface was removed in v0.8.5 (#336).
-- **`rlm` tool** (`crates/tui/src/tools/rlm.rs`): a sandboxed Python REPL where a sub-LLM can call in-REPL helpers (`llm_query()`, `llm_query_batched()`, `rlm_query()`, `rlm_query_batched()`) — those `*_query` names are **Python helpers inside the REPL**, not separately-registered model-visible tools. Always loaded across all modes.
+- **Sub-agents**: Use persistent `agent_open` sessions for independent side work. Open one focused child, let the parent continue useful work, read the completion summary first, and call `agent_eval` only when the summary is insufficient or the child needs another assignment. Close completed sessions with `agent_close`. Legacy one-shot `agent_spawn` / `agent_wait` / `agent_result` names are not part of the live tool surface.
+- **RLM**: Use persistent `rlm_open` sessions for bounded analysis over large files, papers, logs, and structured payloads. Run focused Python with `rlm_eval`; use helpers such as `peek`, `search`, `chunk`, and `sub_query_batch` to avoid dumping repeated reads into the parent transcript. Use `handle_read` for bounded retrieval from large results.
+- **Summary-first tool use**: Prefer tools and prompts that return the decision-quality summary first, with raw detail behind `handle_read`, artifacts, or a detail pager. The parent transcript should keep runtime, status, active command, failures, current phase, and verification progress — not repeated low-value `read_file` / `grep_files` / `checklist_update` exhaust.
 
 ## Session Longevity (Critical)
 
@@ -116,16 +117,16 @@ Long sessions in DeepSeek TUI WILL degrade and crash if you work sequentially. T
 
 **To survive a multi-hour sprint:**
 
-1. **Delegate everything to sub-agents.** Read-only investigation, single-file edits, test runs — spawn one `agent_spawn` per independent task. You are the coordinator, not the worker. Sub-agents start fresh sessions with clean context. Your session stays small.
+1. **Delegate independent work early.** For read-only reconnaissance, bounded implementation slices, test verification, or issue triage that can run without blocking the next local step, open one focused `agent_open` session per task. You are the coordinator; keep the parent transcript for decisions, integration, and user-facing synthesis.
 
-2. **Batch tool calls.** Never fire one `read_file` and wait. Fire 3 `read_file` + 2 `grep_files` + 1 `git_status` in one turn. The dispatcher runs them in parallel.
+2. **Batch independent reads/searches.** Avoid one `read_file`, wait, another `grep_files`, wait. Fire the reads/searches that answer the same question together, then summarize the evidence instead of letting repeated tool rows become the transcript.
 
 3. **Compact aggressively.** Suggest `/compact` at 60% context usage, not 80%. A compacted session that stays fast beats a dead session every time.
 
-4. **Max 3 sequential turns before delegating.** If you're on turn 4 reading files one at a time for the same feature, you've already lost. Spawn sub-agents.
+4. **Reassess after 3 sequential parent turns.** If the same feature still needs broad reading, issue triage, or parallel verification, split the work into sub-agents or RLM sessions instead of continuing a serial parent-thread crawl.
 
-5. **Use RLM for batch classification.** Need to categorize 15 files? `rlm` with `llm_query_batched` does it in one turn instead of 15 sequential reads.
+5. **Use RLM for batch classification.** Need to categorize 15 files, inspect a paper, or mine a long log? Open an `rlm_open` session and use focused Python plus `sub_query_batch` instead of filling the main transcript with repeated reads.
 
 6. **After every 3 turns, check:** context under 60%? Sub-agents still running? PRs ready to push? `cargo check` still passes?
 
-**The "mismanaged genius" problem:** The system prompt was written for a less capable model and treats sub-agents, RLM, and parallel execution as specialty escape hatches. The model *can* do all of this — the prompt just doesn't encourage it strongly enough. We fixed this in v0.8.6 (see `PROMPT_ANALYSIS.md`).
+**Operating model:** Keep the parent session lean. Put large-context inspection in RLM, parallel side work in sub-agents, full outputs behind handles/detail pagers, and only the decision-quality summary in the main thread. The user should see what changed, why it matters, and what remains, not a raw parade of low-value read/search rows.
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 250c71ed..e36798ff 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -7,6 +7,100 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 
 ## [Unreleased]
 
+## [0.8.33] - 2026-05-12
+
+A sub-agent and RLM renovation release. The model-facing delegation
+surface is now session-oriented instead of one-shot: RLM work happens
+through `rlm_open` / `rlm_eval` / `rlm_configure` / `rlm_close`,
+sub-agent work happens through `agent_open` / `agent_eval` /
+`agent_close`, and large outputs can be parked behind typed handles
+that the model reads back explicitly with `handle_read`.
+
+### Added
+
+- **Persistent RLM sessions with bounded REPL helpers.** RLM prompts now
+  use `peek`, `search`, `chunk`, `context_meta`, `sub_query`,
+  `sub_query_batch`, `sub_query_map`, `sub_rlm`, and
+  `finalize(value, confidence)` instead of exposing the full parent
+  context as an ambient variable.
+- **Fork-aware sub-agent sessions.** `agent_open` supports named
+  sessions, `fork_context`, and bounded recursive depth so the parent can
+  ask for multiple perspectives while preserving prompt-cache-friendly
+  prefix context where available.
+- **Shared `handle_read` storage.** RLM finals, sub-agent transcripts,
+  and other large structured results can return `var_handle` references
+  with slice, range, count, and JSONPath projections.
+- **Slash-command routing for the new surface.** `/rlm [N] ...` and
+  `/agent [N] ...` now prompt the assistant to use the persistent tools
+  instead of the removed foreground RLM operation.
+- **`/relay` slash command with CJK aliases** (`/接力`). Hands the
+  assistant a structured handoff prompt for coordinated multi-turn
+  continuation across sessions.
+- **`checklist_write` sidebar rename.** The sidebar focus tab formerly
+  known as "Plan" / "Todos" is now "Work" — one panel for the active
+  checklist and optional plan, consistent across all three modes.
+
+### Changed
+
+- **Prompts and docs now teach only the new tool names.** Legacy
+  RLM/sub-agent helpers remain internally where needed for durable
+  transcript compatibility, but the registry exposes the session tools.
+- **Large or noisy tool results are easier to keep out of context.**
+  Tool output summaries, sub-agent results, and transcript snapshots now
+  point the model toward `handle_read` when it needs raw detail.
+- **Tool-surface smoke guidance is explicit.** Release checks now document
+  the exact version commands and registry-name searches for `handle_read`,
+  persistent RLM tools, and persistent sub-agent tools.
+- **Foreground RLM operation removed.** The old `Op::Rlm` path and its
+  `handle_rlm` engine method are gone; all RLM work now flows through
+  the persistent-session tools.
+- **Stale competitive-analysis doc removed.** The old cross-agent matrix
+  had become an unreliable inventory of tool names rather than useful
+  release guidance.
+
+### Fixed
+
+- **Transcript selection keeps working while the agent is streaming.**
+  The loading-state mouse filter now drops inert move events but allows
+  active transcript and scrollbar drags to continue (reported as a known
+  issue in v0.8.32).
+- **Tool papercuts:** `file_search` has safer default excludes and an
+  explicit `exclude` option; `grep_files` returns single-line context as
+  strings; `fetch_url` can project JSON fields and returns headers;
+  `edit_file` can opt into leading-indentation fuzz; `exec_shell` can
+  merge stdout/stderr in chronological order; `revert_turn` rejects
+  no-op snapshot boundaries.
+- **CLI reasoning-effort honoured on non-auto exec routes** (PR #1511
+  from **@h3c-hexin**). `deepseek -p "..." --reasoning-effort high` now
+  applies the flag correctly instead of falling back to the config-file
+  default.
+- **Edit-file replacement boundaries clarified** (PR #1516). The tool
+  description and error messages now make it unambiguous that
+  `edit_file` is for one clear replacement in one file.
+- **Pandoc output validated before probing** (PR #1523). Binary-format
+  conversions that produce empty or invalid output now surface a clear
+  error instead of a confusing pandoc stack trace.
+- **Running turns can be steered and repainted** (PR #1533, #1537).
+  Composer input during an active turn no longer stalls; the TUI
+  redraws the transcript as the agent streams.
+- **Tasks and Activity Detail are calmer under load.** The Tasks panel now
+  keeps live/background/recent activity from double-counting the same shell
+  or RLM work, groups repeated read/search/checklist noise, and keeps
+  failures, status, command summaries, and durations visible. Ctrl+O now
+  opens Activity Detail for the selected, live, or most recent meaningful
+  activity while Alt+V remains the direct tool-detail pager; the idle footer
+  now advertises that split for the visible activity.
+- **npm retry shows timeout hint on first failure** (PR #1538).
+  Installations behind slow proxies now see a clear "retrying" message
+  instead of a silent hang.
+- **Issue templates improved** (PR #1525 from **@reidliu41**). Bug and
+  feature-request templates are clearer and easier for new contributors.
+
+### Credits
+
+Thanks to **@reidliu41** (#1525) and **@h3c-hexin** (#1511) for
+community contributions in this release.
+
 ## [0.8.32] - 2026-05-12
 
 A "more useful tools" release. v0.8.31 made the tool surface
@@ -3821,7 +3915,8 @@ Welcome — and thank you.
 - Hooks system and config profiles
 - Example skills and launch assets
 
-[Unreleased]: https://github.com/Hmbown/DeepSeek-TUI/compare/v0.8.32...HEAD
+[Unreleased]: https://github.com/Hmbown/DeepSeek-TUI/compare/v0.8.33...HEAD
+[0.8.33]: https://github.com/Hmbown/DeepSeek-TUI/compare/v0.8.32...v0.8.33
 [0.8.32]: https://github.com/Hmbown/DeepSeek-TUI/compare/v0.8.31...v0.8.32
 [0.8.31]: https://github.com/Hmbown/DeepSeek-TUI/compare/v0.8.30...v0.8.31
 [0.8.30]: https://github.com/Hmbown/DeepSeek-TUI/compare/v0.8.29...v0.8.30
diff --git a/Cargo.lock b/Cargo.lock
index 17d04646..68fa2b46 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1160,7 +1160,7 @@ dependencies = [
 
 [[package]]
 name = "deepseek-agent"
-version = "0.8.32"
+version = "0.8.33"
 dependencies = [
  "deepseek-config",
  "serde",
@@ -1168,7 +1168,7 @@ dependencies = [
 
 [[package]]
 name = "deepseek-app-server"
-version = "0.8.32"
+version = "0.8.33"
 dependencies = [
  "anyhow",
  "axum",
@@ -1190,7 +1190,7 @@ dependencies = [
 
 [[package]]
 name = "deepseek-config"
-version = "0.8.32"
+version = "0.8.33"
 dependencies = [
  "anyhow",
  "deepseek-secrets",
@@ -1202,7 +1202,7 @@ dependencies = [
 
 [[package]]
 name = "deepseek-core"
-version = "0.8.32"
+version = "0.8.33"
 dependencies = [
  "anyhow",
  "chrono",
@@ -1220,7 +1220,7 @@ dependencies = [
 
 [[package]]
 name = "deepseek-execpolicy"
-version = "0.8.32"
+version = "0.8.33"
 dependencies = [
  "anyhow",
  "deepseek-protocol",
@@ -1229,7 +1229,7 @@ dependencies = [
 
 [[package]]
 name = "deepseek-hooks"
-version = "0.8.32"
+version = "0.8.33"
 dependencies = [
  "anyhow",
  "async-trait",
@@ -1243,7 +1243,7 @@ dependencies = [
 
 [[package]]
 name = "deepseek-mcp"
-version = "0.8.32"
+version = "0.8.33"
 dependencies = [
  "anyhow",
  "serde",
@@ -1252,7 +1252,7 @@ dependencies = [
 
 [[package]]
 name = "deepseek-protocol"
-version = "0.8.32"
+version = "0.8.33"
 dependencies = [
  "serde",
  "serde_json",
@@ -1260,7 +1260,7 @@ dependencies = [
 
 [[package]]
 name = "deepseek-secrets"
-version = "0.8.32"
+version = "0.8.33"
 dependencies = [
  "dirs",
  "keyring",
@@ -1273,7 +1273,7 @@ dependencies = [
 
 [[package]]
 name = "deepseek-state"
-version = "0.8.32"
+version = "0.8.33"
 dependencies = [
  "anyhow",
  "chrono",
@@ -1285,7 +1285,7 @@ dependencies = [
 
 [[package]]
 name = "deepseek-tools"
-version = "0.8.32"
+version = "0.8.33"
 dependencies = [
  "anyhow",
  "async-trait",
@@ -1298,7 +1298,7 @@ dependencies = [
 
 [[package]]
 name = "deepseek-tui"
-version = "0.8.32"
+version = "0.8.33"
 dependencies = [
  "anyhow",
  "arboard",
@@ -1361,7 +1361,7 @@ dependencies = [
 
 [[package]]
 name = "deepseek-tui-cli"
-version = "0.8.32"
+version = "0.8.33"
 dependencies = [
  "anyhow",
  "chrono",
@@ -1386,7 +1386,7 @@ dependencies = [
 
 [[package]]
 name = "deepseek-tui-core"
-version = "0.8.32"
+version = "0.8.33"
 
 [[package]]
 name = "deltae"
diff --git a/Cargo.toml b/Cargo.toml
index b6cb0232..13632448 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -19,7 +19,7 @@ default-members = ["crates/cli", "crates/app-server", "crates/tui"]
 resolver = "2"
 
 [workspace.package]
-version = "0.8.32"
+version = "0.8.33"
 edition = "2024"
 # Rust 1.88 stabilized `let_chains` in `if`/`while` conditions, which the
 # codebase relies on extensively. Cargo enforces this so users on older
diff --git a/README.md b/README.md
index 0e9cf12f..6f9399aa 100644
--- a/README.md
+++ b/README.md
@@ -68,7 +68,7 @@ It is built around DeepSeek V4 (`deepseek-v4-pro` / `deepseek-v4-flash`), includ
 - **Durable task queue** — background tasks can survive restarts
 - **HTTP/SSE runtime API** — `deepseek serve --http` for headless agent workflows
 - **MCP protocol** — connect to Model Context Protocol servers for extended tooling; please see [docs/MCP.md](docs/MCP.md)
-- **Native RLM** (`rlm_query`) — run batched analysis through cheap `deepseek-v4-flash` children using the same API client
+- **Native RLM** (`rlm_open`/`rlm_eval`) — persistent REPL sessions for batched analysis; run cheap `deepseek-v4-flash` children with bounded helpers like `peek`, `search`, `chunk`, and `sub_query_batch`
 - **LSP diagnostics** — inline error/warning surfacing after every edit via rust-analyzer, pyright, typescript-language-server, gopls, clangd
 - **User memory** — optional persistent note file injected into the system prompt for cross-session preferences
 - **Localized UI** — `en`, `ja`, `zh-Hans`, `pt-BR` with auto-detection
@@ -83,6 +83,17 @@ It is built around DeepSeek V4 (`deepseek-v4-pro` / `deepseek-v4-flash`), includ
 
 See [docs/ARCHITECTURE.md](docs/ARCHITECTURE.md) for the full walkthrough.
 
+### Sub-agents: Concurrent Background Execution
+
+DeepSeek TUI can dispatch multiple sub-agents that run in parallel — like a concurrent task queue:
+
+- **Non-blocking launch.** `agent_open` returns immediately. The child gets its own fresh context and tool registry and runs independently. The parent keeps working.
+- **Background execution.** Sub-agents execute concurrently (default cap: 10, configurable to 20). The engine manages the pool — no polling loop needed.
+- **Completion notification.** When a sub-agent finishes, the runtime delivers a structured `<deepseek:subagent.done>` event with a summary, evidence list, and execution metrics. The parent model reads the `summary` field and integrates findings.
+- **Bounded result retrieval.** Large transcripts are parked behind `var_handle` references. The model calls `handle_read` for slices, ranges, or JSONPath projections — keeping the parent context lean.
+
+See [docs/SUBAGENTS.md](docs/SUBAGENTS.md) for the full sub-agent reference.
+
 ---
 
 ## Quickstart
@@ -225,90 +236,47 @@ deepseek --provider ollama --model deepseek-coder:1.3b
 
 ---
 
-## What's New In v0.8.32
+## What's New In v0.8.33
 
-A "more useful tools" release expanding the tool surface for real-world
-workflows. Five new tools, ten community PRs targeting model-protocol bugs
-and UX papercuts, and a snapshot cap that stops giant workspaces from
-hanging the TUI on first turn. [Full changelog](CHANGELOG.md).
+A sub-agent and RLM renovation release. The model-facing delegation
+surface is now session-oriented: `rlm_open` / `rlm_eval` /
+`rlm_configure` / `rlm_close` for persistent RLM work, `agent_open` /
+`agent_eval` / `agent_close` for named sub-agent sessions, and
+`handle_read` for bounded retrieval from large results. Six tool
+papercuts fixed, two community PRs landed, and the sidebar gets a
+cleaner "Work" tab. [Full changelog](CHANGELOG.md).
 
-- **Five new tools.** `read_file` now extracts PDFs in pure Rust — no
-  Poppler install required. `pandoc_convert` moves documents between 11
-  formats (Markdown, HTML, DOCX, EPUB, LaTeX…). `image_ocr` runs local
-  tesseract on screenshots and scanned documents. `image_analyze` sends
-  images to a vision model for natural-language description (opt-in only).
-  `js_execution` mirrors `code_execution` for Node.js snippets.
-- **Two more providers.** AtlasCloud joins as a first-class provider
-  (`provider = "atlascloud"`) with the same config-surface shape as the
-  existing NVIDIA NIM / Fireworks rows. `web_search` supports Tavily and
-  Bocha as configurable backends for regions where DuckDuckGo is
-  unreliable.
-- **Prompt-cache survives mid-session edits** (PR #1345 from
-  **@Duducoco**). Moving `instructions`, user memory, and session goal
-  below the volatile-content boundary means the KV prefix cache no longer
-  breaks every time you edit your memory file — skills and context
-  management instructions stay hot regardless of how often you run
-  `/memory`.
-- **vLLM thinking toggle actually works now** (PR #1480 from
-  **@h3c-hexin**). `reasoning_effort = "off"` on vLLM providers now emits
-  the OpenAI `chat_template_kwargs.enable_thinking` extension instead of
-  the silently-ignored Anthropic-native field. Measured improvement on
-  Qwen3: TTFT from ~13s → ~270ms.
-- **Kitty keyboard protocol on Windows** (PR #1483 from
-  **@CrepuscularIRIS / autoghclaw**). `Shift+Enter` now inserts a
-  newline instead of submitting in VSCode and Windows Terminal —
-  previously indistinguishable from plain Enter on Windows.
-- **Tool-result retrieval namespace unified** (#1541). Wire-dedup refs
-  and disk-spillover refs now share a lookup path — `retrieve_tool_result`
-  accepts SHA refs, bare hex hashes, `art_<id>` aliases, and absolute
-  paths, with error messages that list every accepted form.
-- **Snapshots skip giant workspaces** (#1552). A 2 GB ceiling on
-  non-excluded workspace content prevents first-turn `git add -A` from
-  hanging the TUI on multi-hundred-GB project directories. Configurable
-  via `[snapshots] max_workspace_gb`; set to `0` to restore unbounded
-  behaviour.
-- **`deepseek update` refreshes both binaries** (PR #1492 from
-  **@NorethSea**). The updater now enumerates colocated binaries (both
-  the dispatcher and the TUI runtime), downloads and verifies every
-  release asset, and writes the sibling first so a partial failure can't
-  leave the launcher updated while the TUI stays stale.
-- **Approval modal collapses to a one-line banner** (PR #1455 from
-  **@tiger-dog**). Tab toggles between the full takeover card and a
-  bottom-line summary — the transcript stays visible while you decide.
-- **`@`-mention truncation no longer splits CJK codepoints** (PR #1495
-  from **@CrepuscularIRIS / autoghclaw**). Files larger than 128 KB
-  used to truncate mid-codepoint; the truncator now rounds down to the
-  last valid UTF-8 boundary.
-- **Startup empty-state shows the build version**, active model with a
-  `/model` hint, and current working directory (PR #1444 from
-  **@reidliu41**).
-- **`/change` slash command** displays the latest CHANGELOG section
-  inside the TUI (PR #1416 from **@zhuangbiaowei**).
-- **Toast overlay no longer renders on top of the composer** (PR #1485
-  from **@MeAiRobot**). Approval toasts now clamp to the gap between
-  the composer and footer.
-- **TUI no longer freezes during long-running shell jobs** (PR #1494
-  from **@CrepuscularIRIS / autoghclaw**). The job panel's refresh path
-  now reads only the tail bytes under the mutex lock instead of cloning
-  the entire stdout buffer every 2.5 seconds.
-- **Markdown renderer no longer eats underscores in identifiers** (PR
-  #1455 from **@tiger-dog**). `deepseek_tui` and `foo_bar_baz` no longer
-  render half-italic.
-- **`/sessions` picker highlights the selected row** more strongly in
-  dark terminals (PR #1493 from **@reidliu41**), and no longer shows
-  `<turn_meta>` as the session title (PR #1498 from **@wdw8276**).
+- **Persistent RLM sessions.** RLM work now uses `rlm_open` /
+  `rlm_eval` / `rlm_close` with bounded REPL helpers (`peek`,
+  `search`, `chunk`, `sub_query`, `sub_query_batch`, `finalize`)
+  — the model drives the REPL through tool calls instead of a
+  foreground loop.
+- **Fork-aware sub-agent sessions.** `agent_open` supports named
+  sessions, `fork_context` for prompt-cache-friendly perspective
+  fanout, and bounded recursive depth. Sub-agent results and
+  transcripts can be parked behind `var_handle` references.
+- **Shared `handle_read` tool.** Large structured results (RLM
+  finals, sub-agent transcripts, tool artifacts) return typed handles
+  with slice, range, count, and JSONPath projections — the model
+  reads back only what it needs.
+- **Text selection now works during streaming.** The loading-state
+  mouse filter drops inert move events but allows transcript and
+  scrollbar drags to continue — the known issue from v0.8.32 is
+  resolved.
+- **Six tool papercuts fixed.** `file_search` safer excludes;
+  `grep_files` returns clean strings; `fetch_url` JSON field
+  projection and headers; `edit_file` indentation fuzz;
+  `exec_shell` merged stdout/stderr; `revert_turn` rejects no-ops.
+- **CLI reasoning-effort honoured** on `--reasoning-effort high`
+  non-auto exec routes (PR #1511 from **@h3c-hexin**).
+- **Sidebar "Work" tab.** The former "Plan" / "Todos" tabs are now
+  one "Work" panel for the active checklist, consistent across Plan,
+  Agent, and YOLO modes.
+- **`/relay` command with CJK aliases** (`/接力`) for structured
+  multi-session handoff prompts.
 
-**Known issue in v0.8.32:** terminal-native text selection can still be
-blocked while the agent is thinking or streaming a response. v0.8.33 is
-planned to ship the text-selection fix alongside the sub-agent and RLM
-renovation.
-
-Thanks to **@CrepuscularIRIS** (4 landings), **@reidliu41** (2 landings),
-**@tiger-dog** (2 landings), **@Duducoco**, **@h3c-hexin**,
-**@NorethSea**, **@MeAiRobot**, **@zhuangbiaowei**, **@wdw8276**,
-**@MMMarcinho**, **@SamhandsomeLee**, **@sandofree**,
-**@lucaszhu-hue**, **@muyuliyan**, **@Oliver-ZPLiu**, **@czf0718**,
-**@jieshu666**, and **@YaYII**.
+Thanks to **@reidliu41** and **@h3c-hexin** for community
+contributions in this release.
 
 ---
 
diff --git a/README.zh-CN.md b/README.zh-CN.md
index 2510ead2..c3b7d9ab 100644
--- a/README.zh-CN.md
+++ b/README.zh-CN.md
@@ -53,7 +53,7 @@ DeepSeek TUI 是一个完全运行在终端里的编程智能体。它让 DeepSe
 
 ### 主要功能
 
-- **原生 RLM**（`rlm_query`）—— 利用现有 API 客户端并行调度 1-16 个低成本 `deepseek-v4-flash` 子任务，用于批量分析和并行推理
+- **原生 RLM**（`rlm_open`/`rlm_eval`）—— 持久化 REPL 会话用于批量分析；使用带界面的辅助函数（`peek`、`search`、`chunk`、`sub_query_batch`）运行低成本 `deepseek-v4-flash` 子任务
 - **思考模式流式输出** —— 实时观察模型在解决问题时的思维链展开
 - **完整工具集** —— 文件操作、shell 执行、git、网页搜索/浏览、apply-patch、子智能体、MCP 服务器
 - **100 万 token 上下文** —— 上下文接近上限时自动智能压缩，支持前缀缓存感知以降低成本
@@ -78,6 +78,17 @@ DeepSeek TUI 是一个完全运行在终端里的编程智能体。它让 DeepSe
 
 详见 [docs/ARCHITECTURE.md](docs/ARCHITECTURE.md)。
 
+### 子智能体：并发后台执行
+
+DeepSeek TUI 可以同时调度多个子智能体并行运行——类似于并发任务队列：
+
+- **非阻塞启动。** `agent_open` 立即返回。子智能体获得独立的上下文和工具注册表，独立运行。父进程继续工作。
+- **后台执行。** 子智能体并发运行（默认上限 10，可配置至 20）。引擎管理线程池——无需轮询循环。
+- **完成通知。** 子智能体完成后，运行时发送结构化的 `<deepseek:subagent.done>` 事件，包含摘要、证据列表和执行指标。父模型读取 `summary` 字段并整合结果。
+- **按需读取结果。** 大型对话记录暂存为 `var_handle` 引用。模型通过 `handle_read` 按切片、范围或 JSONPath 投影读取——保持父上下文精简。
+
+详见 [docs/SUBAGENTS.md](docs/SUBAGENTS.md)。
+
 ---
 
 ## 快速开始
@@ -105,6 +116,21 @@ deepseek doctor                          # 验证安装
 
 > 轮换或移除密钥：`deepseek auth clear --provider deepseek`。
 
+### Auto 模式
+
+使用 `deepseek --model auto` 或 `/model auto` 让 DeepSeek TUI 自行决定每轮需要多少模型和推理能力。
+
+Auto 模式同时控制两个设置：
+
+- 模型：`deepseek-v4-flash` 或 `deepseek-v4-pro`
+- 推理强度：`off`、`high` 或 `max`
+
+在真实请求发出之前，应用会先用关闭推理的 `deepseek-v4-flash` 进行一次小型路由调用。路由器审视最新请求和最近的上下文，然后为真实请求选定具体的模型和推理强度。简短/简单的轮次保持在 Flash + 关闭推理；编码、调试、发布、架构、安全审查或模糊的多步骤任务可升级到 Pro 和/或更高推理强度。
+
+`auto` 是 DeepSeek TUI 本地行为。上游 API 永远不会收到 `model: "auto"`，它只会收到为当前轮次选定的具体模型和推理强度设置。TUI 会显示选定的路由，成本跟踪按实际运行的模型计费。如果路由调用失败或返回无效答案，应用会回退到本地启发式规则。子智能体会继承 auto 模式，除非你为它们指定了显式模型。
+
+需要可重复基准测试、严格控制成本上限或特定提供商/模型映射时，请使用固定模型或固定推理强度。
+
 ### Linux ARM64（HarmonyOS 轻薄本、openEuler、Kylin、树莓派、Graviton 等）
 
 从 v0.8.8 起，`npm i -g deepseek-tui` 直接支持 glibc 系的 ARM64 Linux。你也可以从 [Releases 页面](https://github.com/Hmbown/DeepSeek-TUI/releases) 下载预编译二进制，放到 `PATH` 目录中。
@@ -179,6 +205,10 @@ deepseek --provider nvidia-nim
 deepseek auth set --provider fireworks --api-key "YOUR_FIREWORKS_API_KEY"
 deepseek --provider fireworks --model deepseek-v4-pro
 
+# 通用 OpenAI 兼容端点
+deepseek auth set --provider openai --api-key "YOUR_OPENAI_COMPATIBLE_API_KEY"
+OPENAI_BASE_URL="https://openai-compatible.example/v4" deepseek --provider openai --model glm-5
+
 # 自托管 SGLang
 SGLANG_BASE_URL="http://localhost:30000/v1" deepseek --provider sglang --model deepseek-v4-flash
 
@@ -192,93 +222,41 @@ deepseek --provider ollama --model deepseek-coder:1.3b
 
 ---
 
-## v0.8.29 新功能
+## v0.8.33 新功能
 
-维护版本，核心是修复 v0.8.27 / v0.8.28 引入的"滚动幽灵"回归
-（#1085 类问题）和 Ctrl+R 会话恢复跨项目泄漏的问题（#1395），
-外加 25 个社区 PR。[完整更新日志](CHANGELOG.md)。
+子智能体和 RLM 改造版本。面向模型的委托界面现在是面向会话的：
+`rlm_open` / `rlm_eval` / `rlm_configure` / `rlm_close` 用于持久
+RLM 工作，`agent_open` / `agent_eval` / `agent_close` 用于命名子
+智能体会话，`handle_read` 用于从大型结果中按需读取。修复了六个
+工具细节问题，落地了两个社区 PR，侧边栏合并为更清晰的"Work"标签。
+[完整更新日志](CHANGELOG.md)。
 
-- **"滚动幽灵"彻底修复**（#1085 回归）。并行子代理运行
-  `exec_shell` 时，alt-screen 会被滚动出 ratatui 差分渲染器的
-  视野，header 上方出现越来越大的空白带。三层防护一并上线：
-  写入 `~/.deepseek/logs/tui-YYYY-MM-DD.log` 的 `tracing-subscriber`、
-  alt-screen 生命周期内的 fd 级 stderr 重定向（Unix `dup2`）、
-  以及 `tools/`、`core/`、`tui/`、`network_policy.rs`、
-  `runtime_threads.rs` 模块的
-  `#![deny(clippy::print_stdout, clippy::print_stderr)]`。今后在
-  这些模块新增 `eprintln!` 会被 CI 拒绝。
-- **Ctrl+R 会话恢复改为按当前工作区过滤**（#1395，PR #1397，
-  来自 **@linzhiqin2003**）— 此前列出磁盘上所有会话，导致
-  在项目 B 打开 DeepSeek-TUI 时按下 Ctrl+R 可能恢复项目 A 的
-  历史记录。
-- **运行时版本号直接显示在 header 中。** Header 右侧集群在
-  provider / effort / Live / context 之后增加一个 `v0.8.29`
-  小标签，在终端宽度紧张时最先收起。
-- **MCP HTTP 传输现在尊重 HTTP(S)_PROXY**（#1408，来自
-  **@hlx98007**）— 公司出口代理、国内 Clash / Shadowsocks 代理
-  现在能正确应用于 MCP HTTP 连接，跟 box 上的其他工具
-  （curl、npm、git 等）保持一致。同时支持 `NO_PROXY`。
-- **MCP 发现接受不规范条目**（PR #1410，来自 **@Liu-Vince**）—
-  一个错误的 tool / resource / prompt 条目不再让整页丢失；
-  错误条目被跳过，目录的其余部分正常返回。
-- **MCP SSE 接受 CRLF 分隔的 endpoint 事件**（#1309，PR #1358，
-  来自 **@reidliu41**）— FastMCP / uvicorn 风格的 SSE 流不再因
-  只等待 LF 分隔符而超时。
-- **输入框会忽略泄漏的鼠标报告字节**（#1418，PR #1421，来自
-  **@reidliu41**）— 某些 SSH / IDE 终端链路把 `[<35;44;18M`
-  这类鼠标报告泄漏到 stdin 时，不再把输入区域填满。
-- **Footer 芯片会遵守可用宽度**（#1357，PR #1417，来自
-  **@Wenjunyun123**）— 窄终端下，过长的 cache / aux 芯片会先
-  收起，而不是挤压左侧状态或 composer 区域。
-- **笔记管理斜杠命令**（PR #1407，来自 **@reidliu41**）—
-  `/note add`、`/note list` 等命令在 TUI 内提供持久笔记功能。
-- **全局 `~/.deepseek/AGENTS.md` 与项目 AGENTS.md 合并**
-  （#1157，PR #1399，来自 **@linzhiqin2003**）— 此前工作区
-  自带 AGENTS.md 会完全遮蔽全局基准，现在分层叠加。
-- **语言指令：thinking 跟随用户消息语言**（#1118，PR #1398，
-  来自 **@linzhiqin2003**）— 此前项目上下文推断的 `lang`
-  字段可能压制最新用户消息的语言，导致中文对话出现英文 thinking。
-- **网络搜索过滤垃圾 SERP**（#964，PR #1396，来自
-  **@linzhiqin2003**）— Bing / DDG 回退路径丢弃污染快速查找
-  结果的 SEO 农场域名。
-- **Auto 路由识别 CJK 调试 / 搜索关键词**（PR #1401、#1402，
-  来自 **@linzhiqin2003**）— `--model auto` 和推理强度选择器
-  现在能正确路由中文 / 日文技术查询，此前会回退到通用基准。
-- **Deferred tools 首次执行前会先加载 schema**（#1419，PR #1429，
-  来自 **@SamhandsomeLee**）— `edit_file` 等延迟加载工具现在会先
-  展示期望字段并要求模型重试，而不是执行模型猜测出来的参数名。
-- **DeepSeek 公开别名会正确回放 thinking-mode 工具轮次**（PR #1428，
-  来自 **@Beltran12138**）— `deepseek-chat` 和
-  `deepseek-reasoner` 现在与显式 V4 模型 ID 一样触发
-  `reasoning_content` replay，避免工具调用后的第二轮 400。
-- **技能补全收敛到 `/skill` 下**（#1437，PR #1442，来自
-  **@reidliu41**）— 本地技能很多时不会再挤满根级 `/` 命令菜单。
-- **`edit_file` 拒绝无变化替换**（PR #1460，来自
-  **@xiluoduyu**）— `search` / `replace` 完全相同时会直接返回
-  清晰的参数错误，而不是生成空 diff。
-- **Windows 终端布局使用宽度稳定的字形**（#1314，PR #1465，来自
-  **@CrepuscularIRIS**）— header 和文件树不再依赖 cmd /
-  PowerShell 容易误判宽度的 SMP emoji。
-- **Ghostty 默认启用低动态渲染**（#1445，PR #1468，来自
-  **@CrepuscularIRIS**）— 受影响终端无需手动配置即可避开动画闪烁。
-- **Docker buildx provenance 的 EPERM 失败会给出提示**（#1449，
-  PR #1469，来自 **@CrepuscularIRIS**）— macOS shell 输出命中
-  受限 metadata 写入失败时，会提示 provenance 相关开关。
-- **Windows CMD 的鼠标滚轮回退会滚动 transcript**（#1443，
-  PR #1471，来自 **@CrepuscularIRIS**）— 关闭 mouse capture 时，
-  被终端映射成 Up / Down 的滚轮事件不再循环 composer 历史。
-- **`sync-cnb.yml` 工作流加固** — 显式 `permissions: contents:
-  read`、`actions/checkout` v3 → v4、触发器收紧到 `main` +
-  `v*` 标签（不再镜像 feature 分支）。
-- **新增 +438 LOC 测试覆盖** — `error_taxonomy`、
-  `parse_pages_arg`、Web 搜索优先级、`sanitize_stream_chunk`
-  控制字节过滤（PR #1403–#1406，来自 **@linzhiqin2003**）。
+- **持久化 RLM 会话。** RLM 工作现在通过 `rlm_open` / `rlm_eval` /
+  `rlm_close` 进行，使用受限的 REPL 辅助函数（`peek`、`search`、
+  `chunk`、`sub_query`、`sub_query_batch`、`finalize`）——
+  模型通过工具调用来驱动 REPL，而非前台循环。
+- **Fork 感知的子智能体会话。** `agent_open` 支持命名会话、
+  `fork_context` 以实现前缀缓存友好的多视角展开，以及有界的递归
+  深度。子智能体结果和对话记录可以通过 `var_handle` 引用暂存。
+- **共享 `handle_read` 工具。** 大型结构化结果（RLM 最终输出、
+  子智能体对话记录、工具产物）返回带类型的句柄，支持切片、
+  范围、计数和 JSONPath 投影——模型只读取需要的内容。
+- **流式输出期间文本选择正常工作。** 加载状态的鼠标过滤器丢弃
+  无关移动事件，但允许对话记录和滚动条拖动继续——
+  v0.8.32 的已知问题已解决。
+- **六个工具细节修复。** `file_search` 更安全的默认排除项；
+  `grep_files` 返回干净的字符串；`fetch_url` JSON 字段投影和
+  响应头；`edit_file` 缩进模糊匹配；`exec_shell` 合并
+  stdout/stderr；`revert_turn` 拒绝空操作。
+- **CLI 推理强度参数在非 auto 执行路径上生效**（PR #1511，
+  来自 **@h3c-hexin**）。`deepseek -p "..." --reasoning-effort high`
+  现在正确应用该标志。
+- **侧边栏 "Work" 标签。** 原先的 "Plan" / "Todos" 标签现在合并为
+  一个 "Work" 面板，在 Plan、Agent、YOLO 三种模式下保持一致。
+- **`/relay` 命令及中文别名**（`/接力`）——用于结构化的跨会话
+  接力提示。
 
-感谢本周期落地 10 个 PR 的 **@linzhiqin2003**、落地 5 个 PR 的
-**@reidliu41**、落地 4 个 PR 的 **@CrepuscularIRIS**，以及
-**@SamhandsomeLee**、**@Beltran12138**、**@Wenjunyun123**、
-**@hlx98007**、**@Liu-Vince**、**@xiluoduyu**，和报告 #1395 的
-**@shenxiaodaosanhua**。
+感谢 **@reidliu41** 和 **@h3c-hexin** 在本版本中的社区贡献。
 
 ---
 
@@ -307,6 +285,36 @@ deepseek mcp-server                            # 启动 dispatcher MCP stdio 服
 deepseek update                                # 检查并应用二进制更新
 ```
 
+Docker 镜像发布在 GHCR 上：
+
+```bash
+docker volume create deepseek-tui-home
+
+docker run --rm -it \
+  -e DEEPSEEK_API_KEY="$DEEPSEEK_API_KEY" \
+  -v deepseek-tui-home:/home/deepseek/.deepseek \
+  ghcr.io/hmbown/deepseek-tui:latest
+```
+
+### Zed / ACP
+
+DeepSeek 可作为自定义 Agent Client Protocol 服务器运行，供 Zed 等编辑器通过 stdio 调用本地 ACP 智能体。在 Zed 中添加自定义智能体服务器：
+
+```json
+{
+  "agent_servers": {
+    "DeepSeek": {
+      "type": "custom",
+      "command": "deepseek",
+      "args": ["serve", "--acp"],
+      "env": {}
+    }
+  }
+}
+```
+
+首个 ACP 切片支持通过现有 DeepSeek 配置/API 密钥创建新会话和提示响应。工具支持的编辑和检查点回放尚未通过 ACP 暴露。
+
 ### 常用快捷键
 
 | 按键 | 功能 |
@@ -347,10 +355,11 @@ deepseek update                                # 检查并应用二进制更新
 | `DEEPSEEK_API_KEY` | DeepSeek API key |
 | `DEEPSEEK_BASE_URL` | API base URL |
 | `DEEPSEEK_MODEL` | 默认模型 |
-| `DEEPSEEK_PROVIDER` | `deepseek`（默认）、`nvidia-nim`、`fireworks`、`sglang`、`vllm`、`ollama` |
+| `DEEPSEEK_PROVIDER` | `deepseek`（默认）、`nvidia-nim`、`openai`、`openrouter`、`novita`、`atlascloud`、`fireworks`、`sglang`、`vllm`、`ollama` |
 | `DEEPSEEK_PROFILE` | 配置 profile 名称 |
 | `DEEPSEEK_MEMORY` | 设为 `on` 启用用户记忆 |
-| `NVIDIA_API_KEY` / `FIREWORKS_API_KEY` / `SGLANG_API_KEY` / `VLLM_API_KEY` / `OLLAMA_API_KEY` | 提供商认证 |
+| `NVIDIA_API_KEY` / `OPENAI_API_KEY` / `OPENROUTER_API_KEY` / `NOVITA_API_KEY` / `ATLASCLOUD_API_KEY` / `FIREWORKS_API_KEY` / `SGLANG_API_KEY` / `VLLM_API_KEY` / `OLLAMA_API_KEY` | 提供商认证 |
+| `OPENAI_BASE_URL` / `OPENAI_MODEL` | 通用 OpenAI 兼容端点和模型 ID |
 | `SGLANG_BASE_URL` | 自托管 SGLang 端点 |
 | `VLLM_BASE_URL` | 自托管 vLLM 端点 |
 | `OLLAMA_BASE_URL` | 自托管 Ollama 端点 |
diff --git a/crates/agent/Cargo.toml b/crates/agent/Cargo.toml
index 9aa5759f..69145890 100644
--- a/crates/agent/Cargo.toml
+++ b/crates/agent/Cargo.toml
@@ -7,5 +7,5 @@ repository.workspace = true
 description = "Model/provider registry and fallback strategy for DeepSeek workspace architecture"
 
 [dependencies]
-deepseek-config = { path = "../config", version = "0.8.32" }
+deepseek-config = { path = "../config", version = "0.8.33" }
 serde.workspace = true
diff --git a/crates/app-server/Cargo.toml b/crates/app-server/Cargo.toml
index 1a3aca96..e9f2dd62 100644
--- a/crates/app-server/Cargo.toml
+++ b/crates/app-server/Cargo.toml
@@ -10,15 +10,15 @@ description = "Codex-style app-server transport for DeepSeek workspace architect
 anyhow.workspace = true
 axum.workspace = true
 clap.workspace = true
-deepseek-agent = { path = "../agent", version = "0.8.32" }
-deepseek-config = { path = "../config", version = "0.8.32" }
-deepseek-core = { path = "../core", version = "0.8.32" }
-deepseek-execpolicy = { path = "../execpolicy", version = "0.8.32" }
-deepseek-hooks = { path = "../hooks", version = "0.8.32" }
-deepseek-mcp = { path = "../mcp", version = "0.8.32" }
-deepseek-protocol = { path = "../protocol", version = "0.8.32" }
-deepseek-state = { path = "../state", version = "0.8.32" }
-deepseek-tools = { path = "../tools", version = "0.8.32" }
+deepseek-agent = { path = "../agent", version = "0.8.33" }
+deepseek-config = { path = "../config", version = "0.8.33" }
+deepseek-core = { path = "../core", version = "0.8.33" }
+deepseek-execpolicy = { path = "../execpolicy", version = "0.8.33" }
+deepseek-hooks = { path = "../hooks", version = "0.8.33" }
+deepseek-mcp = { path = "../mcp", version = "0.8.33" }
+deepseek-protocol = { path = "../protocol", version = "0.8.33" }
+deepseek-state = { path = "../state", version = "0.8.33" }
+deepseek-tools = { path = "../tools", version = "0.8.33" }
 serde.workspace = true
 serde_json.workspace = true
 tokio.workspace = true
diff --git a/crates/cli/Cargo.toml b/crates/cli/Cargo.toml
index 0686df54..53d59366 100644
--- a/crates/cli/Cargo.toml
+++ b/crates/cli/Cargo.toml
@@ -14,13 +14,13 @@ path = "src/main.rs"
 anyhow.workspace = true
 clap.workspace = true
 clap_complete.workspace = true
-deepseek-agent = { path = "../agent", version = "0.8.32" }
-deepseek-app-server = { path = "../app-server", version = "0.8.32" }
-deepseek-config = { path = "../config", version = "0.8.32" }
-deepseek-execpolicy = { path = "../execpolicy", version = "0.8.32" }
-deepseek-mcp = { path = "../mcp", version = "0.8.32" }
-deepseek-secrets = { path = "../secrets", version = "0.8.32" }
-deepseek-state = { path = "../state", version = "0.8.32" }
+deepseek-agent = { path = "../agent", version = "0.8.33" }
+deepseek-app-server = { path = "../app-server", version = "0.8.33" }
+deepseek-config = { path = "../config", version = "0.8.33" }
+deepseek-execpolicy = { path = "../execpolicy", version = "0.8.33" }
+deepseek-mcp = { path = "../mcp", version = "0.8.33" }
+deepseek-secrets = { path = "../secrets", version = "0.8.33" }
+deepseek-state = { path = "../state", version = "0.8.33" }
 chrono.workspace = true
 dirs.workspace = true
 serde.workspace = true
diff --git a/crates/config/Cargo.toml b/crates/config/Cargo.toml
index d9d6ac12..c8793743 100644
--- a/crates/config/Cargo.toml
+++ b/crates/config/Cargo.toml
@@ -8,7 +8,7 @@ description = "Config schema and precedence model for DeepSeek workspace archite
 
 [dependencies]
 anyhow.workspace = true
-deepseek-secrets = { path = "../secrets", version = "0.8.32" }
+deepseek-secrets = { path = "../secrets", version = "0.8.33" }
 dirs.workspace = true
 serde.workspace = true
 toml.workspace = true
diff --git a/crates/core/Cargo.toml b/crates/core/Cargo.toml
index 7064eded..50f2598c 100644
--- a/crates/core/Cargo.toml
+++ b/crates/core/Cargo.toml
@@ -9,13 +9,13 @@ description = "Core runtime boundaries for DeepSeek workspace architecture"
 [dependencies]
 anyhow.workspace = true
 chrono.workspace = true
-deepseek-agent = { path = "../agent", version = "0.8.32" }
-deepseek-config = { path = "../config", version = "0.8.32" }
-deepseek-execpolicy = { path = "../execpolicy", version = "0.8.32" }
-deepseek-hooks = { path = "../hooks", version = "0.8.32" }
-deepseek-mcp = { path = "../mcp", version = "0.8.32" }
-deepseek-protocol = { path = "../protocol", version = "0.8.32" }
-deepseek-state = { path = "../state", version = "0.8.32" }
-deepseek-tools = { path = "../tools", version = "0.8.32" }
+deepseek-agent = { path = "../agent", version = "0.8.33" }
+deepseek-config = { path = "../config", version = "0.8.33" }
+deepseek-execpolicy = { path = "../execpolicy", version = "0.8.33" }
+deepseek-hooks = { path = "../hooks", version = "0.8.33" }
+deepseek-mcp = { path = "../mcp", version = "0.8.33" }
+deepseek-protocol = { path = "../protocol", version = "0.8.33" }
+deepseek-state = { path = "../state", version = "0.8.33" }
+deepseek-tools = { path = "../tools", version = "0.8.33" }
 serde_json.workspace = true
 uuid.workspace = true
diff --git a/crates/execpolicy/Cargo.toml b/crates/execpolicy/Cargo.toml
index 979f0033..51f4b341 100644
--- a/crates/execpolicy/Cargo.toml
+++ b/crates/execpolicy/Cargo.toml
@@ -8,5 +8,5 @@ description = "Execution policy and approval model parity for DeepSeek workspace
 
 [dependencies]
 anyhow.workspace = true
-deepseek-protocol = { path = "../protocol", version = "0.8.32" }
+deepseek-protocol = { path = "../protocol", version = "0.8.33" }
 serde.workspace = true
diff --git a/crates/hooks/Cargo.toml b/crates/hooks/Cargo.toml
index c507ab37..855b2c30 100644
--- a/crates/hooks/Cargo.toml
+++ b/crates/hooks/Cargo.toml
@@ -10,7 +10,7 @@ description = "Hook dispatch and notifications parity for DeepSeek workspace arc
 anyhow.workspace = true
 async-trait.workspace = true
 chrono.workspace = true
-deepseek-protocol = { path = "../protocol", version = "0.8.32" }
+deepseek-protocol = { path = "../protocol", version = "0.8.33" }
 reqwest.workspace = true
 serde.workspace = true
 serde_json.workspace = true
diff --git a/crates/tools/Cargo.toml b/crates/tools/Cargo.toml
index 72e8fc0f..bb1c5306 100644
--- a/crates/tools/Cargo.toml
+++ b/crates/tools/Cargo.toml
@@ -9,7 +9,7 @@ description = "Tool invocation lifecycle, schema validation, and scheduler paral
 [dependencies]
 anyhow.workspace = true
 async-trait.workspace = true
-deepseek-protocol = { path = "../protocol", version = "0.8.32" }
+deepseek-protocol = { path = "../protocol", version = "0.8.33" }
 serde.workspace = true
 serde_json.workspace = true
 tokio.workspace = true
diff --git a/crates/tui/CHANGELOG.md b/crates/tui/CHANGELOG.md
index 250c71ed..79080328 100644
--- a/crates/tui/CHANGELOG.md
+++ b/crates/tui/CHANGELOG.md
@@ -7,6 +7,99 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 
 ## [Unreleased]
 
+## [0.8.33] - 2026-05-12
+
+A sub-agent and RLM renovation release. The model-facing delegation
+surface is now session-oriented instead of one-shot: RLM work happens
+through `rlm_open` / `rlm_eval` / `rlm_configure` / `rlm_close`,
+sub-agent work happens through `agent_open` / `agent_eval` /
+`agent_close`, and large outputs can be parked behind typed handles
+that the model reads back explicitly with `handle_read`.
+
+### Added
+
+- **Persistent RLM sessions with bounded REPL helpers.** RLM prompts now
+  use `peek`, `search`, `chunk`, `context_meta`, `sub_query`,
+  `sub_query_batch`, `sub_query_map`, `sub_rlm`, and
+  `finalize(value, confidence)` instead of exposing the full parent
+  context as an ambient variable.
+- **Fork-aware sub-agent sessions.** `agent_open` supports named
+  sessions, `fork_context`, and bounded recursive depth so the parent can
+  ask for multiple perspectives while preserving prompt-cache-friendly
+  prefix context where available.
+- **Shared `handle_read` storage.** RLM finals, sub-agent transcripts,
+  and other large structured results can return `var_handle` references
+  with slice, range, count, and JSONPath projections.
+- **Slash-command routing for the new surface.** `/rlm [N] ...` and
+  `/agent [N] ...` now prompt the assistant to use the persistent tools
+  instead of the removed foreground RLM operation.
+- **`/relay` slash command with CJK aliases** (`/接力`). Hands the
+  assistant a structured handoff prompt for coordinated multi-turn
+  continuation across sessions.
+- **`checklist_write` sidebar rename.** The sidebar focus tab formerly
+  known as "Plan" / "Todos" is now "Work" — one panel for the active
+  checklist and optional plan, consistent across all three modes.
+
+### Changed
+
+- **Prompts and docs now teach only the new tool names.** Legacy
+  RLM/sub-agent helpers remain internally where needed for durable
+  transcript compatibility, but the registry exposes the session tools.
+- **Large or noisy tool results are easier to keep out of context.**
+  Tool output summaries, sub-agent results, and transcript snapshots now
+  point the model toward `handle_read` when it needs raw detail.
+- **Tool-surface smoke guidance is explicit.** Release checks now document
+  the exact version commands and registry-name searches for `handle_read`,
+  persistent RLM tools, and persistent sub-agent tools.
+- **Foreground RLM operation removed.** The old `Op::Rlm` path and its
+  `handle_rlm` engine method are gone; all RLM work now flows through
+  the persistent-session tools.
+- **Stale competitive-analysis doc removed.** The old cross-agent matrix
+  had become an unreliable inventory of tool names rather than useful
+  release guidance.
+
+### Fixed
+
+- **Transcript selection keeps working while the agent is streaming.**
+  The loading-state mouse filter now drops inert move events but allows
+  active transcript and scrollbar drags to continue.
+- **Tool papercuts:** `file_search` has safer default excludes and an
+  explicit `exclude` option; `grep_files` returns single-line context as
+  strings; `fetch_url` can project JSON fields and returns headers;
+  `edit_file` can opt into leading-indentation fuzz; `exec_shell` can
+  merge stdout/stderr in chronological order; `revert_turn` rejects
+  no-op snapshot boundaries.
+- **CLI reasoning-effort honoured on non-auto exec routes** (PR #1511
+  from **@h3c-hexin**). `deepseek -p "..." --reasoning-effort high` now
+  applies the flag correctly instead of falling back to the config-file
+  default.
+- **Edit-file replacement boundaries clarified** (PR #1516). The tool
+  description and error messages now make it unambiguous that
+  `edit_file` is for one clear replacement in one file.
+- **Pandoc output validated before probing** (PR #1523). Binary-format
+  conversions that produce empty or invalid output now surface a clear
+  error instead of a confusing pandoc stack trace.
+- **Running turns can be steered and repainted** (PR #1533, #1537).
+  Composer input during an active turn no longer stalls; the TUI
+  redraws the transcript as the agent streams.
+- **Tasks and Activity Detail are calmer under load.** The Tasks panel now
+  keeps live/background/recent activity from double-counting the same shell
+  or RLM work, groups repeated read/search/checklist noise, and keeps
+  failures, status, command summaries, and durations visible. Ctrl+O now
+  opens Activity Detail for the selected, live, or most recent meaningful
+  activity while Alt+V remains the direct tool-detail pager; the idle footer
+  now advertises that split for the visible activity.
+- **npm retry shows timeout hint on first failure** (PR #1538).
+  Installations behind slow proxies now see a clear "retrying" message
+  instead of a silent hang.
+- **Issue templates improved** (PR #1525 from **@reidliu41**). Bug and
+  feature-request templates are clearer and easier for new contributors.
+
+### Credits
+
+Thanks to **@reidliu41** (#1525) and **@h3c-hexin** (#1511) for
+community contributions in this release.
+
 ## [0.8.32] - 2026-05-12
 
 A "more useful tools" release. v0.8.31 made the tool surface
@@ -3821,7 +3914,8 @@ Welcome — and thank you.
 - Hooks system and config profiles
 - Example skills and launch assets
 
-[Unreleased]: https://github.com/Hmbown/DeepSeek-TUI/compare/v0.8.32...HEAD
+[Unreleased]: https://github.com/Hmbown/DeepSeek-TUI/compare/v0.8.33...HEAD
+[0.8.33]: https://github.com/Hmbown/DeepSeek-TUI/compare/v0.8.32...v0.8.33
 [0.8.32]: https://github.com/Hmbown/DeepSeek-TUI/compare/v0.8.31...v0.8.32
 [0.8.31]: https://github.com/Hmbown/DeepSeek-TUI/compare/v0.8.30...v0.8.31
 [0.8.30]: https://github.com/Hmbown/DeepSeek-TUI/compare/v0.8.29...v0.8.30
diff --git a/crates/tui/Cargo.toml b/crates/tui/Cargo.toml
index aa24e392..44873c5f 100644
--- a/crates/tui/Cargo.toml
+++ b/crates/tui/Cargo.toml
@@ -21,8 +21,8 @@ path = "src/main.rs"
 [dependencies]
 anyhow = "1.0.100"
 arboard = "3.4"
-deepseek-secrets = { path = "../secrets", version = "0.8.32" }
-deepseek-tools = { path = "../tools", version = "0.8.32" }
+deepseek-secrets = { path = "../secrets", version = "0.8.33" }
+deepseek-tools = { path = "../tools", version = "0.8.33" }
 schemaui = { version = "0.12.0", default-features = false, optional = true }
 async-stream = "0.3.6"
 async-trait = "0.1"
diff --git a/crates/tui/src/client.rs b/crates/tui/src/client.rs
index 3b5875ff..3fc09f50 100644
--- a/crates/tui/src/client.rs
+++ b/crates/tui/src/client.rs
@@ -1752,7 +1752,7 @@ mod tests {
             ],
             max_tokens: 1024,
             system: Some(SystemPrompt::Text(
-                "Base policy\n\n<project_instructions source=\"AGENTS.md\">\nStable project rules\n</project_instructions>\n\n## Previous Session Handoff\n\nDynamic handoff"
+                "Base policy\n\n<project_instructions source=\"AGENTS.md\">\nStable project rules\n</project_instructions>\n\n## Previous Session Relay\n\nDynamic relay"
                     .to_string(),
             )),
             tools: None,
@@ -1788,7 +1788,7 @@ mod tests {
             .and_then(Value::as_str)
             .expect("warmup system prompt");
         assert!(system.contains("Stable project rules"));
-        assert!(!system.contains("Dynamic handoff"));
+        assert!(!system.contains("Dynamic relay"));
         assert!(
             !wire
                 .iter()
diff --git a/crates/tui/src/client/chat.rs b/crates/tui/src/client/chat.rs
index c9e51a01..2b3e6f59 100644
--- a/crates/tui/src/client/chat.rs
+++ b/crates/tui/src/client/chat.rs
@@ -685,7 +685,7 @@ fn split_system_layers(content: &str) -> Vec<(String, PromptLayerStability, &str
         ("Skills", "## Skills"),
         ("Context management", "## Context Management"),
         ("Compact template", "## Compact"),
-        ("Previous session handoff", "## Previous Session Handoff"),
+        ("Previous session relay", "## Previous Session Relay"),
     ];
 
     let mut starts: Vec<(usize, &str)> = markers
@@ -706,7 +706,7 @@ fn split_system_layers(content: &str) -> Vec<(String, PromptLayerStability, &str
 
     for (i, (start, name)) in starts.iter().enumerate() {
         let end = starts.get(i + 1).map_or(content.len(), |(idx, _)| *idx);
-        let stability = if *name == "Previous session handoff" {
+        let stability = if *name == "Previous session relay" {
             PromptLayerStability::Dynamic
         } else if is_static_base_layer(name) {
             PromptLayerStability::Static
diff --git a/crates/tui/src/commands/core.rs b/crates/tui/src/commands/core.rs
index 6a9088ec..5314e289 100644
--- a/crates/tui/src/commands/core.rs
+++ b/crates/tui/src/commands/core.rs
@@ -545,6 +545,8 @@ mod tests {
     #[test]
     fn model_reset_same_model_keeps_turn_cache_history() {
         let mut app = create_test_app();
+        app.auto_model = false;
+        app.model = "deepseek-v4-pro".to_string();
         app.push_turn_cache_record(TurnCacheRecord {
             input_tokens: 100,
             output_tokens: 25,
diff --git a/crates/tui/src/commands/mod.rs b/crates/tui/src/commands/mod.rs
index a3616450..c8c1740e 100644
--- a/crates/tui/src/commands/mod.rs
+++ b/crates/tui/src/commands/mod.rs
@@ -32,6 +32,8 @@ mod status;
 mod task;
 mod user_commands;
 
+use std::fmt::Write as _;
+
 use crate::localization::{Locale, MessageId, tr};
 use crate::tui::app::{App, AppAction};
 
@@ -204,6 +206,12 @@ pub const COMMANDS: &[CommandInfo] = &[
         usage: "/subagents",
         description_id: MessageId::CmdSubagentsDescription,
     },
+    CommandInfo {
+        name: "agent",
+        aliases: &[],
+        usage: "/agent [N] <task>",
+        description_id: MessageId::CmdAgentDescription,
+    },
     CommandInfo {
         name: "links",
         aliases: &["dashboard", "api"],
@@ -295,6 +303,12 @@ pub const COMMANDS: &[CommandInfo] = &[
         usage: "/compact",
         description_id: MessageId::CmdCompactDescription,
     },
+    CommandInfo {
+        name: "relay",
+        aliases: &["batonpass", "接力"],
+        usage: "/relay [focus]",
+        description_id: MessageId::CmdRelayDescription,
+    },
     CommandInfo {
         name: "context",
         aliases: &["ctx"],
@@ -482,7 +496,7 @@ pub const COMMANDS: &[CommandInfo] = &[
     CommandInfo {
         name: "rlm",
         aliases: &["recursive"],
-        usage: "/rlm <prompt>",
+        usage: "/rlm [N] <file_or_text>",
         description_id: MessageId::CmdRlmDescription,
     },
     // Debug/cost command
@@ -534,6 +548,7 @@ pub fn execute(cmd: &str, app: &mut App) -> CommandResult {
         "stash" | "park" => stash::stash(app, arg),
         "hooks" | "hook" => hooks::hooks(app, arg),
         "subagents" | "agents" => core::subagents(app),
+        "agent" => agent(app, arg),
         "links" | "dashboard" | "api" => core::deepseek_links(app),
         "feedback" => feedback::feedback(app, arg),
         "home" | "stats" | "overview" => core::home_dashboard(app),
@@ -551,6 +566,7 @@ pub fn execute(cmd: &str, app: &mut App) -> CommandResult {
         "sessions" | "resume" => session::sessions(app, arg),
         "load" => session::load(app, arg),
         "compact" => session::compact(app),
+        "relay" | "batonpass" | "接力" => relay(app, arg),
         "cycles" => cycle::list_cycles(app),
         "cycle" => cycle::show_cycle(app, arg),
         "recall" => cycle::recall_archive(app, arg),
@@ -686,49 +702,220 @@ pub use config::{
 /// in the REPL as the `PROMPT` variable. The root LLM will only see
 /// metadata about the REPL state, never the prompt text directly.
 pub fn rlm(app: &mut App, arg: Option<&str>) -> CommandResult {
-    let prompt = match arg {
+    let (max_depth, target) = match parse_depth_prefixed_arg(arg, 1) {
+        Ok(parsed) => parsed,
+        Err(message) => return CommandResult::error(message),
+    };
+    let target = match target {
         Some(p) if !p.trim().is_empty() => p.trim().to_string(),
         _ => {
             return CommandResult::error(
-                "Usage: /rlm <prompt>\n\n\
-                 Process a prompt using a Recursive Language Model (RLM).\n\
-                 The prompt is stored in a REPL and the model writes code\n\
-                 to decompose and process it recursively."
+                "Usage: /rlm [N] <file_or_text>\n\n\
+                 Opens a persistent RLM context with sub_rlm depth N (0-3, default 1)."
                     .to_string(),
             );
         }
     };
 
-    // Sanity-check: RLM is most useful for longer prompts.
-    if prompt.len() < 50 {
-        return CommandResult::message(
-            "Tip: RLM is designed for processing LONG prompts (>100 chars). \
-             For short queries, just type the message directly."
-                .to_string(),
+    let source_arg = if resolves_to_existing_file(app, &target) {
+        format!(r#"file_path: "{target}""#)
+    } else {
+        format!("content: {:?}", target)
+    };
+    let message = format!(
+        "Open and use a persistent RLM session for this request. Call `rlm_open` with name `slash_rlm` and {source_arg}. Then call `rlm_configure` with `sub_rlm_max_depth: {max_depth}`. Use `rlm_eval` to inspect the context through `peek`, `search`, and `chunk`, and call `finalize(...)` from the REPL when ready. If a `var_handle` is returned, use `handle_read` for bounded slices or projections before answering."
+    );
+
+    CommandResult::with_message_and_action(
+        format!("Opening persistent RLM context at depth {max_depth}..."),
+        AppAction::SendMessage(message),
+    )
+}
+
+/// Open a persistent sub-agent session from a slash command.
+pub fn agent(_app: &mut App, arg: Option<&str>) -> CommandResult {
+    let (max_depth, task) = match parse_depth_prefixed_arg(arg, 1) {
+        Ok(parsed) => parsed,
+        Err(message) => return CommandResult::error(message),
+    };
+    let task = match task {
+        Some(task) if !task.trim().is_empty() => task.trim().to_string(),
+        _ => {
+            return CommandResult::error(
+                "Usage: /agent [N] <task>\n\n\
+                 Opens a persistent sub-agent session with recursive agent depth N (0-3, default 1).",
+            );
+        }
+    };
+    let message = format!(
+        "Open a persistent sub-agent session for this task. Call `agent_open` with name `slash_agent`, `prompt: {:?}`, and `max_depth: {max_depth}`. Use `agent_eval` to wait for the next terminal/current projection and `handle_read` on the returned transcript_handle if you need more detail. Verify any claimed side effects before reporting success.",
+        task
+    );
+    CommandResult::with_message_and_action(
+        format!("Opening persistent sub-agent at depth {max_depth}..."),
+        AppAction::SendMessage(message),
+    )
+}
+
+/// Ask the active model to write a compact relay artifact for the next thread.
+///
+/// The visible command is `/relay` (with `/接力` for Chinese users), but the
+/// durable file path remains `.deepseek/handoff.md` for compatibility with
+/// existing sessions and startup prompt loading.
+pub fn relay(app: &mut App, arg: Option<&str>) -> CommandResult {
+    let focus = arg.map(str::trim).filter(|value| !value.is_empty());
+    let message = build_relay_instruction(app, focus);
+    CommandResult::with_message_and_action(
+        "Preparing session relay at .deepseek/handoff.md...",
+        AppAction::SendMessage(message),
+    )
+}
+
+fn build_relay_instruction(app: &App, focus: Option<&str>) -> String {
+    let mut out = String::new();
+    let _ = writeln!(
+        out,
+        "Create a compact session relay (接力) for a future DeepSeek TUI thread."
+    );
+    let _ = writeln!(out);
+    let _ = writeln!(out, "Write or update `.deepseek/handoff.md`.");
+    let _ = writeln!(
+        out,
+        "Keep the existing file path for compatibility, but title the artifact `# Session relay`."
+    );
+    let _ = writeln!(out);
+    let _ = writeln!(out, "Current session snapshot:");
+    let _ = writeln!(out, "- Workspace: {}", app.workspace.display());
+    let _ = writeln!(out, "- Mode: {}", app.mode.label());
+    let _ = writeln!(out, "- Model: {}", app.model_display_label());
+    if let Some(focus) = focus {
+        let _ = writeln!(out, "- Requested relay focus: {focus}");
+    }
+    if let Some(goal) = app.goal.goal_objective.as_deref() {
+        let _ = writeln!(out, "- Goal: {goal}");
+    }
+    if let Some(budget) = app.goal.goal_token_budget {
+        let _ = writeln!(out, "- Goal token budget: {budget}");
+    }
+    if app.cycle_count > 0 {
+        let _ = writeln!(out, "- Cycle count: {}", app.cycle_count);
+    }
+
+    if let Ok(todos) = app.todos.try_lock() {
+        let snapshot = todos.snapshot();
+        if !snapshot.items.is_empty() {
+            let _ = writeln!(
+                out,
+                "\nWork checklist (primary progress surface, {}% complete):",
+                snapshot.completion_pct
+            );
+            for item in snapshot.items {
+                let _ = writeln!(
+                    out,
+                    "- #{} [{}] {}",
+                    item.id,
+                    item.status.as_str(),
+                    item.content
+                );
+            }
+        }
+    } else {
+        let _ = writeln!(
+            out,
+            "\nWork checklist: unavailable because the checklist is busy."
         );
     }
 
-    let model = app.model.clone();
-    let child_model = "deepseek-v4-flash".to_string();
-    // Paper experiments use depth=1 (one level of `sub_rlm`); we default to
-    // depth=2 so the model can recurse twice if it chooses to.
-    let max_depth: u32 = 2;
+    if let Ok(plan) = app.plan_state.try_lock() {
+        let snapshot = plan.snapshot();
+        if snapshot.explanation.is_some() || !snapshot.items.is_empty() {
+            let _ = writeln!(out, "\nOptional strategy metadata from update_plan:");
+            if let Some(explanation) = snapshot.explanation.as_deref() {
+                let _ = writeln!(out, "- Explanation: {explanation}");
+            }
+            for item in snapshot.items {
+                let _ = writeln!(out, "- [{}] {}", plan_status_label(&item.status), item.step);
+            }
+        }
+    } else {
+        let _ = writeln!(
+            out,
+            "\nStrategy metadata: unavailable because plan state is busy."
+        );
+    }
 
-    CommandResult::with_message_and_action(
-        format!(
-            "Starting RLM turn for {} chars of prompt using {} (child={}, depth={})...",
-            prompt.len(),
-            model,
-            child_model,
-            max_depth,
-        ),
-        AppAction::Rlm {
-            prompt,
-            model,
-            child_model,
-            max_depth,
-        },
-    )
+    let _ = writeln!(
+        out,
+        "\nBefore writing, inspect the current transcript context and any live tool evidence you need. Do not invent test results, file changes, blockers, or decisions."
+    );
+    let _ = writeln!(
+        out,
+        "\nUse this compact structure:\n\
+         # Session relay\n\
+         \n\
+         ## Goal\n\
+         [the user's objective and any explicit constraints]\n\
+         \n\
+         ## Current work\n\
+         [the active Work checklist item, progress, and what is mid-flight]\n\
+         \n\
+         ## Files and state\n\
+         [changed files, important paths, sub-agents/RLM sessions, commands run]\n\
+         \n\
+         ## Decisions\n\
+         [why key choices were made]\n\
+         \n\
+         ## Verification\n\
+         [what passed, what failed, what was not run]\n\
+         \n\
+         ## Next action\n\
+         [one concrete action for the next thread]"
+    );
+    let _ = writeln!(
+        out,
+        "\nKeep it under about 900 words unless the session genuinely needs more. After writing, report the path and the single next action."
+    );
+    out
+}
+
+fn plan_status_label(status: &crate::tools::plan::StepStatus) -> &'static str {
+    match status {
+        crate::tools::plan::StepStatus::Pending => "pending",
+        crate::tools::plan::StepStatus::InProgress => "in_progress",
+        crate::tools::plan::StepStatus::Completed => "completed",
+    }
+}
+
+fn parse_depth_prefixed_arg(
+    arg: Option<&str>,
+    default_depth: u32,
+) -> Result<(u32, Option<&str>), String> {
+    let Some(raw) = arg.map(str::trim).filter(|raw| !raw.is_empty()) else {
+        return Ok((default_depth, None));
+    };
+    let mut parts = raw.splitn(2, char::is_whitespace);
+    let first = parts.next().unwrap_or_default();
+    if first.chars().all(|ch| ch.is_ascii_digit()) {
+        let depth: u32 = first
+            .parse()
+            .map_err(|_| "Depth must be an integer from 0 to 3".to_string())?;
+        if depth > 3 {
+            return Err("Depth must be between 0 and 3".to_string());
+        }
+        Ok((depth, parts.next().map(str::trim)))
+    } else {
+        Ok((default_depth, Some(raw)))
+    }
+}
+
+fn resolves_to_existing_file(app: &App, input: &str) -> bool {
+    let path = std::path::Path::new(input);
+    let candidate = if path.is_absolute() {
+        path.to_path_buf()
+    } else {
+        app.workspace.join(path)
+    };
+    candidate.is_file()
 }
 
 /// Get command info by name or alias
@@ -862,6 +1049,8 @@ fn suggest_command_names(input: &str, limit: usize) -> Vec<String> {
 mod tests {
     use super::*;
     use crate::config::Config;
+    use crate::tools::plan::{PlanItemArg, StepStatus, UpdatePlanArgs};
+    use crate::tools::todo::TodoStatus;
     use crate::tui::app::{App, AppAction, TuiOptions};
     use std::ffi::OsString;
     use std::path::{Path, PathBuf};
@@ -910,6 +1099,101 @@ mod tests {
         assert_eq!(links.aliases, &["dashboard", "api"]);
     }
 
+    #[test]
+    fn rlm_slash_command_routes_to_persistent_tool_instruction() {
+        let mut app = create_test_app();
+        let result = execute("/rlm 2 inspect this long corpus", &mut app);
+        assert!(!result.is_error);
+        assert!(result.message.as_deref().unwrap_or("").contains("depth 2"));
+        let Some(AppAction::SendMessage(message)) = result.action else {
+            panic!("expected SendMessage action");
+        };
+        assert!(message.contains("rlm_open"));
+        assert!(message.contains("rlm_configure"));
+        assert!(message.contains("sub_rlm_max_depth: 2"));
+    }
+
+    #[test]
+    fn agent_slash_command_routes_to_persistent_tool_instruction() {
+        let mut app = create_test_app();
+        let result = execute("/agent 0 inspect the parser", &mut app);
+        assert!(!result.is_error);
+        let Some(AppAction::SendMessage(message)) = result.action else {
+            panic!("expected SendMessage action");
+        };
+        assert!(message.contains("agent_open"));
+        assert!(message.contains("max_depth: 0"));
+    }
+
+    #[test]
+    fn relay_slash_command_routes_to_session_relay_instruction() {
+        let mut app = create_test_app();
+        app.goal.goal_objective = Some("Unify the work surface".to_string());
+        app.goal.goal_token_budget = Some(12_000);
+        app.cycle_count = 2;
+        {
+            let mut todos = app.todos.try_lock().expect("todo lock");
+            todos.add("inspect workspace".to_string(), TodoStatus::Completed);
+            todos.add("patch relay command".to_string(), TodoStatus::InProgress);
+        }
+        {
+            let mut plan = app.plan_state.try_lock().expect("plan lock");
+            plan.update(UpdatePlanArgs {
+                explanation: Some("RLM-style strategy".to_string()),
+                plan: vec![PlanItemArg {
+                    step: "keep checklist primary".to_string(),
+                    status: StepStatus::InProgress,
+                }],
+            });
+        }
+
+        let result = execute("/relay verify install", &mut app);
+        assert!(!result.is_error);
+        assert!(
+            result
+                .message
+                .as_deref()
+                .unwrap_or_default()
+                .contains(".deepseek/handoff.md")
+        );
+        let Some(AppAction::SendMessage(message)) = result.action else {
+            panic!("expected SendMessage action");
+        };
+        assert!(message.contains("session relay"));
+        assert!(message.contains("接力"));
+        assert!(message.contains("Write or update `.deepseek/handoff.md`"));
+        assert!(message.contains("# Session relay"));
+        assert!(message.contains("Requested relay focus: verify install"));
+        assert!(message.contains("Goal: Unify the work surface"));
+        assert!(message.contains("Goal token budget: 12000"));
+        assert!(message.contains("Cycle count: 2"));
+        assert!(message.contains("Work checklist (primary progress surface, 50% complete)"));
+        assert!(message.contains("#1 [completed] inspect workspace"));
+        assert!(message.contains("#2 [in_progress] patch relay command"));
+        assert!(message.contains("Optional strategy metadata from update_plan"));
+        assert!(message.contains("Explanation: RLM-style strategy"));
+        assert!(message.contains("[in_progress] keep checklist primary"));
+    }
+
+    #[test]
+    fn relay_command_has_bilingual_aliases() {
+        let relay = COMMANDS
+            .iter()
+            .find(|cmd| cmd.name == "relay")
+            .expect("relay command should exist");
+        assert_eq!(relay.aliases, &["batonpass", "接力"]);
+        assert!(relay.description_for(Locale::ZhHans).contains("接力"));
+        assert!(relay.description_for(Locale::ZhHant).contains("接力"));
+
+        let mut app = create_test_app();
+        let result = execute("/接力 next hand", &mut app);
+        assert!(!result.is_error);
+        let Some(AppAction::SendMessage(message)) = result.action else {
+            panic!("expected SendMessage action");
+        };
+        assert!(message.contains("Requested relay focus: next hand"));
+    }
+
     #[test]
     fn command_registry_has_unique_names_and_aliases() {
         let mut names = std::collections::BTreeSet::new();
diff --git a/crates/tui/src/config_ui.rs b/crates/tui/src/config_ui.rs
index 12860194..c3cc125e 100644
--- a/crates/tui/src/config_ui.rs
+++ b/crates/tui/src/config_ui.rs
@@ -199,8 +199,7 @@ pub enum CostCurrencyValue {
 #[serde(rename_all = "snake_case")]
 pub enum SidebarFocusValue {
     Auto,
-    Plan,
-    Todos,
+    Work,
     Tasks,
     Agents,
     Context,
@@ -724,8 +723,7 @@ impl SidebarFocusValue {
     fn as_setting(self) -> &'static str {
         match self {
             Self::Auto => "auto",
-            Self::Plan => "plan",
-            Self::Todos => "todos",
+            Self::Work => "work",
             Self::Tasks => "tasks",
             Self::Agents => "agents",
             Self::Context => "context",
@@ -842,8 +840,7 @@ impl From<&str> for SidebarFocusValue {
     fn from(value: &str) -> Self {
         match SidebarFocus::from_setting(value) {
             SidebarFocus::Auto => Self::Auto,
-            SidebarFocus::Plan => Self::Plan,
-            SidebarFocus::Todos => Self::Todos,
+            SidebarFocus::Work => Self::Work,
             SidebarFocus::Tasks => Self::Tasks,
             SidebarFocus::Agents => Self::Agents,
             SidebarFocus::Context => Self::Context,
diff --git a/crates/tui/src/core/engine.rs b/crates/tui/src/core/engine.rs
index 9c596f42..6b181028 100644
--- a/crates/tui/src/core/engine.rs
+++ b/crates/tui/src/core/engine.rs
@@ -850,15 +850,6 @@ impl Engine {
                 Op::CompactContext => {
                     self.handle_manual_compaction().await;
                 }
-                Op::Rlm {
-                    content,
-                    model,
-                    child_model,
-                    max_depth,
-                } => {
-                    self.handle_rlm(content, model, child_model, max_depth)
-                        .await;
-                }
                 Op::EditLastTurn { new_message } => {
                     // #383: /edit — remove the last user+assistant exchange
                     // from the session, then re-send with the new content.
@@ -1339,100 +1330,6 @@ impl Engine {
             .await;
     }
 
-    /// Handle a Recursive Language Model (RLM) query — Algorithm 1 from
-    /// Zhang et al. (arXiv:2512.24601).
-    ///
-    /// The prompt is stored as PROMPT in a REPL variable. The root LLM
-    /// only sees metadata about the REPL state, never the prompt text
-    /// directly. The model generates Python code, which is executed by
-    /// the REPL. When FINAL() is called, the loop ends.
-    async fn handle_rlm(
-        &mut self,
-        content: String,
-        model: String,
-        child_model: String,
-        max_depth: u32,
-    ) {
-        use crate::rlm::turn::run_rlm_turn;
-
-        let Some(ref client) = self.deepseek_client else {
-            let err = self
-                .deepseek_client_error
-                .as_deref()
-                .map(|s| s.to_string())
-                .unwrap_or_else(|| "API client not configured".to_string());
-            let _ = self
-                .tx_event
-                .send(Event::error(ErrorEnvelope::fatal_auth(format!(
-                    "RLM error: {err}"
-                ))))
-                .await;
-            return;
-        };
-
-        let _ = self
-            .tx_event
-            .send(Event::status("RLM turn started".to_string()))
-            .await;
-
-        let result = run_rlm_turn(
-            client,
-            model,
-            content,
-            child_model,
-            self.tx_event.clone(),
-            max_depth,
-        )
-        .await;
-
-        let has_error = result.error.is_some();
-        if let Some(ref err) = result.error {
-            let _ = self
-                .tx_event
-                .send(Event::error(ErrorEnvelope::tool(format!(
-                    "RLM error: {err}"
-                ))))
-                .await;
-        }
-
-        if !result.answer.is_empty() {
-            // Add the final answer as an assistant message in the session.
-            self.add_session_message(crate::models::Message {
-                role: "assistant".to_string(),
-                content: vec![crate::models::ContentBlock::Text {
-                    text: result.answer.clone(),
-                    cache_control: None,
-                }],
-            })
-            .await;
-
-            let _ = self
-                .tx_event
-                .send(Event::MessageDelta {
-                    index: 0,
-                    content: result.answer.clone(),
-                })
-                .await;
-            let _ = self
-                .tx_event
-                .send(Event::MessageComplete { index: 0 })
-                .await;
-        }
-
-        let _ = self
-            .tx_event
-            .send(Event::TurnComplete {
-                usage: result.usage,
-                status: if has_error {
-                    crate::core::events::TurnOutcomeStatus::Failed
-                } else {
-                    crate::core::events::TurnOutcomeStatus::Completed
-                },
-                error: result.error,
-            })
-            .await;
-    }
-
     fn estimated_input_tokens(&self) -> usize {
         estimate_input_tokens_conservative(
             &self.session.messages,
diff --git a/crates/tui/src/core/engine/context.rs b/crates/tui/src/core/engine/context.rs
index 4896cbb2..3ec96626 100644
--- a/crates/tui/src/core/engine/context.rs
+++ b/crates/tui/src/core/engine/context.rs
@@ -146,6 +146,10 @@ fn summarize_subagent_status(status: &serde_json::Value) -> String {
 }
 
 fn summarize_subagent_snapshot(snapshot: &serde_json::Value, index: usize) -> String {
+    if let Some(inner) = snapshot.get("snapshot") {
+        return summarize_subagent_snapshot(inner, index);
+    }
+
     let Some(obj) = snapshot.as_object() else {
         return format!(
             "- item {index}: {}",
@@ -202,7 +206,10 @@ fn summarize_subagent_snapshot(snapshot: &serde_json::Value, index: usize) -> St
 }
 
 fn compact_subagent_tool_result_for_context(tool_name: &str, raw: &str) -> Option<String> {
-    if !matches!(tool_name, "agent_result" | "agent_wait" | "wait") {
+    if !matches!(
+        tool_name,
+        "agent_open" | "agent_eval" | "agent_close" | "agent_result" | "agent_wait" | "wait"
+    ) {
         return None;
     }
 
@@ -217,7 +224,7 @@ fn compact_subagent_tool_result_for_context(tool_name: &str, raw: &str) -> Optio
     out.push_str(
         "Child results are self-reports; verify side effects with tools like read_file or list_dir before claiming success.\n",
     );
-    out.push_str("Use `agent_result` again only if you need the full raw payload.\n");
+    out.push_str("Use `agent_eval` for a fresh projection or `handle_read` on `transcript_handle` for bounded transcript slices.\n");
     for (idx, snapshot) in snapshots.iter().enumerate() {
         if idx >= 8 {
             out.push_str(&format!(
diff --git a/crates/tui/src/core/engine/tests.rs b/crates/tui/src/core/engine/tests.rs
index d247103f..05f9b259 100644
--- a/crates/tui/src/core/engine/tests.rs
+++ b/crates/tui/src/core/engine/tests.rs
@@ -533,6 +533,7 @@ fn turn_tool_registry_builder_keeps_plan_mode_read_only_for_files() {
     assert!(registry.contains("update_plan"));
     assert!(registry.contains("task_list"));
     assert!(registry.contains("task_read"));
+    assert!(registry.contains("handle_read"));
     assert!(registry.contains("recall_archive"));
 
     let plan_state_tools = [
@@ -827,7 +828,7 @@ fn subagent_results_are_summarized_before_parent_context_insertion() {
         .to_string(),
     );
 
-    let context = compact_tool_result_for_context("deepseek-v4-pro", "agent_result", &output);
+    let context = compact_tool_result_for_context("deepseek-v4-pro", "agent_eval", &output);
 
     assert!(context.contains("[sub-agent result summarized for parent context]"));
     assert!(context.contains("agent_1234abcd (explore) status=Completed"));
@@ -837,6 +838,7 @@ fn subagent_results_are_summarized_before_parent_context_insertion() {
     assert!(context.contains("self-report"));
     assert!(context.contains("verify side effects"));
     assert!(context.contains("read_file") && context.contains("list_dir"));
+    assert!(context.contains("handle_read"));
 }
 
 #[test]
diff --git a/crates/tui/src/core/engine/tool_catalog.rs b/crates/tui/src/core/engine/tool_catalog.rs
index 25530993..71e7865c 100644
--- a/crates/tui/src/core/engine/tool_catalog.rs
+++ b/crates/tui/src/core/engine/tool_catalog.rs
@@ -58,7 +58,11 @@ pub(super) fn should_default_defer_tool(name: &str, mode: AppMode) -> bool {
             | "grep_files"
             | "file_search"
             | "diagnostics"
-            | "rlm"
+            | "rlm_open"
+            | "rlm_eval"
+            | "rlm_configure"
+            | "rlm_close"
+            | "handle_read"
             | "recall_archive"
             | "notify"
             | MULTI_TOOL_PARALLEL_NAME
diff --git a/crates/tui/src/core/engine/tool_setup.rs b/crates/tui/src/core/engine/tool_setup.rs
index cc1bfdf0..2354d6a8 100644
--- a/crates/tui/src/core/engine/tool_setup.rs
+++ b/crates/tui/src/core/engine/tool_setup.rs
@@ -48,6 +48,7 @@ impl Engine {
                 .with_diagnostics_tool()
                 .with_skill_tools()
                 .with_validation_tools()
+                .with_handle_tools()
                 .with_runtime_read_only_task_tools()
                 .with_todo_tool(todo_list)
                 .with_plan_tool(plan_state)
diff --git a/crates/tui/src/core/ops.rs b/crates/tui/src/core/ops.rs
index b77385be..77dc8fcc 100644
--- a/crates/tui/src/core/ops.rs
+++ b/crates/tui/src/core/ops.rs
@@ -75,21 +75,6 @@ pub enum Op {
     /// Run context compaction immediately.
     CompactContext,
 
-    /// Run a Recursive Language Model (RLM) turn per Algorithm 1 of
-    /// Zhang et al. (arXiv:2512.24601). The prompt is stored in the REPL
-    /// as `context`; the root LLM only sees metadata.
-    Rlm {
-        /// The user's prompt — stored in REPL, NOT in the LLM context.
-        content: String,
-        /// The model to use for root LLM calls.
-        model: String,
-        /// The model to use for sub-LLM (llm_query) calls.
-        child_model: String,
-        /// Recursion budget for `sub_rlm()` calls. Paper experiments use
-        /// depth=1; defaults set by the `/rlm` command.
-        max_depth: u32,
-    },
-
     /// Edit the last user message: remove the last user+assistant exchange
     /// from the session, then re-send with the new content.
     #[allow(dead_code)]
diff --git a/crates/tui/src/cycle_manager.rs b/crates/tui/src/cycle_manager.rs
index 8d31939c..c4d5b4c7 100644
--- a/crates/tui/src/cycle_manager.rs
+++ b/crates/tui/src/cycle_manager.rs
@@ -10,8 +10,8 @@
 //! summary as if it were verbatim and confabulates around the gaps.
 //!
 //! Checkpoint-restart fixes this by giving every cycle a *homogeneous* fresh
-//! context: original system prompt, structured state (todos / plan / working
-//! set / sub-agent handles), and a model-curated free-form briefing of at
+//! context: original system prompt, structured work state (checklist /
+//! strategy / working set / sub-agent handles), and a model-curated free-form briefing of at
 //! most ~3,000 tokens. The previous cycle is archived to disk in JSONL form
 //! so a future `recall_archive` tool (issue #127) can search it on demand.
 //!
@@ -271,8 +271,27 @@ impl StructuredState {
             out.push_str(&format!("- Cwd: `{}`\n", cwd.display()));
         }
 
+        if self.todo_snapshot.is_some() || self.plan_snapshot.is_some() {
+            out.push_str("\n### Work\n");
+        }
+
+        if let Some(todos) = self.todo_snapshot.as_ref() {
+            out.push_str(&format!(
+                "\nChecklist ({}% complete)\n",
+                todos.completion_pct
+            ));
+            for item in &todos.items {
+                let marker = match item.status {
+                    crate::tools::todo::TodoStatus::Pending => "[ ]",
+                    crate::tools::todo::TodoStatus::InProgress => "[~]",
+                    crate::tools::todo::TodoStatus::Completed => "[x]",
+                };
+                out.push_str(&format!("- {marker} {}\n", item.content));
+            }
+        }
+
         if let Some(plan) = self.plan_snapshot.as_ref() {
-            out.push_str("\n### Plan\n");
+            out.push_str("\nStrategy\n");
             if let Some(explanation) = plan.explanation.as_ref() {
                 out.push_str(&format!("{explanation}\n\n"));
             }
@@ -286,21 +305,6 @@ impl StructuredState {
             }
         }
 
-        if let Some(todos) = self.todo_snapshot.as_ref() {
-            out.push_str(&format!(
-                "\n### Todos ({}% complete)\n",
-                todos.completion_pct
-            ));
-            for item in &todos.items {
-                let marker = match item.status {
-                    crate::tools::todo::TodoStatus::Pending => "[ ]",
-                    crate::tools::todo::TodoStatus::InProgress => "[~]",
-                    crate::tools::todo::TodoStatus::Completed => "[x]",
-                };
-                out.push_str(&format!("- {marker} {}\n", item.content));
-            }
-        }
-
         if !self.subagent_snapshots.is_empty() {
             out.push_str("\n### Open Sub-Agents\n");
             for s in &self.subagent_snapshots {
@@ -976,6 +980,41 @@ mod tests {
         assert!(block.contains("Workspace: `/tmp/ws`"));
     }
 
+    #[test]
+    fn structured_state_to_system_block_unifies_work_state() {
+        let state = StructuredState {
+            mode_label: "agent".to_string(),
+            workspace: PathBuf::from("/tmp/ws"),
+            cwd: None,
+            working_set_summary: None,
+            todo_snapshot: Some(TodoListSnapshot {
+                items: vec![crate::tools::todo::TodoItem {
+                    id: 1,
+                    content: "Run focused tests".to_string(),
+                    status: crate::tools::todo::TodoStatus::InProgress,
+                }],
+                completion_pct: 0,
+                in_progress_id: Some(1),
+            }),
+            plan_snapshot: Some(PlanSnapshot {
+                explanation: Some("Keep sidebar state unified".to_string()),
+                items: vec![crate::tools::plan::PlanItemArg {
+                    step: "Update prompts".to_string(),
+                    status: crate::tools::plan::StepStatus::Pending,
+                }],
+            }),
+            subagent_snapshots: Vec::new(),
+        };
+
+        let block = state.to_system_block().expect("renders");
+
+        assert!(block.contains("### Work"));
+        assert!(block.contains("Checklist (0% complete)"));
+        assert!(block.contains("Strategy"));
+        assert!(!block.contains("### Plan"));
+        assert!(!block.contains("### Todos"));
+    }
+
     #[test]
     fn archive_cycle_writes_jsonl_with_header_and_messages() {
         let dir = tempdir().expect("tempdir");
diff --git a/crates/tui/src/deepseek_theme.rs b/crates/tui/src/deepseek_theme.rs
index 13f96cd0..bf31afef 100644
--- a/crates/tui/src/deepseek_theme.rs
+++ b/crates/tui/src/deepseek_theme.rs
@@ -67,7 +67,7 @@ impl Theme {
             section_bg: palette::DEEPSEEK_INK,
             section_title_color: palette::DEEPSEEK_BLUE,
             // Horizontal padding only. `Padding::uniform(1)` ate two rows of
-            // each sidebar panel — for compact terminals where Plan/Todos/Tasks
+            // each sidebar panel — for compact terminals where Work/Tasks/Agents
             // get ~3 rows total via the 25% layout split, that left zero rows
             // for content (#63 follow-up: panels rendered as empty boxes even
             // when "No todos" / "No active plan" should have shown).
diff --git a/crates/tui/src/handoff.rs b/crates/tui/src/handoff.rs
index 6c453ad0..ae64fcb9 100644
--- a/crates/tui/src/handoff.rs
+++ b/crates/tui/src/handoff.rs
@@ -1,13 +1,13 @@
-// Used by the deferred context-limit handoff feature (#667). The implementation
+// Used by the deferred context-limit relay feature (#667). The implementation
 // path is staged but not yet wired from the engine; suppress dead-code warnings
 // rather than delete the table until the follow-up feature consumes it.
 #[allow(dead_code)]
 pub const THRESHOLDS: [(f32, &str); 3] = [
     (
         0.9,
-        "Context at 90%: stop and write handoff to .deepseek/handoff.md now",
+        "Context at 90%: stop and write relay to .deepseek/handoff.md now",
     ),
-    (0.8, "Context at 80%: draft handoff to .deepseek/handoff.md"),
+    (0.8, "Context at 80%: draft relay to .deepseek/handoff.md"),
     (0.7, "Context at 70%: consider wrapping current sub-task"),
 ];
 #[allow(dead_code)]
diff --git a/crates/tui/src/localization.rs b/crates/tui/src/localization.rs
index 941dd060..25eed32e 100644
--- a/crates/tui/src/localization.rs
+++ b/crates/tui/src/localization.rs
@@ -256,6 +256,7 @@ pub enum MessageId {
     CmdHelpDescription,
     CmdHomeDescription,
     CmdHooksDescription,
+    CmdAgentDescription,
     CmdGoalDescription,
     CmdInitDescription,
     CmdJobsDescription,
@@ -273,6 +274,7 @@ pub enum MessageId {
     CmdProviderDescription,
     CmdQueueDescription,
     CmdRecallDescription,
+    CmdRelayDescription,
     CmdRenameDescription,
     CmdRestoreDescription,
     CmdRetryDescription,
@@ -485,6 +487,7 @@ pub const ALL_MESSAGE_IDS: &[MessageId] = &[
     MessageId::CmdHelpDescription,
     MessageId::CmdHomeDescription,
     MessageId::CmdHooksDescription,
+    MessageId::CmdAgentDescription,
     MessageId::CmdInitDescription,
     MessageId::CmdJobsDescription,
     MessageId::CmdLinksDescription,
@@ -500,6 +503,7 @@ pub const ALL_MESSAGE_IDS: &[MessageId] = &[
     MessageId::CmdProviderDescription,
     MessageId::CmdQueueDescription,
     MessageId::CmdRecallDescription,
+    MessageId::CmdRelayDescription,
     MessageId::CmdRenameDescription,
     MessageId::CmdRestoreDescription,
     MessageId::CmdRetryDescription,
@@ -898,6 +902,9 @@ fn english(id: MessageId) -> &'static str {
         MessageId::CmdHelpDescription => "Show help information",
         MessageId::CmdHomeDescription => "Show home dashboard with stats and quick actions",
         MessageId::CmdHooksDescription => "List configured lifecycle hooks (read-only)",
+        MessageId::CmdAgentDescription => {
+            "Open a persistent sub-agent session: /agent [0-3] <task>"
+        }
         MessageId::CmdGoalDescription => "Set a session goal with optional token budget",
         MessageId::CmdInitDescription => "Generate AGENTS.md for project",
         MessageId::CmdLspDescription => "Toggle LSP diagnostics on or off",
@@ -921,15 +928,14 @@ fn english(id: MessageId) -> &'static str {
         }
         MessageId::CmdQueueDescription => "View or edit queued messages",
         MessageId::CmdRecallDescription => "Search prior cycle archives (BM25 over message text)",
+        MessageId::CmdRelayDescription => "Create a session relay (接力) for a fresh thread",
         MessageId::CmdRenameDescription => "Rename the current session",
         MessageId::CmdRestoreDescription => {
             "Roll back the workspace to a prior pre/post-turn snapshot. With no arg, lists recent snapshots."
         }
         MessageId::CmdRetryDescription => "Retry the last request",
         MessageId::CmdReviewDescription => "Run a structured code review on a file, diff, or PR",
-        MessageId::CmdRlmDescription => {
-            "Recursive Language Model (RLM) turn — store the prompt in a Python REPL and let the model write code to process it, with `llm_query()` / `sub_rlm()` for sub-LLM calls."
-        }
+        MessageId::CmdRlmDescription => "Open a persistent RLM context: /rlm [0-3] <file_or_text>",
         MessageId::CmdSaveDescription => "Save session to file",
         MessageId::CmdSessionsDescription => "Open session picker",
         MessageId::CmdSettingsDescription => "Show persistent settings",
@@ -1055,7 +1061,7 @@ fn english(id: MessageId) -> &'static str {
             "Open details for the selected tool or message (when input is empty)"
         }
         MessageId::KbToolDetailsPager => "Open tool-details pager",
-        MessageId::KbThinkingPager => "Open thinking pager",
+        MessageId::KbThinkingPager => "Open Activity Detail",
         MessageId::KbLiveTranscript => "Open live transcript overlay (sticky-tail auto-scroll)",
         MessageId::KbBacktrackMessage => {
             "Backtrack to a previous user message (Left/Right step, Enter to rewind)"
@@ -1065,7 +1071,7 @@ fn english(id: MessageId) -> &'static str {
         }
         MessageId::KbJumpPlanAgentYolo => "Jump directly to Plan / Agent / YOLO mode",
         MessageId::KbAltJumpPlanAgentYolo => "Alternative jump to Plan / Agent / YOLO mode",
-        MessageId::KbFocusSidebar => "Focus Plan / Todos / Tasks / Agents / Auto sidebar",
+        MessageId::KbFocusSidebar => "Focus Work / Tasks / Agents / Context / Auto sidebar",
         MessageId::KbTogglePlanAgent => "Toggle between Plan and Agent modes",
         MessageId::KbSessionPicker => "Open the session picker",
         MessageId::KbPasteAttach => "Paste text or attach a clipboard image",
@@ -1185,6 +1191,7 @@ fn translation(locale: Locale, id: MessageId) -> Option<&'static str> {
 
 fn traditional_chinese(id: MessageId) -> Option<&'static str> {
     Some(match id {
+        MessageId::CmdRelayDescription => "為新執行緒建立會話接力摘要",
         MessageId::CmdTranslateDescription => "切換輸出翻譯為目前系統語言的開關狀態",
         MessageId::CmdTranslateOff => "輸出翻譯已關閉（顯示原始模型輸出）",
         MessageId::CmdTranslateOn => "輸出翻譯已開啟：模型回覆將以繁體中文顯示",
@@ -1268,6 +1275,9 @@ fn japanese(id: MessageId) -> Option<&'static str> {
         MessageId::CmdHooksDescription => {
             "設定済みのライフサイクルフックを一覧表示（読み取り専用）"
         }
+        MessageId::CmdAgentDescription => {
+            "永続サブエージェントセッションを開く: /agent [0-3] <task>"
+        }
         MessageId::CmdGoalDescription => "トークンバジェット付きのセッション目標を設定",
         MessageId::CmdInitDescription => "プロジェクト用に AGENTS.md を生成",
         MessageId::CmdLspDescription => "LSP 診断のオン・オフを切り替え",
@@ -1293,15 +1303,14 @@ fn japanese(id: MessageId) -> Option<&'static str> {
         MessageId::CmdRecallDescription => {
             "過去のサイクルアーカイブを検索（メッセージ本文への BM25 検索）"
         }
+        MessageId::CmdRelayDescription => "新しいスレッド用のセッションリレー（接力）を作成",
         MessageId::CmdRenameDescription => "現在のセッションの名前を変更",
         MessageId::CmdRestoreDescription => {
             "ワークスペースを以前のターン前/後スナップショットへロールバック。引数なしで最近のスナップショットを一覧表示。"
         }
         MessageId::CmdRetryDescription => "直前のリクエストを再試行",
         MessageId::CmdReviewDescription => "ファイル・diff・PR に対して構造化コードレビューを実行",
-        MessageId::CmdRlmDescription => {
-            "再帰言語モデル（RLM）ターン — プロンプトを Python REPL に格納し、モデルが処理コードを記述。サブ LLM 呼び出しは `llm_query()` / `sub_rlm()`。"
-        }
+        MessageId::CmdRlmDescription => "永続 RLM コンテキストを開く: /rlm [0-3] <file_or_text>",
         MessageId::CmdSaveDescription => "セッションをファイルに保存",
         MessageId::CmdSessionsDescription => "セッションピッカーを開く",
         MessageId::CmdSettingsDescription => "永続化された設定を表示",
@@ -1424,7 +1433,7 @@ fn japanese(id: MessageId) -> Option<&'static str> {
             "選択中のツールまたはメッセージの詳細を開く（入力が空の時）"
         }
         MessageId::KbToolDetailsPager => "ツール詳細のページャーを開く",
-        MessageId::KbThinkingPager => "思考内容のページャーを開く",
+        MessageId::KbThinkingPager => "Activity Detail を開く",
         MessageId::KbLiveTranscript => "ライブ会話履歴オーバーレイを開く（自動追尾スクロール）",
         MessageId::KbBacktrackMessage => {
             "前のユーザーメッセージに戻る（左右でステップ、Enter で巻き戻し）"
@@ -1434,7 +1443,9 @@ fn japanese(id: MessageId) -> Option<&'static str> {
         }
         MessageId::KbJumpPlanAgentYolo => "Plan / Agent / YOLO モードに直接ジャンプ",
         MessageId::KbAltJumpPlanAgentYolo => "Plan / Agent / YOLO モードへの代替ジャンプ",
-        MessageId::KbFocusSidebar => "Plan / Todos / Tasks / Agents / Auto サイドバーにフォーカス",
+        MessageId::KbFocusSidebar => {
+            "Work / Tasks / Agents / Context / Auto サイドバーにフォーカス"
+        }
         MessageId::KbTogglePlanAgent => "Plan モードと Agent モードを切り替え",
         MessageId::KbSessionPicker => "セッションピッカーを開く",
         MessageId::KbPasteAttach => "テキストを貼り付けまたはクリップボード画像を添付",
@@ -1605,6 +1616,7 @@ fn chinese_simplified(id: MessageId) -> Option<&'static str> {
         MessageId::CmdHelpDescription => "显示帮助信息",
         MessageId::CmdHomeDescription => "显示主页面板，含统计与快捷操作",
         MessageId::CmdHooksDescription => "列出已配置的生命周期钩子（只读）",
+        MessageId::CmdAgentDescription => "打开持久子代理会话：/agent [0-3] <task>",
         MessageId::CmdGoalDescription => "设置带有可选令牌预算的会话目标",
         MessageId::CmdInitDescription => "为项目生成 AGENTS.md",
         MessageId::CmdLspDescription => "切换 LSP 诊断的开启或关闭",
@@ -1626,15 +1638,14 @@ fn chinese_simplified(id: MessageId) -> Option<&'static str> {
         }
         MessageId::CmdQueueDescription => "查看或编辑已排队的消息",
         MessageId::CmdRecallDescription => "搜索此前的循环归档（基于消息文本的 BM25 检索）",
+        MessageId::CmdRelayDescription => "为新线程创建会话接力摘要",
         MessageId::CmdRenameDescription => "重命名当前会话",
         MessageId::CmdRestoreDescription => {
             "将工作区回滚到此前的轮次前/后快照。不带参数时列出最近的快照。"
         }
         MessageId::CmdRetryDescription => "重试上一次请求",
         MessageId::CmdReviewDescription => "对文件、diff 或 PR 进行结构化代码审查",
-        MessageId::CmdRlmDescription => {
-            "递归语言模型（RLM）轮次 —— 将提示词存入 Python REPL，让模型编写代码进行处理；可用 `llm_query()` / `sub_rlm()` 调用子 LLM。"
-        }
+        MessageId::CmdRlmDescription => "打开持久 RLM 上下文：/rlm [0-3] <file_or_text>",
         MessageId::CmdSaveDescription => "将会话保存到文件",
         MessageId::CmdSessionsDescription => "打开会话选择器",
         MessageId::CmdSettingsDescription => "显示持久化设置",
@@ -1741,7 +1752,7 @@ fn chinese_simplified(id: MessageId) -> Option<&'static str> {
         MessageId::KbLastMessagePager => "打开最后一条消息的分页器（输入框为空时）",
         MessageId::KbSelectedDetails => "打开选中工具或消息的详情（输入框为空时）",
         MessageId::KbToolDetailsPager => "打开工具详情分页器",
-        MessageId::KbThinkingPager => "打开思考内容分页器",
+        MessageId::KbThinkingPager => "打开 Activity Detail",
         MessageId::KbLiveTranscript => "打开实时对话覆盖层（自动滚动尾随）",
         MessageId::KbBacktrackMessage => "回退到之前的用户消息（左右键步进，Enter 回退）",
         MessageId::KbCompleteCycleModes => {
@@ -1749,7 +1760,7 @@ fn chinese_simplified(id: MessageId) -> Option<&'static str> {
         }
         MessageId::KbJumpPlanAgentYolo => "直接跳转到 Plan / Agent / YOLO 模式",
         MessageId::KbAltJumpPlanAgentYolo => "替代快捷键跳转到 Plan / Agent / YOLO 模式",
-        MessageId::KbFocusSidebar => "聚焦 Plan / 待办 / 任务 / 代理 / 代理 / 自动侧边栏",
+        MessageId::KbFocusSidebar => "聚焦 Work / 任务 / 代理 / Context / 自动侧边栏",
         MessageId::KbTogglePlanAgent => "在 Plan 和 Agent 模式之间切换",
         MessageId::KbSessionPicker => "打开会话选择器",
         MessageId::KbPasteAttach => "粘贴文本或附加剪贴板图片",
@@ -1918,6 +1929,9 @@ fn portuguese_brazil(id: MessageId) -> Option<&'static str> {
         MessageId::CmdHooksDescription => {
             "Listar hooks de ciclo de vida configurados (somente leitura)"
         }
+        MessageId::CmdAgentDescription => {
+            "Abrir uma sessão persistente de sub-agente: /agent [0-3] <task>"
+        }
         MessageId::CmdGoalDescription => {
             "Definir uma meta de sessão com orçamento de tokens opcional"
         }
@@ -1947,6 +1961,7 @@ fn portuguese_brazil(id: MessageId) -> Option<&'static str> {
         MessageId::CmdRecallDescription => {
             "Buscar arquivos de ciclos anteriores (BM25 sobre o texto das mensagens)"
         }
+        MessageId::CmdRelayDescription => "Criar um relay da sessão para um novo thread",
         MessageId::CmdRenameDescription => "Renomear a sessão atual",
         MessageId::CmdRestoreDescription => {
             "Reverter o workspace a um snapshot pré/pós-turno anterior. Sem argumento, lista os snapshots recentes."
@@ -1956,7 +1971,7 @@ fn portuguese_brazil(id: MessageId) -> Option<&'static str> {
             "Executar uma revisão de código estruturada em um arquivo, diff ou PR"
         }
         MessageId::CmdRlmDescription => {
-            "Turno do Recursive Language Model (RLM) — guarda o prompt em um REPL Python e deixa o modelo escrever o código que o processa; use `llm_query()` / `sub_rlm()` para chamadas a sub-LLMs."
+            "Abrir um contexto RLM persistente: /rlm [0-3] <file_or_text>"
         }
         MessageId::CmdSaveDescription => "Salvar a sessão em arquivo",
         MessageId::CmdSessionsDescription => "Abrir o seletor de sessões",
@@ -2090,7 +2105,7 @@ fn portuguese_brazil(id: MessageId) -> Option<&'static str> {
             "Abrir detalhes da ferramenta ou mensagem selecionada (quando entrada vazia)"
         }
         MessageId::KbToolDetailsPager => "Abrir paginador de detalhes da ferramenta",
-        MessageId::KbThinkingPager => "Abrir paginador de raciocínio",
+        MessageId::KbThinkingPager => "Abrir Activity Detail",
         MessageId::KbLiveTranscript => "Abrir sobreposição de transcrição ao vivo (auto-scroll)",
         MessageId::KbBacktrackMessage => {
             "Retroceder para mensagem anterior do usuário (esquerda/direita, Enter para rebobinar)"
@@ -2100,7 +2115,7 @@ fn portuguese_brazil(id: MessageId) -> Option<&'static str> {
         }
         MessageId::KbJumpPlanAgentYolo => "Pular direto para modo Plan / Agent / YOLO",
         MessageId::KbAltJumpPlanAgentYolo => "Salto alternativo para modo Plan / Agent / YOLO",
-        MessageId::KbFocusSidebar => "Focar barra lateral Plan / Todos / Tasks / Agents / Auto",
+        MessageId::KbFocusSidebar => "Focar barra lateral Work / Tasks / Agents / Context / Auto",
         MessageId::KbTogglePlanAgent => "Alternar entre modos Plan e Agent",
         MessageId::KbSessionPicker => "Abrir seletor de sessões",
         MessageId::KbPasteAttach => "Colar texto ou anexar imagem da área de transferência",
diff --git a/crates/tui/src/mcp.rs b/crates/tui/src/mcp.rs
index 874016b8..0a09a8bc 100644
--- a/crates/tui/src/mcp.rs
+++ b/crates/tui/src/mcp.rs
@@ -3233,6 +3233,7 @@ mod tests {
     }
 
     #[tokio::test]
+    #[ignore = "flaky: requires a live TCP listener and is sensitive to port allocation races"]
     async fn mcp_connection_supports_streamable_http_event_stream_responses() {
         use tokio::io::{AsyncReadExt, AsyncWriteExt};
         use tokio::net::{TcpListener, TcpStream};
diff --git a/crates/tui/src/prompts.rs b/crates/tui/src/prompts.rs
index 4028aa3d..ae0f9d11 100644
--- a/crates/tui/src/prompts.rs
+++ b/crates/tui/src/prompts.rs
@@ -30,7 +30,7 @@ pub struct PromptSessionContext<'a> {
     pub translation_enabled: bool,
 }
 
-/// Conventional location for the structured session-handoff artifact (#32).
+/// Conventional location for the structured session relay artifact (#32).
 /// A previous session writes it on exit / `/compact`; the next session reads
 /// it back on startup and prepends it to the system prompt so a fresh agent
 /// doesn't have to re-discover open blockers from scratch.
@@ -157,7 +157,7 @@ fn render_instructions_block(paths: &[PathBuf]) -> Option<String> {
     }
 }
 
-/// Read the workspace-local handoff artifact, if present, and format it as a
+/// Read the workspace-local relay artifact, if present, and format it as a
 /// system-prompt block. Returns `None` when the file is absent or empty so
 /// callers can keep the default-uncluttered prompt for fresh workspaces.
 fn load_handoff_block(workspace: &Path) -> Option<String> {
@@ -168,7 +168,7 @@ fn load_handoff_block(workspace: &Path) -> Option<String> {
         return None;
     }
     Some(format!(
-        "## Previous Session Handoff\n\nThe previous session in this workspace left a handoff at `{}`. Consider it the first artifact to read on this turn — open blockers, in-flight changes, and recent decisions live there. Update or rewrite it before exiting if state changes materially.\n\n{}",
+        "## Previous Session Relay\n\nThe previous session in this workspace left a relay artifact at `{}`. Consider it the first artifact to read on this turn — open blockers, in-flight changes, and recent decisions live there. Update or rewrite it before exiting if state changes materially.\n\n{}",
         HANDOFF_RELATIVE_PATH, trimmed
     ))
 }
@@ -354,7 +354,7 @@ pub const AUTO_APPROVAL: &str = include_str!("prompts/approvals/auto.md");
 pub const SUGGEST_APPROVAL: &str = include_str!("prompts/approvals/suggest.md");
 pub const NEVER_APPROVAL: &str = include_str!("prompts/approvals/never.md");
 
-/// Compaction handoff template — written into the system prompt so the
+/// Compaction relay template — written into the system prompt so the
 /// model knows the format to use when writing `.deepseek/handoff.md`.
 pub const COMPACT_TEMPLATE: &str = include_str!("prompts/compact.md");
 
@@ -514,11 +514,11 @@ pub fn system_prompt_for_mode_with_context(
 ///   2. project context / fallback (workspace-static)
 ///   3. skills block (skills-dir-static)
 ///   4. `## Context Management` (compile-time constant, Agent/Yolo only)
-///   5. compaction handoff template (compile-time constant)
-///   6. handoff block — file-backed; rewritten by `/compact` and on exit
+///   5. compaction relay template (compile-time constant)
+///   6. relay block — file-backed; rewritten by `/compact` and on exit
 ///
 /// Anything appended after a volatile block forfeits the cache for the rest
-/// of the request. New blocks belong above the handoff boundary unless they
+/// of the request. New blocks belong above the relay boundary unless they
 /// themselves are turn-volatile. Working-set metadata is now injected into the
 /// latest user message as per-turn metadata instead of this system prompt.
 pub fn system_prompt_for_mode_with_context_and_skills(
@@ -668,7 +668,7 @@ pub fn system_prompt_for_mode_with_context_skills_session_and_approval(
         );
     }
 
-    // 5. Compaction handoff template — so the model knows the format to use
+    // 5. Compaction relay template — so the model knows the format to use
     //    when writing `.deepseek/handoff.md` on exit / `/compact`.
     full_prompt.push_str("\n\n");
     full_prompt.push_str(COMPACT_TEMPLATE);
@@ -694,7 +694,7 @@ pub fn system_prompt_for_mode_with_context_skills_session_and_approval(
     // 6b. User memory block (#489). Placed below the volatile boundary
     // because memory entries are editable mid-session via `/memory` or
     // `# foo` quick-add. When they change, they only invalidate the
-    // trailing handoff block — the static prefix above stays cached.
+    // trailing relay block — the static prefix above stays cached.
     if let Some(memory_block) = session_context.user_memory_block
         && !memory_block.trim().is_empty()
     {
@@ -713,7 +713,7 @@ pub fn system_prompt_for_mode_with_context_skills_session_and_approval(
         );
     }
 
-    // 7. Previous-session handoff (file-backed, rewritten by `/compact`).
+    // 7. Previous-session relay (file-backed, rewritten by `/compact`).
     if let Some(handoff_block) = load_handoff_block(workspace) {
         full_prompt = format!("{full_prompt}\n\n{handoff_block}");
     }
@@ -775,9 +775,9 @@ mod tests {
     use super::*;
     use tempfile::tempdir;
 
-    /// Discriminator unique to the injected handoff block (not present in the
+    /// Discriminator unique to the injected relay block (not present in the
     /// agent prompt's own discussion of the convention).
-    const HANDOFF_BLOCK_MARKER: &str = "left a handoff at `.deepseek/handoff.md`";
+    const HANDOFF_BLOCK_MARKER: &str = "left a relay artifact at `.deepseek/handoff.md`";
 
     #[test]
     fn render_environment_block_lists_supplied_locale_and_workspace() {
@@ -1120,7 +1120,7 @@ mod tests {
         assert!(prompt.contains("<project_context_pack>"));
         assert!(
             prompt.find("<project_context_pack>").expect("pack")
-                < prompt.find("## Previous Session Handoff").expect("handoff")
+                < prompt.find("## Previous Session Relay").expect("relay")
         );
     }
 
@@ -1132,7 +1132,7 @@ mod tests {
         std::fs::create_dir_all(&handoff_dir).unwrap();
         std::fs::write(
             handoff_dir.join("handoff.md"),
-            "# Session handoff — prior\n\n## Active task\nFinish #32.\n\n## Open blockers\n- [ ] write the basic version\n",
+            "# Session relay — prior\n\n## Active task\nFinish #32.\n\n## Open blockers\n- [ ] write the basic version\n",
         )
         .unwrap();
 
@@ -1278,7 +1278,7 @@ mod tests {
             SystemPrompt::Text(text) => text,
             SystemPrompt::Blocks(_) => panic!("expected text system prompt"),
         };
-        assert!(prompt.contains("## Compaction Handoff"));
+        assert!(prompt.contains("## Compaction Relay"));
         // #429: structured Markdown template. Goal/Constraints/Progress
         // (Done/InProgress/Blocked)/Key Decisions/Next step.
         assert!(prompt.contains("### Goal"));
@@ -1313,7 +1313,7 @@ mod tests {
         };
 
         let goal_pos = prompt.find("<session_goal>").expect("goal block");
-        let compact_pos = prompt.find("## Compaction Handoff").expect("compact block");
+        let compact_pos = prompt.find("## Compaction Relay").expect("compact block");
 
         assert!(prompt.contains("Fix transcript corruption"));
         // Session goal is volatile content — it lives below the
@@ -1353,7 +1353,7 @@ mod tests {
     fn tool_selection_guide_avoids_defensive_tool_suppression() {
         let prompt = compose_prompt(AppMode::Agent, Personality::Calm);
         assert!(prompt.contains("Tool Selection Guide"));
-        assert!(prompt.contains("Use `agent_result`"));
+        assert!(prompt.contains("Use `agent_eval`"));
         assert!(
             !prompt.contains("When NOT to use certain tools"),
             "the system prompt should steer tool choice without training the model to avoid available tools"
@@ -1432,6 +1432,62 @@ mod tests {
         );
     }
 
+    #[test]
+    fn workspace_orientation_guidance_present() {
+        let prompt = compose_prompt(AppMode::Agent, Personality::Calm);
+        assert!(prompt.contains("Workspace Orientation"));
+        assert!(prompt.contains("canonical project root"));
+        assert!(prompt.contains("AGENTS.md"));
+        assert!(prompt.contains("explore` / `explorer"));
+    }
+
+    #[test]
+    fn prompt_uses_persistent_agent_and_rlm_surface() {
+        let prompt = compose_prompt(AppMode::Agent, Personality::Calm);
+        for tool in [
+            "agent_open",
+            "agent_eval",
+            "agent_close",
+            "rlm_open",
+            "rlm_eval",
+            "rlm_configure",
+            "rlm_close",
+            "handle_read",
+        ] {
+            assert!(
+                prompt.contains(tool),
+                "prompt should mention new persistent tool `{tool}`"
+            );
+        }
+        for retired in [
+            "agent_spawn",
+            "agent_wait",
+            "agent_result",
+            "agent_send_input",
+            "agent_assign",
+            "agent_resume",
+            "agent_list",
+            "spawn_agent",
+            "delegate_to_agent",
+            "send_input",
+            "close_agent",
+        ] {
+            assert!(
+                !prompt.contains(retired),
+                "prompt should not advertise retired sub-agent tool `{retired}`"
+            );
+        }
+    }
+
+    #[test]
+    fn prompt_documents_fork_context_prefix_cache_contract() {
+        let prompt = compose_prompt(AppMode::Agent, Personality::Calm);
+        assert!(prompt.contains("fork_context: true"));
+        assert!(prompt.contains("byte-identical"));
+        assert!(prompt.contains("DeepSeek prefix-cache reuse"));
+        assert!(prompt.contains("Fresh sessions are the default"));
+    }
+
     #[test]
     fn subagent_done_sentinel_section_present() {
         let prompt = compose_prompt(AppMode::Agent, Personality::Calm);
@@ -1541,7 +1597,7 @@ mod tests {
     #[test]
     fn system_prompt_with_handoff_file_is_byte_stable_when_file_is_unchanged() {
         // If `.deepseek/handoff.md` hasn't moved between two builds, the
-        // rendered prompt must produce identical bytes. The handoff block
+        // rendered prompt must produce identical bytes. The relay block
         // lands below the static boundary in
         // `system_prompt_for_mode_with_context_and_skills`.
         let tmp = tempdir().expect("tempdir");
@@ -1550,7 +1606,7 @@ mod tests {
         std::fs::create_dir_all(&handoff_dir).unwrap();
         std::fs::write(
             handoff_dir.join("handoff.md"),
-            "# Session handoff\n\n## Active task\nFinish #280.\n\n## Open blockers\n- [ ] none\n",
+            "# Session relay\n\n## Active task\nFinish #280.\n\n## Open blockers\n- [ ] none\n",
         )
         .unwrap();
 
@@ -1567,15 +1623,15 @@ mod tests {
             &a,
             &b,
         );
-        assert!(a.contains(HANDOFF_BLOCK_MARKER), "handoff must be embedded");
-        assert!(a.contains("Finish #280."), "handoff body must be present");
+        assert!(a.contains(HANDOFF_BLOCK_MARKER), "relay must be embedded");
+        assert!(a.contains("Finish #280."), "relay body must be present");
     }
 
     #[test]
     fn handoff_appears_after_static_blocks_without_working_set() {
-        // Cache-prefix invariant: the handoff block must come after static
-        // `## Context Management` and the compaction handoff template
-        // (`## Compaction Handoff`). Working-set metadata is per-turn user
+        // Cache-prefix invariant: the relay block must come after static
+        // `## Context Management` and the compaction relay template
+        // (`## Compaction Relay`). Working-set metadata is per-turn user
         // metadata now, not a system-prompt tail block.
         let tmp = tempdir().expect("tempdir");
         let workspace = tmp.path();
@@ -1594,11 +1650,11 @@ mod tests {
             .find("## Context Management")
             .expect("Context Management section present in Agent mode");
         let compact_pos = prompt
-            .find("## Compaction Handoff")
-            .expect("compaction handoff template present");
+            .find("## Compaction Relay")
+            .expect("compaction relay template present");
         let handoff_pos = prompt
             .find(HANDOFF_BLOCK_MARKER)
-            .expect("handoff block present when fixture file exists");
+            .expect("relay block present when fixture file exists");
         assert!(
             !prompt.contains("## Repo Working Set"),
             "working-set summary must stay out of the system prompt"
@@ -1606,11 +1662,11 @@ mod tests {
 
         assert!(
             context_pos < handoff_pos,
-            "## Context Management must precede the handoff block"
+            "## Context Management must precede the relay block"
         );
         assert!(
             compact_pos < handoff_pos,
-            "## Compaction Handoff must precede the handoff block"
+            "## Compaction Relay must precede the relay block"
         );
     }
 
diff --git a/crates/tui/src/prompts/agent.txt b/crates/tui/src/prompts/agent.txt
index 5ce82e18..fba4977c 100644
--- a/crates/tui/src/prompts/agent.txt
+++ b/crates/tui/src/prompts/agent.txt
@@ -1,7 +1,7 @@
 ## Mode: agent
 
-Read-only tools (reads, searches, `rlm`, agent status queries, git inspection) run silently.
-Any write, patch, shell execution, sub-agent spawn, or CSV batch operation will ask for approval first.
+Read-only tools (reads, searches, persistent RLM session tools, agent status queries, git inspection) run silently.
+Any write, patch, shell execution, sub-agent session open, or CSV batch operation will ask for approval first.
 
 Before requesting approval for writes, lay out your work with `checklist_write` so the user can see what
 you intend to do and approve with context. Complex changes should also get an `update_plan` first.
@@ -9,7 +9,7 @@ Decomposition builds trust — a clear plan gets faster approvals.
 
 ## Sub-agent completion sentinel
 
-When you spawn a sub-agent via `agent_spawn`, the child runs independently.
+When you open a sub-agent via `agent_open`, the child runs independently.
 You will receive a `<deepseek:subagent.done>` element in the transcript when it finishes.
 Read its `summary` field and integrate the work — do not re-do what the child already did.
-You can also call `agent_result` to pull the full structured result.
+You can also call `agent_eval` with the agent name or id to pull the current structured projection or transcript handle.
diff --git a/crates/tui/src/prompts/base.md b/crates/tui/src/prompts/base.md
index c7b30f33..0a05be10 100644
--- a/crates/tui/src/prompts/base.md
+++ b/crates/tui/src/prompts/base.md
@@ -40,19 +40,27 @@ Use three decomposition patterns, selected by task scope:
 
 **PREVIEW** — Before diving into a large task, survey the terrain. Scan directory structure (`list_dir`), file headers, module trees. Identify problem boundaries and estimate complexity. A 30-second preview prevents hours of wrong-path exploration.
 
-**CHUNK + map-reduce** — When a task exceeds single-pass capacity: split into independent sub-tasks, process each independently (parallel where possible via parallel tool calls or `agent_spawn`), then synthesize findings into a coherent whole. Track chunks with `checklist_write`.
+**CHUNK + map-reduce** — When a task exceeds single-pass capacity: split into independent sub-tasks, process each independently (parallel where possible via parallel tool calls or persistent sub-agent sessions), then synthesize findings into a coherent whole. Track chunks with `checklist_write`.
 
-**RECURSIVE** — When sub-tasks reveal sub-problems: decompose recursively until each leaf is tractable. Maintain the task tree via `update_plan` (strategy) layered above `checklist_write` (leaf tasks). Propagate findings upward when sub-problems resolve.
+**RECURSIVE** — When sub-tasks reveal sub-problems: decompose recursively until each leaf is tractable. Keep the active leaves in `checklist_write`; use `update_plan` only when a genuinely complex initiative needs durable high-level strategy metadata. Propagate findings upward when sub-problems resolve.
 
 Your default workflow for any non-trivial request:
 1. **`checklist_write`** — break the work into concrete, verifiable steps. Mark the first one `in_progress`. This populates the sidebar so the user can see what you're doing.
 2. **Execute** — work through each checklist item, updating status as you go.
-3. **For complex initiatives**, layer `update_plan` (high-level strategy) above `checklist_write` (granular steps).
-4. **For parallel work**, spawn sub-agents (`agent_spawn`) — each does one thing well. Link them to plan/todo items in your thinking. Batch independent tool calls in a single turn.
-5. **Only when an input genuinely doesn't fit your context window** — a whole file > ~50K tokens, a long transcript, a multi-document corpus — use `rlm`. It loads the input into a Python REPL where a sub-agent processes it. For shorter inputs, use `read_file` and reason directly.
+3. **For complex initiatives only**, add `update_plan` as high-level strategy. Do not mirror the checklist into a second tracker.
+4. **For parallel work**, open sub-agent sessions with `agent_open` — each does one thing well. Use `agent_eval` for follow-ups or completion state, and `agent_close` when a session should be cancelled or released. Link them to Work/checklist items in your thinking. Batch independent tool calls in a single turn.
+5. **Only when an input genuinely doesn't fit your context window** — a whole file > ~50K tokens, a long transcript, a multi-document corpus — use persistent RLM sessions: `rlm_open` loads the input into a named Python REPL, `rlm_eval` runs bounded analysis, `handle_read` reads returned `var_handle`s, `rlm_configure` adjusts feedback/depth, and `rlm_close` releases the session. For shorter inputs, use `read_file` and reason directly.
 6. **For persistent cross-session memory**, use `note` sparingly for important decisions, open blockers, and architectural context.
 
-**Key principle**: make your work visible. The sidebar shows Plan / Todos / Tasks / Agents. When these panels are empty, the user has no idea what you're doing. Keep them populated.
+**Key principle**: make your work visible in one place. The sidebar shows Work / Tasks / Agents / Context. Keep the Work checklist current; it is the primary progress surface. `update_plan` appears there only as optional strategy when it has real content.
+
+## Workspace Orientation
+
+When you enter an unfamiliar workspace, orient before broad search. Use the project instructions already loaded into the prompt, then confirm the working shape with the cheapest deterministic tools: `list_dir`, direct reads of `AGENTS.md`/`README.md` when relevant, and targeted `grep_files`. If the current directory is a multi-project workspace or the user points at a child path, identify the canonical project root before searching. If the correct project remains ambiguous after a quick orientation pass, ask instead of spraying searches across sibling checkouts.
+
+Treat workspace instructions as authority for where work should happen. If they say a sibling directory is stale, historical, frozen, or not the canonical checkout, do not spend high-value context there unless the user explicitly asks. Prefer exact paths from the user over guessing.
+
+Use `explore` sub-agents for independent read-only reconnaissance. Call the role `explore` / `explorer`, and give each child one bounded question with the project root and expected evidence shape. Use RLM for long inputs or many semantic slices, not for basic path discovery.
 
 ## Verification Principle
 
@@ -76,23 +84,23 @@ If a tool call fails, inspect the error before retrying. Do not repeat the ident
 
 ## Composition Pattern for Multi-Step Work
 
-For any task estimated to take 5+ steps:
+For any task estimated to take 5+ concrete steps:
 
-1. **`update_plan`** — 3-6 high-level phases (status: pending). This gives the user a map.
-2. **`checklist_write`** — concrete leaf tasks under the first phase (mark first `in_progress`).
-3. **Execute phase 1**, updating checklist as you go. Batch independent steps into parallel tool calls.
-4. **After each phase**, re-read your plan: does phase 2 still make sense? Update the plan if new information changes the approach. Don't blindly follow a plan drafted before you understood the code.
-5. **When a phase reveals sub-problems**, add them to the checklist or spawn investigation sub-agents — don't guess.
+1. **`checklist_write`** — concrete leaf tasks, with the first item `in_progress`.
+2. **Execute**, updating checklist status as you go. Batch independent steps into parallel tool calls.
+3. **For multi-phase or ambiguous initiatives**, optionally add `update_plan` with 3-6 high-level phases. Keep it strategic; do not duplicate checklist items.
+4. **After each phase**, re-check whether the next checklist items still make sense. Update the checklist, and update strategy only if the high-level approach changed.
+5. **When a phase reveals sub-problems**, add them to the checklist or open investigation sub-agent sessions — don't guess.
 
 ## Sub-Agent Strategy
 
 Sub-agents are cheap — DeepSeek V4 Flash costs $0.14/M input. Use them liberally for parallel work:
 
-- **Parallel investigation**: When you need to understand 3+ independent files or modules, spawn one read-only sub-agent per target. They run concurrently in one turn and return structured findings you synthesize. This is faster AND more thorough than reading sequentially.
-- **Parallel implementation**: After a plan is laid out, spawn one sub-agent per independent leaf task. Each does one thing well; you integrate results.
-- **Solo tasks**: A single read, a single search, a focused question — do these yourself. Spawning has overhead; one-turn reads are faster direct.
-- **Sequential work**: If step B depends on step A's output, run A yourself, then decide whether to spawn B based on what A found. Don't pre-spawn dependent work.
-- **Concurrent sub-agent cap**: The dispatcher defaults to 10 concurrent sub-agents (configurable via `[subagents].max_concurrent` in `config.toml`, hard ceiling 20). When you need more, batch them: spawn up to the cap, wait for completions, then spawn the next batch.
+- **Parallel investigation**: When you need to understand 3+ independent files or modules, open one read-only sub-agent session per target. They run concurrently in one turn and return structured findings you synthesize. This is faster AND more thorough than reading sequentially.
+- **Parallel implementation**: After a plan is laid out, open one sub-agent session per independent leaf task. Each does one thing well; you integrate results.
+- **Solo tasks**: A single read, a single search, a focused question — do these yourself. Opening a sub-agent has overhead; one-turn reads are faster direct.
+- **Sequential work**: If step B depends on step A's output, run A yourself, then decide whether to open a sub-agent based on what A found. Don't pre-open dependent work.
+- **Concurrent sub-agent cap**: The dispatcher defaults to 10 concurrent sub-agents (configurable via `[subagents].max_concurrent` in `config.toml`, hard ceiling 20). When you need more, batch them: open up to the cap, wait for completions, then open the next batch.
 
 ## Parallel-First Heuristic
 
@@ -101,23 +109,25 @@ Before you fire any tool, scan your checklist: is there another tool you could r
 - Reading 3 files → 3 `read_file` calls in one turn
 - Searching for 2 patterns → 2 `grep_files` calls in one turn
 - Checking git status AND reading a config → `git_status` + `read_file` in one turn
-- Spawning sub-agents for independent investigations → all `agent_spawn` calls in one turn
+- Opening sub-agents for independent investigations → all `agent_open` calls in one turn
 
 The dispatcher runs parallel tool calls simultaneously. Serializing independent operations wastes the user's time and grows your context faster than necessary.
 
 ## RLM — How to Use It
 
-RLM loads input into a Python REPL where you write code that calls sub-LLM helpers (`llm_query`, `llm_query_batched`, `rlm_query`). Three patterns, not one — choose based on the shape of the work:
+RLM is a persistent Python REPL for context that is too large or too repetitive to keep in the parent transcript. Open a named session with `rlm_open`, run bounded code with `rlm_eval`, read large returned payloads through `handle_read`, tune feedback with `rlm_configure`, and close finished sessions with `rlm_close`.
+
+Inside the REPL, use deterministic Python for exact work and the RLM helper functions for semantic work. The current helper family is `peek`, `search`, `chunk`, `context_meta`, `sub_query`, `sub_query_batch`, `sub_query_map`, `sub_rlm`, `finalize`, and `evaluate_progress`. These are in-REPL helpers, not separate model-visible tools. Three patterns, not one — choose based on the shape of the work:
+
+The RLM paper's core design is symbolic state: the long input and intermediate values live in the REPL environment, not copied into the root model context. Inspect with bounded slices, transform with Python, batch child calls programmatically, and keep large intermediate strings in variables or `var_handle`s. Do not paste the whole body back into a prompt or verbalize a long list of sub-calls when a loop can launch them.
 
 **CHUNK** — A single input that genuinely doesn't fit in your context window (a whole file > 50K tokens, a long transcript, a multi-document corpus). Split it, process each chunk, synthesize.
 
-**BATCH** — Many independent items that each need LLM attention (classify 20 entries, extract fields from 30 documents, score 15 candidates). Use `llm_query_batched` for parallel execution — it fans out to the same DeepSeek client and finishes in one turn what would take 15 sequential reads.
+**BATCH** — Many independent items that each need LLM attention (classify 20 entries, extract fields from 30 documents, score 15 candidates). Use `sub_query_batch` for parallel execution — it fans out to the same DeepSeek client and finishes in one turn what would take 15 sequential reads.
 
-**RECURSE** — A problem that benefits from decomposition + critique. Use `rlm_query` to have a sub-LLM review your reasoning, identify gaps, or explore alternative approaches. The sub-LLM returns a synthesized answer you verify against live tool output.
+**RECURSE** — A problem that benefits from decomposition + critique. Use `sub_query` or `sub_rlm` to have a sub-LLM review your reasoning, identify gaps, or explore alternative approaches. The sub-LLM returns a synthesized answer you verify against live tool output.
 
-For exact counts or structured aggregates, compute them directly in Python inside the REPL (`len`, regexes, parsers, counters) and use child LLM calls only for semantic interpretation. When you chunk a whole input, use `chunk_context()` plus `chunk_coverage()` and report coverage explicitly: chunks processed, total chunks, line/char ranges, and any skipped sections. Cross-check surprising aggregate results with deterministic code before presenting them.
-
-The Python helpers visible inside the REPL (`llm_query`, `llm_query_batched`, `rlm_query`, `rlm_query_batched`) are NOT separately-callable tools — they are functions the sub-agent uses inside its Python code. You only call `rlm` itself from the model side.
+For exact counts or structured aggregates, compute them directly in Python inside the REPL (`len`, regexes, parsers, counters) and use child LLM calls only for semantic interpretation. When you chunk a whole input, use `chunk()` and report coverage explicitly: chunks processed, total chunks, line/char ranges, and any skipped sections. Cross-check surprising aggregate results with deterministic code before presenting them. Use `finalize(...)` for the answer you want returned; if it comes back as a `var_handle`, call `handle_read` for a bounded slice, count, or JSON projection instead of asking the runtime to replay the whole value.
 
 ## Context
 You have a 1 M-token context window. When usage creeps above ~80%, suggest `/compact` to the user — it summarises earlier turns so you can keep working without losing thread.
@@ -154,14 +164,15 @@ When context is deep (past a soft seam): cache reasoning conclusions in concise
 
 ## Toolbox (fast reference — tool descriptions are authoritative)
 
-- **Planning / tracking**: `update_plan` (high-level strategy), `task_create` / `task_list` / `task_read` / `task_cancel` (durable work objects), `checklist_write` (granular progress under the active task/thread), `checklist_add` / `checklist_update` / `checklist_list`, `todo_*` aliases (legacy compatibility), `note` (persistent memory).
+- **Planning / tracking**: `checklist_write` (primary Work progress under the active task/thread), `checklist_add` / `checklist_update` / `checklist_list`, `update_plan` (optional high-level strategy metadata for complex initiatives), `task_create` / `task_list` / `task_read` / `task_cancel` (durable work objects), `todo_*` aliases (legacy compatibility), `note` (persistent memory).
 - **File I/O**: `read_file` (PDFs auto-extracted), `list_dir`, `write_file`, `edit_file`, `apply_patch`, `retrieve_tool_result` for prior spilled large tool outputs.
 - **Shell**: `task_shell_start` + `task_shell_wait` for long-running commands, diagnostics, tests, searches, and servers; `exec_shell` for bounded cancellable foreground commands; `exec_shell_wait`, `exec_shell_interact`. If foreground `exec_shell` times out, the process was killed; rerun long work with `task_shell_start` or `exec_shell` using `background: true`, then poll/wait.
 - **Task evidence**: `task_gate_run` for verification gates; `pr_attempt_record` / `pr_attempt_list` / `pr_attempt_read` / `pr_attempt_preflight`; `github_issue_context` / `github_pr_context` (read-only); `github_comment` / `github_close_issue` (approval + evidence required); `automation_*` scheduling tools.
 - **Structured search**: `grep_files`, `file_search`, `web_search`, `fetch_url`, `web.run` (browse).
 - **Git / diag / tests**: `git_status`, `git_diff`, `git_show`, `git_log`, `git_blame`, `diagnostics`, `run_tests`, `review`.
-- **Sub-agents**: `agent_spawn` (`spawn_agent`, `delegate_to_agent`), `agent_result`, `agent_cancel` (`close_agent`), `agent_list`, `agent_wait` (`wait`), `agent_send_input` (`send_input`), `agent_assign` (`assign_agent`), `resume_agent`.
-- **Recursive LM (long inputs / parallel reasoning)**: `rlm` — load a file/string as `context` in a Python REPL, sub-agent writes Python that calls `llm_query`/`llm_query_batched`/`rlm_query` to chunk, compare, critique, and synthesize; returns the synthesized answer. Read-only.
+- **Sub-agents**: `agent_open`, `agent_eval`, `agent_close`. Open fresh sessions by default; pass `fork_context: true` only when the child needs the current parent context and prefix-cache continuity.
+- **Recursive LM (long inputs / parallel reasoning)**: `rlm_open`, `rlm_eval`, `rlm_configure`, `rlm_close` — open a named Python REPL over a file/string/URL, run deterministic and semantic analysis, return compact results or `var_handle`s, then close when done.
+- **Large symbolic outputs**: `handle_read` — read bounded slices, counts, ranges, or JSONPath projections from returned `var_handle`s without replaying the whole payload.
 - **Skills**: `load_skill` (#434) — when the user names a skill or the task matches one in the `## Skills` section above, call this with the skill id to pull its `SKILL.md` body and companion-file list into context in one tool call. Faster than `read_file` + `list_dir`.
 - **Other**: `code_execution` (Python sandbox), `validate_data` (JSON/TOML), `request_user_input`, `finance` (market quotes), `tool_search_tool_regex`, `tool_search_tool_bm25` (deferred tool discovery).
 
@@ -178,17 +189,17 @@ Use `edit_file` for one clear replacement in one file. Do not use it for multi-b
 ### `exec_shell`
 Use `exec_shell` for shell-native diagnostics, pipelines, and bounded commands. Use structured tools for structured operations when they map directly (`grep_files`, `git_diff`, `read_file`). For long commands, servers, full test suites, or release computations, start background work with `task_shell_start` or `exec_shell` using `background: true`, then poll with `task_shell_wait` or `exec_shell_wait`.
 
-### `agent_spawn`
-Use `agent_spawn` for independent investigations or implementation slices that can run while you continue coordinating. Use `fork_context: true` when the child must inherit the current transcript, plan/todo state, and byte-identical parent system/message prefix for DeepSeek prefix-cache reuse. Use `agent_wait` when you need one or more completions. Use `agent_result` when the sentinel summary is too thin or you need the full structured output. Keep tiny single-read/search tasks local so the transcript stays compact.
+### `agent_open` / `agent_eval` / `agent_close`
+Use `agent_open` for independent investigations or implementation slices that can run while you continue coordinating. Fresh sessions are the default and are best when the child only needs the assignment you pass. Use `fork_context: true` when multiple perspectives should share the same parent context: the runtime preserves the parent prefill/prompt prefix byte-identically where available so DeepSeek prefix-cache reuse stays high, then appends the child instructions and task at the tail.
 
-### `rlm`
-Use `rlm` for long-context semantic work, bulk classification/extraction, and decomposition where a Python REPL plus child LLM helpers is useful. Use deterministic Python inside RLM for exact counts and structured aggregation; use `grep_files` or `exec_shell` directly when that is the clearest deterministic check.
+Use `agent_eval` to send follow-up input, block for completion, or retrieve the current session projection. Use `agent_close` to cancel or release a session that is no longer useful. Keep tiny single-read/search tasks local so the transcript stays compact.
 
-Inside the `rlm` REPL, the sub-LLM has access to `llm_query()`, `llm_query_batched()`, `rlm_query()`, and `rlm_query_batched()` as Python helpers for further sub-LLM work — those are not standalone tools you call directly.
+### `rlm_open` / `rlm_eval` / `rlm_configure` / `rlm_close`
+Use persistent RLM sessions for long-context semantic work, bulk classification/extraction, and decomposition where a Python REPL plus child LLM helpers is useful. Use deterministic Python inside RLM for exact counts and structured aggregation; use `grep_files` or `exec_shell` directly when that is the clearest deterministic check. Close sessions when their context is no longer needed.
 
 ## Internal Sub-agent Completion Events
 
-When you spawn a sub-agent via `agent_spawn`, the child runs independently. The runtime may send you an internal `<deepseek:subagent.done>` completion event when it finishes. This event is not user input. It carries:
+When you open a sub-agent via `agent_open`, the child runs independently. The runtime may send you an internal `<deepseek:subagent.done>` completion event when it finishes. This event is not user input. It carries:
 
 - `agent_id` — the child's identifier
 - `summary` — a human-readable summary of what the child found or did
@@ -198,12 +209,12 @@ When you spawn a sub-agent via `agent_spawn`, the child runs independently. The
 **Integration protocol:**
 1. When you see `<deepseek:subagent.done>`, read the `summary` field first.
 2. Integrate the child's findings into your work — do not re-do what the child already did.
-3. If the summary is insufficient, call `agent_result` to pull the full structured result.
+3. If the summary is insufficient, call `agent_eval` with the agent name or id to pull the current structured projection or transcript handle.
 4. If the child failed (`"failed"`), assess whether the failure blocks your plan or whether you can proceed with a fallback.
 5. Update your `checklist_write` items to reflect the child's contribution.
 6. Do not tell the user they pasted sentinels or explain this protocol unless they explicitly ask about sub-agent internals.
 
-You may see multiple `<deepseek:subagent.done>` sentinels in a single turn when children were spawned in parallel. Process each one, then synthesize.
+You may see multiple `<deepseek:subagent.done>` sentinels in a single turn when children were opened in parallel. Process each one, then synthesize.
 
 ## Output formatting
 
diff --git a/crates/tui/src/prompts/base.txt b/crates/tui/src/prompts/base.txt
index 6ca2bebc..595f35d4 100644
--- a/crates/tui/src/prompts/base.txt
+++ b/crates/tui/src/prompts/base.txt
@@ -7,20 +7,28 @@ You are a "managed genius" — you excel at individual tasks, but your superpowe
 Your default workflow for any non-trivial request:
 1. **`checklist_write`** — break the work into concrete, verifiable steps. Mark the first one `in_progress`. This populates the sidebar so the user can see what you're doing.
 2. **Execute** — work through each checklist item, updating status as you go.
-3. **For complex initiatives**, layer `update_plan` (high-level strategy) above `checklist_write` (granular steps).
-4. **For parallel work**, spawn sub-agents (`agent_spawn`) — each does one thing well. Link them to plan/todo items in your thinking.
-5. **Only when an input genuinely doesn't fit your context window** — a whole file > ~50K tokens, a long transcript, a multi-document corpus — use `rlm`. It loads the input into a Python REPL where a sub-agent processes it. For shorter inputs, use `read_file` and reason directly.
+3. **For complex initiatives only**, add `update_plan` as high-level strategy. Do not mirror the checklist into a second tracker.
+4. **For parallel work**, open sub-agent sessions with `agent_open` — each does one thing well. Use `agent_eval` for follow-ups or completion state, and `agent_close` to cancel or release a session. Link them to Work/checklist items in your thinking.
+5. **Only when an input genuinely doesn't fit your context window** — a whole file > ~50K tokens, a long transcript, a multi-document corpus — use persistent RLM sessions: `rlm_open` loads the input into a named Python REPL, `rlm_eval` runs bounded analysis, `handle_read` reads returned `var_handle`s, `rlm_configure` adjusts feedback/depth, and `rlm_close` releases the session. For shorter inputs, use `read_file` and reason directly.
 6. **For persistent cross-session memory**, use `note` sparingly for important decisions, open blockers, and architectural context.
 
-**Key principle**: make your work visible. The sidebar shows Plan / Todos / Tasks / Agents. When these panels are empty, the user has no idea what you're doing. Keep them populated.
+**Key principle**: make your work visible in one place. The sidebar shows Work / Tasks / Agents / Context. Keep the Work checklist current; it is the primary progress surface. `update_plan` appears there only as optional strategy when it has real content.
+
+## Workspace Orientation
+
+In unfamiliar workspaces, orient before broad search. Use loaded project instructions plus cheap deterministic tools (`list_dir`, relevant `AGENTS.md`/`README.md`, targeted `grep_files`) to identify the canonical project root. If a workspace holds several projects or stale sibling checkouts, follow the user's path and the project instructions; ask if the target remains ambiguous.
+
+Use `explore` / `explorer` sub-agents for independent read-only reconnaissance. Give each child one bounded question with the project root and expected evidence shape. Use RLM for long inputs or many semantic slices, not basic path discovery.
 
 ## RLM Is a Specialty Tool
 
-`rlm` is for one specific shape of work: a long input that genuinely does not fit in your context (a whole file > ~50K tokens, a long transcript, a multi-document corpus). Reach for it ONLY when direct reasoning over the input is impossible because of its size. For everything else — short inputs, focused questions, parallel exploration — use `read_file`, `grep_files`, or `agent_spawn` instead.
+Persistent RLM sessions are for one specific shape of work: a long input that genuinely does not fit in your context (a whole file > ~50K tokens, a long transcript, a multi-document corpus) or a batch of many semantic sub-questions that is cleaner in Python. Reach for RLM only when direct reasoning over the input is impossible or wasteful. For everything else — short inputs, focused questions, parallel exploration — use `read_file`, `grep_files`, or `agent_open` instead.
 
-When you do use `rlm`, ask bounded questions with explicit inputs and expected output shape. The result is advisory — ground decisions in local files, live tool output, and passing verification before claiming completion.
+When you do use RLM, open a named context with `rlm_open`, run bounded code with `rlm_eval`, read large `var_handle` results with `handle_read`, and close the context with `rlm_close`. Results are advisory — ground decisions in local files, live tool output, and passing verification before claiming completion.
 
-The Python helpers visible inside the REPL (`llm_query`, `llm_query_batched`, `rlm_query`, `rlm_query_batched`) are NOT separately-callable tools — they are functions the sub-agent uses inside its Python code.
+RLM works by keeping the long input and intermediate values as symbolic REPL state. Inspect bounded slices, transform with Python, batch child calls programmatically, and avoid copying the whole body back into the root prompt.
+
+The Python helpers visible inside the REPL (`sub_query`, `sub_query_batch`, `sub_query_map`, `sub_rlm`, `finalize`, and related context helpers) are NOT separately-callable tools — they are functions the sub-agent uses inside its Python code.
 
 ## Context
 You have a 1 M-token context window. When usage creeps above ~80%, suggest `/compact` to the user — it summarises earlier turns so you can keep working without losing thread.
@@ -29,14 +37,15 @@ Model notes: DeepSeek V4 models emit *thinking tokens* (`ContentBlock::Thinking`
 
 ## Toolbox (fast reference — tool descriptions are authoritative)
 
-- **Planning / tracking**: `update_plan` (high-level strategy), `task_create` / `task_list` / `task_read` / `task_cancel` (durable work objects), `checklist_write` (granular progress under the active task/thread), `checklist_add` / `checklist_update` / `checklist_list`, `todo_*` aliases (legacy compatibility), `note` (persistent memory).
+- **Planning / tracking**: `checklist_write` (primary Work progress under the active task/thread), `checklist_add` / `checklist_update` / `checklist_list`, `update_plan` (optional high-level strategy metadata for complex initiatives), `task_create` / `task_list` / `task_read` / `task_cancel` (durable work objects), `todo_*` aliases (legacy compatibility), `note` (persistent memory).
 - **File I/O**: `read_file` (PDFs auto-extracted), `list_dir`, `write_file`, `edit_file`, `apply_patch`, `retrieve_tool_result` for prior spilled large tool outputs.
 - **Shell**: `task_shell_start` + `task_shell_wait` for long-running commands, diagnostics, tests, searches, and servers; `exec_shell` for bounded cancellable foreground commands; `exec_shell_wait`, `exec_shell_interact`.
 - **Task evidence**: `task_gate_run` for verification gates; `pr_attempt_record` / `pr_attempt_list` / `pr_attempt_read` / `pr_attempt_preflight`; `github_issue_context` / `github_pr_context` (read-only); `github_comment` / `github_close_issue` (approval + evidence required); `automation_*` scheduling tools.
 - **Structured search**: `grep_files`, `file_search`, `web_search`, `fetch_url`, `web.run` (browse).
 - **Git / diag / tests**: `git_status`, `git_diff`, `git_show`, `git_log`, `git_blame`, `diagnostics`, `run_tests`, `review`.
-- **Sub-agents**: `agent_spawn` (`spawn_agent`, `delegate_to_agent`), `agent_result`, `agent_cancel` (`close_agent`), `agent_list`, `agent_wait` (`wait`), `agent_send_input` (`send_input`), `agent_assign` (`assign_agent`), `resume_agent`.
-- **Recursive LM (long inputs / parallel reasoning)**: `rlm` — load a file/string as `context` in a Python REPL, sub-agent writes Python that calls `llm_query`/`llm_query_batched`/`rlm_query` to chunk, compare, critique, and synthesize; returns the synthesized answer. Read-only.
+- **Sub-agents**: `agent_open`, `agent_eval`, `agent_close`. Fresh sessions are the default; use `fork_context: true` when multiple perspectives need the current parent context and byte-identical prefill/prompt prefix for DeepSeek prefix-cache reuse.
+- **Recursive LM (long inputs / parallel reasoning)**: `rlm_open`, `rlm_eval`, `rlm_configure`, `rlm_close` — open a named Python REPL over a file/string/URL, run deterministic and semantic analysis, return compact results or `var_handle`s, then close when done.
+- **Large symbolic outputs**: `handle_read` — read bounded slices, counts, ranges, or JSONPath projections from returned `var_handle`s.
 - **Other**: `code_execution` (Python sandbox), `validate_data` (JSON/TOML), `request_user_input`, `finance` (market quotes), `tool_search_tool_regex`, `tool_search_tool_bm25` (deferred tool discovery).
 
 Multiple `tool_calls` in one turn run in parallel. `web_search` returns `ref_id`s — cite as `(ref_id)`.
diff --git a/crates/tui/src/prompts/compact.md b/crates/tui/src/prompts/compact.md
index afeea91e..aa3f5394 100644
--- a/crates/tui/src/prompts/compact.md
+++ b/crates/tui/src/prompts/compact.md
@@ -1,4 +1,4 @@
-## Compaction Handoff
+## Compaction Relay
 
 The conversation above this point has been compacted. Below is a structured summary of what was discussed and decided. Read this first — it replaces re-reading the compressed transcript.
 
diff --git a/crates/tui/src/prompts/modes/agent.md b/crates/tui/src/prompts/modes/agent.md
index 7b26a3d0..5e8d9f2b 100644
--- a/crates/tui/src/prompts/modes/agent.md
+++ b/crates/tui/src/prompts/modes/agent.md
@@ -2,14 +2,15 @@
 
 You are running in Agent mode — autonomous task execution with tool access.
 
-Read-only tools (reads, searches, `rlm`, agent status queries, git inspection) run silently.
-Any write, patch, shell execution, sub-agent spawn, or CSV batch operation will ask for approval first.
+Read-only tools (reads, searches, persistent RLM session tools, agent status queries, git inspection) run silently.
+Any write, patch, shell execution, sub-agent session open, or CSV batch operation will ask for approval first.
 
 Before requesting approval for writes, lay out your work with `checklist_write` so the user can see what
-you intend to do and approve with context. Complex changes should also get an `update_plan` first.
-Decomposition builds trust — a clear plan gets faster approvals.
+you intend to do and approve with context. Use `update_plan` only when a complex initiative needs
+high-level strategy metadata that is not just a copy of the checklist.
+Decomposition builds trust — a clear Work checklist gets faster approvals.
 
-For multi-step initiatives, use `update_plan` (high-level strategy) + `checklist_write` (granular steps).
+For multi-step initiatives, keep `checklist_write` current. Add `update_plan` only for genuinely useful strategy.
 
 ## Efficient Approvals
 
@@ -23,8 +24,8 @@ Don't sequence approvals one at a time — the user wants context, not interrupt
 ## Session Longevity
 
 Long sessions accumulate context. To stay fast:
-- Spawn sub-agents for independent work instead of doing everything sequentially
+- Open sub-agent sessions for independent work instead of doing everything sequentially
 - Batch reads/searches/git-inspections into parallel tool calls
-- Suggest `/compact` when context nears 80% — the compaction handoff preserves open blockers
+- Suggest `/compact` when context nears 80% — the compaction relay preserves open blockers
 - Use `note` for decisions you'll need across compaction boundaries
 - A 3-turn session that fans out to sub-agents finishes faster AND stays responsive longer than a 15-turn sequential grind
diff --git a/crates/tui/src/prompts/modes/plan.md b/crates/tui/src/prompts/modes/plan.md
index 8b854a4f..583058d0 100644
--- a/crates/tui/src/prompts/modes/plan.md
+++ b/crates/tui/src/prompts/modes/plan.md
@@ -2,8 +2,9 @@
 
 You are running in Plan mode — design before implementing.
 
-Investigate first, act later. Use `update_plan` to lay out high-level strategy and `checklist_write` for
-granular, verifiable steps. All writes and patches are blocked — you can read the world but you
+Investigate first, act later. Use `checklist_write` for visible, granular progress. Add `update_plan`
+only when high-level strategy adds value beyond the checklist.
+All writes and patches are blocked — you can read the world but you
 can't change it. Shell and code execution are unavailable.
 
 Use this mode to build a thorough plan. Spawn read-only sub-agents for parallel investigation.
diff --git a/crates/tui/src/prompts/modes/yolo.md b/crates/tui/src/prompts/modes/yolo.md
index 804fe7b0..d6572b90 100644
--- a/crates/tui/src/prompts/modes/yolo.md
+++ b/crates/tui/src/prompts/modes/yolo.md
@@ -7,4 +7,5 @@ overwrite user work, or run destructive commands, pause and double-check. The un
 
 Even with auto-approval, create a `checklist_write` first so your work is visible and trackable in the
 sidebar. Decomposition is not red tape — it's how you organize complex work and demonstrate thoroughness.
-For multi-step initiatives, use `update_plan` + `checklist_write` together.
+For multi-step initiatives, keep `checklist_write` current. Add `update_plan` only when a high-level strategy
+would help and do not duplicate the checklist there.
diff --git a/crates/tui/src/repl/runtime.rs b/crates/tui/src/repl/runtime.rs
index 73f64bd9..f943e416 100644
--- a/crates/tui/src/repl/runtime.rs
+++ b/crates/tui/src/repl/runtime.rs
@@ -6,8 +6,9 @@
 //! `exec()`s them into the same global namespace so variables, imports,
 //! and even open file handles persist naturally across rounds.
 //!
-//! Sub-LLM helpers (`llm_query`, `llm_query_batched`, `rlm_query`,
-//! `rlm_query_batched`) are wired through a stdin/stdout RPC protocol:
+//! Sub-LLM helpers (`sub_query`, `sub_query_batch`, `sub_rlm`, plus legacy
+//! `llm_query`, `llm_query_batched`, `rlm_query`, `rlm_query_batched`) are
+//! wired through a stdin/stdout RPC protocol:
 //! Python emits `__RLM_REQ_<sid>__::{json}` on stdout, Rust dispatches the
 //! request and writes `__RLM_RESP_<sid>__::{json}` back on stdin. No HTTP
 //! sidecar, no temp ports — the same pipes carry both control and data.
@@ -22,6 +23,7 @@ use std::process::Stdio;
 use std::time::{Duration, Instant};
 
 use serde::{Deserialize, Serialize};
+use serde_json::Value;
 use tokio::io::{AsyncBufReadExt, AsyncWriteExt, BufReader};
 use tokio::process::{Child, ChildStdin, ChildStdout, Command};
 use uuid::Uuid;
@@ -43,9 +45,11 @@ pub struct ReplRound {
     pub stderr: String,
     /// `True` if the user code raised an unhandled Python exception.
     pub has_error: bool,
-    /// Captured `FINAL(value)` payload, if any.
+    /// Captured `finalize(value, confidence=...)` payload, if any.
     pub final_value: Option<String>,
-    /// Number of `llm_query`/`rlm_query` RPCs the round issued.
+    /// Optional confidence supplied to `finalize(...)`.
+    pub final_confidence: Option<Value>,
+    /// Number of `sub_query`/`sub_rlm` RPCs the round issued.
     pub rpc_count: u32,
     /// Wall-clock duration of the round.
     pub elapsed: Duration,
@@ -173,8 +177,8 @@ impl PythonRuntime {
         )
     }
 
-    /// Spawn a REPL with `context` (and `ctx`) preloaded from a file. Used
-    /// by the RLM turn loop.
+    /// Spawn a REPL with the long input preloaded from a file. Used by the
+    /// RLM turn loop.
     pub async fn spawn_with_context(context_path: &Path) -> Result<Self, String> {
         Self::spawn_inner(Some(context_path), None).await
     }
@@ -310,6 +314,7 @@ impl PythonRuntime {
 
         let mut stdout_buf = String::new();
         let mut final_value: Option<String> = None;
+        let mut final_confidence: Option<Value> = None;
         let mut had_error = false;
         let mut rpc_count: u32 = 0;
         let round_timeout = self.round_timeout;
@@ -332,10 +337,35 @@ impl PythonRuntime {
                     break;
                 }
                 if let Some(rest) = trimmed.strip_prefix(&final_prefix) {
-                    // Stored as a JSON-encoded string.
-                    let v =
-                        serde_json::from_str::<String>(rest).unwrap_or_else(|_| rest.to_string());
-                    final_value = Some(v);
+                    // New sessions emit an object with value/confidence;
+                    // legacy helpers emitted a JSON string.
+                    match serde_json::from_str::<Value>(rest) {
+                        Ok(Value::Object(map)) => {
+                            let value = map
+                                .get("value")
+                                .and_then(Value::as_str)
+                                .map(str::to_string)
+                                .unwrap_or_else(|| {
+                                    map.get("value")
+                                        .map(Value::to_string)
+                                        .unwrap_or_else(|| rest.to_string())
+                                });
+                            final_value = Some(value);
+                            final_confidence = map.get("confidence").cloned();
+                        }
+                        Ok(Value::String(value)) => {
+                            final_value = Some(value);
+                            final_confidence = None;
+                        }
+                        Ok(other) => {
+                            final_value = Some(other.to_string());
+                            final_confidence = None;
+                        }
+                        Err(_) => {
+                            final_value = Some(rest.to_string());
+                            final_confidence = None;
+                        }
+                    }
                     continue;
                 }
                 if let Some(rest) = trimmed.strip_prefix(&err_prefix) {
@@ -399,6 +429,7 @@ impl PythonRuntime {
             stderr,
             has_error: had_error,
             final_value,
+            final_confidence,
             rpc_count,
             elapsed: started.elapsed(),
         })
@@ -493,6 +524,7 @@ fn render_bootstrap(session_id: &str) -> String {
 const BOOTSTRAP_TEMPLATE: &str = r#"
 import json as _json
 import os as _os
+import re as _re
 import sys as _sys
 import traceback as _traceback
 
@@ -574,16 +606,67 @@ def rlm_query_batched(prompts, model=None):
             out.append(r.get("text",""))
     return out
 
-def FINAL(value):
-    """Signal the loop to stop with this final answer."""
-    _sys.stdout.write(_FINAL + _json.dumps(str(value)) + "\n")
+def _slice_text(slice_value):
+    if slice_value is None:
+        return ""
+    if isinstance(slice_value, dict):
+        if "text" in slice_value:
+            return str(slice_value["text"])
+        return _json.dumps(slice_value, ensure_ascii=False)
+    return str(slice_value)
+
+def _prompt_with_slice(prompt, slice_value):
+    text = _slice_text(slice_value)
+    if not text:
+        return str(prompt)
+    if isinstance(slice_value, dict) and ("index" in slice_value or ("start" in slice_value and "end" in slice_value)):
+        label = f"slice index={slice_value.get('index', '?')} range={slice_value.get('start', '?')}:{slice_value.get('end', '?')}"
+    else:
+        label = "slice"
+    return f"{prompt}\n\n--- {label} ---\n{text}"
+
+def sub_query(prompt, slice=None):
+    """One child LLM call, optionally scoped to a bounded slice."""
+    return llm_query(_prompt_with_slice(prompt, slice))
+
+def sub_query_batch(prompt, slices):
+    """Apply one prompt to many bounded slices concurrently."""
+    if not isinstance(slices, (list, tuple)):
+        return ["[sub_query_batch: slices must be a list]"]
+    return llm_query_batched([_prompt_with_slice(prompt, s) for s in slices])
+
+def sub_query_map(prompts, slices=None):
+    """Run N distinct prompts, optionally paired with N bounded slices."""
+    if not isinstance(prompts, (list, tuple)):
+        return ["[sub_query_map: prompts must be a list]"]
+    if slices is None:
+        return llm_query_batched([str(p) for p in prompts])
+    if not isinstance(slices, (list, tuple)):
+        return ["[sub_query_map: slices must be a list]"]
+    if len(prompts) != len(slices):
+        return [f"[sub_query_map: size mismatch ({len(prompts)}/{len(slices)})]" for _ in prompts]
+    return llm_query_batched([_prompt_with_slice(p, s) for p, s in zip(prompts, slices)])
+
+def sub_rlm(prompt, source=None):
+    """Recursive sub-RLM call for tasks that need their own decomposition."""
+    return rlm_query(_prompt_with_slice(prompt, source))
+
+def _emit_final(value, confidence=None):
+    _sys.stdout.write(_FINAL + _json.dumps({
+        "value": str(value),
+        "confidence": confidence,
+    }) + "\n")
     _sys.stdout.flush()
 
+def FINAL(value):
+    """Legacy compatibility alias for finalize(value)."""
+    _emit_final(value)
+
 def FINAL_VAR(name):
-    """Signal the loop to stop, returning the value of a named variable."""
+    """Legacy compatibility alias for finalize(repl_get(name))."""
     name_str = str(name).strip().strip("'\"")
     if name_str in globals():
-        FINAL(globals()[name_str])
+        _emit_final(globals()[name_str])
     else:
         print(f"FINAL_VAR error: variable '{name_str}' not found. "
               f"Use SHOW_VARS() to list available variables.", flush=True)
@@ -603,8 +686,61 @@ def repl_get(name, default=None):
 def repl_set(name, value):
     globals()[str(name)] = value
 
-def chunk_context(max_chars=20000, overlap=0):
-    """Return full-coverage context chunks with index/start/end/text fields."""
+def context_meta():
+    """Return bounded metadata about the loaded input; never includes the full text."""
+    text = _context
+    line_count = 0 if text == "" else text.count("\n") + (0 if text.endswith("\n") else 1)
+    return {
+        "chars": len(text),
+        "lines": line_count,
+        "preview": text[:500],
+        "tail_preview": text[-500:] if len(text) > 500 else text,
+    }
+
+def _slice_chars(start, end):
+    total = len(_context)
+    s = max(0, int(start))
+    e = max(s, min(total, int(end)))
+    return _context[s:e]
+
+def _slice_lines(start, end):
+    lines = _context.splitlines()
+    s = max(0, int(start))
+    e = max(s, min(len(lines), int(end)))
+    return "\n".join(lines[s:e])
+
+def peek(start, end, unit="chars"):
+    """Return a bounded slice of the input by char offsets or line numbers."""
+    if str(unit).lower() in ("line", "lines"):
+        return _slice_lines(start, end)
+    if str(unit).lower() not in ("char", "chars"):
+        raise ValueError("unit must be 'chars' or 'lines'")
+    return _slice_chars(start, end)
+
+def search(pattern, max_hits=100):
+    """Regex-search the input and return bounded hit records with snippets."""
+    max_hits = max(0, int(max_hits))
+    hits = []
+    if max_hits == 0:
+        return hits
+    rx = _re.compile(str(pattern), _re.MULTILINE)
+    for i, m in enumerate(rx.finditer(_context)):
+        if i >= max_hits:
+            break
+        start, end = m.span()
+        snippet_start = max(0, start - 120)
+        snippet_end = min(len(_context), end + 120)
+        hits.append({
+            "index": i,
+            "start": start,
+            "end": end,
+            "match": m.group(0),
+            "snippet": _context[snippet_start:snippet_end],
+        })
+    return hits
+
+def chunk(max_chars=20000, overlap=0):
+    """Return full-coverage input chunks with index/start/end/text fields."""
     max_chars = int(max_chars)
     overlap = max(0, int(overlap))
     if max_chars <= 0:
@@ -614,18 +750,22 @@ def chunk_context(max_chars=20000, overlap=0):
     chunks = []
     start = 0
     idx = 0
-    total = len(context)
+    total = len(_context)
     while start < total:
         end = min(total, start + max_chars)
-        chunks.append({"index": idx, "start": start, "end": end, "text": context[start:end]})
+        chunks.append({"index": idx, "start": start, "end": end, "text": _context[start:end]})
         idx += 1
         if end >= total:
             break
         start = end - overlap
     return chunks
 
+def chunk_context(max_chars=20000, overlap=0):
+    """Compatibility alias for chunk()."""
+    return chunk(max_chars=max_chars, overlap=overlap)
+
 def chunk_coverage(chunks):
-    """Summarize coverage for chunks produced by chunk_context()."""
+    """Summarize coverage for chunks produced by chunk()."""
     spans = []
     for c in chunks:
         try:
@@ -642,36 +782,59 @@ def chunk_coverage(chunks):
         if end > cursor:
             covered += end - max(start, cursor)
             cursor = end
-    if cursor < len(context):
-        gaps.append((cursor, len(context)))
+    if cursor < len(_context):
+        gaps.append((cursor, len(_context)))
     return {
         "chunks": len(chunks),
-        "context_chars": len(context),
+        "context_chars": len(_context),
+        "input_chars": len(_context),
         "covered_chars": covered,
         "gaps": gaps,
-        "complete": covered >= len(context) and not gaps,
+        "complete": covered >= len(_context) and not gaps,
     }
 
-# Load the long input as `context` (and `ctx`) from a file. This keeps the
-# big string out of the process command-line and out of the LLM's window.
+def finalize(value, confidence=None):
+    """Signal the session's final answer and persist confidence metadata."""
+    global final_answer, final_confidence, final_result
+    final_answer = str(value)
+    final_confidence = confidence
+    final_result = {
+        "value": final_answer,
+        "confidence": confidence,
+    }
+    _emit_final(final_answer, confidence=confidence)
+    return final_answer
+
+def evaluate_progress():
+    """Return lightweight state useful before deciding the next REPL step."""
+    vars_now = SHOW_VARS()
+    return {
+        "has_final_answer": "final_answer" in globals(),
+        "final_confidence": globals().get("final_confidence", None),
+        "user_variables": vars_now,
+    }
+
+# Load the long input from a file. This keeps the big string out of the
+# process command-line and out of the LLM's window.
 _ctx_file = _os.environ.get("RLM_CONTEXT_FILE","")
-context = ""
+_context = ""
 if _ctx_file:
     try:
         with open(_ctx_file, "r", encoding="utf-8", errors="replace") as f:
-            context = f.read()
+            _context = f.read()
     except Exception as e:
         _sys.stderr.write(f"[bootstrap] failed to load context: {e}\n")
-ctx = context  # short alias matching aleph
 
 _BOOTSTRAP_NAMES = {
     "_SID","_REQ","_RESP","_FINAL","_ERR","_RUN","_END","_DONE","_READY",
-    "_rpc","_ctx_file","_BOOTSTRAP_NAMES","_main_loop",
+    "_rpc","_ctx_file","_context","_slice_chars","_slice_lines","_BOOTSTRAP_NAMES","_main_loop",
+    "_emit_final","_slice_text","_prompt_with_slice",
     "llm_query","llm_query_batched","rlm_query","rlm_query_batched",
+    "sub_query","sub_query_batch","sub_query_map","sub_rlm",
     "FINAL","FINAL_VAR","SHOW_VARS","repl_get","repl_set",
-    "chunk_context","chunk_coverage",
-    "context","ctx",
-    "_json","_os","_sys","_traceback",
+    "context_meta","peek","search","chunk","chunk_context","chunk_coverage",
+    "finalize","evaluate_progress",
+    "_json","_os","_re","_sys","_traceback",
 }
 
 def _main_loop():
@@ -829,7 +992,7 @@ mod tests {
             .await
             .expect("spawn");
         let round = rt
-            .execute("print(len(context), context[:5])")
+            .execute("print(context_meta()['chars'], peek(0, 5))")
             .await
             .expect("execute");
         assert!(round.stdout.contains("19"));
@@ -838,13 +1001,16 @@ mod tests {
     }
 
     #[tokio::test]
-    async fn ctx_alias_works() {
+    async fn context_aliases_are_not_bound() {
         let path = write_temp_context("aleph-style");
         let mut rt = PythonRuntime::spawn_with_context(&path)
             .await
             .expect("spawn");
-        let round = rt.execute("print(ctx)").await.expect("execute");
-        assert!(round.stdout.contains("aleph-style"));
+        let round = rt
+            .execute("print('context' in globals(), 'ctx' in globals())")
+            .await
+            .expect("execute");
+        assert!(round.stdout.contains("False False"));
         rt.shutdown().await;
     }
 
@@ -866,6 +1032,67 @@ mod tests {
         rt.shutdown().await;
     }
 
+    #[tokio::test]
+    async fn bounded_input_helpers_work() {
+        let path = write_temp_context("alpha\nbeta needle\ngamma needle\nomega");
+        let mut rt = PythonRuntime::spawn_with_context(&path)
+            .await
+            .expect("spawn");
+        let round = rt
+            .execute(
+                "meta = context_meta()\n\
+                 hits = search('needle', max_hits=1)\n\
+                 print(meta['chars'], meta['lines'])\n\
+                 print(peek(6, 17))\n\
+                 print(peek(1, 3, unit='lines'))\n\
+                 print(len(hits), hits[0]['match'], hits[0]['start'])",
+            )
+            .await
+            .expect("execute");
+        assert!(round.stdout.contains("36 4"), "{}", round.stdout);
+        assert!(round.stdout.contains("beta needle"), "{}", round.stdout);
+        assert!(
+            round.stdout.contains("beta needle\ngamma needle"),
+            "{}",
+            round.stdout
+        );
+        assert!(round.stdout.contains("1 needle 11"), "{}", round.stdout);
+        rt.shutdown().await;
+    }
+
+    #[tokio::test]
+    async fn new_chunk_helper_reports_full_coverage() {
+        let path = write_temp_context("abcdefghijklmnopqrstuvwxyz");
+        let mut rt = PythonRuntime::spawn_with_context(&path)
+            .await
+            .expect("spawn");
+        let round = rt
+            .execute(
+                "chunks = chunk(max_chars=10)\n\
+                 coverage = chunk_coverage(chunks)\n\
+                 print(len(chunks), coverage['input_chars'], coverage['covered_chars'], coverage['complete'])",
+            )
+            .await
+            .expect("execute");
+        assert!(round.stdout.contains("3 26 26 True"), "{}", round.stdout);
+        rt.shutdown().await;
+    }
+
+    #[tokio::test]
+    async fn finalize_helper_is_captured_directly() {
+        let mut rt = PythonRuntime::new().await.expect("spawn");
+        let round = rt
+            .execute("finalize('computed answer', confidence='high')")
+            .await
+            .expect("execute");
+        assert_eq!(round.final_value.as_deref(), Some("computed answer"));
+        assert_eq!(
+            round.final_confidence.as_ref().and_then(Value::as_str),
+            Some("high")
+        );
+        rt.shutdown().await;
+    }
+
     #[tokio::test]
     async fn rlm_context_runtime_has_no_fixed_round_timeout() {
         let path = write_temp_context("long input");
@@ -887,7 +1114,7 @@ mod tests {
     }
 
     #[tokio::test]
-    async fn final_is_captured() {
+    async fn legacy_final_is_captured() {
         let mut rt = PythonRuntime::new().await.expect("spawn");
         let round = rt
             .execute("FINAL('the answer is 42')")
@@ -898,7 +1125,7 @@ mod tests {
     }
 
     #[tokio::test]
-    async fn final_var_is_captured() {
+    async fn legacy_final_var_is_captured() {
         let mut rt = PythonRuntime::new().await.expect("spawn");
         rt.execute("answer = 'computed'").await.expect("r1");
         let round = rt.execute("FINAL_VAR('answer')").await.expect("r2");
@@ -945,6 +1172,33 @@ mod tests {
         rt.shutdown().await;
     }
 
+    #[tokio::test]
+    async fn rpc_dispatcher_round_trips_sub_query_alias() {
+        let bridge = StubBridge::new();
+        let calls = Arc::clone(&bridge.calls);
+
+        let mut rt = PythonRuntime::new().await.expect("spawn");
+        let round = rt
+            .run("print(sub_query('hello from sub'))", Some(&bridge))
+            .await
+            .expect("execute");
+        assert!(
+            round.stdout.contains("stub#0: hello from sub"),
+            "stdout: {:?}",
+            round.stdout
+        );
+        assert_eq!(round.rpc_count, 1);
+
+        let recorded = calls.lock().await;
+        assert_eq!(recorded.len(), 1);
+        match &recorded[0] {
+            RpcRequest::Llm { prompt, .. } => assert_eq!(prompt, "hello from sub"),
+            other => panic!("expected Llm request, got {other:?}"),
+        }
+        drop(recorded);
+        rt.shutdown().await;
+    }
+
     #[tokio::test]
     async fn rpc_dispatcher_round_trips_batch() {
         let bridge = StubBridge::new();
diff --git a/crates/tui/src/rlm/mod.rs b/crates/tui/src/rlm/mod.rs
index 44959983..4b48dc22 100644
--- a/crates/tui/src/rlm/mod.rs
+++ b/crates/tui/src/rlm/mod.rs
@@ -26,6 +26,7 @@ use crate::models::Usage;
 
 pub mod bridge;
 pub mod prompt;
+pub mod session;
 pub mod turn;
 
 pub use bridge::RlmBridge;
diff --git a/crates/tui/src/rlm/prompt.rs b/crates/tui/src/rlm/prompt.rs
index 39f5d6cd..91db97e3 100644
--- a/crates/tui/src/rlm/prompt.rs
+++ b/crates/tui/src/rlm/prompt.rs
@@ -11,74 +11,90 @@ pub fn rlm_system_prompt() -> SystemPrompt {
     SystemPrompt::Text(RLM_SYSTEM_PROMPT.trim().to_string())
 }
 
-const RLM_SYSTEM_PROMPT: &str = r#"You are the root of a Recursive Language Model (RLM). Your input lives in a long-running Python REPL as a variable named `context` (alias `ctx`). You DO NOT see `context` in your prompt — only its length and a short preview. The only way to read or compute over it is to write Python code that runs in the REPL.
+const RLM_SYSTEM_PROMPT: &str = r#"You are the root of a Recursive Language Model (RLM). The input is loaded into a long-running Python REPL. You hold a live context handle, not the raw body. Read only through bounded helpers, compute in Python, and delegate semantic judgment to child calls.
+
+The point is symbolic recursion. Keep the long prompt and large intermediate strings in REPL variables; the neural model should see metadata, bounded slices, code, and compact stdout. Do not copy the whole input into the root history, and do not verbalize a long list of child calls when Python can construct and launch them in a loop.
 
 The REPL exposes:
-- `context` (alias `ctx`) — the full input string. Often huge — never `print(context)` in full.
-- `llm_query(prompt, model=None, max_tokens=None, system=None)` — one-shot child LLM. Cheap. Use for chunk-level work. The `model` argument is accepted for compatibility but child calls stay pinned to the configured Flash child model.
-- `llm_query_batched(prompts, model=None)` — concurrent fan-out. Returns `list[str]` in input order. The `model` argument is accepted for compatibility but ignored.
-- `rlm_query(prompt, model=None)` — recursive sub-RLM. Use when a sub-task itself needs decomposition. The `model` argument is accepted for compatibility but ignored.
-- `rlm_query_batched(prompts, model=None)` — concurrent recursive sub-RLMs. The `model` argument is accepted for compatibility but ignored.
-- `chunk_context(max_chars=20000, overlap=0)` — full-coverage chunks with index/start/end/text fields.
-- `chunk_coverage(chunks)` — coverage summary for chunks produced by `chunk_context`.
-- `SHOW_VARS()` — list user variables and their types.
-- `repl_set(name, value)` / `repl_get(name)` — explicit cross-round storage.
-- `print(...)` — diagnostic output. The driver feeds you a truncated preview next round.
-- `FINAL(value)` — end the loop with this string answer.
-- `FINAL_VAR(name)` — end the loop with the value of a named variable.
+- `context_meta()` - bounded metadata: char count, line count, preview, tail preview.
+- `peek(start, end, unit="chars")` - bounded slice by char offsets or line numbers.
+- `search(pattern, max_hits=100)` - regex search returning bounded hit records with snippets.
+- `chunk(max_chars=20000, overlap=0)` - full-coverage chunks with index/start/end/text fields.
+- `chunk_coverage(chunks)` - coverage summary for chunks produced by `chunk`.
+- `sub_query(prompt, slice=None)` - one child LLM call, optionally scoped to one bounded slice.
+- `sub_query_batch(prompt, slices)` - apply one prompt to many bounded slices concurrently.
+- `sub_query_map(prompts, slices=None)` - run N distinct prompts, optionally paired with N bounded slices.
+- `sub_rlm(prompt, source=None)` - recursive sub-RLM for a sub-task that needs its own decomposition. Pass a bounded source, not the whole body.
+- `SHOW_VARS()` - list user variables and their types.
+- `repl_set(name, value)` / `repl_get(name)` - explicit cross-round storage.
+- `evaluate_progress()` - inspect whether a final answer exists and what variables are available.
+- `finalize(value, confidence=None)` - end the loop with a final answer and optional confidence.
+- `print(...)` - diagnostic output. The driver feeds you a truncated preview next round.
 
-Variables, imports, and any other state PERSIST across rounds — the REPL is a single long-lived Python process for the whole turn.
+Variables, imports, and any other state persist across rounds. There is no `context` or `ctx` variable. Use `peek`, `search`, `chunk`, and `context_meta`.
 
-Contract — every turn, output ONE ` ```repl ` block of Python. That's it. No prose-only turns. No "I will do X" — just emit the code that does X.
+Contract: every turn, output exactly one ` ```repl ` block of Python and nothing else. No prose-only turns. No "I will do X"; emit the code that does X.
 
-Strategy patterns
+Five-phase skeleton
 
-1. PREVIEW first.
+1. Load
 ```repl
-print(f"len(context) = {len(context)}")
-print(context[:500])
+meta = context_meta()
+print(meta)
 ```
+Confirm the handle shape. Do not re-load the body. Keep the head small: names and metadata only.
 
-2. CHUNK + map-reduce with batched concurrent calls.
+2. Orient
 ```repl
-chunk_size = 8000
-chunks = chunk_context(max_chars=chunk_size)
+hits = search(r"term|phrase", max_hits=20)
+sample = peek(0, min(meta["chars"], 1200))
+print({"hits": len(hits), "sample": sample[:300]})
+```
+Search before peeking. Pull only the slices you need. Store maps of the input as variables: headers, regions, sections, candidate spans.
+
+3. Compute
+```repl
+chunks = chunk(max_chars=12000, overlap=400)
 coverage = chunk_coverage(chunks)
-prompts = [f"Extract any mentions of X from section {c['index']} ({c['start']}:{c['end']}):\n\n{c['text']}" for c in chunks]
-partials = llm_query_batched(prompts)
+partials = sub_query_batch(
+    "Extract the facts needed for the user's question from this slice. "
+    "Return only grounded facts and cite the slice index/range.",
+    chunks,
+)
+print({"coverage": coverage, "partials": len(partials)})
+```
+Use deterministic Python first for counts, regex, parsing, sorting, dedupe, joins, and coverage. You do NO math by asking a child model to count; if Python can enumerate, parse, or simulate it exactly, do that in Python.
+
+4. Recurse
+```repl
 combined = "\n\n".join(partials)
-answer = llm_query(f"Coverage: {coverage}\n\nSynthesize across these section-level extractions:\n\n{combined}")
-print(answer[:500])
-```
-Then on the next turn:
-```repl
-FINAL(answer)
+analysis = sub_rlm(
+    "Synthesize these section findings into a precise answer. "
+    "Call out conflicts and missing coverage.",
+    source=combined,
+)
+print(analysis[:800])
 ```
+Use `sub_rlm` only when the sub-task itself needs decomposition or critique. Pass slices or compact variables, not the whole body. Memoize recursive results in variables.
 
-3. RECURSIVE decomposition for hard sub-problems.
+5. Converge
 ```repl
-trend = rlm_query(f"Analyze this dataset and conclude with one word — up, down, or stable: {data}")
-recommendation = "Hold" if "stable" in trend.lower() else ("Hedge" if "down" in trend.lower() else "Increase")
-print(trend, "→", recommendation)
-```
-
-4. PROGRAMMATIC computation + LLM interpretation.
-```repl
-import math
-theta = math.degrees(math.atan2(v_perp, v_parallel))
-final_answer = llm_query(f"Entry angle is {theta:.2f}°. Phrase the answer for a physics student.")
-FINAL(final_answer)
+progress = evaluate_progress()
+finalize(
+    f"{analysis}\n\nCoverage: {coverage['covered_chars']}/{coverage['input_chars']} chars "
+    f"across {coverage['chunks']} chunks; complete={coverage['complete']}.",
+    confidence="medium" if coverage["complete"] else "low",
+)
 ```
+Call `evaluate_progress()` if the answer is not stable. Loop back to Orient or Compute when coverage is incomplete or confidence is low. Call `finalize(...)` only when the answer is supported by variables you can inspect.
 
 Rules
 
-- Emit exactly ONE ` ```repl ` block per turn. The block must contain Python code only.
-- Never `print(context)` or otherwise dump it whole — slice, sample, or chunk.
-- You MUST call `llm_query` / `llm_query_batched` / `rlm_query` at least once before `FINAL(...)`. Calling FINAL from a top-level prose answer (without ever running a `repl` block that touched `context` via a sub-LLM) is REJECTED — the driver will discard the FINAL and ask you to actually use the REPL.
-- Sub-LLMs are powerful — feed them generous chunks (tens of thousands of chars), not tiny windows.
-- For exact counts, package totals, line totals, or other structured aggregates, compute them with Python over `context` directly. Do not ask a child LLM to count.
-- For whole-input map-reduce, report coverage in the final answer: chunks processed, total chunks, and whether every line/char range was included. If you only processed a subset, say that explicitly.
-- Do NOT pad your output with prose like "Here is what I'll do:" — just emit the next ```repl block.
+- Use the bounded helpers (`context_meta`, `peek`, `search`, `chunk`) to inspect input.
+- Use `sub_query`, `sub_query_batch`, `sub_query_map`, or `sub_rlm` before finalizing unless the task is purely deterministic and fully computed in Python.
+- End only by calling `finalize(value, confidence=...)`.
+- For exact counts, totals, parsing, and structured aggregates, compute with Python. Do not ask a child LLM to count.
+- For whole-input map-reduce, include coverage in the final answer: chunks processed, total chunks, and whether every char range was included. If you only processed a subset, say that explicitly.
 "#;
 
 #[cfg(test)]
@@ -103,49 +119,66 @@ mod tests {
     }
 
     #[test]
-    fn rlm_prompt_mentions_context_variable() {
-        assert!(body().contains("`context`"));
-    }
-
-    #[test]
-    fn rlm_prompt_mentions_ctx_alias() {
-        assert!(body().contains("`ctx`"));
+    fn rlm_prompt_uses_five_phase_skeleton() {
+        let s = body();
+        for phase in ["Load", "Orient", "Compute", "Recurse", "Converge"] {
+            assert!(s.contains(phase), "system prompt missing phase: {phase}");
+        }
     }
 
     #[test]
     fn rlm_prompt_mentions_all_helpers() {
         let s = body();
         for name in [
-            "llm_query",
-            "llm_query_batched",
-            "rlm_query",
-            "rlm_query_batched",
-            "chunk_context",
+            "peek",
+            "search",
+            "chunk",
             "chunk_coverage",
+            "context_meta",
+            "sub_query",
+            "sub_query_batch",
+            "sub_query_map",
+            "sub_rlm",
+            "finalize",
+            "evaluate_progress",
             "SHOW_VARS",
-            "FINAL",
-            "FINAL_VAR",
         ] {
             assert!(s.contains(name), "system prompt missing helper: {name}");
         }
     }
 
     #[test]
-    fn rlm_prompt_forbids_prose_shortcut() {
-        // The new contract requires a sub-LLM call before FINAL — the
-        // prompt must say so explicitly so the model doesn't try to bail
-        // with FINAL("...inferred from preview...").
-        assert!(
-            body().contains("REJECTED") || body().contains("rejected"),
-            "system prompt should reject the prose-shortcut path explicitly"
-        );
+    fn rlm_prompt_does_not_publicize_context_variables() {
+        let s = body();
+        assert!(s.contains("There is no `context` or `ctx` variable"));
+        assert!(!s.contains("len(context)"));
+        assert!(!s.contains("chunk_context"));
+        assert!(!s.contains("llm_query"));
+        assert!(!s.contains("rlm_query"));
+    }
+
+    #[test]
+    fn rlm_prompt_is_finalize_only() {
+        let s = body();
+        assert!(s.contains("finalize(value"));
+        assert!(!s.contains("FINAL_VAR"));
+        assert!(!s.contains("FINAL(value)"));
+        assert!(!s.contains("FINAL("));
     }
 
     #[test]
     fn rlm_prompt_requires_deterministic_counts_and_coverage() {
         let s = body();
-        assert!(s.contains("compute them with Python"));
-        assert!(s.contains("report coverage"));
+        assert!(s.contains("compute with Python"));
+        assert!(s.contains("include coverage"));
         assert!(s.contains("chunks processed"));
     }
+
+    #[test]
+    fn rlm_prompt_mentions_symbolic_state_contract() {
+        let s = body();
+        assert!(s.contains("symbolic recursion"));
+        assert!(s.contains("REPL variables"));
+        assert!(s.contains("Do not copy the whole input"));
+    }
 }
diff --git a/crates/tui/src/rlm/session.rs b/crates/tui/src/rlm/session.rs
new file mode 100644
index 00000000..71426863
--- /dev/null
+++ b/crates/tui/src/rlm/session.rs
@@ -0,0 +1,180 @@
+//! Persistent RLM session state for the v0.8.33 head/hands tool surface.
+
+use std::collections::HashMap;
+use std::path::{Path, PathBuf};
+use std::sync::Arc;
+use std::time::{Duration, Instant};
+
+use serde::{Deserialize, Serialize};
+use sha2::{Digest, Sha256};
+use tokio::sync::Mutex;
+use uuid::Uuid;
+
+use crate::repl::PythonRuntime;
+
+pub type SharedRlmSessionStore = Arc<Mutex<HashMap<String, Arc<Mutex<RlmSession>>>>>;
+
+#[must_use]
+pub fn new_shared_rlm_session_store() -> SharedRlmSessionStore {
+    Arc::new(Mutex::new(HashMap::new()))
+}
+
+#[derive(Debug)]
+pub struct RlmSession {
+    pub name: String,
+    pub id: String,
+    pub kernel: Option<PythonRuntime>,
+    pub context_meta: ContextMeta,
+    pub config: RlmSessionConfig,
+    pub rpc_count: u32,
+    pub total_duration: Duration,
+    pub peak_var_count: usize,
+    pub final_count: usize,
+    pub created_at: Instant,
+    pub last_used_at: Instant,
+    pub context_path: PathBuf,
+}
+
+impl RlmSession {
+    #[must_use]
+    pub fn new(
+        name: String,
+        kernel: PythonRuntime,
+        context_meta: ContextMeta,
+        context_path: PathBuf,
+    ) -> Self {
+        let now = Instant::now();
+        Self {
+            name,
+            id: format!("rlm:{}", Uuid::new_v4().simple()),
+            kernel: Some(kernel),
+            context_meta,
+            config: RlmSessionConfig::default(),
+            rpc_count: 0,
+            total_duration: Duration::ZERO,
+            peak_var_count: 0,
+            final_count: 0,
+            created_at: now,
+            last_used_at: now,
+            context_path,
+        }
+    }
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct ContextMeta {
+    pub length: usize,
+    #[serde(rename = "type")]
+    pub type_name: String,
+    pub preview_500: String,
+    pub sha256: String,
+}
+
+impl ContextMeta {
+    #[must_use]
+    pub fn from_body(body: &str, type_name: impl Into<String>) -> Self {
+        Self {
+            length: body.chars().count(),
+            type_name: type_name.into(),
+            preview_500: body.chars().take(500).collect(),
+            sha256: sha256_hex(body.as_bytes()),
+        }
+    }
+}
+
+#[derive(Debug, Clone, Copy, Serialize, Deserialize, PartialEq, Eq)]
+#[serde(rename_all = "snake_case")]
+pub enum OutputFeedback {
+    Full,
+    Metadata,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct RlmSessionConfig {
+    pub output_feedback: OutputFeedback,
+    pub sub_query_timeout_secs: u64,
+    pub sub_rlm_max_depth: u32,
+    pub share_session: bool,
+}
+
+impl Default for RlmSessionConfig {
+    fn default() -> Self {
+        Self {
+            output_feedback: OutputFeedback::Full,
+            sub_query_timeout_secs: 120,
+            sub_rlm_max_depth: 1,
+            share_session: false,
+        }
+    }
+}
+
+pub fn write_context_file(body: &str) -> std::io::Result<PathBuf> {
+    let dir = std::env::temp_dir().join("deepseek_rlm_ctx");
+    std::fs::create_dir_all(&dir)?;
+    let path = dir.join(format!(
+        "session_{}_{}.txt",
+        std::process::id(),
+        Uuid::new_v4().simple()
+    ));
+    std::fs::write(&path, body)?;
+    Ok(path)
+}
+
+#[must_use]
+pub fn derive_session_name(source_hint: Option<&str>) -> String {
+    let hint = source_hint
+        .and_then(|raw| {
+            Path::new(raw)
+                .file_name()
+                .and_then(|name| name.to_str())
+                .or(Some(raw))
+        })
+        .unwrap_or("context");
+    let mut out = String::new();
+    for ch in hint.chars() {
+        if ch.is_ascii_alphanumeric() {
+            out.push(ch.to_ascii_lowercase());
+        } else if !out.ends_with('_') {
+            out.push('_');
+        }
+        if out.len() >= 48 {
+            break;
+        }
+    }
+    let out = out.trim_matches('_');
+    if out.is_empty() {
+        "context".to_string()
+    } else {
+        out.to_string()
+    }
+}
+
+fn sha256_hex(bytes: &[u8]) -> String {
+    let mut hasher = Sha256::new();
+    hasher.update(bytes);
+    format!("{:x}", hasher.finalize())
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn derive_session_name_slugifies_path() {
+        assert_eq!(
+            derive_session_name(Some("src/Big File.rs")),
+            "big_file_rs".to_string()
+        );
+    }
+
+    #[test]
+    fn context_meta_hashes_and_previews_body() {
+        let meta = ContextMeta::from_body("abcdef", "text");
+        assert_eq!(meta.length, 6);
+        assert_eq!(meta.preview_500, "abcdef");
+        assert_eq!(
+            meta.sha256,
+            "bef57ec7f53a6d40beb640a780a639c83bc29ac8a9816f1fc6c5c6dcd93c4721"
+        );
+    }
+}
diff --git a/crates/tui/src/runtime_threads.rs b/crates/tui/src/runtime_threads.rs
index 742ef440..b556e030 100644
--- a/crates/tui/src/runtime_threads.rs
+++ b/crates/tui/src/runtime_threads.rs
@@ -1960,6 +1960,8 @@ impl RuntimeThreadManager {
                 active_thread_id: Some(thread.id.clone()),
                 shell_manager: None,
                 hook_executor: None,
+                handle_store: crate::tools::handle::new_shared_handle_store(),
+                rlm_sessions: crate::rlm::session::new_shared_rlm_session_store(),
             },
             subagent_model_overrides: self.config.subagent_model_overrides(),
             memory_enabled: self.config.memory_enabled(),
diff --git a/crates/tui/src/settings.rs b/crates/tui/src/settings.rs
index 18fec2ed..0df883a7 100644
--- a/crates/tui/src/settings.rs
+++ b/crates/tui/src/settings.rs
@@ -211,7 +211,7 @@ pub struct Settings {
     pub default_mode: String,
     /// Sidebar width as percentage of terminal width
     pub sidebar_width_percent: u16,
-    /// Sidebar focus mode: auto, plan, todos, tasks, agents, context
+    /// Sidebar focus mode: auto, work, tasks, agents, context
     pub sidebar_focus: String,
     /// Enable the session-context panel (#504). Shows working set, tokens,
     /// cost, MCP/LSP status, cycle count, and memory info.
@@ -555,13 +555,13 @@ impl Settings {
             "sidebar_focus" | "focus" => {
                 let normalized = match value.trim().to_ascii_lowercase().as_str() {
                     "auto" => "auto",
-                    "plan" => "plan",
-                    "todos" => "todos",
+                    "work" | "plan" | "todos" => "work",
                     "tasks" => "tasks",
                     "agents" | "subagents" | "sub-agents" => "agents",
+                    "context" | "session" => "context",
                     _ => {
                         anyhow::bail!(
-                            "Failed to update setting: invalid sidebar focus '{value}'. Expected: auto, plan, todos, tasks, agents."
+                            "Failed to update setting: invalid sidebar focus '{value}'. Expected: auto, work, tasks, agents, context."
                         )
                     }
                 };
@@ -732,7 +732,7 @@ impl Settings {
             ("sidebar_width", "Sidebar width percentage: 10-50"),
             (
                 "sidebar_focus",
-                "Sidebar focus: auto, plan, todos, tasks, agents",
+                "Sidebar focus: auto, work, tasks, agents, context",
             ),
             ("cost_currency", "Cost display currency: usd, cny"),
             ("max_history", "Max input history entries"),
@@ -886,8 +886,7 @@ fn normalize_background_color_setting(value: &str) -> Result<Option<String>> {
 
 fn normalize_sidebar_focus(value: &str) -> &str {
     match value.trim().to_ascii_lowercase().as_str() {
-        "plan" => "plan",
-        "todos" => "todos",
+        "work" | "plan" | "todos" => "work",
         "tasks" => "tasks",
         "agents" | "subagents" | "sub-agents" => "agents",
         "context" | "session" => "context",
@@ -1008,6 +1007,28 @@ mod tests {
         assert!(err.to_string().contains("invalid cost currency"));
     }
 
+    #[test]
+    fn sidebar_focus_accepts_work_values_and_legacy_aliases() {
+        let mut settings = Settings::default();
+
+        settings.set("sidebar_focus", "work").expect("set work");
+        assert_eq!(settings.sidebar_focus, "work");
+
+        settings.set("focus", "plan").expect("legacy plan alias");
+        assert_eq!(settings.sidebar_focus, "work");
+
+        settings.set("focus", "todos").expect("legacy todos alias");
+        assert_eq!(settings.sidebar_focus, "work");
+
+        settings.set("focus", "context").expect("context focus");
+        assert_eq!(settings.sidebar_focus, "context");
+
+        let err = settings
+            .set("sidebar_focus", "classic")
+            .expect_err("classic is not a supported public focus");
+        assert!(err.to_string().contains("invalid sidebar focus"));
+    }
+
     #[test]
     fn display_localizes_header_and_config_file_label() {
         let settings = Settings::default();
diff --git a/crates/tui/src/tools/fetch_url.rs b/crates/tui/src/tools/fetch_url.rs
index 57dfeb13..8c76ccea 100644
--- a/crates/tui/src/tools/fetch_url.rs
+++ b/crates/tui/src/tools/fetch_url.rs
@@ -7,6 +7,7 @@
 //! (`format = "markdown"`); pass `format = "raw"` to keep the bytes intact
 //! when the model wants to do its own parsing.
 
+use super::handle::query_jsonpath;
 use super::spec::{
     ApprovalRequirement, ToolCapability, ToolContext, ToolError, ToolResult, ToolSpec, optional_u64,
 };
@@ -15,6 +16,7 @@ use async_trait::async_trait;
 use regex::Regex;
 use serde::Serialize;
 use serde_json::{Value, json};
+use std::collections::BTreeMap;
 use std::sync::OnceLock;
 use std::time::Duration;
 
@@ -73,9 +75,12 @@ impl Format {
 struct FetchResponse {
     url: String,
     status: u16,
+    headers: BTreeMap<String, String>,
     content_type: String,
     content: String,
     truncated: bool,
+    #[serde(skip_serializing_if = "Option::is_none")]
+    fields: Option<BTreeMap<String, Vec<Value>>>,
 }
 
 pub struct FetchUrlTool;
@@ -110,6 +115,11 @@ impl ToolSpec for FetchUrlTool {
                 "timeout_ms": {
                     "type": "integer",
                     "description": "Request timeout in milliseconds (default 15,000; max 60,000)."
+                },
+                "fields": {
+                    "type": "array",
+                    "items": { "type": "string" },
+                    "description": "Optional JSONPath projections for JSON responses. Supports $, .field, [index], [*], and ['field']; returns matches under `fields`."
                 }
             },
             "required": ["url"]
@@ -146,6 +156,7 @@ impl ToolSpec for FetchUrlTool {
         let max_bytes = optional_u64(&input, "max_bytes", DEFAULT_MAX_BYTES).min(HARD_MAX_BYTES);
         let timeout_ms =
             optional_u64(&input, "timeout_ms", DEFAULT_TIMEOUT_MS).min(HARD_MAX_TIMEOUT_MS);
+        let requested_fields = parse_fields(&input)?;
         let mut current_url = reqwest::Url::parse(&url)
             .map_err(|e| ToolError::invalid_input(format!("invalid URL: {e}")))?;
         let mut redirects_followed = 0usize;
@@ -202,6 +213,7 @@ impl ToolSpec for FetchUrlTool {
             .and_then(|v| v.to_str().ok())
             .unwrap_or("application/octet-stream")
             .to_string();
+        let headers = response_headers(resp.headers());
 
         let bytes = resp
             .bytes()
@@ -216,6 +228,7 @@ impl ToolSpec for FetchUrlTool {
         };
 
         let body_text = String::from_utf8_lossy(usable).to_string();
+        let fields = project_json_fields(&body_text, &content_type, &requested_fields)?;
         let processed = match format {
             Format::Raw => body_text,
             Format::Text | Format::Markdown => {
@@ -230,9 +243,11 @@ impl ToolSpec for FetchUrlTool {
         let response = FetchResponse {
             url: final_url,
             status: status.as_u16(),
+            headers,
             content_type,
             content: processed,
             truncated,
+            fields,
         };
 
         if !status.is_success() {
@@ -386,6 +401,66 @@ fn validate_dns_resolved_ip(
     )))
 }
 
+fn parse_fields(input: &Value) -> Result<Vec<String>, ToolError> {
+    let Some(values) = input.get("fields") else {
+        return Ok(Vec::new());
+    };
+    let Some(values) = values.as_array() else {
+        return Err(ToolError::invalid_input("`fields` must be an array"));
+    };
+    let mut fields = Vec::new();
+    for value in values {
+        let Some(field) = value.as_str() else {
+            return Err(ToolError::invalid_input(
+                "`fields` entries must be JSONPath strings",
+            ));
+        };
+        let field = field.trim();
+        if !field.is_empty() {
+            fields.push(field.to_string());
+        }
+    }
+    Ok(fields)
+}
+
+fn response_headers(headers: &reqwest::header::HeaderMap) -> BTreeMap<String, String> {
+    headers
+        .iter()
+        .filter_map(|(name, value)| {
+            value
+                .to_str()
+                .ok()
+                .map(|value| (name.as_str().to_ascii_lowercase(), value.to_string()))
+        })
+        .collect()
+}
+
+fn project_json_fields(
+    body_text: &str,
+    content_type: &str,
+    fields: &[String],
+) -> Result<Option<BTreeMap<String, Vec<Value>>>, ToolError> {
+    if fields.is_empty() {
+        return Ok(None);
+    }
+    if !content_type.to_ascii_lowercase().contains("json") {
+        return Err(ToolError::invalid_input(
+            "`fields` can only be used with JSON responses",
+        ));
+    }
+    let body_json: Value = serde_json::from_str(body_text).map_err(|e| {
+        ToolError::execution_failed(format!("response body is not valid JSON for `fields`: {e}"))
+    })?;
+    let mut out = BTreeMap::new();
+    for field in fields {
+        let matches = query_jsonpath(&body_json, field).map_err(|e| {
+            ToolError::invalid_input(format!("invalid JSONPath `{field}` in `fields`: {e}"))
+        })?;
+        out.insert(field.clone(), matches);
+    }
+    Ok(Some(out))
+}
+
 /// Strip `<script>` / `<style>` blocks, drop remaining tags, and collapse
 /// whitespace. Good enough for "let the model read this page" — not a full
 /// HTML-to-Markdown converter.
@@ -453,6 +528,31 @@ mod tests {
         assert!(Format::parse(Some("yaml")).is_err());
     }
 
+    #[test]
+    fn project_json_fields_returns_requested_jsonpath_matches() {
+        let fields = vec!["$.items[*].name".to_string(), "$.count".to_string()];
+        let projected = project_json_fields(
+            r#"{"items":[{"name":"alpha"},{"name":"beta"}],"count":2}"#,
+            "application/json",
+            &fields,
+        )
+        .expect("project")
+        .expect("some");
+
+        assert_eq!(
+            projected.get("$.items[*].name").unwrap(),
+            &vec![json!("alpha"), json!("beta")]
+        );
+        assert_eq!(projected.get("$.count").unwrap(), &vec![json!(2)]);
+    }
+
+    #[test]
+    fn project_json_fields_rejects_non_json_content_type() {
+        let fields = vec!["$.name".to_string()];
+        let err = project_json_fields("{}", "text/plain", &fields).expect_err("must reject");
+        assert!(format!("{err}").contains("JSON responses"));
+    }
+
     #[tokio::test]
     async fn rejects_non_http_schemes() {
         let tool = FetchUrlTool;
diff --git a/crates/tui/src/tools/file.rs b/crates/tui/src/tools/file.rs
index bc2f56a0..ccf826d1 100644
--- a/crates/tui/src/tools/file.rs
+++ b/crates/tui/src/tools/file.rs
@@ -6,7 +6,7 @@
 use super::diff_format::make_unified_diff;
 use super::spec::{
     ApprovalRequirement, ToolCapability, ToolContext, ToolError, ToolResult, ToolSpec,
-    lsp_diagnostics_for_paths, optional_str, required_str,
+    lsp_diagnostics_for_paths, optional_bool, optional_str, required_str,
 };
 use async_trait::async_trait;
 use serde_json::{Value, json};
@@ -473,7 +473,7 @@ impl ToolSpec for EditFileTool {
     }
 
     fn description(&self) -> &'static str {
-        "Replace text in a single file via exact search/replace. Use this instead of `sed -i` in `exec_shell` for one unambiguous in-place edit. `search` must match exactly, including whitespace and indentation. Returns a compact unified diff, not the full file. For structural, multi-block, or cross-file changes, use `apply_patch` or `write_file` instead."
+        "Replace text in a single file via exact search/replace. Use this instead of `sed -i` in `exec_shell` for one unambiguous in-place edit. `search` matches exactly by default, including whitespace and indentation; set `fuzz: true` to tolerate leading-indentation differences. Returns a compact unified diff, not the full file. For structural, multi-block, or cross-file changes, use `apply_patch` or `write_file` instead."
     }
 
     fn input_schema(&self) -> Value {
@@ -491,6 +491,10 @@ impl ToolSpec for EditFileTool {
                 "replace": {
                     "type": "string",
                     "description": "Text to replace with"
+                },
+                "fuzz": {
+                    "type": "boolean",
+                    "description": "When true, tolerate leading whitespace differences on each searched line (default false)"
                 }
             },
             "required": ["path", "search", "replace"]
@@ -513,6 +517,7 @@ impl ToolSpec for EditFileTool {
         let path_str = required_str(&input, "path")?;
         let search = required_str(&input, "search")?;
         let replace = required_str(&input, "replace")?;
+        let fuzz = optional_bool(&input, "fuzz", false);
 
         if search == replace {
             return Err(ToolError::invalid_input(
@@ -527,14 +532,36 @@ impl ToolSpec for EditFileTool {
         })?;
 
         let count = contents.matches(search).count();
-        if count == 0 {
+        let (updated, count, fuzz_used) = if count == 0 && fuzz {
+            let matches = leading_whitespace_fuzzy_matches(&contents, search);
+            match matches.as_slice() {
+                [] => {
+                    return Err(ToolError::execution_failed(format!(
+                        "Search string not found in {}",
+                        file_path.display()
+                    )));
+                }
+                [(start, end)] => {
+                    let mut updated = contents.clone();
+                    updated.replace_range(*start..*end, replace);
+                    (updated, 1, true)
+                }
+                _ => {
+                    return Err(ToolError::execution_failed(format!(
+                        "Fuzzy search matched {} locations in {}; refine search text",
+                        matches.len(),
+                        file_path.display()
+                    )));
+                }
+            }
+        } else if count == 0 {
             return Err(ToolError::execution_failed(format!(
                 "Search string not found in {}",
                 file_path.display()
             )));
-        }
-
-        let updated = contents.replace(search, replace);
+        } else {
+            (contents.replace(search, replace), count, false)
+        };
 
         fs::write(&file_path, &updated).map_err(|e| {
             ToolError::execution_failed(format!("Failed to write {}: {}", file_path.display(), e))
@@ -549,7 +576,12 @@ impl ToolSpec for EditFileTool {
                  Verify the result with read_file before proceeding."
             )
         } else {
-            format!("Replaced 1 occurrence in {display}")
+            let fuzz_note = if fuzz_used {
+                " (fuzzy indentation match)"
+            } else {
+                ""
+            };
+            format!("Replaced 1 occurrence in {display}{fuzz_note}")
         };
         let body = if diff.is_empty() {
             format!("{summary}\n(no textual changes)")
@@ -569,6 +601,52 @@ impl ToolSpec for EditFileTool {
     }
 }
 
+fn strip_line_leading_whitespace_with_map(input: &str) -> (String, Vec<usize>) {
+    let mut normalized = String::with_capacity(input.len());
+    let mut byte_map = Vec::with_capacity(input.len());
+    let mut at_line_start = true;
+    for (idx, ch) in input.char_indices() {
+        if at_line_start && matches!(ch, ' ' | '\t') {
+            continue;
+        }
+        normalized.push(ch);
+        for _ in 0..ch.len_utf8() {
+            byte_map.push(idx);
+        }
+        at_line_start = ch == '\n';
+    }
+    (normalized, byte_map)
+}
+
+fn line_start_before(input: &str, idx: usize) -> usize {
+    input[..idx]
+        .rfind('\n')
+        .map_or(0, |newline| newline.saturating_add(1))
+}
+
+fn leading_whitespace_fuzzy_matches(contents: &str, search: &str) -> Vec<(usize, usize)> {
+    let (normalized_contents, byte_map) = strip_line_leading_whitespace_with_map(contents);
+    let (normalized_search, _) = strip_line_leading_whitespace_with_map(search);
+    if normalized_search.is_empty() {
+        return Vec::new();
+    }
+
+    let mut matches = Vec::new();
+    let mut cursor = 0;
+    while let Some(rel_idx) = normalized_contents[cursor..].find(&normalized_search) {
+        let norm_start = cursor + rel_idx;
+        let norm_end = norm_start + normalized_search.len();
+        let Some(&mapped_start) = byte_map.get(norm_start) else {
+            break;
+        };
+        let original_start = line_start_before(contents, mapped_start);
+        let original_end = byte_map.get(norm_end).copied().unwrap_or(contents.len());
+        matches.push((original_start, original_end));
+        cursor = norm_start.saturating_add(1);
+    }
+    matches
+}
+
 // === ListDirTool ===
 
 /// Tool for listing directory contents.
@@ -1205,6 +1283,41 @@ mod tests {
         assert!(!result.content.contains("multiple matches were replaced"));
     }
 
+    #[tokio::test]
+    async fn test_edit_file_fuzz_tolerates_leading_whitespace() {
+        let tmp = tempdir().expect("tempdir");
+        let ctx = ToolContext::new(tmp.path().to_path_buf());
+
+        let test_file = tmp.path().join("fuzzy.txt");
+        fs::write(
+            &test_file,
+            "fn main() {\n    if true {\n        let value = 1;\n    }\n}\n",
+        )
+        .expect("write");
+
+        let tool = EditFileTool;
+        let result = tool
+            .execute(
+                json!({
+                    "path": "fuzzy.txt",
+                    "search": "if true {\n    let value = 1;\n}",
+                    "replace": "    if true {\n        let value = 2;\n    }",
+                    "fuzz": true
+                }),
+                &ctx,
+            )
+            .await
+            .expect("execute");
+
+        assert!(result.success);
+        assert!(result.content.contains("fuzzy indentation match"));
+        let edited = fs::read_to_string(&test_file).expect("read");
+        assert_eq!(
+            edited,
+            "fn main() {\n    if true {\n        let value = 2;\n    }\n}\n"
+        );
+    }
+
     #[tokio::test]
     async fn test_edit_file_not_found() {
         let tmp = tempdir().expect("tempdir");
diff --git a/crates/tui/src/tools/file_search.rs b/crates/tui/src/tools/file_search.rs
index fa966909..c417e81e 100644
--- a/crates/tui/src/tools/file_search.rs
+++ b/crates/tui/src/tools/file_search.rs
@@ -8,6 +8,8 @@ use ignore::WalkBuilder;
 use serde::Serialize;
 use serde_json::{Value, json};
 
+use crate::tools::search::matches_glob;
+
 use super::spec::{
     ApprovalRequirement, ToolCapability, ToolContext, ToolError, ToolResult, ToolSpec,
     optional_str, optional_u64, required_str,
@@ -52,6 +54,11 @@ impl ToolSpec for FileSearchTool {
                     "type": "array",
                     "items": { "type": "string" },
                     "description": "Optional list of file extensions to include (e.g. [\"rs\", \"md\"])."
+                },
+                "exclude": {
+                    "type": "array",
+                    "items": { "type": "string" },
+                    "description": "Optional glob patterns to exclude, matching grep_files' convention (e.g. [\"target/**\", \"*.lock\"])."
                 }
             },
             "required": ["query"]
@@ -79,7 +86,8 @@ impl ToolSpec for FileSearchTool {
         };
 
         let extensions = parse_extensions(&input);
-        let matches = search_files(query, &base_path, extensions, limit)?;
+        let exclude_patterns = parse_exclude_patterns(&input);
+        let matches = search_files(query, &base_path, extensions, exclude_patterns, limit)?;
         ToolResult::json(&matches).map_err(|e| ToolError::execution_failed(e.to_string()))
     }
 }
@@ -107,10 +115,37 @@ fn parse_extensions(input: &Value) -> Vec<String> {
     out
 }
 
+fn parse_exclude_patterns(input: &Value) -> Vec<String> {
+    if let Some(values) = input.get("exclude").and_then(Value::as_array) {
+        return values
+            .iter()
+            .filter_map(Value::as_str)
+            .map(str::trim)
+            .filter(|pattern| !pattern.is_empty())
+            .map(ToOwned::to_owned)
+            .collect();
+    }
+
+    [
+        "target/**",
+        "node_modules/**",
+        ".git/**",
+        "DerivedData/**",
+        "dist/**",
+        "build/**",
+        "*.lock",
+        "*.plist",
+    ]
+    .into_iter()
+    .map(ToOwned::to_owned)
+    .collect()
+}
+
 fn search_files(
     query: &str,
     base_path: &Path,
     extensions: Vec<String>,
+    exclude_patterns: Vec<String>,
     limit: usize,
 ) -> Result<Vec<FileSearchMatch>, ToolError> {
     if !base_path.exists() {
@@ -137,15 +172,19 @@ fn search_files(
         }
 
         let path = entry.path();
-        if !extensions.is_empty() && !extension_matches(path, &extensions) {
-            continue;
-        }
-
         let rel_path = path
             .strip_prefix(base_path)
             .unwrap_or(path)
             .to_string_lossy()
-            .to_string();
+            .replace('\\', "/");
+        if should_exclude(&rel_path, &exclude_patterns) {
+            continue;
+        }
+
+        if !extensions.is_empty() && !extension_matches(path, &extensions) {
+            continue;
+        }
+
         let name = file_name(path);
 
         let score = match score_match(&query_norm, &rel_path, &name) {
@@ -167,6 +206,12 @@ fn search_files(
     Ok(results)
 }
 
+fn should_exclude(rel_path: &str, exclude_patterns: &[String]) -> bool {
+    exclude_patterns
+        .iter()
+        .any(|pattern| matches_glob(rel_path, pattern))
+}
+
 fn extension_matches(path: &Path, extensions: &[String]) -> bool {
     let Some(ext) = path.extension().and_then(|e| e.to_str()) else {
         return false;
@@ -323,6 +368,46 @@ mod tests {
         assert!(!result.content.contains("notes.md"));
     }
 
+    #[tokio::test]
+    async fn test_file_search_exclude_filter() {
+        let tmp = tempdir().expect("tempdir");
+        let root = tmp.path();
+        std::fs::create_dir_all(root.join("fixtures")).expect("mkdir");
+        std::fs::write(root.join("fixtures").join("needle.txt"), "no\n").expect("write");
+        std::fs::write(root.join("needle.txt"), "yes\n").expect("write");
+
+        let ctx = ToolContext::new(root.to_path_buf());
+        let tool = FileSearchTool;
+        let result = tool
+            .execute(json!({"query": "needle", "exclude": ["fixtures/**"]}), &ctx)
+            .await
+            .expect("execute");
+
+        assert!(result.success);
+        assert!(result.content.contains("\"path\": \"needle.txt\""));
+        assert!(!result.content.contains("fixtures/needle.txt"));
+    }
+
+    #[tokio::test]
+    async fn test_file_search_default_excludes_build_artifacts() {
+        let tmp = tempdir().expect("tempdir");
+        let root = tmp.path();
+        std::fs::create_dir_all(root.join("target")).expect("mkdir");
+        std::fs::write(root.join("target").join("needle.txt"), "no\n").expect("write");
+        std::fs::write(root.join("needle.txt"), "yes\n").expect("write");
+
+        let ctx = ToolContext::new(root.to_path_buf());
+        let tool = FileSearchTool;
+        let result = tool
+            .execute(json!({"query": "needle"}), &ctx)
+            .await
+            .expect("execute");
+
+        assert!(result.success);
+        assert!(result.content.contains("\"path\": \"needle.txt\""));
+        assert!(!result.content.contains("target/needle.txt"));
+    }
+
     #[tokio::test]
     #[cfg(unix)]
     async fn test_file_search_does_not_follow_symlinked_files() {
diff --git a/crates/tui/src/tools/handle.rs b/crates/tui/src/tools/handle.rs
new file mode 100644
index 00000000..a6406748
--- /dev/null
+++ b/crates/tui/src/tools/handle.rs
@@ -0,0 +1,812 @@
+//! Symbolic handle storage and bounded reads.
+//!
+//! `var_handle` is the shared protocol that lets expensive environments
+//! (RLM sessions, sub-agent transcripts, large artifacts) hand the parent a
+//! small symbolic reference instead of copying the whole payload into the
+//! parent transcript.
+
+use std::collections::HashMap;
+use std::sync::Arc;
+
+use async_trait::async_trait;
+use serde::{Deserialize, Serialize};
+use serde_json::{Value, json};
+use sha2::{Digest, Sha256};
+use tokio::sync::Mutex;
+
+use crate::tools::spec::{
+    ApprovalRequirement, ToolCapability, ToolContext, ToolError, ToolResult, ToolSpec,
+};
+
+const DEFAULT_MAX_CHARS: usize = 12_000;
+const HARD_MAX_CHARS: usize = 50_000;
+#[allow(dead_code)] // Used by producers as they begin returning var_handle records.
+const REPR_PREVIEW_CHARS: usize = 160;
+
+pub type SharedHandleStore = Arc<Mutex<HandleStore>>;
+
+#[must_use]
+pub fn new_shared_handle_store() -> SharedHandleStore {
+    Arc::new(Mutex::new(HandleStore::default()))
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
+pub struct VarHandle {
+    pub kind: String,
+    pub session_id: String,
+    pub name: String,
+    #[serde(rename = "type")]
+    pub type_name: String,
+    pub length: usize,
+    pub repr_preview: String,
+    pub sha256: String,
+}
+
+impl VarHandle {
+    #[must_use]
+    pub fn key(&self) -> HandleKey {
+        HandleKey {
+            session_id: self.session_id.clone(),
+            name: self.name.clone(),
+        }
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+pub struct HandleKey {
+    pub session_id: String,
+    pub name: String,
+}
+
+#[derive(Debug, Clone)]
+pub struct HandleRecord {
+    pub handle: VarHandle,
+    pub value: HandleValue,
+}
+
+#[allow(dead_code)] // Producers land in later v0.8.33 slices; handle_read is first.
+#[derive(Debug, Clone)]
+pub enum HandleValue {
+    Text(String),
+    Json(Value),
+}
+
+#[allow(dead_code)] // Foundation methods used by upcoming RLM/agent session producers.
+impl HandleValue {
+    fn length(&self) -> usize {
+        match self {
+            Self::Text(text) => text.chars().count(),
+            Self::Json(Value::Array(items)) => items.len(),
+            Self::Json(Value::Object(map)) => map.len(),
+            Self::Json(value) => value.to_string().chars().count(),
+        }
+    }
+
+    fn type_name(&self) -> String {
+        match self {
+            Self::Text(_) => "str".to_string(),
+            Self::Json(Value::Array(_)) => "list".to_string(),
+            Self::Json(Value::Object(_)) => "dict".to_string(),
+            Self::Json(Value::String(_)) => "str".to_string(),
+            Self::Json(Value::Bool(_)) => "bool".to_string(),
+            Self::Json(Value::Number(_)) => "number".to_string(),
+            Self::Json(Value::Null) => "null".to_string(),
+        }
+    }
+
+    fn stable_bytes(&self) -> Vec<u8> {
+        match self {
+            Self::Text(text) => text.as_bytes().to_vec(),
+            Self::Json(value) => serde_json::to_vec(value).unwrap_or_default(),
+        }
+    }
+
+    fn repr_preview(&self) -> String {
+        match self {
+            Self::Text(text) => truncate_chars(text, REPR_PREVIEW_CHARS),
+            Self::Json(value) => truncate_chars(&value.to_string(), REPR_PREVIEW_CHARS),
+        }
+    }
+}
+
+#[derive(Debug, Default)]
+pub struct HandleStore {
+    records: HashMap<HandleKey, HandleRecord>,
+}
+
+#[allow(dead_code)] // Insertors are for producer tools; this PR wires the reader first.
+impl HandleStore {
+    #[must_use]
+    pub fn insert_text(
+        &mut self,
+        session_id: impl Into<String>,
+        name: impl Into<String>,
+        text: impl Into<String>,
+    ) -> VarHandle {
+        self.insert(session_id, name, HandleValue::Text(text.into()))
+    }
+
+    #[must_use]
+    pub fn insert_json(
+        &mut self,
+        session_id: impl Into<String>,
+        name: impl Into<String>,
+        value: Value,
+    ) -> VarHandle {
+        self.insert(session_id, name, HandleValue::Json(value))
+    }
+
+    #[must_use]
+    pub fn get(&self, handle: &VarHandle) -> Option<&HandleRecord> {
+        self.records.get(&handle.key())
+    }
+
+    fn insert(
+        &mut self,
+        session_id: impl Into<String>,
+        name: impl Into<String>,
+        value: HandleValue,
+    ) -> VarHandle {
+        let session_id = session_id.into();
+        let name = name.into();
+        let handle = VarHandle {
+            kind: "var_handle".to_string(),
+            session_id: session_id.clone(),
+            name: name.clone(),
+            type_name: value.type_name(),
+            length: value.length(),
+            repr_preview: value.repr_preview(),
+            sha256: sha256_hex(&value.stable_bytes()),
+        };
+        let key = HandleKey { session_id, name };
+        self.records.insert(
+            key,
+            HandleRecord {
+                handle: handle.clone(),
+                value,
+            },
+        );
+        handle
+    }
+}
+
+pub struct HandleReadTool;
+
+#[async_trait]
+impl ToolSpec for HandleReadTool {
+    fn name(&self) -> &'static str {
+        "handle_read"
+    }
+
+    fn description(&self) -> &'static str {
+        "Read a bounded projection from a var_handle returned by tools such \
+         as RLM sessions, sub-agents, or large artifact producers. Provide \
+         exactly one projection: `slice` for char/line slices, `range` for \
+         one-based line ranges, `count` for metadata counts, or `jsonpath` \
+         for a small JSON-path projection. This retrieves from the handle's \
+         backing environment instead of asking the parent transcript to hold \
+         the full payload."
+    }
+
+    fn input_schema(&self) -> Value {
+        json!({
+            "type": "object",
+            "required": ["handle"],
+            "properties": {
+                "handle": {
+                    "description": "A var_handle object, or a compact `session_id/name` string.",
+                    "oneOf": [
+                        {
+                            "type": "object",
+                            "required": ["kind", "session_id", "name"],
+                            "properties": {
+                                "kind": { "type": "string", "const": "var_handle" },
+                                "session_id": { "type": "string" },
+                                "name": { "type": "string" },
+                                "type": { "type": "string" },
+                                "length": { "type": "integer" },
+                                "repr_preview": { "type": "string" },
+                                "sha256": { "type": "string" }
+                            }
+                        },
+                        { "type": "string" }
+                    ]
+                },
+                "slice": {
+                    "type": "object",
+                    "description": "Zero-based half-open slice over chars or lines.",
+                    "properties": {
+                        "start": { "type": "integer", "minimum": 0 },
+                        "end": { "type": "integer", "minimum": 0 },
+                        "unit": { "type": "string", "enum": ["chars", "lines"], "default": "chars" }
+                    }
+                },
+                "range": {
+                    "type": "object",
+                    "description": "One-based inclusive line range.",
+                    "required": ["start", "end"],
+                    "properties": {
+                        "start": { "type": "integer", "minimum": 1 },
+                        "end": { "type": "integer", "minimum": 1 }
+                    }
+                },
+                "count": {
+                    "type": "boolean",
+                    "description": "Return counts for the handle payload."
+                },
+                "jsonpath": {
+                    "type": "string",
+                    "description": "Small JSONPath subset: $, .field, [index], [*], and ['field']."
+                },
+                "max_chars": {
+                    "type": "integer",
+                    "description": "Maximum characters to return in this projection. Defaults to 12000; hard-capped at 50000."
+                }
+            }
+        })
+    }
+
+    fn capabilities(&self) -> Vec<ToolCapability> {
+        vec![ToolCapability::ReadOnly]
+    }
+
+    fn approval_requirement(&self) -> ApprovalRequirement {
+        ApprovalRequirement::Auto
+    }
+
+    fn supports_parallel(&self) -> bool {
+        true
+    }
+
+    async fn execute(&self, input: Value, context: &ToolContext) -> Result<ToolResult, ToolError> {
+        let handle = parse_handle(
+            input
+                .get("handle")
+                .ok_or_else(|| ToolError::missing_field("handle"))?,
+        )?;
+        let projection = parse_projection(&input)?;
+        let max_chars = input
+            .get("max_chars")
+            .and_then(Value::as_u64)
+            .map(|n| (n as usize).min(HARD_MAX_CHARS))
+            .unwrap_or(DEFAULT_MAX_CHARS);
+
+        let store = context.runtime.handle_store.lock().await;
+        let record = store.get(&handle).ok_or_else(|| {
+            ToolError::invalid_input(format!(
+                "handle_read: no payload found for handle {}/{}",
+                handle.session_id, handle.name
+            ))
+        })?;
+        if !handle.sha256.is_empty() && handle.sha256 != record.handle.sha256 {
+            return Err(ToolError::invalid_input(
+                "handle_read: handle sha256 does not match stored payload",
+            ));
+        }
+
+        let output = match projection {
+            Projection::Count => count_projection(record),
+            Projection::Slice { start, end, unit } => {
+                slice_projection(record, start, end, unit, max_chars)
+            }
+            Projection::Range { start, end } => {
+                line_range_projection(record, start, end, max_chars)
+            }
+            Projection::JsonPath(path) => jsonpath_projection(record, &path, max_chars)?,
+        };
+
+        ToolResult::json(&output).map_err(|e| ToolError::execution_failed(e.to_string()))
+    }
+}
+
+#[derive(Debug, Clone, Copy)]
+enum SliceUnit {
+    Chars,
+    Lines,
+}
+
+enum Projection {
+    Count,
+    Slice {
+        start: usize,
+        end: Option<usize>,
+        unit: SliceUnit,
+    },
+    Range {
+        start: usize,
+        end: usize,
+    },
+    JsonPath(String),
+}
+
+fn parse_handle(value: &Value) -> Result<VarHandle, ToolError> {
+    if let Some(raw) = value.as_str() {
+        let Some((session_id, name)) = raw.rsplit_once('/') else {
+            return Err(ToolError::invalid_input(
+                "handle_read: string handle must use `session_id/name`",
+            ));
+        };
+        return Ok(VarHandle {
+            kind: "var_handle".to_string(),
+            session_id: session_id.to_string(),
+            name: name.to_string(),
+            type_name: String::new(),
+            length: 0,
+            repr_preview: String::new(),
+            sha256: String::new(),
+        });
+    }
+
+    let handle: VarHandle = serde_json::from_value(value.clone()).map_err(|e| {
+        ToolError::invalid_input(format!("handle_read: invalid var_handle object: {e}"))
+    })?;
+    if handle.kind != "var_handle" {
+        return Err(ToolError::invalid_input(
+            "handle_read: handle.kind must be `var_handle`",
+        ));
+    }
+    if handle.session_id.trim().is_empty() || handle.name.trim().is_empty() {
+        return Err(ToolError::invalid_input(
+            "handle_read: handle.session_id and handle.name must be non-empty",
+        ));
+    }
+    Ok(handle)
+}
+
+fn parse_projection(input: &Value) -> Result<Projection, ToolError> {
+    let mut count = 0usize;
+    count += usize::from(input.get("slice").is_some());
+    count += usize::from(input.get("range").is_some());
+    count += usize::from(input.get("count").and_then(Value::as_bool).unwrap_or(false));
+    count += usize::from(input.get("jsonpath").is_some());
+    if count != 1 {
+        return Err(ToolError::invalid_input(
+            "handle_read: provide exactly one of `slice`, `range`, `count: true`, or `jsonpath`",
+        ));
+    }
+
+    if input.get("count").and_then(Value::as_bool).unwrap_or(false) {
+        return Ok(Projection::Count);
+    }
+    if let Some(path) = input.get("jsonpath") {
+        let path = path
+            .as_str()
+            .ok_or_else(|| ToolError::invalid_input("handle_read: jsonpath must be a string"))?
+            .trim();
+        if path.is_empty() {
+            return Err(ToolError::invalid_input(
+                "handle_read: jsonpath must not be empty",
+            ));
+        }
+        return Ok(Projection::JsonPath(path.to_string()));
+    }
+    if let Some(slice) = input.get("slice") {
+        let start = slice.get("start").and_then(Value::as_u64).unwrap_or(0) as usize;
+        let end = slice.get("end").and_then(Value::as_u64).map(|n| n as usize);
+        if let Some(end) = end
+            && end < start
+        {
+            return Err(ToolError::invalid_input(
+                "handle_read: slice.end must be greater than or equal to slice.start",
+            ));
+        }
+        let unit = match slice.get("unit").and_then(Value::as_str).unwrap_or("chars") {
+            "chars" => SliceUnit::Chars,
+            "lines" => SliceUnit::Lines,
+            other => {
+                return Err(ToolError::invalid_input(format!(
+                    "handle_read: unsupported slice.unit `{other}`"
+                )));
+            }
+        };
+        return Ok(Projection::Slice { start, end, unit });
+    }
+    let range = input
+        .get("range")
+        .ok_or_else(|| ToolError::invalid_input("handle_read: missing projection"))?;
+    let start = range
+        .get("start")
+        .and_then(Value::as_u64)
+        .ok_or_else(|| ToolError::missing_field("range.start"))? as usize;
+    let end = range
+        .get("end")
+        .and_then(Value::as_u64)
+        .ok_or_else(|| ToolError::missing_field("range.end"))? as usize;
+    if start == 0 || end == 0 || end < start {
+        return Err(ToolError::invalid_input(
+            "handle_read: range is one-based inclusive and end must be >= start",
+        ));
+    }
+    Ok(Projection::Range { start, end })
+}
+
+fn count_projection(record: &HandleRecord) -> Value {
+    match &record.value {
+        HandleValue::Text(text) => json!({
+            "handle": record.handle,
+            "projection": "count",
+            "chars": text.chars().count(),
+            "lines": text.lines().count(),
+            "bytes": text.len(),
+        }),
+        HandleValue::Json(value) => json!({
+            "handle": record.handle,
+            "projection": "count",
+            "json_type": json_type(value),
+            "length": record.handle.length,
+            "bytes": value.to_string().len(),
+        }),
+    }
+}
+
+fn slice_projection(
+    record: &HandleRecord,
+    start: usize,
+    end: Option<usize>,
+    unit: SliceUnit,
+    max_chars: usize,
+) -> Value {
+    let text = record_text(record);
+    match unit {
+        SliceUnit::Chars => {
+            let total = text.chars().count();
+            let end = end.unwrap_or(total).min(total);
+            let raw = char_slice(&text, start.min(total), end);
+            bounded_text_projection(
+                record,
+                "slice",
+                raw,
+                max_chars,
+                json!({
+                    "unit": "chars",
+                    "start": start.min(total),
+                    "end": end,
+                    "total_chars": total,
+                }),
+            )
+        }
+        SliceUnit::Lines => {
+            let lines: Vec<&str> = text.lines().collect();
+            let total = lines.len();
+            let end = end.unwrap_or(total).min(total);
+            let raw = if start >= end {
+                String::new()
+            } else {
+                lines[start.min(total)..end].join("\n")
+            };
+            bounded_text_projection(
+                record,
+                "slice",
+                raw,
+                max_chars,
+                json!({
+                    "unit": "lines",
+                    "start": start.min(total),
+                    "end": end,
+                    "total_lines": total,
+                }),
+            )
+        }
+    }
+}
+
+fn line_range_projection(
+    record: &HandleRecord,
+    start: usize,
+    end: usize,
+    max_chars: usize,
+) -> Value {
+    let text = record_text(record);
+    let lines: Vec<&str> = text.lines().collect();
+    let total = lines.len();
+    let zero_start = start.saturating_sub(1).min(total);
+    let zero_end = end.min(total);
+    let raw = if zero_start >= zero_end {
+        String::new()
+    } else {
+        lines[zero_start..zero_end].join("\n")
+    };
+    bounded_text_projection(
+        record,
+        "range",
+        raw,
+        max_chars,
+        json!({
+            "start": start,
+            "end": end,
+            "shown_start": zero_start + 1,
+            "shown_end": zero_end,
+            "total_lines": total,
+        }),
+    )
+}
+
+fn jsonpath_projection(
+    record: &HandleRecord,
+    path: &str,
+    max_chars: usize,
+) -> Result<Value, ToolError> {
+    let HandleValue::Json(value) = &record.value else {
+        return Err(ToolError::invalid_input(
+            "handle_read: jsonpath projection requires a JSON handle",
+        ));
+    };
+    let matches = query_jsonpath(value, path)
+        .map_err(|e| ToolError::invalid_input(format!("handle_read: {e}")))?;
+    let mut payload = json!({
+        "handle": record.handle,
+        "projection": "jsonpath",
+        "jsonpath": path,
+        "count": matches.len(),
+        "matches": matches,
+        "truncated": false,
+    });
+    let rendered = serde_json::to_string(&payload).unwrap_or_default();
+    if rendered.chars().count() > max_chars {
+        payload["matches"] = json!([]);
+        payload["preview"] = json!(truncate_chars(&rendered, max_chars));
+        payload["truncated"] = json!(true);
+    }
+    Ok(payload)
+}
+
+fn bounded_text_projection(
+    record: &HandleRecord,
+    projection: &str,
+    raw: String,
+    max_chars: usize,
+    extra: Value,
+) -> Value {
+    let raw_chars = raw.chars().count();
+    let content = truncate_chars(&raw, max_chars);
+    let shown_chars = content.chars().count();
+    json!({
+        "handle": record.handle,
+        "projection": projection,
+        "content": content,
+        "truncated": shown_chars < raw_chars,
+        "shown_chars": shown_chars,
+        "omitted_chars": raw_chars.saturating_sub(shown_chars),
+        "meta": extra,
+    })
+}
+
+fn record_text(record: &HandleRecord) -> String {
+    match &record.value {
+        HandleValue::Text(text) => text.clone(),
+        HandleValue::Json(value) => serde_json::to_string_pretty(value).unwrap_or_default(),
+    }
+}
+
+pub(crate) fn query_jsonpath(root: &Value, path: &str) -> Result<Vec<Value>, String> {
+    if !path.starts_with('$') {
+        return Err("jsonpath must start with `$`".to_string());
+    }
+    let mut idx = 1usize;
+    let bytes = path.as_bytes();
+    let mut current = vec![root];
+    while idx < bytes.len() {
+        match bytes[idx] {
+            b'.' => {
+                idx += 1;
+                if idx < bytes.len() && bytes[idx] == b'.' {
+                    return Err("recursive descent (`..`) is not supported".to_string());
+                }
+                let start = idx;
+                while idx < bytes.len()
+                    && (bytes[idx].is_ascii_alphanumeric() || bytes[idx] == b'_')
+                {
+                    idx += 1;
+                }
+                if start == idx {
+                    return Err("expected field name after `.`".to_string());
+                }
+                let field = &path[start..idx];
+                current = current
+                    .into_iter()
+                    .filter_map(|value| value.get(field))
+                    .collect();
+            }
+            b'[' => {
+                let Some(close_rel) = path[idx + 1..].find(']') else {
+                    return Err("unterminated `[` segment".to_string());
+                };
+                let close = idx + 1 + close_rel;
+                let token = path[idx + 1..close].trim();
+                idx = close + 1;
+                current = apply_bracket_token(current, token)?;
+            }
+            other => {
+                return Err(format!(
+                    "unexpected character `{}` in jsonpath",
+                    other as char
+                ));
+            }
+        }
+    }
+    Ok(current.into_iter().cloned().collect())
+}
+
+fn apply_bracket_token<'a>(values: Vec<&'a Value>, token: &str) -> Result<Vec<&'a Value>, String> {
+    if token == "*" {
+        let mut out = Vec::new();
+        for value in values {
+            match value {
+                Value::Array(items) => out.extend(items),
+                Value::Object(map) => out.extend(map.values()),
+                _ => {}
+            }
+        }
+        return Ok(out);
+    }
+
+    if let Some(field) = quoted_field(token) {
+        return Ok(values
+            .into_iter()
+            .filter_map(|value| value.get(field))
+            .collect());
+    }
+
+    let index = token
+        .parse::<usize>()
+        .map_err(|_| format!("unsupported bracket token `{token}`"))?;
+    Ok(values
+        .into_iter()
+        .filter_map(|value| value.as_array().and_then(|items| items.get(index)))
+        .collect())
+}
+
+fn quoted_field(token: &str) -> Option<&str> {
+    if token.len() < 2 {
+        return None;
+    }
+    let bytes = token.as_bytes();
+    let quote = bytes[0];
+    if !matches!(quote, b'\'' | b'"') || bytes[token.len() - 1] != quote {
+        return None;
+    }
+    Some(&token[1..token.len() - 1])
+}
+
+fn char_slice(text: &str, start: usize, end: usize) -> String {
+    text.chars()
+        .skip(start)
+        .take(end.saturating_sub(start))
+        .collect()
+}
+
+fn truncate_chars(text: &str, max_chars: usize) -> String {
+    let mut out = String::new();
+    for (idx, ch) in text.chars().enumerate() {
+        if idx == max_chars {
+            break;
+        }
+        out.push(ch);
+    }
+    out
+}
+
+#[allow(dead_code)] // Used when producer tools register handle payloads.
+fn sha256_hex(bytes: &[u8]) -> String {
+    let mut hasher = Sha256::new();
+    hasher.update(bytes);
+    format!("{:x}", hasher.finalize())
+}
+
+fn json_type(value: &Value) -> &'static str {
+    match value {
+        Value::Null => "null",
+        Value::Bool(_) => "bool",
+        Value::Number(_) => "number",
+        Value::String(_) => "string",
+        Value::Array(_) => "array",
+        Value::Object(_) => "object",
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use serde_json::json;
+
+    fn ctx() -> ToolContext {
+        ToolContext::new(".")
+    }
+
+    #[tokio::test]
+    async fn handle_read_slices_text_by_chars() {
+        let ctx = ctx();
+        let handle = {
+            let mut store = ctx.runtime.handle_store.lock().await;
+            store.insert_text("rlm:test", "matches", "abcdef")
+        };
+
+        let result = HandleReadTool
+            .execute(
+                json!({"handle": handle, "slice": {"start": 1, "end": 4}}),
+                &ctx,
+            )
+            .await
+            .expect("execute");
+        let body: Value = serde_json::from_str(&result.content).expect("json");
+        assert_eq!(body["content"], "bcd");
+        assert_eq!(body["truncated"], false);
+    }
+
+    #[tokio::test]
+    async fn handle_read_ranges_text_by_one_based_lines() {
+        let ctx = ctx();
+        let handle = {
+            let mut store = ctx.runtime.handle_store.lock().await;
+            store.insert_text("agent:test", "transcript", "one\ntwo\nthree\nfour")
+        };
+
+        let result = HandleReadTool
+            .execute(
+                json!({"handle": handle, "range": {"start": 2, "end": 3}}),
+                &ctx,
+            )
+            .await
+            .expect("execute");
+        let body: Value = serde_json::from_str(&result.content).expect("json");
+        assert_eq!(body["content"], "two\nthree");
+        assert_eq!(body["meta"]["shown_start"], 2);
+        assert_eq!(body["meta"]["shown_end"], 3);
+    }
+
+    #[tokio::test]
+    async fn handle_read_counts_json_collections() {
+        let ctx = ctx();
+        let handle = {
+            let mut store = ctx.runtime.handle_store.lock().await;
+            store.insert_json("rlm:test", "items", json!([{"a": 1}, {"a": 2}]))
+        };
+
+        let result = HandleReadTool
+            .execute(json!({"handle": handle, "count": true}), &ctx)
+            .await
+            .expect("execute");
+        let body: Value = serde_json::from_str(&result.content).expect("json");
+        assert_eq!(body["json_type"], "array");
+        assert_eq!(body["length"], 2);
+    }
+
+    #[tokio::test]
+    async fn handle_read_projects_jsonpath_subset() {
+        let ctx = ctx();
+        let handle = {
+            let mut store = ctx.runtime.handle_store.lock().await;
+            store.insert_json(
+                "rlm:test",
+                "items",
+                json!({"items": [{"name": "a"}, {"name": "b"}]}),
+            )
+        };
+
+        let result = HandleReadTool
+            .execute(
+                json!({"handle": handle, "jsonpath": "$.items[*].name"}),
+                &ctx,
+            )
+            .await
+            .expect("execute");
+        let body: Value = serde_json::from_str(&result.content).expect("json");
+        assert_eq!(body["matches"], json!(["a", "b"]));
+        assert_eq!(body["count"], 2);
+    }
+
+    #[tokio::test]
+    async fn handle_read_rejects_unbounded_projection_requests() {
+        let ctx = ctx();
+        let handle = {
+            let mut store = ctx.runtime.handle_store.lock().await;
+            store.insert_text("rlm:test", "body", "abc")
+        };
+
+        let err = HandleReadTool
+            .execute(json!({"handle": handle}), &ctx)
+            .await
+            .expect_err("projection required");
+        assert!(err.to_string().contains("exactly one"));
+    }
+}
diff --git a/crates/tui/src/tools/mod.rs b/crates/tui/src/tools/mod.rs
index ce2ac86e..1a6d470f 100644
--- a/crates/tui/src/tools/mod.rs
+++ b/crates/tui/src/tools/mod.rs
@@ -23,6 +23,7 @@ pub mod fim;
 pub mod git;
 pub mod git_history;
 pub mod github;
+pub mod handle;
 pub mod image_ocr;
 pub mod js_execution;
 pub mod large_output_router;
diff --git a/crates/tui/src/tools/registry.rs b/crates/tui/src/tools/registry.rs
index e355a9ef..eff511e0 100644
--- a/crates/tui/src/tools/registry.rs
+++ b/crates/tui/src/tools/registry.rs
@@ -660,15 +660,22 @@ impl ToolRegistryBuilder {
         self.with_tool(Arc::new(RevertTurnTool))
     }
 
-    /// Include the RLM tool (`rlm`). Runs the full recursive language-model
-    /// loop on a long input (file or inline content); the long input never
-    /// enters the calling model's context window. The Python REPL exposes
-    /// `llm_query` / `llm_query_batched` / `rlm_query` / `rlm_query_batched`
-    /// helpers for sub-LLM work — that's where parallel fan-out belongs.
+    /// Include persistent RLM session tools.
     #[must_use]
-    pub fn with_rlm_tool(self, client: Option<DeepSeekClient>, root_model: String) -> Self {
-        use super::rlm::RlmTool;
-        self.with_tool(Arc::new(RlmTool::new(client, root_model)))
+    pub fn with_rlm_tool(self, client: Option<DeepSeekClient>, _root_model: String) -> Self {
+        use super::rlm::{RlmCloseTool, RlmConfigureTool, RlmEvalTool, RlmOpenTool};
+        self.with_tool(Arc::new(RlmOpenTool))
+            .with_tool(Arc::new(RlmEvalTool::new(client)))
+            .with_tool(Arc::new(RlmConfigureTool))
+            .with_tool(Arc::new(RlmCloseTool))
+    }
+
+    /// Include `handle_read`, the bounded projection reader for symbolic
+    /// `var_handle` payloads.
+    #[must_use]
+    pub fn with_handle_tools(self) -> Self {
+        use super::handle::HandleReadTool;
+        self.with_tool(Arc::new(HandleReadTool))
     }
 
     /// Include the review tool.
@@ -769,6 +776,7 @@ impl ToolRegistryBuilder {
             .with_test_runner_tool()
             .with_validation_tools()
             .with_tool_result_retrieval_tool()
+            .with_handle_tools()
             .with_runtime_task_tools()
             .with_revert_turn_tool()
             .with_pandoc_tools()
@@ -840,51 +848,14 @@ impl ToolRegistryBuilder {
         manager: super::subagent::SharedSubAgentManager,
         runtime: super::subagent::SubAgentRuntime,
     ) -> Self {
-        use super::subagent::{
-            AgentAssignTool, AgentCancelTool, AgentCloseTool, AgentListTool, AgentResultTool,
-            AgentResumeTool, AgentSendInputTool, AgentSpawnTool, AgentWaitTool,
-            DelegateToAgentTool,
-        };
+        use super::subagent::{AgentCloseTool, AgentEvalTool, AgentOpenTool};
 
-        self.with_tool(Arc::new(AgentSpawnTool::new(
+        self.with_tool(Arc::new(AgentOpenTool::new(
             manager.clone(),
             runtime.clone(),
         )))
-        .with_tool(Arc::new(AgentSpawnTool::with_name(
-            manager.clone(),
-            runtime.clone(),
-            "spawn_agent",
-        )))
-        .with_tool(Arc::new(DelegateToAgentTool::new(
-            manager.clone(),
-            runtime.clone(),
-        )))
-        .with_tool(Arc::new(AgentResultTool::new(manager.clone())))
-        .with_tool(Arc::new(AgentSendInputTool::new(
-            manager.clone(),
-            "send_input",
-        )))
-        .with_tool(Arc::new(AgentAssignTool::new(
-            manager.clone(),
-            "agent_assign",
-        )))
-        .with_tool(Arc::new(AgentAssignTool::new(
-            manager.clone(),
-            "assign_agent",
-        )))
-        .with_tool(Arc::new(AgentWaitTool::new(manager.clone(), "wait")))
-        .with_tool(Arc::new(AgentSendInputTool::new(
-            manager.clone(),
-            "agent_send_input",
-        )))
-        .with_tool(Arc::new(AgentWaitTool::new(manager.clone(), "agent_wait")))
-        .with_tool(Arc::new(AgentResumeTool::new(
-            manager.clone(),
-            runtime.clone(),
-        )))
-        .with_tool(Arc::new(AgentCloseTool::new(manager.clone())))
-        .with_tool(Arc::new(AgentCancelTool::new(manager.clone())))
-        .with_tool(Arc::new(AgentListTool::new(manager)))
+        .with_tool(Arc::new(AgentEvalTool::new(manager.clone())))
+        .with_tool(Arc::new(AgentCloseTool::new(manager)))
     }
 
     /// Build the registry with the given context.
diff --git a/crates/tui/src/tools/revert_turn.rs b/crates/tui/src/tools/revert_turn.rs
index 9234d1cd..68413e80 100644
--- a/crates/tui/src/tools/revert_turn.rs
+++ b/crates/tui/src/tools/revert_turn.rs
@@ -97,6 +97,17 @@ impl ToolSpec for RevertTurnTool {
                     )
                 })?
                 .clone();
+            if repo
+                .work_tree_matches_snapshot(&target.id)
+                .map_err(|e| format!("Snapshot comparison failed: {e}"))?
+            {
+                return Err(format!(
+                    "NoSnapshotForTurn: target '{}' ({}) already matches the current workspace. \
+                     Revert operates at completed turn boundaries; there is no distinct later snapshot to restore.",
+                    target.label,
+                    short_sha(target.id.as_str()),
+                ));
+            }
             repo.restore(&target.id)
                 .map_err(|e| format!("Restore failed: {e}"))?;
             Ok(format!(
@@ -189,6 +200,24 @@ mod tests {
         assert!(r.is_err());
     }
 
+    #[tokio::test]
+    async fn revert_turn_rejects_snapshot_matching_current_workspace() {
+        let tmp = tempdir().unwrap();
+        let workspace = tmp.path().join("ws");
+        std::fs::create_dir_all(&workspace).unwrap();
+        let _guard = scoped_home(tmp.path());
+
+        let repo = SnapshotRepo::open_or_init(&workspace).unwrap();
+        std::fs::write(workspace.join("a.txt"), b"unchanged").unwrap();
+        repo.snapshot("pre-turn:1").unwrap();
+
+        let tool = RevertTurnTool;
+        let ctx = ToolContext::new(workspace);
+        let r = tool.execute(json!({}), &ctx).await.expect("execute");
+        assert!(!r.success);
+        assert!(r.content.contains("NoSnapshotForTurn"), "{}", r.content);
+    }
+
     #[tokio::test]
     async fn revert_turn_no_snapshots_returns_error_result() {
         let tmp = tempdir().unwrap();
diff --git a/crates/tui/src/tools/rlm.rs b/crates/tui/src/tools/rlm.rs
index 2c7058b4..9d1f4cdf 100644
--- a/crates/tui/src/tools/rlm.rs
+++ b/crates/tui/src/tools/rlm.rs
@@ -1,443 +1,592 @@
-//! `rlm_process` tool — heavy-lift recursive language model as a tool call.
+//! Persistent RLM session tools.
 //!
-//! Where `rlm_query` is a parallel fanout primitive (N prompts → N answers,
-//! stateless), `rlm_process` runs the full recursive-language-model loop
-//! against a long input. The input is loaded into a Python REPL as the
-//! `PROMPT` variable; a sub-agent writes code to chunk it, calls
-//! `llm_query()` / `sub_rlm()` for sub-LLM work, and returns a final string
-//! via `FINAL()`. The model never has to put the long input in its own
-//! context window — it just calls the tool with `task` + `file_path` (or
-//! inline `content`) and reads the synthesized answer back.
-//!
-//! Use when the input genuinely doesn't fit in working context: a whole
-//! file, a long transcript, a multi-document corpus. For short prompts or
-//! parallel fanout, prefer `rlm_query`.
+//! v0.8.33 replaces the old one-shot `rlm` tool with a head/hands surface:
+//! `rlm_open` creates a named Python kernel over a large context,
+//! `rlm_eval` runs bounded probes against it, `rlm_configure` adjusts runtime
+//! feedback, and `rlm_close` tears it down.
+
+use std::sync::Arc;
+use std::time::Instant;
 
 use async_trait::async_trait;
 use serde_json::{Value, json};
 
 use crate::client::DeepSeekClient;
-use crate::rlm::turn::{RlmTermination, run_rlm_turn_with_root};
+use crate::repl::PythonRuntime;
+use crate::rlm::RlmBridge;
+use crate::rlm::session::{
+    ContextMeta, OutputFeedback, RlmSession, derive_session_name, write_context_file,
+};
+use crate::tools::fetch_url::FetchUrlTool;
+use crate::tools::handle::VarHandle;
 use crate::tools::spec::{
     ApprovalRequirement, ToolCapability, ToolContext, ToolError, ToolResult, ToolSpec,
 };
-use crate::utils::spawn_supervised;
 
-/// Default child model — cheap and fast.
 const DEFAULT_CHILD_MODEL: &str = "deepseek-v4-flash";
-/// Default `sub_rlm` recursion budget — paper experiments use 1.
-const DEFAULT_MAX_DEPTH: u32 = 1;
-/// Hard cap on how many chars of inline `content` we'll accept. Larger
-/// inputs should come in via `file_path` so they never enter the caller's
-/// context in the first place.
 const MAX_INLINE_CONTENT_CHARS: usize = 200_000;
+const FULL_STDOUT_HEAD_CHARS: usize = 4_096;
+const FULL_STDOUT_TAIL_CHARS: usize = 1_024;
+const HARD_SUB_RLM_DEPTH_CAP: u32 = 3;
 
-pub struct RlmTool {
-    /// Production HTTP client. `None` when no API key is configured.
-    client: Option<DeepSeekClient>,
-    /// Root model to drive the RLM loop. Set at registration time; matches
-    /// whatever model the parent session is using.
-    root_model: String,
-}
-
-impl RlmTool {
-    #[must_use]
-    pub fn new(client: Option<DeepSeekClient>, root_model: String) -> Self {
-        Self { client, root_model }
-    }
-}
+pub struct RlmOpenTool;
 
 #[async_trait]
-impl ToolSpec for RlmTool {
+impl ToolSpec for RlmOpenTool {
     fn name(&self) -> &'static str {
-        "rlm"
+        "rlm_open"
     }
 
     fn description(&self) -> &'static str {
-        "Specialty tool for processing long inputs that don't fit in your \
-         own context window. Loads the input into a sandboxed Python REPL \
-         as `PROMPT`; a sub-agent writes Python that chunks the input and \
-         calls in-REPL helpers (`llm_query`, `llm_query_batched`, \
-         `rlm_query`, `rlm_query_batched`) to process it, then returns a \
-         synthesized answer. \n\n\
-         Use this tool when the input is genuinely large or when a Python \
-         map-reduce pass plus child LLM calls is the right shape: whole \
-         files, long transcripts, multi-document corpora, bulk semantic \
-         classification, or decomposition/critique work. For exact counts \
-         or structured aggregates, compute them directly in Python inside \
-         the REPL and report the deterministic result instead of asking a \
-         child LLM to guess. For whole-input map-reduce, use the REPL \
-         helpers `chunk_context()` and `chunk_coverage()` so the result \
-         states what was covered. \n\n\
-         Provide `task` (what to do) plus exactly one of `file_path` \
-         (workspace-relative, preferred — keeps the long input out of \
-         your context entirely) or `content` (inline, capped at 200k \
-         chars). The Python helpers (`llm_query`, `rlm_query`, etc.) live \
-         INSIDE the REPL — they are not separately-callable tools. \n\n\
-         Returns the final synthesized answer plus an RLM report showing \
-         input size, iterations, duration, sub-LLM calls, and trace summary."
+        "Open a persistent RLM context. Loads `file_path`, `content`, or `url` \
+         into a named Python kernel and returns only metadata: name, length, \
+         preview, and sha256. Use this for large or unfamiliar inputs so the \
+         parent transcript holds a handle, not the body."
     }
 
     fn input_schema(&self) -> Value {
         json!({
             "type": "object",
-            "required": ["task"],
             "properties": {
-                "task": {
+                "name": {
                     "type": "string",
-                    "description": "What to do with the input (e.g. \"Summarize the security model\", \"Extract all API endpoints\", \"Categorize each row by sentiment\"). The sub-agent uses this as its objective."
+                    "description": "Caller-chosen context name, unique within this parent session. Defaults to a slug from the source."
                 },
                 "file_path": {
                     "type": "string",
-                    "description": "Workspace-relative path to a file to load as PROMPT. Preferred — keeps the long input out of your context. Mutually exclusive with `content`."
+                    "description": "Workspace-relative file to load."
                 },
                 "content": {
                     "type": "string",
-                    "description": "Inline content to load as PROMPT. Use only when the input isn't a file you can point at. Capped at 200k chars."
+                    "description": "Inline content to load. Capped at 200k chars."
                 },
-                "max_depth": {
-                    "type": "integer",
-                    "description": "Recursion budget for `sub_rlm()` calls. 0 disables recursion; default 1 matches paper experiments."
+                "url": {
+                    "type": "string",
+                    "description": "HTTP/HTTPS URL to fetch through fetch_url and load."
                 }
             }
         })
     }
 
     fn capabilities(&self) -> Vec<ToolCapability> {
-        // Network for the LLM calls; ExecutesCode because the sub-agent
-        // runs Python in the REPL (which can do filesystem operations
-        // within its sandbox).
+        vec![
+            ToolCapability::ReadOnly,
+            ToolCapability::Network,
+            ToolCapability::ExecutesCode,
+        ]
+    }
+
+    fn approval_requirement(&self) -> ApprovalRequirement {
+        ApprovalRequirement::Auto
+    }
+
+    async fn execute(&self, input: Value, context: &ToolContext) -> Result<ToolResult, ToolError> {
+        let source_count = ["file_path", "content", "url"]
+            .iter()
+            .filter(|key| input.get(**key).and_then(Value::as_str).is_some())
+            .count();
+        if source_count != 1 {
+            return Err(ToolError::invalid_input(
+                "rlm_open: provide exactly one of `file_path`, `content`, or `url`",
+            ));
+        }
+
+        let (body, source_type, source_hint) = load_source(&input, context).await?;
+        if body.trim().is_empty() {
+            return Err(ToolError::invalid_input(
+                "rlm_open: input is empty after loading",
+            ));
+        }
+
+        let name = input
+            .get("name")
+            .and_then(Value::as_str)
+            .map(str::trim)
+            .filter(|name| !name.is_empty())
+            .map(ToOwned::to_owned)
+            .unwrap_or_else(|| derive_session_name(source_hint.as_deref()));
+
+        {
+            let sessions = context.runtime.rlm_sessions.lock().await;
+            if sessions.contains_key(&name) {
+                return Err(ToolError::invalid_input(format!(
+                    "rlm_open: context name `{name}` already exists"
+                )));
+            }
+        }
+
+        let context_path = write_context_file(&body).map_err(|e| {
+            ToolError::execution_failed(format!("rlm_open: failed to stage context: {e}"))
+        })?;
+        let kernel = PythonRuntime::spawn_with_context(&context_path)
+            .await
+            .map_err(|e| ToolError::execution_failed(format!("rlm_open: {e}")))?;
+        let context_meta = ContextMeta::from_body(&body, source_type);
+        let session = RlmSession::new(name.clone(), kernel, context_meta.clone(), context_path);
+        let id = session.id.clone();
+
+        let mut sessions = context.runtime.rlm_sessions.lock().await;
+        sessions.insert(name.clone(), Arc::new(tokio::sync::Mutex::new(session)));
+
+        ToolResult::json(&json!({
+            "name": name,
+            "id": id,
+            "length": context_meta.length,
+            "type": context_meta.type_name,
+            "preview_500": context_meta.preview_500,
+            "sha256": context_meta.sha256,
+        }))
+        .map_err(|e| ToolError::execution_failed(e.to_string()))
+    }
+}
+
+pub struct RlmEvalTool {
+    client: Option<DeepSeekClient>,
+}
+
+impl RlmEvalTool {
+    #[must_use]
+    pub fn new(client: Option<DeepSeekClient>) -> Self {
+        Self { client }
+    }
+}
+
+#[async_trait]
+impl ToolSpec for RlmEvalTool {
+    fn name(&self) -> &'static str {
+        "rlm_eval"
+    }
+
+    fn description(&self) -> &'static str {
+        "Run one Python REPL block against a named RLM context. Returns a \
+         bounded projection of stdout/stderr plus metadata. If the code calls \
+         FINAL/finalize, the final value is stored as a var_handle retrievable \
+         with handle_read instead of copied unbounded into the parent context."
+    }
+
+    fn input_schema(&self) -> Value {
+        json!({
+            "type": "object",
+            "required": ["name", "code"],
+            "properties": {
+                "name": { "type": "string", "description": "RLM context name from rlm_open." },
+                "code": { "type": "string", "description": "Python code to execute. Do not include markdown fences." }
+            }
+        })
+    }
+
+    fn capabilities(&self) -> Vec<ToolCapability> {
         vec![ToolCapability::Network, ToolCapability::ExecutesCode]
     }
 
     fn approval_requirement(&self) -> ApprovalRequirement {
-        // Same level as parallel_fanout: the model decided to invoke this, the
-        // user already enabled tools by being in Agent/YOLO mode, and
-        // every concrete side-effect (file read, LLM call) is bounded.
         ApprovalRequirement::Auto
     }
 
-    fn supports_parallel(&self) -> bool {
-        // Each call spins its own sidecar on a kernel-assigned port and
-        // its own per-turn state file, so two calls don't interfere.
-        true
+    async fn execute(&self, input: Value, context: &ToolContext) -> Result<ToolResult, ToolError> {
+        let name = required_non_empty_str(&input, "name")?;
+        let code = required_non_empty_str(&input, "code")?;
+        let session = get_session(context, name).await?;
+        let mut session = session.lock().await;
+        let config = session.config.clone();
+
+        let Some(kernel) = session.kernel.as_mut() else {
+            return Err(ToolError::invalid_input(format!(
+                "rlm_eval: context `{name}` is closed"
+            )));
+        };
+
+        let started = Instant::now();
+        let (round, child_usage) = if let Some(client) = self.client.clone() {
+            let bridge = RlmBridge::new(
+                Arc::new(client),
+                DEFAULT_CHILD_MODEL.to_string(),
+                config.sub_rlm_max_depth.min(HARD_SUB_RLM_DEPTH_CAP),
+            );
+            let usage_handle = bridge.usage_handle();
+            let round = kernel
+                .run(code, Some(&bridge))
+                .await
+                .map_err(|e| ToolError::execution_failed(format!("rlm_eval: {e}")))?;
+            let usage = usage_handle.lock().await.clone();
+            (round, usage)
+        } else {
+            let round = kernel
+                .run(code, None::<&RlmBridge>)
+                .await
+                .map_err(|e| ToolError::execution_failed(format!("rlm_eval: {e}")))?;
+            (round, Default::default())
+        };
+
+        session.rpc_count = session.rpc_count.saturating_add(round.rpc_count);
+        session.total_duration += round.elapsed;
+        session.last_used_at = Instant::now();
+
+        let final_handle = if let Some(value) = round.final_value.clone() {
+            session.final_count = session.final_count.saturating_add(1);
+            let handle_name = format!("final_{}", session.final_count);
+            let handle = {
+                let mut store = context.runtime.handle_store.lock().await;
+                store.insert_text(session.id.clone(), handle_name, value)
+            };
+            Some(handle)
+        } else {
+            None
+        };
+
+        let had_error = round.has_error;
+        let rpc_count = round.rpc_count;
+        let duration_ms = round.elapsed.as_millis() as u64;
+        let stdout_preview = match config.output_feedback {
+            OutputFeedback::Full => Some(preview_output(&round.full_stdout)),
+            OutputFeedback::Metadata => None,
+        };
+        let stderr_preview = match config.output_feedback {
+            OutputFeedback::Full if !round.stderr.is_empty() => Some(preview_output(&round.stderr)),
+            _ => None,
+        };
+
+        let mut output = json!({
+            "name": session.name,
+            "id": session.id,
+            "duration_ms": duration_ms,
+            "rpc_count": rpc_count,
+            "had_error": had_error,
+            "new_vars": [],
+            "final": final_handle,
+        });
+        if let Some(stdout_preview) = stdout_preview {
+            output["stdout_preview"] = json!(stdout_preview);
+        }
+        if let Some(stderr_preview) = stderr_preview {
+            output["stderr_preview"] = json!(stderr_preview);
+        }
+        if let Some(confidence) = round.final_confidence.clone() {
+            output["confidence"] = confidence;
+        }
+
+        let metadata = json!({
+            "tool": "rlm_eval",
+            "duration_ms": started.elapsed().as_millis() as u64,
+            "child_input_tokens": child_usage.input_tokens,
+            "child_output_tokens": child_usage.output_tokens,
+            "child_prompt_cache_hit_tokens": child_usage.prompt_cache_hit_tokens,
+            "child_prompt_cache_miss_tokens": child_usage.prompt_cache_miss_tokens,
+            "child_model": DEFAULT_CHILD_MODEL,
+        });
+
+        Ok(ToolResult::json(&output)
+            .map_err(|e| ToolError::execution_failed(e.to_string()))?
+            .with_metadata(metadata))
+    }
+}
+
+pub struct RlmConfigureTool;
+
+#[async_trait]
+impl ToolSpec for RlmConfigureTool {
+    fn name(&self) -> &'static str {
+        "rlm_configure"
+    }
+
+    fn description(&self) -> &'static str {
+        "Configure a named RLM context: output feedback, child query timeout, \
+         recursive sub-RLM depth, and explicit session sharing."
+    }
+
+    fn input_schema(&self) -> Value {
+        json!({
+            "type": "object",
+            "required": ["name"],
+            "properties": {
+                "name": { "type": "string" },
+                "output_feedback": { "type": "string", "enum": ["full", "metadata"] },
+                "sub_query_timeout_secs": { "type": "integer" },
+                "sub_rlm_max_depth": { "type": "integer", "minimum": 0, "maximum": 3 },
+                "share_session": { "type": "boolean" }
+            }
+        })
+    }
+
+    fn capabilities(&self) -> Vec<ToolCapability> {
+        vec![ToolCapability::ReadOnly]
     }
 
     async fn execute(&self, input: Value, context: &ToolContext) -> Result<ToolResult, ToolError> {
-        let Some(client) = self.client.clone() else {
-            return Err(ToolError::not_available(
-                "rlm_process requires an active DeepSeek client".to_string(),
-            ));
-        };
+        let name = required_non_empty_str(&input, "name")?;
+        let session = get_session(context, name).await?;
+        let mut session = session.lock().await;
 
-        let task = input
-            .get("task")
-            .and_then(|v| v.as_str())
-            .ok_or_else(|| ToolError::MissingField {
-                field: "task".to_string(),
-            })?
-            .trim();
-        if task.is_empty() {
-            return Err(ToolError::invalid_input("rlm: `task` is empty"));
-        }
-
-        let file_path = input.get("file_path").and_then(|v| v.as_str());
-        let content = input.get("content").and_then(|v| v.as_str());
-
-        let body = match (file_path, content) {
-            (Some(_), Some(_)) => {
-                return Err(ToolError::invalid_input(
-                    "rlm: pass `file_path` OR `content`, not both",
-                ));
-            }
-            (None, None) => {
-                return Err(ToolError::invalid_input(
-                    "rlm: requires `file_path` (preferred) or `content`",
-                ));
-            }
-            (Some(path), None) => {
-                let resolved = context.resolve_path(path)?;
-                tokio::fs::read_to_string(&resolved).await.map_err(|e| {
-                    ToolError::ExecutionFailed {
-                        message: format!("read {}: {e}", resolved.display()),
-                    }
-                })?
-            }
-            (None, Some(c)) => {
-                if c.chars().count() > MAX_INLINE_CONTENT_CHARS {
+        if let Some(value) = input.get("output_feedback").and_then(Value::as_str) {
+            session.config.output_feedback = match value {
+                "full" => OutputFeedback::Full,
+                "metadata" => OutputFeedback::Metadata,
+                other => {
                     return Err(ToolError::invalid_input(format!(
-                        "rlm: inline `content` is {} chars (cap {MAX_INLINE_CONTENT_CHARS}). Pass `file_path` for larger inputs.",
-                        c.chars().count()
+                        "rlm_configure: invalid output_feedback `{other}`"
                     )));
                 }
-                c.to_string()
-            }
-        };
-
-        if body.trim().is_empty() {
-            return Err(ToolError::invalid_input(
-                "rlm: input is empty after loading",
-            ));
+            };
         }
-        let input_chars = body.chars().count();
-        let input_lines = body.lines().count();
-
-        // Pin child calls to Flash so model-generated tool args cannot quietly
-        // turn fanout work into Pro-billed requests. The RLM root still uses
-        // the session model; child helper calls are the cheap batch layer.
-        let child_model = DEFAULT_CHILD_MODEL.to_string();
-
-        let max_depth = input
-            .get("max_depth")
-            .and_then(|v| v.as_u64())
-            .map(|n| n.min(u64::from(u32::MAX)) as u32)
-            .unwrap_or(DEFAULT_MAX_DEPTH);
-
-        // The tool framework doesn't expose a per-tool event stream, and
-        // we don't want RLM's progress events to interleave with the
-        // parent agent's stream. Drain into a no-op channel.
-        let (tx, mut rx) = tokio::sync::mpsc::channel(64);
-        let drain = spawn_supervised(
-            "rlm-progress-drain",
-            std::panic::Location::caller(),
-            async move { while rx.recv().await.is_some() {} },
-        );
-
-        // The big body lives only in the REPL as `context`. The small
-        // `task` rides along as `root_prompt` and is shown to the root
-        // LLM each iteration so it never forgets the objective.
-        let result = run_rlm_turn_with_root(
-            &client,
-            self.root_model.clone(),
-            body,
-            Some(task.to_string()),
-            child_model.clone(),
-            tx,
-            max_depth,
-        )
-        .await;
-
-        drain.abort();
-
-        if let Some(err) = result.error {
-            return Err(ToolError::ExecutionFailed {
-                message: format!(
-                    "rlm: {err} (iterations={}, termination={:?})",
-                    result.iterations, result.termination
-                ),
-            });
+        if let Some(timeout) = input.get("sub_query_timeout_secs").and_then(Value::as_u64) {
+            session.config.sub_query_timeout_secs = timeout.clamp(1, 600);
+        }
+        if let Some(depth) = input.get("sub_rlm_max_depth").and_then(Value::as_u64) {
+            session.config.sub_rlm_max_depth = (depth as u32).min(HARD_SUB_RLM_DEPTH_CAP);
+        }
+        if let Some(share) = input.get("share_session").and_then(Value::as_bool) {
+            session.config.share_session = share;
         }
 
-        if result.answer.trim().is_empty() {
-            return Err(ToolError::ExecutionFailed {
-                message: format!(
-                    "rlm: empty answer (termination={:?}, iterations={})",
-                    result.termination, result.iterations
-                ),
-            });
-        }
-
-        // Surface the termination reason and a brief per-round trace so the
-        // user can verify the sub-agent actually engaged with `context`
-        // through sub-LLM calls — not just inferred an answer from the
-        // preview.
-        let footer = match result.termination {
-            RlmTermination::Final => String::new(),
-            RlmTermination::NoCode => format!(
-                "\n\n[warning: sub-agent failed to engage the REPL after {} iterations — answer is the model's last raw response]",
-                result.iterations
-            ),
-            RlmTermination::Exhausted => format!(
-                "\n\n[warning: sub-agent hit the {}-iteration cap without FINAL()]",
-                result.iterations
-            ),
-            RlmTermination::Error => String::new(),
-        };
-
-        let report = format!(
-            "RLM report:\n- input: {input_lines} line(s), {input_chars} char(s)\n- iterations: {}\n- duration: {}ms\n- sub-LLM RPCs: {}\n- termination: {:?}\n\nAnswer:\n",
-            result.iterations,
-            result.duration.as_millis(),
-            result.total_rpcs,
-            result.termination,
-        );
-
-        let trace_summary = if result.trace.is_empty() {
-            String::from("\n\n[trace: no REPL rounds executed]")
-        } else {
-            let mut s = String::from("\n\n[RLM trace]");
-            for r in &result.trace {
-                let head = r
-                    .code_summary
-                    .lines()
-                    .next()
-                    .unwrap_or(r.code_summary.as_str())
-                    .chars()
-                    .take(80)
-                    .collect::<String>();
-                s.push_str(&format!(
-                    "\n  round {}: {} sub-LLM call(s), {}ms{} — {}",
-                    r.round,
-                    r.rpc_count,
-                    r.elapsed_ms,
-                    if r.had_error { " (error)" } else { "" },
-                    head
-                ));
-            }
-            s
-        };
-
-        let trace_json: Vec<_> = result
-            .trace
-            .iter()
-            .map(|r| {
-                json!({
-                    "round": r.round,
-                    "rpc_count": r.rpc_count,
-                    "elapsed_ms": r.elapsed_ms,
-                    "had_error": r.had_error,
-                    "code_summary": r.code_summary,
-                    "stdout_preview": r.stdout_preview,
-                })
-            })
-            .collect();
-
-        // The `child_*` keys are the contract the engine reads in
-        // `tool_routing::accrue_child_token_cost_if_any` to roll
-        // sub-LLM token usage into the session-cost counter. RLM
-        // spawns its own DeepSeek calls under `child_model`; without
-        // this accrual the dashboard under-reports a session that
-        // uses RLM heavily by 10-20× because only the parent turn's
-        // tokens hit `accrue_session_cost` (#524).
-        let metadata = json!({
-            "iterations": result.iterations,
-            "duration_ms": result.duration.as_millis() as u64,
-            "input_tokens": result.usage.input_tokens,
-            "output_tokens": result.usage.output_tokens,
-            "child_input_tokens": result.usage.input_tokens,
-            "child_output_tokens": result.usage.output_tokens,
-            "child_prompt_cache_hit_tokens": result.usage.prompt_cache_hit_tokens,
-            "child_prompt_cache_miss_tokens": result.usage.prompt_cache_miss_tokens,
-            "child_model": child_model,
-            "termination": format!("{:?}", result.termination).to_lowercase(),
-            "max_depth": max_depth,
-            "context_chars": input_chars,
-            "context_lines": input_lines,
-            "total_rpcs": result.total_rpcs,
-            "trace": trace_json,
-        });
-
-        Ok(ToolResult::success(format!(
-            "{report}{}{}{}",
-            result.answer, footer, trace_summary
-        ))
-        .with_metadata(metadata))
+        ToolResult::json(&json!({
+            "name": session.name,
+            "current_config": session.config,
+        }))
+        .map_err(|e| ToolError::execution_failed(e.to_string()))
     }
 }
 
+pub struct RlmCloseTool;
+
+#[async_trait]
+impl ToolSpec for RlmCloseTool {
+    fn name(&self) -> &'static str {
+        "rlm_close"
+    }
+
+    fn description(&self) -> &'static str {
+        "Close a named RLM context, tear down its Python kernel, and return \
+         usage/lifecycle metadata."
+    }
+
+    fn input_schema(&self) -> Value {
+        json!({
+            "type": "object",
+            "required": ["name"],
+            "properties": {
+                "name": { "type": "string", "description": "RLM context name from rlm_open." }
+            }
+        })
+    }
+
+    fn capabilities(&self) -> Vec<ToolCapability> {
+        vec![ToolCapability::ReadOnly]
+    }
+
+    async fn execute(&self, input: Value, context: &ToolContext) -> Result<ToolResult, ToolError> {
+        let name = required_non_empty_str(&input, "name")?;
+        let removed = {
+            let mut sessions = context.runtime.rlm_sessions.lock().await;
+            sessions.remove(name)
+        };
+        let Some(session) = removed else {
+            return Err(ToolError::invalid_input(format!(
+                "rlm_close: unknown context `{name}`"
+            )));
+        };
+
+        let mut session = session.lock().await;
+        let kernel = session.kernel.take();
+        let output = json!({
+            "name": session.name,
+            "id": session.id,
+            "rpc_count": session.rpc_count,
+            "total_duration_ms": session.total_duration.as_millis() as u64,
+            "peak_var_count": session.peak_var_count,
+            "created_ms_ago": session.created_at.elapsed().as_millis() as u64,
+            "context_path": session.context_path,
+        });
+        drop(session);
+
+        if let Some(kernel) = kernel {
+            kernel.shutdown().await;
+        }
+
+        ToolResult::json(&output).map_err(|e| ToolError::execution_failed(e.to_string()))
+    }
+}
+
+async fn load_source(
+    input: &Value,
+    context: &ToolContext,
+) -> Result<(String, String, Option<String>), ToolError> {
+    if let Some(path) = input.get("file_path").and_then(Value::as_str) {
+        let resolved = context.resolve_path(path)?;
+        let body = tokio::fs::read_to_string(&resolved).await.map_err(|e| {
+            ToolError::execution_failed(format!("rlm_open: read {}: {e}", resolved.display()))
+        })?;
+        return Ok((body, "file".to_string(), Some(path.to_string())));
+    }
+
+    if let Some(content) = input.get("content").and_then(Value::as_str) {
+        if content.chars().count() > MAX_INLINE_CONTENT_CHARS {
+            return Err(ToolError::invalid_input(format!(
+                "rlm_open: inline content is {} chars (cap {MAX_INLINE_CONTENT_CHARS})",
+                content.chars().count()
+            )));
+        }
+        return Ok((content.to_string(), "content".to_string(), None));
+    }
+
+    let url = input
+        .get("url")
+        .and_then(Value::as_str)
+        .ok_or_else(|| ToolError::invalid_input("rlm_open: missing source"))?;
+    let result = FetchUrlTool
+        .execute(json!({"url": url, "format": "raw"}), context)
+        .await?;
+    let parsed: Value = serde_json::from_str(&result.content).map_err(|e| {
+        ToolError::execution_failed(format!("rlm_open: fetch_url returned invalid JSON: {e}"))
+    })?;
+    let body = parsed
+        .get("content")
+        .and_then(Value::as_str)
+        .ok_or_else(|| ToolError::execution_failed("rlm_open: fetched body missing content"))?
+        .to_string();
+    let source_type = parsed
+        .get("content_type")
+        .and_then(Value::as_str)
+        .unwrap_or("url")
+        .to_string();
+    Ok((body, source_type, Some(url.to_string())))
+}
+
+async fn get_session(
+    context: &ToolContext,
+    name: &str,
+) -> Result<Arc<tokio::sync::Mutex<RlmSession>>, ToolError> {
+    let sessions = context.runtime.rlm_sessions.lock().await;
+    sessions.get(name).cloned().ok_or_else(|| {
+        ToolError::invalid_input(format!("unknown RLM context `{name}`; call rlm_open first"))
+    })
+}
+
+fn required_non_empty_str<'a>(input: &'a Value, field: &str) -> Result<&'a str, ToolError> {
+    let value = input
+        .get(field)
+        .and_then(Value::as_str)
+        .ok_or_else(|| ToolError::missing_field(field))?
+        .trim();
+    if value.is_empty() {
+        return Err(ToolError::invalid_input(format!(
+            "rlm: `{field}` must not be empty"
+        )));
+    }
+    Ok(value)
+}
+
+fn preview_output(text: &str) -> String {
+    let total = text.chars().count();
+    if total <= FULL_STDOUT_HEAD_CHARS + FULL_STDOUT_TAIL_CHARS {
+        return text.to_string();
+    }
+    let head: String = text.chars().take(FULL_STDOUT_HEAD_CHARS).collect();
+    let tail: String = text
+        .chars()
+        .skip(total.saturating_sub(FULL_STDOUT_TAIL_CHARS))
+        .collect();
+    format!(
+        "{head}\n... [{} chars truncated, retrieve via handle_read when returned as a handle] ...\n{tail}",
+        total.saturating_sub(FULL_STDOUT_HEAD_CHARS + FULL_STDOUT_TAIL_CHARS)
+    )
+}
+
+#[allow(dead_code)]
+fn _assert_var_handle_shape(_: Option<VarHandle>) {}
+
 #[cfg(test)]
 mod tests {
     use super::*;
-
-    fn tool() -> RlmTool {
-        RlmTool::new(None, "deepseek-v4-pro".to_string())
-    }
+    use crate::tools::spec::ToolContext;
 
     fn ctx() -> ToolContext {
-        use std::path::PathBuf;
-        ToolContext::with_auto_approve(
-            PathBuf::from("."),
-            false,
-            PathBuf::from("notes.txt"),
-            PathBuf::from("mcp.json"),
-            true,
-        )
+        ToolContext::new(".")
     }
 
     #[test]
-    fn name_and_schema() {
-        let t = tool();
-        assert_eq!(t.name(), "rlm");
-        let schema = t.input_schema();
-        assert!(schema["properties"]["task"].is_object());
-        assert!(schema["properties"]["file_path"].is_object());
-        assert!(schema["properties"]["content"].is_object());
-        assert!(schema["properties"]["max_depth"].is_object());
-        let required = schema["required"].as_array().unwrap();
-        assert!(required.iter().any(|v| v == "task"));
-    }
-
-    #[test]
-    fn approval_is_auto_so_calls_are_unattended() {
-        assert_eq!(tool().approval_requirement(), ApprovalRequirement::Auto);
-    }
-
-    #[test]
-    fn capabilities_include_network_and_executes_code() {
-        let caps = tool().capabilities();
-        assert!(caps.contains(&ToolCapability::Network));
-        assert!(caps.contains(&ToolCapability::ExecutesCode));
-    }
-
-    #[test]
-    fn supports_parallel_dispatch() {
-        assert!(tool().supports_parallel());
-    }
-
-    #[test]
-    fn description_steers_without_suppressing_rlm_use() {
-        let t = tool();
-        let description = t.description();
-        assert!(
-            description.contains("Use this tool when"),
-            "description should positively explain the RLM fit"
-        );
-        assert!(
-            !description.contains("DO NOT use"),
-            "avoid training the model to avoid an available tool"
-        );
-        assert!(
-            !description.contains("slower and more expensive"),
-            "cost caveats belong in verification guidance, not tool suppression"
-        );
+    fn schema_uses_new_tool_names() {
+        assert_eq!(RlmOpenTool.name(), "rlm_open");
+        assert_eq!(RlmEvalTool::new(None).name(), "rlm_eval");
+        assert_eq!(RlmConfigureTool.name(), "rlm_configure");
+        assert_eq!(RlmCloseTool.name(), "rlm_close");
     }
 
     #[tokio::test]
-    async fn returns_not_available_without_client() {
-        let t = tool();
+    async fn rlm_session_open_eval_close_lifecycle() {
         let ctx = ctx();
-        let res = t
-            .execute(json!({"task": "x", "content": "y"}), &ctx)
+        RlmOpenTool
+            .execute(
+                json!({"name": "sample", "content": "alpha\nbeta\ngamma"}),
+                &ctx,
+            )
             .await
-            .expect_err("must error");
-        assert!(matches!(res, ToolError::NotAvailable { .. }));
+            .expect("open");
+
+        let eval = RlmEvalTool::new(None)
+            .execute(json!({"name": "sample", "code": "print('ok')"}), &ctx)
+            .await
+            .expect("eval");
+        let eval_json: Value = serde_json::from_str(&eval.content).expect("eval json");
+        assert_eq!(eval_json["stdout_preview"], "ok\n");
+
+        let close = RlmCloseTool
+            .execute(json!({"name": "sample"}), &ctx)
+            .await
+            .expect("close");
+        assert!(close.content.contains("sample"));
     }
 
     #[tokio::test]
-    async fn rejects_missing_task() {
-        let t = RlmTool::new(None, "x".into());
+    async fn rlm_eval_final_returns_handle() {
         let ctx = ctx();
-        let res = t
-            .execute(json!({"content": "abc"}), &ctx)
+        RlmOpenTool
+            .execute(json!({"name": "finals", "content": "body"}), &ctx)
             .await
-            .expect_err("must error");
-        // Without a client we hit NotAvailable first. Re-check ordering by
-        // injecting an obviously-bad payload that would trip earlier.
-        assert!(matches!(
-            res,
-            ToolError::NotAvailable { .. } | ToolError::MissingField { .. }
-        ));
+            .expect("open");
+
+        let eval = RlmEvalTool::new(None)
+            .execute(
+                json!({"name": "finals", "code": "finalize('done', confidence=0.8)"}),
+                &ctx,
+            )
+            .await
+            .expect("eval");
+        let eval_json: Value = serde_json::from_str(&eval.content).expect("eval json");
+        assert_eq!(eval_json["final"]["kind"], "var_handle");
+        assert_eq!(eval_json["final"]["name"], "final_1");
+        assert_eq!(eval_json["confidence"], 0.8);
+
+        RlmCloseTool
+            .execute(json!({"name": "finals"}), &ctx)
+            .await
+            .expect("close");
     }
 
     #[tokio::test]
-    async fn rejects_both_path_and_content() {
-        // Even without a client, the input-shape check should fire if we
-        // bypass the client guard. Simpler: just verify the schema lists
-        // the two as alternatives via descriptions.
-        let schema = tool().input_schema();
-        let path_desc = schema["properties"]["file_path"]["description"]
-            .as_str()
-            .unwrap();
-        assert!(path_desc.to_lowercase().contains("mutually exclusive"));
+    async fn rlm_configure_metadata_omits_stdout() {
+        let ctx = ctx();
+        RlmOpenTool
+            .execute(json!({"name": "quiet", "content": "body"}), &ctx)
+            .await
+            .expect("open");
+        RlmConfigureTool
+            .execute(
+                json!({"name": "quiet", "output_feedback": "metadata", "sub_rlm_max_depth": 99}),
+                &ctx,
+            )
+            .await
+            .expect("configure");
+
+        let eval = RlmEvalTool::new(None)
+            .execute(json!({"name": "quiet", "code": "print('hidden')"}), &ctx)
+            .await
+            .expect("eval");
+        let eval_json: Value = serde_json::from_str(&eval.content).expect("eval json");
+        assert!(eval_json.get("stdout_preview").is_none());
+
+        RlmCloseTool
+            .execute(json!({"name": "quiet"}), &ctx)
+            .await
+            .expect("close");
     }
 }
diff --git a/crates/tui/src/tools/search.rs b/crates/tui/src/tools/search.rs
index 4acc5845..c1fb5bbc 100644
--- a/crates/tui/src/tools/search.rs
+++ b/crates/tui/src/tools/search.rs
@@ -213,9 +213,16 @@ impl ToolSpec for GrepFilesTool {
             }
         }
 
-        // Build result
+        let matches_json: Vec<Value> = results
+            .iter()
+            .map(|item| grep_match_to_json(item, context_lines))
+            .collect();
+
+        // Build result. When context_lines == 1, return the single context
+        // line as a string instead of a one-item array. That keeps the common
+        // "show just the adjacent line" case easy for model callers to read.
         let result = json!({
-            "matches": results,
+            "matches": matches_json,
             "total_matches": total_matches,
             "files_searched": files_searched,
             "truncated": total_matches > max_results,
@@ -225,6 +232,20 @@ impl ToolSpec for GrepFilesTool {
     }
 }
 
+fn grep_match_to_json(item: &GrepMatch, context_lines: usize) -> Value {
+    if context_lines == 1 {
+        json!({
+            "file": item.file,
+            "line_number": item.line_number,
+            "line": item.line,
+            "context_before": item.context_before.first().cloned().unwrap_or_default(),
+            "context_after": item.context_after.first().cloned().unwrap_or_default(),
+        })
+    } else {
+        json!(item)
+    }
+}
+
 /// Collect files to search based on include/exclude patterns
 fn collect_files(
     root: &Path,
@@ -315,7 +336,7 @@ fn should_include(path: &str, patterns: &[String]) -> bool {
 
 /// Simple glob pattern matching
 /// Supports: * (any chars), ** (any path), ? (single char)
-fn matches_glob(path: &str, pattern: &str) -> bool {
+pub(crate) fn matches_glob(path: &str, pattern: &str) -> bool {
     // Handle ** for any path
     if pattern.contains("**") {
         let parts: Vec<&str> = pattern.split("**").collect();
@@ -502,6 +523,34 @@ mod tests {
         assert!(result.success);
         assert!(result.content.contains("line2")); // context before
         assert!(result.content.contains("line4")); // context after
+
+        let parsed: Value = serde_json::from_str(&result.content).unwrap();
+        let matches = parsed["matches"].as_array().unwrap();
+        assert_eq!(matches.len(), 1);
+        assert_eq!(matches[0]["context_before"], "line2");
+        assert_eq!(matches[0]["context_after"], "line4");
+        assert!(matches[0]["context_before"].is_string());
+        assert!(matches[0]["context_after"].is_string());
+    }
+
+    #[tokio::test]
+    async fn test_grep_files_multi_line_context_remains_arrays() {
+        let tmp = tempdir().expect("tempdir");
+        let ctx = ToolContext::new(tmp.path().to_path_buf());
+
+        fs::write(tmp.path().join("test.txt"), "a\nb\nMATCH\nd\ne\n").expect("write");
+
+        let tool = GrepFilesTool;
+        let result = tool
+            .execute(json!({"pattern": "MATCH", "context_lines": 2}), &ctx)
+            .await
+            .expect("execute");
+
+        let parsed: Value = serde_json::from_str(&result.content).unwrap();
+        let matches = parsed["matches"].as_array().unwrap();
+        assert_eq!(matches.len(), 1);
+        assert_eq!(matches[0]["context_before"], json!(["a", "b"]));
+        assert_eq!(matches[0]["context_after"], json!(["d", "e"]));
     }
 
     #[tokio::test]
diff --git a/crates/tui/src/tools/shell.rs b/crates/tui/src/tools/shell.rs
index 27773e43..6eab3a18 100644
--- a/crates/tui/src/tools/shell.rs
+++ b/crates/tui/src/tools/shell.rs
@@ -1586,6 +1586,7 @@ async fn execute_foreground_via_background(
     command: &str,
     timeout_ms: u64,
     stdin_data: Option<&str>,
+    tty: bool,
     policy_override: Option<ExecutionSandboxPolicy>,
     extra_env: HashMap<String, String>,
 ) -> Result<ShellResult> {
@@ -1602,7 +1603,7 @@ async fn execute_foreground_via_background(
             timeout_ms,
             true,
             stdin_data,
-            false,
+            tty,
             policy_override,
             extra_env,
         )?
@@ -1706,6 +1707,10 @@ impl ToolSpec for ExecShellTool {
                 "tty": {
                     "type": "boolean",
                     "description": "Allocate a pseudo-terminal for interactive programs (implies background)"
+                },
+                "combined_output": {
+                    "type": "boolean",
+                    "description": "Capture stdout and stderr as one chronological PTY stream (default false). In foreground mode, waits for completion; in background mode, implies tty."
                 }
             },
             "required": ["command"]
@@ -1733,7 +1738,8 @@ impl ToolSpec for ExecShellTool {
         let timeout_ms = optional_u64(&input, "timeout_ms", 120_000).min(600_000);
         let background = optional_bool(&input, "background", false);
         let interactive = optional_bool(&input, "interactive", false);
-        let tty = optional_bool(&input, "tty", false);
+        let combined_output = optional_bool(&input, "combined_output", false);
+        let tty = optional_bool(&input, "tty", false) || (combined_output && background);
         let stdin_data = input
             .get("stdin")
             .or_else(|| input.get("input"))
@@ -1746,9 +1752,9 @@ impl ToolSpec for ExecShellTool {
                 "Interactive commands cannot run in background mode.",
             ));
         }
-        if interactive && tty {
+        if interactive && (tty || combined_output) {
             return Ok(ToolResult::error(
-                "Interactive mode cannot be combined with TTY sessions.",
+                "Interactive mode cannot be combined with TTY or combined_output sessions.",
             ));
         }
         if interactive && stdin_data.is_some() {
@@ -1969,6 +1975,7 @@ impl ToolSpec for ExecShellTool {
                 command,
                 timeout_ms,
                 stdin_data.as_deref(),
+                combined_output,
                 policy_override,
                 extra_env,
             )
@@ -2067,6 +2074,7 @@ impl ToolSpec for ExecShellTool {
                     "stderr_summary": stderr_summary,
                     "safety_level": format!("{:?}", safety.level),
                     "interactive": interactive,
+                    "combined_output": combined_output,
                     "canceled": was_cancelled,
                     "execpolicy": execpolicy_decision.as_ref().map(|decision| match decision {
                         ExecPolicyDecision::Allow => json!({
diff --git a/crates/tui/src/tools/shell/tests.rs b/crates/tui/src/tools/shell/tests.rs
index 4e71c29c..1c5970c3 100644
--- a/crates/tui/src/tools/shell/tests.rs
+++ b/crates/tui/src/tools/shell/tests.rs
@@ -403,6 +403,29 @@ async fn test_exec_shell_metadata_includes_summaries() {
     assert!(meta.get("stdout_truncated").is_some());
 }
 
+#[cfg(not(windows))]
+#[tokio::test]
+async fn test_exec_shell_combined_output_uses_single_stream() {
+    let tmp = tempdir().expect("tempdir");
+    let ctx = ToolContext::new(tmp.path());
+    let tool = ExecShellTool;
+    let command = "printf 'out\\n'; printf 'err\\n' >&2";
+
+    let result = tool
+        .execute(json!({"command": command, "combined_output": true}), &ctx)
+        .await
+        .expect("execute");
+    assert!(result.success, "{}", result.content);
+    assert!(result.content.contains("out"), "{}", result.content);
+    assert!(result.content.contains("err"), "{}", result.content);
+
+    let meta = result.metadata.expect("metadata");
+    assert_eq!(
+        meta.get("combined_output").and_then(Value::as_bool),
+        Some(true)
+    );
+}
+
 #[tokio::test]
 async fn test_exec_shell_foreground_timeout_guides_background_rerun() {
     let tmp = tempdir().expect("tempdir");
diff --git a/crates/tui/src/tools/spec.rs b/crates/tui/src/tools/spec.rs
index 55b5cb5f..21c91fa5 100644
--- a/crates/tui/src/tools/spec.rs
+++ b/crates/tui/src/tools/spec.rs
@@ -16,7 +16,9 @@ use tokio_util::sync::CancellationToken;
 use crate::features::Features;
 use crate::lsp::LspManager;
 use crate::network_policy::NetworkPolicyDecider;
+use crate::rlm::session::{SharedRlmSessionStore, new_shared_rlm_session_store};
 use crate::sandbox::backend::SandboxBackend;
+use crate::tools::handle::{SharedHandleStore, new_shared_handle_store};
 use crate::tools::shell::{SharedShellManager, new_shared_shell_manager};
 #[allow(unused_imports)]
 pub use deepseek_tools::{
@@ -30,7 +32,7 @@ pub use deepseek_tools::{
 /// contexts keep working. Tools that need durable task/automation state fail
 /// closed with a clear "not available" error when the relevant service is not
 /// attached.
-#[derive(Clone, Default)]
+#[derive(Clone)]
 pub struct RuntimeToolServices {
     pub shell_manager: Option<SharedShellManager>,
     pub task_manager: Option<crate::task_manager::SharedTaskManager>,
@@ -42,6 +44,27 @@ pub struct RuntimeToolServices {
     /// tool-side hook events. `None` outside the live engine — test
     /// contexts that don't care about hooks get a no-op.
     pub hook_executor: Option<std::sync::Arc<crate::hooks::HookExecutor>>,
+    /// Per-session backing store for `var_handle` payloads. Cloned tool
+    /// contexts share this Arc so handles survive across turns.
+    pub handle_store: SharedHandleStore,
+    /// Per-session persistent RLM kernels, keyed by caller-chosen context name.
+    pub rlm_sessions: SharedRlmSessionStore,
+}
+
+impl Default for RuntimeToolServices {
+    fn default() -> Self {
+        Self {
+            shell_manager: None,
+            task_manager: None,
+            automations: None,
+            task_data_dir: None,
+            active_task_id: None,
+            active_thread_id: None,
+            hook_executor: None,
+            handle_store: new_shared_handle_store(),
+            rlm_sessions: new_shared_rlm_session_store(),
+        }
+    }
 }
 
 impl std::fmt::Debug for RuntimeToolServices {
@@ -54,6 +77,8 @@ impl std::fmt::Debug for RuntimeToolServices {
             .field("active_task_id", &self.active_task_id)
             .field("active_thread_id", &self.active_thread_id)
             .field("hook_executor", &self.hook_executor.is_some())
+            .field("handle_store", &true)
+            .field("rlm_sessions", &true)
             .finish()
     }
 }
diff --git a/crates/tui/src/tools/subagent/mod.rs b/crates/tui/src/tools/subagent/mod.rs
index abfb25bd..2b56d339 100644
--- a/crates/tui/src/tools/subagent/mod.rs
+++ b/crates/tui/src/tools/subagent/mod.rs
@@ -3,6 +3,11 @@
 //! Provides tools to spawn background sub-agents, query their status,
 //! and retrieve results. Sub-agents run with a filtered toolset and
 //! inherit the workspace configuration from the main session.
+//!
+//! v0.8.33's new model-facing surface is `agent_open` / `agent_eval` /
+//! `agent_close`. Some older structs and manager helpers remain in this
+//! module while the durable runtime is being reused by the new surface.
+#![allow(dead_code)]
 
 use std::collections::{HashMap, VecDeque};
 use std::fs;
@@ -24,6 +29,7 @@ use crate::config::MAX_SUBAGENTS;
 use crate::core::events::Event;
 use crate::llm_client::LlmClient;
 use crate::models::{ContentBlock, Message, MessageRequest, SystemPrompt, Tool};
+use crate::tools::handle::VarHandle;
 use crate::tools::plan::{PlanState, SharedPlanState};
 use crate::tools::registry::{ToolRegistry, ToolRegistryBuilder};
 use crate::tools::spec::{
@@ -64,6 +70,7 @@ const TOOL_TIMEOUT: Duration = Duration::from_secs(30);
 const STEP_API_TIMEOUT: Duration = Duration::from_secs(120);
 const RESULT_POLL_INTERVAL: Duration = Duration::from_millis(250);
 const DEFAULT_RESULT_TIMEOUT_MS: u64 = 30_000;
+#[allow(dead_code)] // Legacy agent_wait clamp; new agent_eval uses DEFAULT/MAX.
 const MIN_WAIT_TIMEOUT_MS: u64 = 10_000;
 const MAX_RESULT_TIMEOUT_MS: u64 = 3_600_000;
 const COMPLETED_AGENT_RETENTION: Duration = Duration::from_secs(60 * 60);
@@ -407,7 +414,10 @@ pub enum SubAgentStatus {
 /// Snapshot of sub-agent state for tool results.
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct SubAgentResult {
+    pub name: String,
     pub agent_id: String,
+    pub context_mode: String,
+    pub fork_context: bool,
     pub agent_type: SubAgentType,
     pub assignment: SubAgentAssignment,
     #[serde(default)]
@@ -432,6 +442,7 @@ fn is_false(b: &bool) -> bool {
 
 #[derive(Debug, Clone, Default)]
 pub(crate) struct SubAgentSpawnOptions {
+    pub name: Option<String>,
     pub model: Option<String>,
     pub nickname: Option<String>,
     pub fork_context: bool,
@@ -452,6 +463,7 @@ impl WaitMode {
         }
     }
 
+    #[allow(dead_code)] // Legacy wait metadata while registry moves to agent_eval.
     fn as_str(self) -> &'static str {
         match self {
             Self::Any => "any",
@@ -479,6 +491,7 @@ struct SubAgentInput {
 
 #[derive(Debug, Clone)]
 struct SpawnRequest {
+    session_name: Option<String>,
     prompt: String,
     agent_type: SubAgentType,
     assignment: SubAgentAssignment,
@@ -497,6 +510,9 @@ struct SpawnRequest {
     /// When true, seed the child with the parent's system prompt and message
     /// prefix before appending the child task.
     fork_context: bool,
+    /// Optional recursion budget for descendants opened by this child.
+    /// `0` means the child may not call `agent_open` recursively.
+    max_depth: Option<u32>,
 }
 
 #[derive(Debug, Clone)]
@@ -511,6 +527,10 @@ struct AssignRequest {
 #[derive(Debug, Clone, Serialize, Deserialize)]
 struct PersistedSubAgent {
     id: String,
+    #[serde(default, skip_serializing_if = "Option::is_none")]
+    session_name: Option<String>,
+    #[serde(default)]
+    fork_context: bool,
     agent_type: SubAgentType,
     prompt: String,
     assignment: SubAgentAssignment,
@@ -789,6 +809,8 @@ impl SubAgentRuntime {
 /// A running sub-agent instance.
 pub struct SubAgent {
     pub id: String,
+    pub session_name: String,
+    pub fork_context: bool,
     pub agent_type: SubAgentType,
     pub prompt: String,
     pub assignment: SubAgentAssignment,
@@ -824,9 +846,12 @@ impl SubAgent {
         session_boot_id: String,
     ) -> Self {
         let id = format!("agent_{}", &Uuid::new_v4().to_string()[..8]);
+        let session_name = id.clone();
 
         Self {
             id,
+            session_name,
+            fork_context: false,
             agent_type,
             prompt,
             assignment,
@@ -847,7 +872,10 @@ impl SubAgent {
     #[must_use]
     pub fn snapshot(&self) -> SubAgentResult {
         SubAgentResult {
+            name: self.session_name.clone(),
             agent_id: self.id.clone(),
+            context_mode: if self.fork_context { "forked" } else { "fresh" }.to_string(),
+            fork_context: self.fork_context,
             agent_type: self.agent_type.clone(),
             assignment: self.assignment.clone(),
             model: self.model.clone(),
@@ -928,6 +956,8 @@ impl SubAgentManager {
         for agent in self.agents.values() {
             agents.push(PersistedSubAgent {
                 id: agent.id.clone(),
+                session_name: Some(agent.session_name.clone()),
+                fork_context: agent.fork_context,
                 agent_type: agent.agent_type.clone(),
                 prompt: agent.prompt.clone(),
                 assignment: agent.assignment.clone(),
@@ -998,6 +1028,11 @@ impl SubAgentManager {
             };
             let agent = SubAgent {
                 id: persisted.id.clone(),
+                session_name: persisted
+                    .session_name
+                    .filter(|name| !name.trim().is_empty())
+                    .unwrap_or_else(|| persisted.id.clone()),
+                fork_context: persisted.fork_context,
                 agent_type: persisted.agent_type,
                 prompt: persisted.prompt,
                 assignment: persisted.assignment,
@@ -1126,6 +1161,22 @@ impl SubAgentManager {
             input_tx,
             self.current_session_boot_id.clone(),
         );
+        if let Some(name) = options
+            .name
+            .as_deref()
+            .map(str::trim)
+            .filter(|name| !name.is_empty())
+        {
+            if self
+                .agents
+                .values()
+                .any(|existing| existing.session_name == name)
+            {
+                return Err(anyhow!("Sub-agent session name '{name}' is already in use"));
+            }
+            agent.session_name = name.to_string();
+        }
+        agent.fork_context = options.fork_context;
         let agent_id = agent.id.clone();
         let started_at = agent.started_at;
         let max_steps = self.max_steps;
@@ -1175,6 +1226,29 @@ impl SubAgentManager {
         Ok(agent.snapshot())
     }
 
+    /// Resolve either a durable agent id or a model-facing session name.
+    fn resolve_agent_ref(&self, agent_ref: &str) -> Result<String> {
+        let agent_ref = agent_ref.trim();
+        if self.agents.contains_key(agent_ref) {
+            return Ok(agent_ref.to_string());
+        }
+
+        let matches = self
+            .agents
+            .values()
+            .filter(|agent| agent.session_name == agent_ref)
+            .map(|agent| agent.id.clone())
+            .collect::<Vec<_>>();
+
+        match matches.as_slice() {
+            [id] => Ok(id.clone()),
+            [] => Err(anyhow!("Agent session {agent_ref} not found")),
+            _ => Err(anyhow!(
+                "Agent session name '{agent_ref}' is ambiguous; use an agent_id"
+            )),
+        }
+    }
+
     /// Cancel a running sub-agent.
     pub fn cancel(&mut self, agent_id: &str) -> Result<SubAgentResult> {
         let (snapshot, changed) = {
@@ -1202,6 +1276,7 @@ impl SubAgentManager {
     }
 
     /// Resume a non-running sub-agent by restarting it with the original assignment.
+    #[allow(dead_code)] // Legacy agent_resume path; retained until registry migration.
     pub fn resume(
         &mut self,
         manager_handle: SharedSubAgentManager,
@@ -1505,6 +1580,86 @@ impl SubAgentManager {
 /// Thread-safe wrapper for `SubAgentManager`.
 pub type SharedSubAgentManager = Arc<RwLock<SubAgentManager>>;
 
+/// Model-facing session projection returned by the v0.8.33 sub-agent API.
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct SubAgentSessionProjection {
+    pub name: String,
+    pub agent_id: String,
+    pub status: String,
+    pub terminal: bool,
+    pub context_mode: String,
+    pub fork_context: bool,
+    pub prefix_cache: SubAgentPrefixCacheProjection,
+    pub transcript_handle: VarHandle,
+    pub snapshot: SubAgentResult,
+    #[serde(default, skip_serializing_if = "is_false")]
+    pub timed_out: bool,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct SubAgentPrefixCacheProjection {
+    pub mode: String,
+    pub parent_prefix: String,
+    pub deepseek_prefix_cache_reuse: String,
+}
+
+fn subagent_prefix_cache_projection(snapshot: &SubAgentResult) -> SubAgentPrefixCacheProjection {
+    if snapshot.fork_context {
+        SubAgentPrefixCacheProjection {
+            mode: "forked".to_string(),
+            parent_prefix: "preserved_byte_identical_when_available".to_string(),
+            deepseek_prefix_cache_reuse: "optimized_for_existing_parent_prefill".to_string(),
+        }
+    } else {
+        SubAgentPrefixCacheProjection {
+            mode: "fresh".to_string(),
+            parent_prefix: "not_inherited".to_string(),
+            deepseek_prefix_cache_reuse: "independent_child_prefill".to_string(),
+        }
+    }
+}
+
+async fn subagent_session_projection(
+    snapshot: SubAgentResult,
+    timed_out: bool,
+    context: &ToolContext,
+) -> SubAgentSessionProjection {
+    let transcript_payload = json!({
+        "kind": "subagent_session_snapshot",
+        "agent_id": snapshot.agent_id.clone(),
+        "name": snapshot.name.clone(),
+        "status": subagent_status_name(&snapshot.status),
+        "context_mode": snapshot.context_mode.clone(),
+        "fork_context": snapshot.fork_context,
+        "result": snapshot.result.clone(),
+        "steps_taken": snapshot.steps_taken,
+        "duration_ms": snapshot.duration_ms,
+        "assignment": snapshot.assignment.clone(),
+        "snapshot": snapshot.clone(),
+    });
+    let transcript_handle = {
+        let mut store = context.runtime.handle_store.lock().await;
+        store.insert_json(
+            format!("agent:{}", snapshot.agent_id),
+            "transcript",
+            transcript_payload,
+        )
+    };
+
+    SubAgentSessionProjection {
+        name: snapshot.name.clone(),
+        agent_id: snapshot.agent_id.clone(),
+        status: subagent_status_name(&snapshot.status).to_string(),
+        terminal: snapshot.status != SubAgentStatus::Running,
+        context_mode: snapshot.context_mode.clone(),
+        fork_context: snapshot.fork_context,
+        prefix_cache: subagent_prefix_cache_projection(&snapshot),
+        transcript_handle,
+        snapshot,
+        timed_out,
+    }
+}
+
 fn default_state_path(workspace: &Path) -> PathBuf {
     workspace
         .join(".deepseek")
@@ -1552,6 +1707,143 @@ pub fn new_shared_subagent_manager(workspace: PathBuf, max_agents: usize) -> Sha
 
 // === Tool Implementations ===
 
+/// Open a named background sub-agent session.
+#[allow(dead_code)] // Registered by the adjacent v0.8.33 registry surface update.
+pub struct AgentOpenTool {
+    manager: SharedSubAgentManager,
+    runtime: SubAgentRuntime,
+}
+
+impl AgentOpenTool {
+    #[allow(dead_code)] // Registered by the adjacent v0.8.33 registry surface update.
+    #[must_use]
+    pub fn new(manager: SharedSubAgentManager, runtime: SubAgentRuntime) -> Self {
+        Self { manager, runtime }
+    }
+}
+
+#[async_trait]
+impl ToolSpec for AgentOpenTool {
+    fn name(&self) -> &'static str {
+        "agent_open"
+    }
+
+    fn description(&self) -> &'static str {
+        concat!(
+            "Open a named child sub-agent session for focused background work. Returns the session name, status, agent_id, context_mode, prefix_cache metadata, and a handle_read-compatible transcript_handle. ",
+            "Use agent_eval to fetch or wait on the session, and agent_close to cancel/close it.\n\n",
+            "Context control is explicit: omit fork_context or set it false for a fresh child with an independent prefill; set fork_context=true for perspective fanout over the current parent context. ",
+            "Forked children preserve the parent system prompt and leading message prefix byte-identically where the runtime has that prefix, so DeepSeek can reuse its prefix cache before the child-specific task is appended.\n\n",
+            "Sub-agent results are self-reports. Re-verify claimed side effects such as file edits, commands, network writes, tests, or git operations before reporting them as facts."
+        )
+    }
+
+    fn input_schema(&self) -> Value {
+        json!({
+            "type": "object",
+            "properties": {
+                "name": {
+                    "type": "string",
+                    "description": "Stable model-facing session name. Defaults to the generated agent_id when omitted."
+                },
+                "session_name": {
+                    "type": "string",
+                    "description": "Alias for name"
+                },
+                "prompt": {
+                    "type": "string",
+                    "description": "Initial task description for the child session"
+                },
+                "message": {
+                    "type": "string",
+                    "description": "Alias for prompt"
+                },
+                "objective": {
+                    "type": "string",
+                    "description": "Alias for prompt"
+                },
+                "items": {
+                    "type": "array",
+                    "description": "Structured input items (text, mention, skill, local_image, image)",
+                    "items": { "type": "object" }
+                },
+                "type": {
+                    "type": "string",
+                    "description": "Sub-agent type: general, explore, plan, review, implementer, verifier, custom"
+                },
+                "agent_type": {
+                    "type": "string",
+                    "description": "Alias for type"
+                },
+                "role": {
+                    "type": "string",
+                    "description": "Role alias: worker, explorer, awaiter, default"
+                },
+                "agent_role": {
+                    "type": "string",
+                    "description": "Alias for role"
+                },
+                "allowed_tools": {
+                    "type": "array",
+                    "items": { "type": "string" },
+                    "description": "Explicit tool allowlist (required for custom type)"
+                },
+                "model": {
+                    "type": "string",
+                    "description": "Optional DeepSeek model id for this child"
+                },
+                "cwd": {
+                    "type": "string",
+                    "description": "Optional working directory for the child; must be inside the parent workspace"
+                },
+                "resident_file": {
+                    "type": "string",
+                    "description": "Optional file path for cache-aware resident mode"
+                },
+                "fork_context": {
+                    "type": "boolean",
+                    "description": "false (default): fresh child with independent context/prefill. true: forked child that preserves the parent's byte-identical system/message prefix where available, then appends this task for DeepSeek prefix-cache reuse."
+                },
+                "max_depth": {
+                    "type": "integer",
+                    "minimum": 0,
+                    "maximum": 3,
+                    "description": "Recursive child-agent budget for this session. 0 blocks agent_open from the child; 1-3 allow that many descendant levels."
+                }
+            }
+        })
+    }
+
+    fn capabilities(&self) -> Vec<ToolCapability> {
+        vec![
+            ToolCapability::ExecutesCode,
+            ToolCapability::RequiresApproval,
+        ]
+    }
+
+    fn approval_requirement(&self) -> ApprovalRequirement {
+        ApprovalRequirement::Required
+    }
+
+    async fn execute(&self, input: Value, context: &ToolContext) -> Result<ToolResult, ToolError> {
+        let spawn_tool = AgentSpawnTool::new(self.manager.clone(), self.runtime.clone());
+        let result = spawn_tool.execute(input, context).await?;
+        let snapshot: SubAgentResult = serde_json::from_str(&result.content).map_err(|e| {
+            ToolError::execution_failed(format!("agent_open projection failed: {e}"))
+        })?;
+        let projection = subagent_session_projection(snapshot, false, context).await;
+        let mut tool_result = ToolResult::json(&projection)
+            .map_err(|e| ToolError::execution_failed(e.to_string()))?;
+        tool_result.metadata = Some(json!({
+            "status": projection.status,
+            "terminal": projection.terminal,
+            "context_mode": projection.context_mode,
+            "prefix_cache": projection.prefix_cache,
+        }));
+        Ok(tool_result)
+    }
+}
+
 /// Tool to spawn a background sub-agent.
 pub struct AgentSpawnTool {
     manager: SharedSubAgentManager,
@@ -1725,6 +2017,9 @@ impl ToolSpec for AgentSpawnTool {
         // optionally overrides cwd if the caller passed one (used for the
         // parallel-worktree pattern).
         let mut child_runtime = self.runtime.background_runtime();
+        if let Some(max_depth) = spawn_request.max_depth {
+            child_runtime.max_spawn_depth = child_runtime.spawn_depth.saturating_add(max_depth);
+        }
         if let Some(cwd) = validated_cwd {
             child_runtime.context.workspace = cwd;
         }
@@ -1790,6 +2085,7 @@ impl ToolSpec for AgentSpawnTool {
                 spawn_request.assignment,
                 spawn_request.allowed_tools,
                 SubAgentSpawnOptions {
+                    name: spawn_request.session_name.clone(),
                     model: Some(effective_model),
                     nickname: None,
                     fork_context: spawn_request.fork_context,
@@ -1843,13 +2139,143 @@ impl ToolSpec for AgentSpawnTool {
     }
 }
 
+/// Evaluate/fetch a child session boundary for the v0.8.33 sub-agent API.
+#[allow(dead_code)] // Registered by the adjacent v0.8.33 registry surface update.
+pub struct AgentEvalTool {
+    manager: SharedSubAgentManager,
+}
+
+impl AgentEvalTool {
+    #[allow(dead_code)] // Registered by the adjacent v0.8.33 registry surface update.
+    #[must_use]
+    pub fn new(manager: SharedSubAgentManager) -> Self {
+        Self { manager }
+    }
+}
+
+#[async_trait]
+impl ToolSpec for AgentEvalTool {
+    fn name(&self) -> &'static str {
+        "agent_eval"
+    }
+
+    fn description(&self) -> &'static str {
+        "Fetch or wait on a child sub-agent session. Optionally deliver a message/items to a running session, then return the latest session projection. With block=true (default), waits for the session to reach a terminal boundary; block=false is a non-blocking status fetch."
+    }
+
+    fn input_schema(&self) -> Value {
+        json!({
+            "type": "object",
+            "properties": {
+                "name": {
+                    "type": "string",
+                    "description": "Session name returned by agent_open"
+                },
+                "agent_id": {
+                    "type": "string",
+                    "description": "Generated agent id returned by agent_open"
+                },
+                "id": {
+                    "type": "string",
+                    "description": "Alias for agent_id"
+                },
+                "message": {
+                    "type": "string",
+                    "description": "Optional message to deliver before evaluating the session"
+                },
+                "input": {
+                    "type": "string",
+                    "description": "Alias for message"
+                },
+                "items": {
+                    "type": "array",
+                    "description": "Structured input items (text, mention, skill, local_image, image)",
+                    "items": { "type": "object" }
+                },
+                "interrupt": {
+                    "type": "boolean",
+                    "description": "When sending input, prioritize it over pending inputs"
+                },
+                "block": {
+                    "type": "boolean",
+                    "description": "Wait for a terminal boundary before returning (default true)"
+                },
+                "timeout_ms": {
+                    "type": "integer",
+                    "description": "Max wait time in milliseconds (default: 30000, clamped to 1000-3600000)"
+                }
+            }
+        })
+    }
+
+    fn capabilities(&self) -> Vec<ToolCapability> {
+        vec![ToolCapability::ReadOnly]
+    }
+
+    async fn execute(&self, input: Value, context: &ToolContext) -> Result<ToolResult, ToolError> {
+        let agent_ref = input
+            .get("name")
+            .or_else(|| input.get("agent_id"))
+            .or_else(|| input.get("id"))
+            .and_then(Value::as_str)
+            .map(str::trim)
+            .filter(|value| !value.is_empty())
+            .ok_or_else(|| ToolError::missing_field("name"))?;
+        let message = parse_optional_text_or_items(&input, &["message", "input"], "items")?;
+        let interrupt = optional_bool(&input, "interrupt", false);
+        let block = optional_bool(&input, "block", true);
+        let timeout_ms = optional_u64(&input, "timeout_ms", DEFAULT_RESULT_TIMEOUT_MS)
+            .clamp(1000, MAX_RESULT_TIMEOUT_MS);
+
+        let agent_id = {
+            let manager = self.manager.read().await;
+            manager
+                .resolve_agent_ref(agent_ref)
+                .map_err(|e| ToolError::execution_failed(e.to_string()))?
+        };
+
+        if let Some(message) = message {
+            let mut manager = self.manager.write().await;
+            manager
+                .send_input(&agent_id, message, interrupt)
+                .map_err(|e| ToolError::execution_failed(e.to_string()))?;
+        }
+
+        let (snapshot, timed_out) = if block {
+            wait_for_result(&self.manager, &agent_id, Duration::from_millis(timeout_ms)).await?
+        } else {
+            let manager = self.manager.read().await;
+            (
+                manager
+                    .get_result(&agent_id)
+                    .map_err(|e| ToolError::execution_failed(e.to_string()))?,
+                false,
+            )
+        };
+
+        let projection = subagent_session_projection(snapshot, timed_out, context).await;
+        let mut result = ToolResult::json(&projection)
+            .map_err(|e| ToolError::execution_failed(e.to_string()))?;
+        result.metadata = Some(json!({
+            "status": if timed_out { "TimedOut".to_string() } else { projection.status.clone() },
+            "timed_out": timed_out,
+            "terminal": projection.terminal,
+            "context_mode": projection.context_mode,
+            "timeout_ms": timeout_ms
+        }));
+        Ok(result)
+    }
+}
+
 /// Tool to fetch a sub-agent's result.
+#[allow(dead_code)] // Legacy surface superseded by agent_eval.
 pub struct AgentResultTool {
     manager: SharedSubAgentManager,
 }
 
 impl AgentResultTool {
     /// Create a new result tool.
+    #[allow(dead_code)] // Legacy surface superseded by agent_eval.
     #[must_use]
     pub fn new(manager: SharedSubAgentManager) -> Self {
         Self { manager }
@@ -1933,12 +2359,14 @@ impl ToolSpec for AgentResultTool {
 }
 
 /// Tool to cancel a sub-agent.
+#[allow(dead_code)] // Legacy surface superseded by agent_close.
 pub struct AgentCancelTool {
     manager: SharedSubAgentManager,
 }
 
 impl AgentCancelTool {
     /// Create a new cancel tool.
+    #[allow(dead_code)] // Legacy surface superseded by agent_close.
     #[must_use]
     pub fn new(manager: SharedSubAgentManager) -> Self {
         Self { manager }
@@ -1991,6 +2419,7 @@ impl ToolSpec for AgentCancelTool {
 }
 
 /// Tool to list all sub-agents.
+#[allow(dead_code)] // Legacy surface superseded by named agent_open/eval/close sessions.
 pub struct AgentListTool {
     manager: SharedSubAgentManager,
 }
@@ -2011,11 +2440,11 @@ impl AgentCloseTool {
 #[async_trait]
 impl ToolSpec for AgentCloseTool {
     fn name(&self) -> &'static str {
-        "close_agent"
+        "agent_close"
     }
 
     fn description(&self) -> &'static str {
-        "Close a running sub-agent. Alias for agent_cancel."
+        "Close a child sub-agent session by cancelling it if still running. Returns the final session projection with transcript_handle metadata."
     }
 
     fn input_schema(&self) -> Value {
@@ -2024,7 +2453,11 @@ impl ToolSpec for AgentCloseTool {
             "properties": {
                 "id": {
                     "type": "string",
-                    "description": "Agent id returned by agent_spawn"
+                    "description": "Agent id returned by agent_open"
+                },
+                "name": {
+                    "type": "string",
+                    "description": "Session name returned by agent_open"
                 },
                 "agent_id": {
                     "type": "string",
@@ -2045,27 +2478,30 @@ impl ToolSpec for AgentCloseTool {
         ApprovalRequirement::Required
     }
 
-    async fn execute(&self, input: Value, _context: &ToolContext) -> Result<ToolResult, ToolError> {
+    async fn execute(&self, input: Value, context: &ToolContext) -> Result<ToolResult, ToolError> {
         let agent_id = input
-            .get("id")
+            .get("name")
+            .or_else(|| input.get("id"))
             .or_else(|| input.get("agent_id"))
             .and_then(|v| v.as_str())
             .ok_or_else(|| ToolError::missing_field("id"))?;
+        let agent_id = {
+            let manager = self.manager.read().await;
+            manager
+                .resolve_agent_ref(agent_id)
+                .map_err(|e| ToolError::execution_failed(e.to_string()))?
+        };
         let mut manager = self.manager.write().await;
         let result = manager
-            .cancel(agent_id)
+            .cancel(&agent_id)
             .map_err(|e| ToolError::execution_failed(format!("Failed to close sub-agent: {e}")))?;
-        let tool_result =
-            ToolResult::json(&result).map_err(|e| ToolError::execution_failed(e.to_string()))?;
-        Ok(wrap_with_deprecation_notice(
-            tool_result,
-            "close_agent",
-            "agent_cancel",
-        ))
+        let projection = subagent_session_projection(result, false, context).await;
+        ToolResult::json(&projection).map_err(|e| ToolError::execution_failed(e.to_string()))
     }
 }
 
 /// Tool to resume an existing sub-agent.
+#[allow(dead_code)] // Legacy surface superseded by agent_open/eval.
 pub struct AgentResumeTool {
     manager: SharedSubAgentManager,
     runtime: SubAgentRuntime,
@@ -2073,6 +2509,7 @@ pub struct AgentResumeTool {
 
 impl AgentResumeTool {
     /// Create a new resume tool.
+    #[allow(dead_code)] // Legacy surface superseded by agent_open/eval.
     #[must_use]
     pub fn new(manager: SharedSubAgentManager, runtime: SubAgentRuntime) -> Self {
         Self { manager, runtime }
@@ -2132,6 +2569,7 @@ impl ToolSpec for AgentResumeTool {
 
 impl AgentListTool {
     /// Create a new list tool.
+    #[allow(dead_code)] // Legacy surface superseded by named agent_open/eval/close sessions.
     #[must_use]
     pub fn new(manager: SharedSubAgentManager) -> Self {
         Self { manager }
@@ -2181,6 +2619,7 @@ impl ToolSpec for AgentListTool {
 }
 
 /// Tool to send input to a running sub-agent.
+#[allow(dead_code)] // Legacy surface superseded by agent_eval.
 pub struct AgentSendInputTool {
     manager: SharedSubAgentManager,
     name: &'static str,
@@ -2188,6 +2627,7 @@ pub struct AgentSendInputTool {
 
 impl AgentSendInputTool {
     /// Create a new send-input tool.
+    #[allow(dead_code)] // Legacy surface superseded by agent_eval.
     #[must_use]
     pub fn new(manager: SharedSubAgentManager, name: &'static str) -> Self {
         Self { manager, name }
@@ -2277,6 +2717,7 @@ impl ToolSpec for AgentSendInputTool {
 }
 
 /// Tool to update assignment metadata for a sub-agent.
+#[allow(dead_code)] // Legacy surface superseded by agent_eval/open metadata.
 pub struct AgentAssignTool {
     manager: SharedSubAgentManager,
     name: &'static str,
@@ -2284,6 +2725,7 @@ pub struct AgentAssignTool {
 
 impl AgentAssignTool {
     /// Create a new assignment tool.
+    #[allow(dead_code)] // Legacy surface superseded by agent_eval/open metadata.
     #[must_use]
     pub fn new(manager: SharedSubAgentManager, name: &'static str) -> Self {
         Self { manager, name }
@@ -2371,6 +2813,7 @@ impl ToolSpec for AgentAssignTool {
 }
 
 /// Tool to wait for sub-agents to complete.
+#[allow(dead_code)] // Legacy surface superseded by agent_eval.
 pub struct AgentWaitTool {
     manager: SharedSubAgentManager,
     name: &'static str,
@@ -2378,6 +2821,7 @@ pub struct AgentWaitTool {
 
 impl AgentWaitTool {
     /// Create a new wait tool.
+    #[allow(dead_code)] // Legacy surface superseded by agent_eval.
     #[must_use]
     pub fn new(manager: SharedSubAgentManager, name: &'static str) -> Self {
         Self { manager, name }
@@ -2517,6 +2961,7 @@ impl ToolSpec for AgentWaitTool {
 
 /// Compatibility delegate tool. It routes through `agent_spawn`, but defaults
 /// to `fork_context=true` because delegation is usually continuation work.
+#[allow(dead_code)] // Legacy alias superseded by agent_open(fork_context=true).
 pub struct DelegateToAgentTool {
     manager: SharedSubAgentManager,
     runtime: SubAgentRuntime,
@@ -2524,6 +2969,7 @@ pub struct DelegateToAgentTool {
 
 impl DelegateToAgentTool {
     /// Create a new delegation tool.
+    #[allow(dead_code)] // Legacy alias superseded by agent_open(fork_context=true).
     #[must_use]
     pub fn new(manager: SharedSubAgentManager, runtime: SubAgentRuntime) -> Self {
         Self { manager, runtime }
@@ -2855,7 +3301,8 @@ async fn run_subagent(
     mut input_rx: mpsc::UnboundedReceiver<SubAgentInput>,
 ) -> Result<SubAgentResult> {
     let system_prompt = build_subagent_system_prompt(&agent_type, &assignment);
-    let fork_context = fork_context
+    let fork_context_enabled = fork_context;
+    let fork_context = fork_context_enabled
         .then_some(runtime.fork_context.as_ref())
         .flatten();
     let request_system = subagent_request_system_prompt(&system_prompt, fork_context);
@@ -2911,7 +3358,15 @@ async fn run_subagent(
                 });
             }
             return Ok(SubAgentResult {
+                name: agent_id.clone(),
                 agent_id: agent_id.clone(),
+                context_mode: if fork_context_enabled {
+                    "forked"
+                } else {
+                    "fresh"
+                }
+                .to_string(),
+                fork_context: fork_context_enabled,
                 agent_type: agent_type.clone(),
                 assignment: assignment.clone(),
                 model: runtime.model.clone(),
@@ -2984,7 +3439,10 @@ async fn run_subagent(
                     });
                 }
                 return Ok(SubAgentResult {
+                    name: agent_id.clone(),
                     agent_id: agent_id.clone(),
+                    context_mode: if fork_context_enabled { "forked" } else { "fresh" }.to_string(),
+                    fork_context: fork_context_enabled,
                     agent_type: agent_type.clone(),
                     assignment: assignment.clone(),
                     model: runtime.model.clone(),
@@ -3121,7 +3579,15 @@ async fn run_subagent(
     release_resident_leases_for(&agent_id);
 
     Ok(SubAgentResult {
+        name: agent_id.clone(),
         agent_id,
+        context_mode: if fork_context_enabled {
+            "forked"
+        } else {
+            "fresh"
+        }
+        .to_string(),
+        fork_context: fork_context_enabled,
         agent_type,
         assignment,
         model: runtime.model.clone(),
@@ -3160,6 +3626,7 @@ async fn wait_for_result(
     }
 }
 
+#[allow(dead_code)] // Legacy agent_wait helper; agent_eval uses wait_for_result.
 async fn wait_for_agents(
     manager: &SharedSubAgentManager,
     ids: &[String],
@@ -3369,6 +3836,9 @@ fn parse_spawn_request(input: &Value) -> Result<SpawnRequest, ToolError> {
         "items",
         "prompt",
     )?;
+    let session_name = optional_input_str(input, &["name", "session_name"])
+        .map(validate_session_name)
+        .transpose()?;
 
     let type_input = optional_input_str(input, &["type", "agent_type", "agent_name"]);
     let role_input = optional_input_str(input, &["role", "agent_role"]);
@@ -3444,8 +3914,28 @@ fn parse_spawn_request(input: &Value) -> Result<SpawnRequest, ToolError> {
     let fork_context =
         parse_optional_bool(input, &["fork_context", "forkContext", "inherit_context"])
             .unwrap_or(false);
+    let max_depth = input
+        .get("max_depth")
+        .or_else(|| input.get("maxDepth"))
+        .or_else(|| input.get("max_spawn_depth"))
+        .and_then(Value::as_u64)
+        .map(|depth| {
+            u32::try_from(depth)
+                .map_err(|_| ToolError::invalid_input("max_depth must be between 0 and 3"))
+                .and_then(|depth| {
+                    if depth <= 3 {
+                        Ok(depth)
+                    } else {
+                        Err(ToolError::invalid_input(
+                            "max_depth must be between 0 and 3",
+                        ))
+                    }
+                })
+        })
+        .transpose()?;
 
     Ok(SpawnRequest {
+        session_name,
         prompt: prompt.clone(),
         agent_type,
         assignment: SubAgentAssignment::new(prompt, role),
@@ -3454,9 +3944,31 @@ fn parse_spawn_request(input: &Value) -> Result<SpawnRequest, ToolError> {
         cwd,
         resident_file,
         fork_context,
+        max_depth,
     })
 }
 
+fn validate_session_name(name: &str) -> Result<String, ToolError> {
+    let trimmed = name.trim();
+    if trimmed.is_empty() {
+        return Err(ToolError::invalid_input("name cannot be blank"));
+    }
+    if trimmed.chars().any(char::is_whitespace) {
+        return Err(ToolError::invalid_input(
+            "name must not contain whitespace; use letters, numbers, '-', '_', or '.'",
+        ));
+    }
+    if !trimmed
+        .chars()
+        .all(|ch| ch.is_ascii_alphanumeric() || matches!(ch, '-' | '_' | '.'))
+    {
+        return Err(ToolError::invalid_input(
+            "name may only contain ASCII letters, numbers, '-', '_', or '.'",
+        ));
+    }
+    Ok(trimmed.to_string())
+}
+
 fn parse_optional_bool(input: &Value, names: &[&str]) -> Option<bool> {
     names
         .iter()
@@ -3983,9 +4495,10 @@ const GENERAL_AGENT_INTRO: &str = concat!(
 );
 
 const EXPLORE_AGENT_INTRO: &str = concat!(
-    "You are an exploration sub-agent. Map the relevant code quickly and stay read-only.\n",
-    "Use list_dir/file_search, grep_files, and read_file; stop once evidence is sufficient.\n",
-    "EVIDENCE is load-bearing: cite `path:line-range` for each finding.\n",
+    "You are an exploration sub-agent (role: `explore`). Map the relevant code quickly and stay read-only.\n",
+    "Orient first: confirm the workspace/project root, read relevant AGENTS.md/README guidance when the tree is unfamiliar, then search only the likely scope.\n",
+    "Use list_dir/file_search, grep_files, and read_file; use RLM only for long inputs or many semantic slices, not basic path discovery.\n",
+    "DeepSeek V4 can hold broad evidence, but your value is compressed reconnaissance: cite `path:line-range` for each finding and stop once evidence is sufficient.\n",
     "CHANGES will almost always be \"None.\" for an explorer.\n\n"
 );
 
diff --git a/crates/tui/src/tools/subagent/tests.rs b/crates/tui/src/tools/subagent/tests.rs
index 97ae5f8c..164ba00f 100644
--- a/crates/tui/src/tools/subagent/tests.rs
+++ b/crates/tui/src/tools/subagent/tests.rs
@@ -7,7 +7,10 @@ fn make_assignment() -> SubAgentAssignment {
 
 fn make_snapshot(status: SubAgentStatus) -> SubAgentResult {
     SubAgentResult {
+        name: "agent_test".to_string(),
         agent_id: "agent_test".to_string(),
+        context_mode: "fresh".to_string(),
+        fork_context: false,
         agent_type: SubAgentType::General,
         assignment: make_assignment(),
         model: "deepseek-v4-flash".to_string(),
@@ -176,36 +179,43 @@ fn test_agent_type_prompts_include_shared_output_contract_once() {
 }
 
 #[test]
-fn agent_spawn_description_warns_parent_to_verify_self_reports_within_budget() {
+fn explore_prompt_orients_before_searching() {
+    let prompt = SubAgentType::Explore.system_prompt();
+    assert!(prompt.contains("role: `explore`"));
+    assert!(prompt.contains("AGENTS.md/README"));
+    assert!(prompt.contains("workspace/project root"));
+    assert!(prompt.contains("compressed reconnaissance"));
+}
+
+#[test]
+fn agent_open_description_explains_fresh_vs_forked_context_and_trust_model() {
     let tmp = tempdir().expect("tempdir");
     let manager = new_shared_subagent_manager(tmp.path().to_path_buf(), 1);
-    let tool = AgentSpawnTool::new(manager, stub_runtime());
+    let tool = AgentOpenTool::new(manager, stub_runtime());
     let description = tool.description();
 
-    assert!(
-        description
-            .contains("## Trust model: subagent results are self-reports, not verified facts")
-    );
-    assert!(description.contains("`agent_result` returns the child's narrative summary"));
-    assert!(description.contains("| Side effect | Re-verify with |"));
-    assert!(description.contains("If the child returns a verifiable handle"));
-    for row in [
-        "| URL claimed posted/written | `fetch_url` and check the response |",
-        "| File claimed created | `read_file` or `list_dir` |",
-        "| File claimed edited | `read_file` and check the change is present |",
-        "| HTTP POST/PUT response | inspect status code and body |",
-        "| Git operation | `git_status` / `git_diff` |",
-        "| Test claimed passing | `run_tests` |",
-        "| Process claimed started | `exec_shell` (e.g. `pgrep`, `lsof -i`) |",
-    ] {
-        assert!(description.contains(row));
-    }
+    assert!(description.contains("fresh child with an independent prefill"));
+    assert!(description.contains("fork_context=true"));
+    assert!(description.contains("byte-identically"));
+    assert!(description.contains("DeepSeek can reuse its prefix cache"));
+    assert!(description.contains("Sub-agent results are self-reports"));
     assert!(
         estimate_tool_description_tokens_conservative(description) <= 1024,
-        "agent_spawn description exceeds the conservative 1024-token budget"
+        "agent_open description exceeds the conservative 1024-token budget"
     );
 }
 
+#[test]
+fn new_session_tools_use_open_eval_close_names() {
+    let manager = Arc::new(RwLock::new(SubAgentManager::new(PathBuf::from("."), 1)));
+    assert_eq!(
+        AgentOpenTool::new(manager.clone(), stub_runtime()).name(),
+        "agent_open"
+    );
+    assert_eq!(AgentEvalTool::new(manager.clone()).name(), "agent_eval");
+    assert_eq!(AgentCloseTool::new(manager).name(), "agent_close");
+}
+
 #[test]
 fn test_implementer_allowed_tools_include_writes() {
     // Implementer is the write-heavy role; the deprecated
@@ -288,6 +298,66 @@ fn test_parse_spawn_request_accepts_fork_context() {
     assert!(parsed.fork_context);
 }
 
+#[test]
+fn test_parse_spawn_request_accepts_session_name_for_agent_open() {
+    let input = json!({
+        "name": "review.parser",
+        "prompt": "inspect parser",
+        "fork_context": true,
+        "max_depth": 0
+    });
+    let parsed = parse_spawn_request(&input).expect("open request should parse");
+    assert_eq!(parsed.session_name.as_deref(), Some("review.parser"));
+    assert!(parsed.fork_context);
+    assert_eq!(parsed.max_depth, Some(0));
+}
+
+#[test]
+fn test_parse_spawn_request_rejects_invalid_session_name() {
+    let input = json!({
+        "name": "bad name",
+        "prompt": "inspect parser"
+    });
+    let err = parse_spawn_request(&input).expect_err("space in name should fail");
+    assert!(err.to_string().contains("name must not contain whitespace"));
+}
+
+#[test]
+fn test_parse_spawn_request_rejects_out_of_range_max_depth() {
+    let input = json!({
+        "name": "review.parser",
+        "prompt": "inspect parser",
+        "max_depth": 4
+    });
+    let err = parse_spawn_request(&input).expect_err("max_depth should be capped at schema range");
+    assert!(
+        err.to_string()
+            .contains("max_depth must be between 0 and 3")
+    );
+}
+
+#[tokio::test]
+async fn session_projection_exposes_forked_prefix_cache_contract() {
+    let mut snapshot = make_snapshot(SubAgentStatus::Running);
+    snapshot.name = "fanout_review".to_string();
+    snapshot.context_mode = "forked".to_string();
+    snapshot.fork_context = true;
+
+    let ctx = ToolContext::new(".");
+    let projection = subagent_session_projection(snapshot, false, &ctx).await;
+
+    assert_eq!(projection.name, "fanout_review");
+    assert_eq!(projection.context_mode, "forked");
+    assert!(projection.fork_context);
+    assert_eq!(projection.prefix_cache.mode, "forked");
+    assert_eq!(
+        projection.prefix_cache.parent_prefix,
+        "preserved_byte_identical_when_available"
+    );
+    assert_eq!(projection.transcript_handle.kind, "var_handle");
+    assert_eq!(projection.transcript_handle.name, "transcript");
+}
+
 #[test]
 fn test_delegate_defaults_to_fork_context() {
     let input = with_default_fork_context(json!({ "prompt": "review current work" }), true);
@@ -427,23 +497,6 @@ fn test_parse_assign_request_requires_update_fields() {
     );
 }
 
-#[test]
-fn test_send_input_schema_does_not_require_message_field() {
-    let manager = Arc::new(RwLock::new(SubAgentManager::new(PathBuf::from("."), 1)));
-    let schema = AgentSendInputTool::new(manager, "send_input").input_schema();
-    let required = schema
-        .get("required")
-        .and_then(Value::as_array)
-        .cloned()
-        .unwrap_or_default();
-    assert!(
-        !required
-            .iter()
-            .any(|entry| entry.as_str().is_some_and(|name| name == "message")),
-        "send_input schema should allow items-only payloads"
-    );
-}
-
 #[test]
 fn test_build_allowed_tools_independent_of_allow_shell() {
     // v0.6.6: allow_shell no longer filters at the build_allowed_tools
@@ -880,83 +933,6 @@ fn test_interrupted_status_name_and_summary() {
     assert!(summarize_subagent_result(&snapshot).contains(SUBAGENT_RESTART_REASON));
 }
 
-// === Deprecation notice tests ===
-
-/// Helper: build a plain ToolResult with a JSON payload.
-fn make_plain_result(payload: serde_json::Value) -> crate::tools::spec::ToolResult {
-    crate::tools::spec::ToolResult::json(&payload).expect("json result")
-}
-
-#[test]
-fn test_wrap_with_deprecation_notice_adds_deprecation_block() {
-    let result = make_plain_result(json!({"agent_id": "abc"}));
-    let wrapped = wrap_with_deprecation_notice(result, "spawn_agent", "agent_spawn");
-
-    let meta = wrapped.metadata.expect("metadata should be present");
-    let dep = &meta["_deprecation"];
-    assert_eq!(dep["this_tool"], "spawn_agent");
-    assert_eq!(dep["use_instead"], "agent_spawn");
-    assert_eq!(dep["removed_in"], DEPRECATION_REMOVAL_VERSION);
-    assert!(
-        dep["message"]
-            .as_str()
-            .unwrap_or("")
-            .contains("spawn_agent")
-    );
-}
-
-#[test]
-fn test_wrap_with_deprecation_notice_preserves_existing_metadata() {
-    let result = make_plain_result(json!({"agent_id": "abc"}))
-        .with_metadata(json!({"status": "Running", "snapshot": {}}));
-    let wrapped = wrap_with_deprecation_notice(result, "close_agent", "agent_cancel");
-
-    let meta = wrapped.metadata.expect("metadata should be present");
-    // Existing metadata key must survive.
-    assert_eq!(meta["status"], "Running");
-    // Deprecation block must be present alongside.
-    assert_eq!(meta["_deprecation"]["this_tool"], "close_agent");
-    assert_eq!(meta["_deprecation"]["use_instead"], "agent_cancel");
-}
-
-#[test]
-fn test_canonical_agent_send_input_has_no_deprecation() {
-    let manager = Arc::new(RwLock::new(SubAgentManager::new(PathBuf::from("."), 1)));
-    // The canonical name "agent_send_input" must NOT receive a deprecation notice.
-    // We verify this by inspecting the tool's name — the deprecation branch
-    // only fires when name == "send_input".
-    let tool = AgentSendInputTool::new(manager.clone(), "agent_send_input");
-    assert_eq!(tool.name(), "agent_send_input");
-
-    let alias = AgentSendInputTool::new(manager, "send_input");
-    assert_eq!(alias.name(), "send_input");
-}
-
-#[test]
-fn test_wrap_with_deprecation_notice_all_alias_mappings() {
-    let cases = [
-        ("spawn_agent", "agent_spawn"),
-        ("delegate_to_agent", "agent_spawn"),
-        ("close_agent", "agent_cancel"),
-        ("send_input", "agent_send_input"),
-    ];
-
-    for (alias, canonical) in cases {
-        let result = make_plain_result(json!({"ok": true}));
-        let wrapped = wrap_with_deprecation_notice(result, alias, canonical);
-        let meta = wrapped.metadata.expect("metadata for alias {alias}");
-        assert_eq!(meta["_deprecation"]["this_tool"], alias, "alias={alias}");
-        assert_eq!(
-            meta["_deprecation"]["use_instead"], canonical,
-            "alias={alias}"
-        );
-        assert_eq!(
-            meta["_deprecation"]["removed_in"], DEPRECATION_REMOVAL_VERSION,
-            "alias={alias}"
-        );
-    }
-}
-
 // === v0.6.6 — sub-agent authority unification ===
 
 #[test]
diff --git a/crates/tui/src/tui/app.rs b/crates/tui/src/tui/app.rs
index 880eba2c..a719fda7 100644
--- a/crates/tui/src/tui/app.rs
+++ b/crates/tui/src/tui/app.rs
@@ -203,8 +203,7 @@ impl ReasoningEffort {
 #[derive(Debug, Clone, Copy, PartialEq, Eq)]
 pub enum SidebarFocus {
     Auto,
-    Plan,
-    Todos,
+    Work,
     Tasks,
     Agents,
     Context,
@@ -250,8 +249,7 @@ impl SidebarFocus {
     #[must_use]
     pub fn from_setting(value: &str) -> Self {
         match value.trim().to_ascii_lowercase().as_str() {
-            "plan" => Self::Plan,
-            "todos" => Self::Todos,
+            "work" | "plan" | "todos" => Self::Work,
             "tasks" => Self::Tasks,
             "agents" | "subagents" | "sub-agents" => Self::Agents,
             "context" | "session" => Self::Context,
@@ -264,8 +262,7 @@ impl SidebarFocus {
     pub fn as_setting(self) -> &'static str {
         match self {
             Self::Auto => "auto",
-            Self::Plan => "plan",
-            Self::Todos => "todos",
+            Self::Work => "work",
             Self::Tasks => "tasks",
             Self::Agents => "agents",
             Self::Context => "context",
@@ -4002,19 +3999,6 @@ pub enum AppAction {
     },
     /// Send a message to the AI (normal chat mode).
     SendMessage(String),
-    /// Run a Recursive Language Model (RLM) turn — Algorithm 1 from
-    /// Zhang et al. (arXiv:2512.24601). The prompt is stored in the REPL;
-    /// the root LLM only sees metadata.
-    Rlm {
-        /// The user's prompt — stored in REPL, NOT in LLM context.
-        prompt: String,
-        /// Model for the root LLM.
-        model: String,
-        /// Model for sub-LLM (llm_query) calls.
-        child_model: String,
-        /// Recursion budget for `sub_rlm()` calls.
-        max_depth: u32,
-    },
     ListSubAgents,
     FetchModels,
     CacheWarmup,
@@ -4140,6 +4124,18 @@ mod tests {
         assert!(app.trust_mode);
     }
 
+    #[test]
+    fn sidebar_focus_accepts_work_and_maps_legacy_trackers_to_work() {
+        assert_eq!(SidebarFocus::from_setting("auto"), SidebarFocus::Auto);
+        assert_eq!(SidebarFocus::from_setting("work"), SidebarFocus::Work);
+        assert_eq!(SidebarFocus::from_setting("plan"), SidebarFocus::Work);
+        assert_eq!(SidebarFocus::from_setting("todos"), SidebarFocus::Work);
+        assert_eq!(SidebarFocus::from_setting("tasks"), SidebarFocus::Tasks);
+        assert_eq!(SidebarFocus::from_setting("agents"), SidebarFocus::Agents);
+        assert_eq!(SidebarFocus::from_setting("context"), SidebarFocus::Context);
+        assert_eq!(SidebarFocus::Work.as_setting(), "work");
+    }
+
     #[test]
     fn composer_strips_raw_sgr_mouse_report_when_mouse_capture_is_enabled() {
         let mut app = App::new(test_options(false), &Config::default());
diff --git a/crates/tui/src/tui/history.rs b/crates/tui/src/tui/history.rs
index 6f06f5cd..871480b8 100644
--- a/crates/tui/src/tui/history.rs
+++ b/crates/tui/src/tui/history.rs
@@ -309,7 +309,7 @@ impl HistoryCell {
     /// Render the cell in transcript mode: full content, no caps, no
     /// "Alt+V for details" affordances.
     ///
-    /// Use this for the pager (`v` / `Ctrl+O`), clipboard exports, and any
+    /// Use this for full-detail pagers, clipboard exports, and any
     /// surface that wants the complete body rather than the live summary.
     /// For most variants (User / Assistant / System) this matches `lines()`;
     /// `Thinking` and `Tool` are where the live and transcript surfaces
@@ -1247,19 +1247,21 @@ impl GenericToolCell {
             return lines;
         }
 
-        // Issue #409: `agent_spawn` already gets a dedicated `DelegateCard`
+        // Issue #409: sub-agent open already gets a dedicated `DelegateCard`
         // that owns the live action tree, status, and final summary. The
         // generic tool block for the same call duplicates that signal at
         // 3-4 lines per spawn — N parallel spawns multiply the noise. In
         // live mode, render one compact summary line and let the
         // DelegateCard be the source of truth. Transcript mode keeps the
         // full block so session replay remains complete.
-        if matches!(mode, RenderMode::Live) && self.name == "agent_spawn" {
+        if matches!(mode, RenderMode::Live)
+            && matches!(self.name.as_str(), "agent_open" | "agent_spawn")
+        {
             return self.render_agent_spawn_compact(low_motion);
         }
 
         let mut lines = Vec::new();
-        // Map the actual tool name (e.g. `agent_spawn`, `apply_patch`) to a
+        // Map the actual tool name (e.g. `agent_open`, `apply_patch`) to a
         // family rather than the catch-all `"Tool"` title — this is what
         // gives a `GenericToolCell` the right verb glyph (◐ delegate, ⋮⋮
         // fanout, etc.) instead of falling back to the neutral bullet.
@@ -1343,13 +1345,13 @@ impl GenericToolCell {
         wrap_card_rail(lines)
     }
 
-    /// Render `agent_spawn` as a single compact summary line for live
+    /// Render `agent_open`/legacy `agent_spawn` as a single compact summary line for live
     /// mode (#409). The companion `DelegateCard` already carries the
     /// live action tree, status, and final summary; this line is just
     /// the pointer that says "a spawn happened, here's the agent id".
     ///
     /// Output shape (header):
-    ///   `◐ delegate · agent_spawn  agent-abc12  [running]`
+    ///   `◐ delegate · agent_open  agent-abc12  [running]`
     /// Falls back to a placeholder when the spawn is still pending and
     /// no agent id has been assigned yet.
     fn render_agent_spawn_compact(&self, low_motion: bool) -> Vec<Line<'static>> {
@@ -1438,7 +1440,7 @@ fn render_spillover_annotation(path: &std::path::Path, width: u16) -> Line<'stat
     ])
 }
 
-/// Pull the `agent_id` field out of an `agent_spawn` tool output. The
+/// Pull the `agent_id` field out of a sub-agent open tool output. The
 /// tool emits structured JSON shaped like
 /// `{"agent_id": "agent-abc12", "nickname": "...", "model": "..."}` so we
 /// look for the `agent_id` key and return its string value.
@@ -2160,9 +2162,9 @@ fn render_thinking(
         };
     if needs_affordance {
         let label = if streaming {
-            "thinking continues; press Ctrl+O for full text"
+            "thinking continues; Ctrl+O opens Activity Detail"
         } else {
-            "thinking collapsed; press Ctrl+O for full text"
+            "thinking collapsed; Ctrl+O opens Activity Detail"
         };
         lines.push(Line::from(vec![
             Span::styled(REASONING_RAIL.to_string(), rail_style),
@@ -3646,7 +3648,7 @@ mod tests {
             .iter()
             .flat_map(|line| line.spans.iter().map(|span| span.content.as_ref()))
             .collect::<String>();
-        assert!(text.contains("thinking collapsed; press Ctrl+O for full text"));
+        assert!(text.contains("thinking collapsed; Ctrl+O opens Activity Detail"));
         assert!(text.contains("thinking"));
     }
 
@@ -3694,7 +3696,7 @@ mod tests {
             .flat_map(|line| line.spans.iter().map(|span| span.content.as_ref()))
             .collect::<String>();
         assert!(
-            text.contains("thinking continues; press Ctrl+O for full text"),
+            text.contains("thinking continues; Ctrl+O opens Activity Detail"),
             "streaming-truncation affordance missing, got: {text}"
         );
         // The most recent line must be the visible tail (head dropped).
@@ -4345,11 +4347,11 @@ mod tests {
             "live thinking must drop the tail when collapsed"
         );
         assert!(
-            live_text.contains("press Ctrl+O for full text"),
+            live_text.contains("Ctrl+O opens Activity Detail"),
             "live thinking must offer the pager affordance"
         );
         assert!(
-            !transcript_text.contains("press Ctrl+O for full text"),
+            !transcript_text.contains("Ctrl+O opens Activity Detail"),
             "transcript thinking must not include the live affordance"
         );
     }
@@ -4381,7 +4383,7 @@ mod tests {
             "short thinking must render identically on both surfaces"
         );
         assert!(
-            !live_text.contains("press Ctrl+O for full text"),
+            !live_text.contains("Ctrl+O opens Activity Detail"),
             "short thinking must not show the collapse affordance"
         );
     }
diff --git a/crates/tui/src/tui/keybindings.rs b/crates/tui/src/tui/keybindings.rs
index 10f0ad7b..c58437fb 100644
--- a/crates/tui/src/tui/keybindings.rs
+++ b/crates/tui/src/tui/keybindings.rs
@@ -242,7 +242,7 @@ pub const KEYBINDINGS: &[KeybindingEntry] = &[
         section: KeybindingSection::Modes,
     },
     KeybindingEntry {
-        chord: "Alt+! / Alt+@ / Alt+# / Alt+4 / Alt+$ / Alt+0",
+        chord: "Alt+! / Alt+@ / Alt+# / Alt+$ / Alt+0",
         description_id: crate::localization::MessageId::KbFocusSidebar,
         section: KeybindingSection::Modes,
     },
@@ -335,6 +335,23 @@ mod tests {
         );
     }
 
+    #[test]
+    fn ctrl_o_help_copy_matches_activity_detail_behavior() {
+        let ctrl_o = KEYBINDINGS
+            .iter()
+            .find(|entry| entry.chord == "Ctrl+O")
+            .expect("Ctrl+O keybinding should be documented");
+
+        assert_eq!(
+            ctrl_o.description_id,
+            crate::localization::MessageId::KbThinkingPager
+        );
+        assert_eq!(
+            crate::localization::tr(crate::localization::Locale::En, ctrl_o.description_id,),
+            "Open Activity Detail"
+        );
+    }
+
     #[test]
     fn section_rank_is_a_total_order() {
         let sections = [
diff --git a/crates/tui/src/tui/sidebar.rs b/crates/tui/src/tui/sidebar.rs
index c4305345..f2630f91 100644
--- a/crates/tui/src/tui/sidebar.rs
+++ b/crates/tui/src/tui/sidebar.rs
@@ -1,4 +1,4 @@
-//! Sidebar rendering — Plan / Todos / Tasks / Agents panels.
+//! Sidebar rendering — Work / Tasks / Agents / Context panels.
 //!
 //! Extracted from `tui/ui.rs` (P1.2). The sidebar appears to the right of
 //! the chat transcript when the available width allows it. Each section
@@ -21,8 +21,8 @@ use crate::tools::plan::StepStatus;
 use crate::tools::subagent::SubAgentStatus;
 use crate::tools::todo::TodoStatus;
 
-use super::app::{App, SidebarFocus};
-use super::history::{HistoryCell, ToolCell, ToolStatus};
+use super::app::{App, SidebarFocus, TaskPanelEntry};
+use super::history::{HistoryCell, ToolCell, ToolStatus, summarize_tool_output};
 use super::subagent_routing::active_fanout_counts;
 use super::ui::truncate_line_to_width;
 
@@ -30,6 +30,7 @@ use super::ui::truncate_line_to_width;
 /// Must be large enough that accumulated f64 error across hundreds of turns
 /// does not prematurely hide the session+agents breakdown.
 const COST_EQ_TOLERANCE: f64 = 1e-6;
+const RECENT_TOOL_SCAN_LIMIT: usize = 24;
 
 pub fn render_sidebar(f: &mut Frame, area: Rect, app: &App) {
     if area.width < 24 || area.height < 8 {
@@ -43,8 +44,7 @@ pub fn render_sidebar(f: &mut Frame, area: Rect, app: &App) {
 
     match app.sidebar_focus {
         SidebarFocus::Auto => render_sidebar_auto(f, area, app),
-        SidebarFocus::Plan => render_sidebar_plan(f, area, app),
-        SidebarFocus::Todos => render_sidebar_todos(f, area, app),
+        SidebarFocus::Work => render_sidebar_work(f, area, app),
         SidebarFocus::Tasks => render_sidebar_tasks(f, area, app),
         SidebarFocus::Agents => render_sidebar_subagents(f, area, app),
         SidebarFocus::Context => render_context_panel(f, area, app),
@@ -52,45 +52,22 @@ pub fn render_sidebar(f: &mut Frame, area: Rect, app: &App) {
 }
 
 /// Build the Auto-mode panel stack. Empty panels collapse to zero height so
-/// non-empty ones get the full sidebar real estate. Without this, Plan got
-/// clipped because Todos/Tasks/Agents each reserved 25% of the height even
-/// when they had nothing to show. Plan is always rendered (it owns the
-/// session-wide empty-state hint).
+/// non-empty ones get the full sidebar real estate. Work appears when it has
+/// useful content, or as the one quiet empty state when nothing else is active.
 fn render_sidebar_auto(f: &mut Frame, area: Rect, app: &App) {
-    #[derive(Clone, Copy)]
-    enum Panel {
-        Plan,
-        Todos,
-        Tasks,
-        Agents,
-        Context,
-    }
-
-    let todos_empty = app
-        .todos
-        .try_lock()
-        .map(|todos| todos.snapshot().items.is_empty())
-        .unwrap_or(false); // assume non-empty when locked so we don't hide updating data
+    let work_has_content = sidebar_work_summary(app).has_useful_content();
     let tasks_empty = app.runtime_turn_id.is_none() && app.task_panel.is_empty();
     let agents_empty = app.subagent_cache.is_empty()
         && app.agent_progress.is_empty()
         && active_fanout_counts(app).is_none()
         && !foreground_rlm_running(app);
 
-    let mut visible: Vec<Panel> = Vec::with_capacity(5);
-    visible.push(Panel::Plan);
-    if !todos_empty {
-        visible.push(Panel::Todos);
-    }
-    if !tasks_empty {
-        visible.push(Panel::Tasks);
-    }
-    if !agents_empty {
-        visible.push(Panel::Agents);
-    }
-    if app.context_panel {
-        visible.push(Panel::Context);
-    }
+    let visible = auto_sidebar_panels(AutoSidebarState {
+        work_has_content,
+        tasks_empty,
+        agents_empty,
+        context_enabled: app.context_panel,
+    });
 
     let constraints: Vec<Constraint> = match visible.len() {
         1 => vec![Constraint::Min(0)],
@@ -122,246 +99,412 @@ fn render_sidebar_auto(f: &mut Frame, area: Rect, app: &App) {
 
     for (panel, rect) in visible.iter().zip(sections.iter()) {
         match panel {
-            Panel::Plan => render_sidebar_plan(f, *rect, app),
-            Panel::Todos => render_sidebar_todos(f, *rect, app),
-            Panel::Tasks => render_sidebar_tasks(f, *rect, app),
-            Panel::Agents => render_sidebar_subagents(f, *rect, app),
-            Panel::Context => render_context_panel(f, *rect, app),
+            AutoSidebarPanel::Work => render_sidebar_work(f, *rect, app),
+            AutoSidebarPanel::Tasks => render_sidebar_tasks(f, *rect, app),
+            AutoSidebarPanel::Agents => render_sidebar_subagents(f, *rect, app),
+            AutoSidebarPanel::Context => render_context_panel(f, *rect, app),
         }
     }
 }
 
-/// The Plan section is the **single source of truth for the
-/// `update_plan` tool's output** (#408). It is intentionally distinct
-/// from the Todos section: todos are checklist work items the user
-/// or model is tracking; plan steps are the model's higher-level
-/// strategy as recorded by `update_plan`. The panel also hosts two
-/// session-wide indicators that don't fit the other sections — Goal
-/// (`/goal`) and the cycle counter (#124) — because they share the
-/// "what's the agent trying to do, big-picture" theme.
-///
-/// When the panel is fully empty (no goal, no cycles, no plan) it
-/// renders as a quiet section with a single dim hint at the bottom
-/// rather than the blunt "No active plan" placeholder it used to show.
-/// That kept the user wondering whether the panel was broken; the
-/// hint instead tells them what the panel is for and how to populate
-/// it.
-fn render_sidebar_plan(f: &mut Frame, area: Rect, app: &App) {
-    if area.height < 3 {
-        return;
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+enum AutoSidebarPanel {
+    Work,
+    Tasks,
+    Agents,
+    Context,
+}
+
+#[derive(Debug, Clone, Copy)]
+struct AutoSidebarState {
+    work_has_content: bool,
+    tasks_empty: bool,
+    agents_empty: bool,
+    context_enabled: bool,
+}
+
+fn auto_sidebar_panels(state: AutoSidebarState) -> Vec<AutoSidebarPanel> {
+    let nothing_else_active = state.tasks_empty && state.agents_empty && !state.context_enabled;
+    let mut visible = Vec::with_capacity(4);
+
+    if state.work_has_content || nothing_else_active {
+        visible.push(AutoSidebarPanel::Work);
+    }
+    if !state.tasks_empty {
+        visible.push(AutoSidebarPanel::Tasks);
+    }
+    if !state.agents_empty {
+        visible.push(AutoSidebarPanel::Agents);
+    }
+    if state.context_enabled {
+        visible.push(AutoSidebarPanel::Context);
     }
 
-    let theme = Theme::for_palette_mode(app.ui_theme.mode);
-    let content_width = area.width.saturating_sub(4) as usize;
-    let mut lines: Vec<Line<'static>> = Vec::with_capacity(usize::from(area.height).max(4));
+    visible
+}
 
-    // === Goal Mode (#397) — gold outline matching todo items ===
-    if let Some(ref objective) = app.goal.goal_objective {
-        lines.push(Line::from(Span::styled(
-            format!(
-                "◆ {}",
-                truncate_line_to_width(objective, content_width.max(1))
-            ),
-            Style::default()
-                .fg(palette::STATUS_WARNING)
-                .add_modifier(ratatui::style::Modifier::BOLD),
-        )));
-        if let Some(budget) = app.goal.goal_token_budget {
-            let used = app.session.total_conversation_tokens;
-            let pct = if budget > 0 {
-                ((used as f64 / budget as f64) * 100.0).min(100.0)
-            } else {
-                0.0
-            };
-            let bar_width = content_width.min(20);
-            let filled = ((pct / 100.0) * bar_width as f64) as usize;
-            let bar = format!(
-                "[{}{}] {:.0}%",
-                "█".repeat(filled),
-                "░".repeat(bar_width.saturating_sub(filled)),
-                pct
-            );
-            lines.push(Line::from(Span::styled(
-                format!("  tokens: {used}/{budget} {}", bar),
-                Style::default().fg(palette::TEXT_MUTED),
-            )));
-        }
-        // Gold separator
-        lines.push(Line::from(Span::styled(
-            "─".repeat(content_width.min(24)),
-            Style::default().fg(palette::STATUS_WARNING),
-        )));
+#[derive(Debug, Clone)]
+struct SidebarWorkChecklistItem {
+    id: u32,
+    content: String,
+    status: TodoStatus,
+}
+
+#[derive(Debug, Clone)]
+struct SidebarWorkStrategyStep {
+    text: String,
+    status: StepStatus,
+    elapsed: String,
+}
+
+#[derive(Debug, Clone, Default)]
+struct SidebarWorkSummary {
+    goal_objective: Option<String>,
+    goal_token_budget: Option<u32>,
+    tokens_used: u32,
+    cycle_count: u32,
+    checklist_completion_pct: u8,
+    checklist_items: Vec<SidebarWorkChecklistItem>,
+    strategy_explanation: Option<String>,
+    strategy_steps: Vec<SidebarWorkStrategyStep>,
+    state_updating: bool,
+}
+
+impl SidebarWorkSummary {
+    fn has_strategy(&self) -> bool {
+        self.strategy_explanation
+            .as_deref()
+            .is_some_and(|s| !s.trim().is_empty())
+            || !self.strategy_steps.is_empty()
     }
 
-    // Cycle indicator (issue #124). Only shown once a boundary has fired —
-    // first-time users with cycle_count == 0 don't need this row of chrome.
-    if app.cycle_count > 0 {
-        lines.push(Line::from(Span::styled(
-            format!(
-                "cycles: {} (active: {})",
-                app.cycle_count,
-                app.cycle_count.saturating_add(1)
-            ),
-            Style::default().fg(theme.plan_summary_color),
-        )));
+    fn has_useful_content(&self) -> bool {
+        self.goal_objective
+            .as_deref()
+            .is_some_and(|s| !s.trim().is_empty())
+            || self.cycle_count > 0
+            || !self.checklist_items.is_empty()
+            || self.has_strategy()
+            || self.state_updating
     }
 
-    match app.plan_state.try_lock() {
-        Ok(plan) => {
-            if plan.is_empty() {
-                // The blunt "No active plan" placeholder used to land
-                // here on every render with no plan steps, even when the
-                // user had a goal set or had cycled — making the panel
-                // look broken. After #408 we instead emit a quiet hint
-                // that explains what the panel is for, but only when
-                // *all* of the panel's signals are empty so we don't
-                // crowd a panel that already has a goal / cycle
-                // indicator above.
-                let nothing_above = app.goal.goal_objective.is_none() && app.cycle_count == 0;
-                if nothing_above {
-                    lines.push(Line::from(Span::styled(
-                        plan_panel_empty_hint(content_width.max(1)),
-                        Style::default().fg(palette::TEXT_MUTED).italic(),
-                    )));
-                }
-            } else {
-                let (pending, in_progress, completed) = plan.counts();
-                let total = pending + in_progress + completed;
-                lines.push(Line::from(vec![
-                    Span::styled(
-                        format!("{}%", plan.progress_percent()),
-                        Style::default().fg(theme.plan_progress_color).bold(),
-                    ),
-                    Span::styled(
-                        format!(" complete ({completed}/{total})"),
-                        Style::default().fg(theme.plan_summary_color),
-                    ),
-                ]));
-
-                if let Some(explanation) = plan.explanation() {
-                    lines.push(Line::from(Span::styled(
-                        truncate_line_to_width(explanation, content_width.max(1)),
-                        Style::default().fg(theme.plan_explanation_color),
-                    )));
-                }
-
-                let usable_rows = area.height.saturating_sub(3) as usize;
-                let max_steps = usable_rows.saturating_sub(lines.len());
-                for step in plan.steps().iter().take(max_steps) {
-                    let (prefix, color) = match &step.status {
-                        StepStatus::Pending => ("[ ]", theme.plan_pending_color),
-                        StepStatus::InProgress => ("[~]", theme.plan_in_progress_color),
-                        StepStatus::Completed => ("[x]", theme.plan_completed_color),
-                    };
-                    let mut text = format!("{prefix} {}", step.text);
-                    let elapsed = step.elapsed_str();
-                    if !elapsed.is_empty() {
-                        let _ = write!(text, " ({elapsed})");
-                    }
-                    lines.push(Line::from(Span::styled(
-                        truncate_line_to_width(&text, content_width.max(1)),
-                        Style::default().fg(color),
-                    )));
-                }
-
-                let remaining = plan.steps().len().saturating_sub(max_steps);
-                if remaining > 0 {
-                    lines.push(Line::from(Span::styled(
-                        format!("+{remaining} more steps"),
-                        Style::default().fg(theme.plan_summary_color),
-                    )));
-                }
+    fn strategy_counts(&self) -> (usize, usize, usize) {
+        let mut pending = 0;
+        let mut in_progress = 0;
+        let mut completed = 0;
+        for step in &self.strategy_steps {
+            match step.status {
+                StepStatus::Pending => pending += 1,
+                StepStatus::InProgress => in_progress += 1,
+                StepStatus::Completed => completed += 1,
             }
         }
-        Err(_) => {
-            lines.push(Line::from(Span::styled(
-                "Plan state updating...",
-                Style::default().fg(theme.plan_summary_color),
-            )));
+        (pending, in_progress, completed)
+    }
+
+    fn strategy_progress_percent(&self) -> u8 {
+        if self.strategy_steps.is_empty() {
+            return 0;
         }
+        let completed = self
+            .strategy_steps
+            .iter()
+            .filter(|step| step.status == StepStatus::Completed)
+            .count();
+        let percent = completed.saturating_mul(100) / self.strategy_steps.len();
+        u8::try_from(percent).unwrap_or(u8::MAX)
     }
-
-    render_sidebar_section(f, area, "Plan", lines, app);
 }
 
-/// One-line hint shown when the Plan section has nothing to display
-/// (no goal, no cycle, no steps). Ellipsizes for narrow widths so
-/// even a 24-column sidebar doesn't wrap mid-word. Visible across
-/// modes — the panel's role doesn't change between Plan / Agent /
-/// YOLO; only its content does.
-#[must_use]
-fn plan_panel_empty_hint(content_width: usize) -> String {
-    let full = "tracks update_plan / /goal / cycles";
-    truncate_line_to_width(full, content_width)
-}
-
-fn render_sidebar_todos(f: &mut Frame, area: Rect, app: &App) {
-    if area.height < 3 {
-        return;
-    }
-
-    let content_width = area.width.saturating_sub(4) as usize;
-    let mut lines: Vec<Line<'static>> = Vec::with_capacity(usize::from(area.height).max(4));
+fn sidebar_work_summary(app: &App) -> SidebarWorkSummary {
+    let mut summary = SidebarWorkSummary {
+        goal_objective: app.goal.goal_objective.clone(),
+        goal_token_budget: app.goal.goal_token_budget,
+        tokens_used: app.session.total_conversation_tokens,
+        cycle_count: app.cycle_count,
+        ..SidebarWorkSummary::default()
+    };
 
     match app.todos.try_lock() {
         Ok(todos) => {
             let snapshot = todos.snapshot();
-            if snapshot.items.is_empty() {
-                lines.push(Line::from(Span::styled(
-                    "No todos",
-                    Style::default().fg(palette::TEXT_MUTED),
-                )));
-            } else {
-                let total = snapshot.items.len();
-                let completed = snapshot
-                    .items
-                    .iter()
-                    .filter(|item| item.status == TodoStatus::Completed)
-                    .count();
-                lines.push(Line::from(vec![
-                    Span::styled(
-                        format!("{}%", snapshot.completion_pct),
-                        Style::default().fg(palette::STATUS_SUCCESS).bold(),
-                    ),
-                    Span::styled(
-                        format!(" complete ({completed}/{total})"),
-                        Style::default().fg(palette::TEXT_MUTED),
-                    ),
-                ]));
-
-                let usable_rows = area.height.saturating_sub(3) as usize;
-                let max_items = usable_rows.saturating_sub(lines.len());
-                for item in snapshot.items.iter().take(max_items) {
-                    let (prefix, color) = match item.status {
-                        TodoStatus::Pending => ("[ ]", palette::TEXT_MUTED),
-                        TodoStatus::InProgress => ("[~]", palette::STATUS_WARNING),
-                        TodoStatus::Completed => ("[x]", palette::STATUS_SUCCESS),
-                    };
-                    let text = format!("{prefix} #{} {}", item.id, item.content);
-                    lines.push(Line::from(Span::styled(
-                        truncate_line_to_width(&text, content_width.max(1)),
-                        Style::default().fg(color),
-                    )));
-                }
-
-                let remaining = snapshot.items.len().saturating_sub(max_items);
-                if remaining > 0 {
-                    lines.push(Line::from(Span::styled(
-                        format!("+{remaining} more todos"),
-                        Style::default().fg(palette::TEXT_MUTED),
-                    )));
-                }
-            }
+            summary.checklist_completion_pct = snapshot.completion_pct;
+            summary.checklist_items = snapshot
+                .items
+                .into_iter()
+                .map(|item| SidebarWorkChecklistItem {
+                    id: item.id,
+                    content: item.content,
+                    status: item.status,
+                })
+                .collect();
         }
         Err(_) => {
-            lines.push(Line::from(Span::styled(
-                "Todo list updating...",
-                Style::default().fg(palette::TEXT_MUTED),
-            )));
+            summary.state_updating = true;
         }
     }
 
-    render_sidebar_section(f, area, "Todos", lines, app);
+    match app.plan_state.try_lock() {
+        Ok(plan) => {
+            if !plan.is_empty() {
+                summary.strategy_explanation = plan.explanation().map(str::to_string);
+                summary.strategy_steps = plan
+                    .steps()
+                    .iter()
+                    .map(|step| SidebarWorkStrategyStep {
+                        text: step.text.clone(),
+                        status: step.status.clone(),
+                        elapsed: step.elapsed_str(),
+                    })
+                    .collect();
+            }
+        }
+        Err(_) => {
+            summary.state_updating = true;
+        }
+    }
+
+    summary
+}
+
+fn work_panel_lines(
+    summary: &SidebarWorkSummary,
+    content_width: usize,
+    max_rows: usize,
+    palette_mode: palette::PaletteMode,
+) -> Vec<Line<'static>> {
+    let theme = Theme::for_palette_mode(palette_mode);
+    let mut lines: Vec<Line<'static>> = Vec::with_capacity(max_rows.max(4));
+
+    push_work_goal_lines(summary, content_width, max_rows, &mut lines);
+
+    if summary.state_updating && lines.len() < max_rows {
+        lines.push(Line::from(Span::styled(
+            "Work state updating...",
+            Style::default().fg(palette::TEXT_MUTED),
+        )));
+    }
+
+    push_work_checklist_lines(summary, content_width, max_rows, &mut lines);
+    push_work_strategy_lines(summary, content_width, max_rows, &mut lines, &theme);
+
+    if summary.cycle_count > 0 && lines.len() < max_rows {
+        lines.push(Line::from(Span::styled(
+            format!(
+                "cycles: {} (active: {})",
+                summary.cycle_count,
+                summary.cycle_count.saturating_add(1)
+            ),
+            Style::default().fg(palette::TEXT_MUTED),
+        )));
+    }
+
+    if lines.is_empty() {
+        lines.push(Line::from(Span::styled(
+            work_panel_empty_hint(content_width),
+            Style::default().fg(palette::TEXT_MUTED).italic(),
+        )));
+    }
+
+    lines
+}
+
+fn push_work_goal_lines(
+    summary: &SidebarWorkSummary,
+    content_width: usize,
+    max_rows: usize,
+    lines: &mut Vec<Line<'static>>,
+) {
+    let Some(objective) = summary.goal_objective.as_deref() else {
+        return;
+    };
+    if objective.trim().is_empty() || lines.len() >= max_rows {
+        return;
+    }
+
+    lines.push(Line::from(Span::styled(
+        format!(
+            "◆ {}",
+            truncate_line_to_width(objective, content_width.saturating_sub(2).max(1))
+        ),
+        Style::default()
+            .fg(palette::STATUS_WARNING)
+            .add_modifier(ratatui::style::Modifier::BOLD),
+    )));
+
+    if let Some(budget) = summary.goal_token_budget
+        && lines.len() < max_rows
+    {
+        let pct = if budget > 0 {
+            ((summary.tokens_used as f64 / budget as f64) * 100.0).min(100.0)
+        } else {
+            0.0
+        };
+        let bar_width = content_width.min(20);
+        let filled = ((pct / 100.0) * bar_width as f64) as usize;
+        let bar = format!(
+            "[{}{}] {:.0}%",
+            "█".repeat(filled),
+            "░".repeat(bar_width.saturating_sub(filled)),
+            pct
+        );
+        lines.push(Line::from(Span::styled(
+            truncate_line_to_width(
+                &format!("tokens: {}/{} {}", summary.tokens_used, budget, bar),
+                content_width,
+            ),
+            Style::default().fg(palette::TEXT_MUTED),
+        )));
+    }
+}
+
+fn push_work_checklist_lines(
+    summary: &SidebarWorkSummary,
+    content_width: usize,
+    max_rows: usize,
+    lines: &mut Vec<Line<'static>>,
+) {
+    if summary.checklist_items.is_empty() || lines.len() >= max_rows {
+        return;
+    }
+
+    let total = summary.checklist_items.len();
+    let completed = summary
+        .checklist_items
+        .iter()
+        .filter(|item| item.status == TodoStatus::Completed)
+        .count();
+    lines.push(Line::from(vec![
+        Span::styled(
+            format!("{}%", summary.checklist_completion_pct),
+            Style::default().fg(palette::STATUS_SUCCESS).bold(),
+        ),
+        Span::styled(
+            format!(" complete ({completed}/{total})"),
+            Style::default().fg(palette::TEXT_MUTED),
+        ),
+    ]));
+
+    let reserve_for_strategy = if summary.has_strategy() { 2 } else { 0 };
+    let max_items = max_rows
+        .saturating_sub(lines.len())
+        .saturating_sub(reserve_for_strategy)
+        .min(summary.checklist_items.len());
+    for item in summary.checklist_items.iter().take(max_items) {
+        let (prefix, color) = match item.status {
+            TodoStatus::Pending => ("[ ]", palette::TEXT_MUTED),
+            TodoStatus::InProgress => ("[~]", palette::STATUS_WARNING),
+            TodoStatus::Completed => ("[x]", palette::STATUS_SUCCESS),
+        };
+        let text = format!("{prefix} #{} {}", item.id, item.content);
+        lines.push(Line::from(Span::styled(
+            truncate_line_to_width(&text, content_width),
+            Style::default().fg(color),
+        )));
+    }
+
+    let remaining = summary.checklist_items.len().saturating_sub(max_items);
+    if remaining > 0 && lines.len() < max_rows {
+        lines.push(Line::from(Span::styled(
+            format!("+{remaining} more checklist items"),
+            Style::default().fg(palette::TEXT_MUTED),
+        )));
+    }
+}
+
+fn push_work_strategy_lines(
+    summary: &SidebarWorkSummary,
+    content_width: usize,
+    max_rows: usize,
+    lines: &mut Vec<Line<'static>>,
+    theme: &Theme,
+) {
+    if !summary.has_strategy() || lines.len() >= max_rows {
+        return;
+    }
+
+    if summary.checklist_items.is_empty() && !summary.strategy_steps.is_empty() {
+        let (pending, in_progress, completed) = summary.strategy_counts();
+        let total = pending + in_progress + completed;
+        lines.push(Line::from(vec![
+            Span::styled(
+                "Strategy ",
+                Style::default().fg(theme.plan_summary_color).bold(),
+            ),
+            Span::styled(
+                format!("{}%", summary.strategy_progress_percent()),
+                Style::default().fg(theme.plan_progress_color).bold(),
+            ),
+            Span::styled(
+                format!(" complete ({completed}/{total})"),
+                Style::default().fg(theme.plan_summary_color),
+            ),
+        ]));
+    } else {
+        lines.push(Line::from(Span::styled(
+            "Strategy",
+            Style::default().fg(theme.plan_summary_color).bold(),
+        )));
+    }
+
+    if let Some(explanation) = summary.strategy_explanation.as_deref()
+        && lines.len() < max_rows
+    {
+        lines.push(Line::from(Span::styled(
+            truncate_line_to_width(explanation, content_width),
+            Style::default().fg(theme.plan_explanation_color),
+        )));
+    }
+
+    let max_steps = max_rows
+        .saturating_sub(lines.len())
+        .min(summary.strategy_steps.len());
+    for step in summary.strategy_steps.iter().take(max_steps) {
+        let (prefix, color) = match step.status {
+            StepStatus::Pending => ("[ ]", theme.plan_pending_color),
+            StepStatus::InProgress => ("[~]", theme.plan_in_progress_color),
+            StepStatus::Completed => ("[x]", theme.plan_completed_color),
+        };
+        let mut text = format!("{prefix} {}", step.text);
+        if !step.elapsed.is_empty() {
+            let _ = write!(text, " ({})", step.elapsed);
+        }
+        lines.push(Line::from(Span::styled(
+            truncate_line_to_width(&text, content_width),
+            Style::default().fg(color),
+        )));
+    }
+
+    let remaining = summary.strategy_steps.len().saturating_sub(max_steps);
+    if remaining > 0 && lines.len() < max_rows {
+        lines.push(Line::from(Span::styled(
+            format!("+{remaining} more strategy steps"),
+            Style::default().fg(theme.plan_summary_color),
+        )));
+    }
+}
+
+#[must_use]
+fn work_panel_empty_hint(content_width: usize) -> String {
+    truncate_line_to_width("No active work", content_width)
+}
+
+fn render_sidebar_work(f: &mut Frame, area: Rect, app: &App) {
+    if area.height < 3 {
+        return;
+    }
+
+    let content_width = area.width.saturating_sub(4) as usize;
+    let usable_rows = area.height.saturating_sub(3) as usize;
+    let summary = sidebar_work_summary(app);
+    let lines = work_panel_lines(
+        &summary,
+        content_width.max(1),
+        usable_rows,
+        app.ui_theme.mode,
+    );
+
+    render_sidebar_section(f, area, "Work", lines, app);
 }
 
 fn render_sidebar_tasks(f: &mut Frame, area: Rect, app: &App) {
@@ -370,7 +513,22 @@ fn render_sidebar_tasks(f: &mut Frame, area: Rect, app: &App) {
     }
 
     let content_width = area.width.saturating_sub(4) as usize;
-    let mut lines: Vec<Line<'static>> = Vec::with_capacity(usize::from(area.height).max(4));
+    let usable_rows = area.height.saturating_sub(3) as usize;
+    let lines = task_panel_lines(app, content_width.max(1), usable_rows.max(1));
+
+    render_sidebar_section(f, area, "Tasks", lines, app);
+}
+
+#[derive(Debug, Clone)]
+struct SidebarToolRow {
+    name: String,
+    status: ToolStatus,
+    summary: String,
+    duration_ms: Option<u64>,
+}
+
+fn task_panel_lines(app: &App, content_width: usize, max_rows: usize) -> Vec<Line<'static>> {
+    let mut lines: Vec<Line<'static>> = Vec::with_capacity(max_rows.max(4));
 
     if let Some(turn_id) = app.runtime_turn_id.as_ref() {
         let status = app
@@ -387,28 +545,29 @@ fn render_sidebar_tasks(f: &mut Frame, area: Rect, app: &App) {
         )));
     }
 
-    if app.task_panel.is_empty() {
-        lines.push(Line::from(Span::styled(
-            "No active tasks",
-            Style::default().fg(palette::TEXT_MUTED),
-        )));
-    } else {
-        let running = app
-            .task_panel
+    let active_rows = active_tool_rows(app);
+    if !active_rows.is_empty() && lines.len() < max_rows {
+        push_sidebar_label(&mut lines, "Live tools", palette::DEEPSEEK_SKY);
+        push_tool_rows(&mut lines, &active_rows, content_width, max_rows);
+    }
+
+    let background_rows = background_task_rows(app, &active_rows);
+    if !background_rows.is_empty() && lines.len() < max_rows {
+        let running = background_rows
             .iter()
             .filter(|task| task.status == "running")
             .count();
         lines.push(Line::from(vec![
             Span::styled(
-                if running == app.task_panel.len() {
-                    format!("{running} running")
+                if running == background_rows.len() {
+                    format!("Background jobs: {running} running")
                 } else {
-                    format!("{} active", app.task_panel.len())
+                    format!("Background jobs: {} active", background_rows.len())
                 },
                 Style::default().fg(palette::DEEPSEEK_SKY).bold(),
             ),
             Span::styled(
-                if running == app.task_panel.len() {
+                if running == background_rows.len() {
                     String::new()
                 } else {
                     format!(" ({running} running)")
@@ -417,9 +576,8 @@ fn render_sidebar_tasks(f: &mut Frame, area: Rect, app: &App) {
             ),
         ]));
 
-        let usable_rows = area.height.saturating_sub(3) as usize;
-        let max_items = usable_rows.saturating_sub(lines.len());
-        for task in app.task_panel.iter().take(max_items) {
+        let max_items = max_rows.saturating_sub(lines.len());
+        for task in background_rows.iter().take(max_items) {
             let color = match task.status.as_str() {
                 "queued" => palette::TEXT_MUTED,
                 "running" => palette::STATUS_WARNING,
@@ -430,7 +588,7 @@ fn render_sidebar_tasks(f: &mut Frame, area: Rect, app: &App) {
             };
             let duration = task
                 .duration_ms
-                .map(|ms| format!("{:.1}s", ms as f64 / 1000.0))
+                .map(format_duration_ms)
                 .unwrap_or_else(|| "-".to_string());
             let label = format!(
                 "{} {} {}",
@@ -455,7 +613,392 @@ fn render_sidebar_tasks(f: &mut Frame, area: Rect, app: &App) {
         }
     }
 
-    render_sidebar_section(f, area, "Tasks", lines, app);
+    if lines.len() < max_rows {
+        let recent_rows = recent_tool_rows(app, 4);
+        if !recent_rows.is_empty() {
+            push_sidebar_label(&mut lines, "Recent tools", palette::TEXT_DIM);
+            push_tool_rows(&mut lines, &recent_rows, content_width, max_rows);
+        }
+    }
+
+    if lines.is_empty()
+        || (lines.len() == 1
+            && app.runtime_turn_id.is_some()
+            && active_rows.is_empty()
+            && background_rows.is_empty())
+    {
+        lines.push(Line::from(Span::styled(
+            "No live tools or background jobs",
+            Style::default().fg(palette::TEXT_MUTED),
+        )));
+    }
+
+    lines
+}
+
+fn push_sidebar_label(lines: &mut Vec<Line<'static>>, label: &str, color: ratatui::style::Color) {
+    lines.push(Line::from(Span::styled(
+        label.to_string(),
+        Style::default().fg(color).bold(),
+    )));
+}
+
+fn active_tool_rows(app: &App) -> Vec<SidebarToolRow> {
+    let Some(active) = app.active_cell.as_ref() else {
+        return Vec::new();
+    };
+    let rows: Vec<SidebarToolRow> = active
+        .entries()
+        .iter()
+        .filter_map(sidebar_tool_row_from_cell)
+        .collect();
+    editorial_tool_rows(rows, usize::MAX)
+}
+
+fn recent_tool_rows(app: &App, limit: usize) -> Vec<SidebarToolRow> {
+    let rows: Vec<SidebarToolRow> = app
+        .history
+        .iter()
+        .rev()
+        .filter_map(sidebar_tool_row_from_cell)
+        .take(RECENT_TOOL_SCAN_LIMIT)
+        .collect();
+    editorial_tool_rows(rows, limit)
+}
+
+fn push_tool_rows(
+    lines: &mut Vec<Line<'static>>,
+    rows: &[SidebarToolRow],
+    content_width: usize,
+    max_rows: usize,
+) {
+    for row in rows {
+        if lines.len() >= max_rows {
+            break;
+        }
+        let (marker, color) = tool_status_marker(row.status);
+        let label = if let Some(duration_ms) = row.duration_ms {
+            format!("{marker} {} {}", row.name, format_duration_ms(duration_ms))
+        } else {
+            format!("{marker} {}", row.name)
+        };
+        lines.push(Line::from(Span::styled(
+            truncate_line_to_width(&label, content_width),
+            Style::default().fg(color),
+        )));
+        if !row.summary.trim().is_empty() && lines.len() < max_rows {
+            lines.push(Line::from(Span::styled(
+                format!(
+                    "  {}",
+                    truncate_line_to_width(&row.summary, content_width.saturating_sub(2).max(1))
+                ),
+                Style::default().fg(palette::TEXT_DIM),
+            )));
+        }
+    }
+}
+
+fn sidebar_tool_row_from_cell(cell: &HistoryCell) -> Option<SidebarToolRow> {
+    let HistoryCell::Tool(tool) = cell else {
+        return None;
+    };
+    match tool {
+        ToolCell::Exec(exec) => Some(SidebarToolRow {
+            name: "run".to_string(),
+            status: exec.status,
+            summary: compact_join([
+                exec.command.clone(),
+                exec.output_summary.clone().unwrap_or_default(),
+                exec.output
+                    .as_deref()
+                    .map(first_nonempty_line)
+                    .unwrap_or_default()
+                    .to_string(),
+            ]),
+            duration_ms: exec.duration_ms.or_else(|| {
+                (exec.status == ToolStatus::Running).then(|| {
+                    u64::try_from(
+                        exec.started_at
+                            .map(|started| started.elapsed().as_millis())
+                            .unwrap_or_default(),
+                    )
+                    .unwrap_or(u64::MAX)
+                })
+            }),
+        }),
+        ToolCell::Exploring(explore) => {
+            let running = explore
+                .entries
+                .iter()
+                .filter(|entry| entry.status == ToolStatus::Running)
+                .count();
+            let status = if running > 0 {
+                ToolStatus::Running
+            } else if explore
+                .entries
+                .iter()
+                .any(|entry| entry.status == ToolStatus::Failed)
+            {
+                ToolStatus::Failed
+            } else {
+                ToolStatus::Success
+            };
+            let first = explore.entries.first().map(|entry| entry.label.as_str());
+            Some(SidebarToolRow {
+                name: "workspace".to_string(),
+                status,
+                summary: compact_join([
+                    format!("{} item(s), {running} running", explore.entries.len()),
+                    first.unwrap_or_default().to_string(),
+                ]),
+                duration_ms: None,
+            })
+        }
+        ToolCell::PlanUpdate(plan) => Some(SidebarToolRow {
+            name: "update_plan".to_string(),
+            status: plan.status,
+            summary: plan
+                .explanation
+                .as_deref()
+                .or_else(|| plan.steps.first().map(|step| step.step.as_str()))
+                .unwrap_or("")
+                .to_string(),
+            duration_ms: None,
+        }),
+        ToolCell::PatchSummary(patch) => Some(SidebarToolRow {
+            name: "patch".to_string(),
+            status: patch.status,
+            summary: compact_join([patch.path.clone(), patch.summary.clone()]),
+            duration_ms: None,
+        }),
+        ToolCell::Review(review) => Some(SidebarToolRow {
+            name: "review".to_string(),
+            status: review.status,
+            summary: review.target.clone(),
+            duration_ms: None,
+        }),
+        ToolCell::DiffPreview(diff) => Some(SidebarToolRow {
+            name: "diff".to_string(),
+            status: ToolStatus::Success,
+            summary: diff.title.clone(),
+            duration_ms: None,
+        }),
+        ToolCell::Mcp(mcp) => Some(SidebarToolRow {
+            name: mcp.tool.clone(),
+            status: mcp.status,
+            summary: mcp
+                .content
+                .as_deref()
+                .map(summarize_tool_output)
+                .unwrap_or_default(),
+            duration_ms: None,
+        }),
+        ToolCell::ViewImage(image) => Some(SidebarToolRow {
+            name: "image".to_string(),
+            status: ToolStatus::Success,
+            summary: image.path.display().to_string(),
+            duration_ms: None,
+        }),
+        ToolCell::WebSearch(search) => Some(SidebarToolRow {
+            name: "web_search".to_string(),
+            status: search.status,
+            summary: compact_join([
+                search.query.clone(),
+                search.summary.clone().unwrap_or_default(),
+            ]),
+            duration_ms: None,
+        }),
+        ToolCell::Generic(generic) => Some(SidebarToolRow {
+            name: generic.name.clone(),
+            status: generic.status,
+            summary: compact_join([
+                generic.input_summary.clone().unwrap_or_default(),
+                generic.output_summary.clone().unwrap_or_default(),
+                generic
+                    .output
+                    .as_deref()
+                    .map(summarize_tool_output)
+                    .unwrap_or_default(),
+            ]),
+            duration_ms: None,
+        }),
+    }
+}
+
+fn background_task_rows(app: &App, active_rows: &[SidebarToolRow]) -> Vec<TaskPanelEntry> {
+    let mut rows: Vec<TaskPanelEntry> = app
+        .task_panel
+        .iter()
+        .filter(|task| !background_task_duplicates_live_tool(task, active_rows))
+        .cloned()
+        .collect();
+    rows.sort_by_key(|task| (task_status_rank(task.status.as_str()), task.id.clone()));
+    rows
+}
+
+fn background_task_duplicates_live_tool(
+    task: &TaskPanelEntry,
+    active_rows: &[SidebarToolRow],
+) -> bool {
+    if task.status != "running" {
+        return false;
+    }
+
+    if task.id.starts_with("rlm-") || task.prompt_summary.starts_with("RLM: ") {
+        return active_rows
+            .iter()
+            .any(|row| row.status == ToolStatus::Running && row.name.starts_with("rlm_"));
+    }
+
+    let Some(command) = task.prompt_summary.strip_prefix("shell: ") else {
+        return false;
+    };
+    let command = normalize_activity_text(command);
+    !command.is_empty()
+        && active_rows.iter().any(|row| {
+            row.status == ToolStatus::Running
+                && row.name == "run"
+                && normalize_activity_text(&row.summary).contains(&command)
+        })
+}
+
+fn editorial_tool_rows(rows: Vec<SidebarToolRow>, limit: usize) -> Vec<SidebarToolRow> {
+    #[derive(Clone)]
+    struct Candidate {
+        rank: u8,
+        order: usize,
+        row: SidebarToolRow,
+    }
+
+    let mut candidates: Vec<Candidate> = Vec::new();
+    let mut low_value_groups: Vec<(usize, SidebarToolRow, usize)> = Vec::new();
+    let mut seen_success: Vec<String> = Vec::new();
+
+    for (order, row) in rows.into_iter().enumerate() {
+        if is_low_value_tool(&row.name) && row.status == ToolStatus::Success {
+            if let Some((_, grouped, count)) = low_value_groups
+                .iter_mut()
+                .find(|(_, grouped, _)| grouped.name == row.name)
+            {
+                *count += 1;
+                if grouped.summary.trim().is_empty() && !row.summary.trim().is_empty() {
+                    grouped.summary = row.summary;
+                }
+            } else {
+                low_value_groups.push((order, row, 1));
+            }
+            continue;
+        }
+
+        let key = sidebar_row_identity(&row);
+        if row.status == ToolStatus::Success && seen_success.iter().any(|seen| seen == &key) {
+            continue;
+        }
+        if row.status == ToolStatus::Success {
+            seen_success.push(key);
+        }
+
+        candidates.push(Candidate {
+            rank: tool_row_rank(&row),
+            order,
+            row,
+        });
+    }
+
+    for (order, mut row, count) in low_value_groups {
+        if count > 1 {
+            row.name = format!("{} x{count}", row.name);
+            if !row.summary.trim().is_empty() {
+                row.summary = format!("latest: {}", row.summary);
+            }
+        }
+        candidates.push(Candidate {
+            rank: tool_row_rank(&row).saturating_add(1),
+            order,
+            row,
+        });
+    }
+
+    candidates.sort_by_key(|candidate| (candidate.rank, candidate.order));
+    candidates
+        .into_iter()
+        .take(limit)
+        .map(|candidate| candidate.row)
+        .collect()
+}
+
+fn sidebar_row_identity(row: &SidebarToolRow) -> String {
+    format!(
+        "{}\n{}",
+        row.name.trim(),
+        normalize_activity_text(row.summary.as_str())
+    )
+}
+
+fn normalize_activity_text(text: &str) -> String {
+    text.split_whitespace().collect::<Vec<_>>().join(" ")
+}
+
+fn tool_row_rank(row: &SidebarToolRow) -> u8 {
+    match row.status {
+        ToolStatus::Failed => 0,
+        ToolStatus::Running => 1,
+        ToolStatus::Success if is_low_value_tool(&row.name) => 3,
+        ToolStatus::Success => 2,
+    }
+}
+
+fn task_status_rank(status: &str) -> u8 {
+    match status {
+        "running" => 0,
+        "failed" => 1,
+        "queued" => 2,
+        "completed" => 3,
+        "canceled" => 4,
+        _ => 5,
+    }
+}
+
+fn is_low_value_tool(name: &str) -> bool {
+    let base = name.split_whitespace().next().unwrap_or(name);
+    matches!(
+        base,
+        "read_file" | "grep_files" | "file_search" | "find" | "checklist_update"
+    )
+}
+
+fn compact_join(parts: impl IntoIterator<Item = String>) -> String {
+    let mut out: Vec<String> = Vec::new();
+    for part in parts {
+        let part = part.trim();
+        if !part.is_empty() && !out.iter().any(|seen| seen == part) {
+            out.push(part.to_string());
+        }
+    }
+    out.join(" · ")
+}
+
+fn first_nonempty_line(text: &str) -> &str {
+    text.lines()
+        .map(str::trim)
+        .find(|line| !line.is_empty())
+        .unwrap_or("")
+}
+
+fn tool_status_marker(status: ToolStatus) -> (&'static str, ratatui::style::Color) {
+    match status {
+        ToolStatus::Running => ("[~]", palette::STATUS_WARNING),
+        ToolStatus::Success => ("[x]", palette::STATUS_SUCCESS),
+        ToolStatus::Failed => ("[!]", palette::STATUS_ERROR),
+    }
+}
+
+fn format_duration_ms(ms: u64) -> String {
+    if ms < 1000 {
+        format!("{ms}ms")
+    } else {
+        format!("{:.1}s", ms as f64 / 1000.0)
+    }
 }
 
 fn render_sidebar_subagents(f: &mut Frame, area: Rect, app: &App) {
@@ -464,11 +1007,7 @@ fn render_sidebar_subagents(f: &mut Frame, area: Rect, app: &App) {
     }
 
     let content_width = area.width.saturating_sub(4) as usize;
-
-    // Demoted to navigator (issue #128): the in-transcript DelegateCard /
-    // FanoutCard now carries the live action tree and dot-grid. The sidebar
-    // shows just count + role-mix so the user can scan parallel work at a
-    // glance and scroll to the matching transcript card for detail.
+    let usable_rows = area.height.saturating_sub(3) as usize;
     let cached_ids: std::collections::HashSet<&str> = app
         .subagent_cache
         .iter()
@@ -506,7 +1045,8 @@ fn render_sidebar_subagents(f: &mut Frame, area: Rect, app: &App) {
         foreground_rlm_running,
         role_counts,
     };
-    let lines = subagent_navigator_lines(&summary, content_width);
+    let rows = sidebar_agent_rows(app);
+    let lines = subagent_panel_lines(&summary, &rows, content_width, usable_rows.max(1));
 
     render_sidebar_section(f, area, "Agents", lines, app);
 }
@@ -525,25 +1065,104 @@ pub struct SidebarSubagentSummary {
     pub role_counts: std::collections::BTreeMap<String, usize>,
 }
 
+#[derive(Debug, Clone)]
+pub struct SidebarAgentRow {
+    pub id: String,
+    pub name: String,
+    pub role: String,
+    pub status: String,
+    pub progress: Option<String>,
+    pub steps_taken: u32,
+    pub duration_ms: Option<u64>,
+}
+
 fn foreground_rlm_running(app: &App) -> bool {
     app.active_cell.as_ref().is_some_and(|active| {
         active.entries().iter().any(|entry| {
             matches!(
                 entry,
                 HistoryCell::Tool(ToolCell::Generic(generic))
-                    if generic.name == "rlm" && generic.status == ToolStatus::Running
+                    if matches!(
+                        generic.name.as_str(),
+                        "rlm_open" | "rlm_eval" | "rlm_configure" | "rlm_close" | "rlm"
+                    ) && generic.status == ToolStatus::Running
             )
         })
     })
 }
 
-/// Build the demoted navigator lines from a summary projection. Public
-/// for the snapshot test in this module.
-pub fn subagent_navigator_lines(
+fn sidebar_agent_rows(app: &App) -> Vec<SidebarAgentRow> {
+    let mut rows: Vec<SidebarAgentRow> = app
+        .subagent_cache
+        .iter()
+        .map(|agent| {
+            let progress = app
+                .agent_progress
+                .get(&agent.agent_id)
+                .cloned()
+                .or_else(|| {
+                    agent
+                        .result
+                        .as_deref()
+                        .map(summarize_tool_output)
+                        .filter(|summary| !summary.trim().is_empty())
+                });
+            SidebarAgentRow {
+                id: agent.agent_id.clone(),
+                name: agent.nickname.clone().unwrap_or_else(|| agent.name.clone()),
+                role: agent.agent_type.as_str().to_string(),
+                status: subagent_status_text(&agent.status).to_string(),
+                progress,
+                steps_taken: agent.steps_taken,
+                duration_ms: Some(agent.duration_ms),
+            }
+        })
+        .collect();
+
+    let cached_ids: std::collections::HashSet<&str> = app
+        .subagent_cache
+        .iter()
+        .map(|agent| agent.agent_id.as_str())
+        .collect();
+    rows.extend(
+        app.agent_progress
+            .iter()
+            .filter(|(id, _)| !cached_ids.contains(id.as_str()))
+            .map(|(id, progress)| SidebarAgentRow {
+                id: id.clone(),
+                name: id.clone(),
+                role: "agent".to_string(),
+                status: "running".to_string(),
+                progress: Some(progress.clone()),
+                steps_taken: 0,
+                duration_ms: app.agent_activity_started_at.map(|started| {
+                    u64::try_from(started.elapsed().as_millis()).unwrap_or(u64::MAX)
+                }),
+            }),
+    );
+
+    rows
+}
+
+fn subagent_status_text(status: &SubAgentStatus) -> &'static str {
+    match status {
+        SubAgentStatus::Running => "running",
+        SubAgentStatus::Completed => "done",
+        SubAgentStatus::Interrupted(_) => "interrupted",
+        SubAgentStatus::Failed(_) => "failed",
+        SubAgentStatus::Cancelled => "canceled",
+    }
+}
+
+/// Build sub-agent sidebar lines from summary + per-agent rows. Public
+/// for the snapshot tests in this module.
+pub fn subagent_panel_lines(
     summary: &SidebarSubagentSummary,
+    rows: &[SidebarAgentRow],
     content_width: usize,
+    max_rows: usize,
 ) -> Vec<Line<'static>> {
-    let mut lines: Vec<Line<'static>> = Vec::with_capacity(4);
+    let mut lines: Vec<Line<'static>> = Vec::with_capacity(max_rows.max(4));
 
     let fanout_total = summary.fanout_total.unwrap_or(0);
     if summary.cached_total == 0
@@ -599,6 +1218,45 @@ pub fn subagent_navigator_lines(
         )));
     }
 
+    for row in rows {
+        if lines.len() >= max_rows {
+            break;
+        }
+        let (marker, color) = agent_status_marker(row.status.as_str());
+        let label = format!("{marker} {} {}", row.role, row.name);
+        lines.push(Line::from(Span::styled(
+            truncate_line_to_width(&label, content_width.max(1)),
+            Style::default().fg(color),
+        )));
+
+        if lines.len() >= max_rows {
+            break;
+        }
+        let mut detail_parts = Vec::new();
+        detail_parts.push(truncate_line_to_width(&row.id, 10));
+        if row.steps_taken > 0 {
+            detail_parts.push(format!("{} step(s)", row.steps_taken));
+        }
+        if let Some(duration) = row.duration_ms {
+            detail_parts.push(format_duration_ms(duration));
+        }
+        if let Some(progress) = row.progress.as_deref()
+            && !progress.trim().is_empty()
+        {
+            detail_parts.push(summarize_tool_output(progress));
+        }
+        lines.push(Line::from(Span::styled(
+            format!(
+                "  {}",
+                truncate_line_to_width(
+                    &detail_parts.join(" · "),
+                    content_width.saturating_sub(2).max(1)
+                )
+            ),
+            Style::default().fg(palette::TEXT_DIM),
+        )));
+    }
+
     if summary.foreground_rlm_running {
         lines.push(Line::from(vec![
             Span::styled("RLM", Style::default().fg(palette::DEEPSEEK_SKY).bold()),
@@ -609,14 +1267,19 @@ pub fn subagent_navigator_lines(
         ]));
     }
 
-    lines.push(Line::from(Span::styled(
-        "(see transcript card for detail)",
-        Style::default().fg(palette::TEXT_MUTED).italic(),
-    )));
-
     lines
 }
 
+fn agent_status_marker(status: &str) -> (&'static str, ratatui::style::Color) {
+    match status {
+        "running" => ("[~]", palette::STATUS_WARNING),
+        "done" => ("[x]", palette::STATUS_SUCCESS),
+        "failed" => ("[!]", palette::STATUS_ERROR),
+        "canceled" | "interrupted" => ("[-]", palette::TEXT_MUTED),
+        _ => ("[ ]", palette::TEXT_MUTED),
+    }
+}
+
 /// Session-context panel (#504) — consolidated session state overview.
 ///
 /// Surfaces at-a-glance: working set, token usage / context %, running
@@ -812,8 +1475,47 @@ fn render_sidebar_section(
 
 #[cfg(test)]
 mod tests {
-    use super::{SidebarSubagentSummary, plan_panel_empty_hint, subagent_navigator_lines};
+    use super::{
+        AutoSidebarPanel, AutoSidebarState, SidebarAgentRow, SidebarSubagentSummary,
+        SidebarWorkChecklistItem, SidebarWorkStrategyStep, SidebarWorkSummary, auto_sidebar_panels,
+        subagent_panel_lines, task_panel_lines, work_panel_empty_hint, work_panel_lines,
+    };
+    use crate::config::Config;
+    use crate::palette::PaletteMode;
+    use crate::tools::plan::StepStatus;
+    use crate::tools::todo::TodoStatus;
+    use crate::tui::active_cell::ActiveCell;
+    use crate::tui::app::{App, TaskPanelEntry, TuiOptions};
+    use crate::tui::history::{
+        ExecCell, ExecSource, GenericToolCell, HistoryCell, ToolCell, ToolStatus,
+    };
     use ratatui::text::Line;
+    use std::path::PathBuf;
+
+    fn create_test_app() -> App {
+        let options = TuiOptions {
+            model: "deepseek-v4-pro".to_string(),
+            workspace: PathBuf::from("."),
+            config_path: None,
+            config_profile: None,
+            allow_shell: false,
+            use_alt_screen: true,
+            use_mouse_capture: false,
+            use_bracketed_paste: true,
+            max_subagents: 1,
+            skills_dir: PathBuf::from("."),
+            memory_path: PathBuf::from("memory.md"),
+            notes_path: PathBuf::from("notes.txt"),
+            mcp_config_path: PathBuf::from("mcp.json"),
+            use_memory: false,
+            start_in_agent_mode: false,
+            skip_onboarding: true,
+            yolo: false,
+            resume_session_id: None,
+            initial_input: None,
+        };
+        App::new(options, &Config::default())
+    }
 
     fn lines_to_text(lines: &[Line<'static>]) -> Vec<String> {
         lines
@@ -827,57 +1529,339 @@ mod tests {
             .collect()
     }
 
-    // ---- #408 Plan panel empty-state hint ----
-
     #[test]
-    fn plan_panel_empty_hint_mentions_panels_role() {
-        // The hint replaces the old "No active plan" placeholder; it
-        // should explain what the panel tracks so the user can tell
-        // whether the panel is broken vs simply unused this turn.
-        let hint = plan_panel_empty_hint(80);
-        assert!(
-            hint.contains("update_plan"),
-            "hint should name the tool: {hint:?}"
-        );
-        assert!(
-            hint.contains("/goal") || hint.contains("goal"),
-            "hint should mention /goal: {hint:?}"
-        );
+    fn auto_sidebar_does_not_reserve_empty_work_when_other_panels_are_active() {
+        let panels = auto_sidebar_panels(AutoSidebarState {
+            work_has_content: false,
+            tasks_empty: false,
+            agents_empty: true,
+            context_enabled: false,
+        });
+
+        assert_eq!(panels, vec![AutoSidebarPanel::Tasks]);
     }
 
     #[test]
-    fn plan_panel_empty_hint_truncates_to_narrow_widths() {
-        // Width 16 forces an ellipsis; the hint should still fit.
-        let hint = plan_panel_empty_hint(16);
+    fn auto_sidebar_uses_work_as_single_empty_state() {
+        let panels = auto_sidebar_panels(AutoSidebarState {
+            work_has_content: false,
+            tasks_empty: true,
+            agents_empty: true,
+            context_enabled: false,
+        });
+
+        assert_eq!(panels, vec![AutoSidebarPanel::Work]);
+    }
+
+    #[test]
+    fn work_panel_empty_hint_stays_quiet_and_truncates() {
+        let hint = work_panel_empty_hint(10);
         assert!(
-            hint.chars().count() <= 16,
-            "hint width {} > 16: {hint:?}",
+            hint.chars().count() <= 10,
+            "hint width {} > 10: {hint:?}",
             hint.chars().count()
         );
+        assert!(
+            !hint.contains("update_plan"),
+            "hint should be quiet: {hint:?}"
+        );
     }
 
     #[test]
-    fn plan_panel_empty_hint_does_not_say_no_active_plan() {
-        // Regression guard: the placeholder used to say "No active
-        // plan" which made the panel look broken. The hint should
-        // never re-introduce that wording.
-        let hint = plan_panel_empty_hint(80);
+    fn work_panel_renders_checklist_as_primary_progress_surface() {
+        let summary = SidebarWorkSummary {
+            checklist_completion_pct: 33,
+            checklist_items: vec![
+                SidebarWorkChecklistItem {
+                    id: 1,
+                    content: "Plan it out".to_string(),
+                    status: TodoStatus::Completed,
+                },
+                SidebarWorkChecklistItem {
+                    id: 2,
+                    content: "Wire the thing".to_string(),
+                    status: TodoStatus::InProgress,
+                },
+                SidebarWorkChecklistItem {
+                    id: 3,
+                    content: "Run gates".to_string(),
+                    status: TodoStatus::Pending,
+                },
+            ],
+            strategy_explanation: Some("Keep the UI unified".to_string()),
+            strategy_steps: vec![
+                SidebarWorkStrategyStep {
+                    text: "Simplify sidebar".to_string(),
+                    status: StepStatus::Completed,
+                    elapsed: String::new(),
+                },
+                SidebarWorkStrategyStep {
+                    text: "Update prompts".to_string(),
+                    status: StepStatus::Pending,
+                    elapsed: String::new(),
+                },
+            ],
+            ..SidebarWorkSummary::default()
+        };
+
+        let text = lines_to_text(&work_panel_lines(&summary, 80, 16, PaletteMode::Dark));
+
         assert!(
-            !hint.to_ascii_lowercase().contains("no active plan"),
-            "hint regressed to old placeholder: {hint:?}"
+            text[0].starts_with("33% complete (1/3)"),
+            "checklist should lead: {text:?}"
+        );
+        assert!(
+            text.iter().any(|line| line.contains("[~] #2 Wire")),
+            "in-progress checklist item should be visible: {text:?}"
+        );
+        assert!(
+            !text.iter().any(|line| line.contains("50% complete")),
+            "strategy progress must not render as a second progress bar when checklist exists: {text:?}"
+        );
+    }
+
+    #[test]
+    fn work_panel_includes_strategy_only_when_plan_state_is_non_empty() {
+        let empty_text = lines_to_text(&work_panel_lines(
+            &SidebarWorkSummary::default(),
+            80,
+            16,
+            PaletteMode::Dark,
+        ));
+        assert!(
+            !empty_text.iter().any(|line| line.contains("Strategy")),
+            "empty plan state should not show strategy: {empty_text:?}"
+        );
+
+        let summary = SidebarWorkSummary {
+            strategy_explanation: Some("High-level sequencing".to_string()),
+            ..SidebarWorkSummary::default()
+        };
+        let text = lines_to_text(&work_panel_lines(&summary, 80, 16, PaletteMode::Dark));
+        assert!(
+            text.iter().any(|line| line == "Strategy"),
+            "non-empty plan should show strategy label: {text:?}"
+        );
+        assert!(
+            text.iter()
+                .any(|line| line.contains("High-level sequencing")),
+            "non-empty plan explanation should render: {text:?}"
+        );
+    }
+
+    #[test]
+    fn tasks_panel_renders_active_tool_rows_before_background_empty_state() {
+        let mut app = create_test_app();
+        let mut active = ActiveCell::new();
+        active.push_tool(
+            "tool-1",
+            HistoryCell::Tool(ToolCell::Generic(GenericToolCell {
+                name: "agent_eval".to_string(),
+                status: ToolStatus::Running,
+                input_summary: Some("agent_id: agent_af58ba3a".to_string()),
+                output: None,
+                prompts: None,
+                spillover_path: None,
+                output_summary: None,
+                is_diff: false,
+            })),
+        );
+        app.active_cell = Some(active);
+        app.runtime_turn_id = Some("turn_abcdef123456".to_string());
+        app.runtime_turn_status = Some("in_progress".to_string());
+
+        let text = lines_to_text(&task_panel_lines(&app, 64, 8));
+
+        assert!(text[0].contains("turn "));
+        assert!(text[0].contains("in_progress"));
+        assert!(
+            text.iter().any(|line| line == "Live tools"),
+            "live section missing: {text:?}"
+        );
+        assert!(
+            text.iter().any(|line| line.contains("[~] agent_eval")),
+            "active agent_eval row missing: {text:?}"
+        );
+        assert!(
+            !text.iter().any(|line| line.contains("No active tasks")),
+            "old empty state should not render during active tools: {text:?}"
+        );
+    }
+
+    #[test]
+    fn tasks_panel_renders_recent_completed_tool_rows() {
+        let mut app = create_test_app();
+        app.history
+            .push(HistoryCell::Tool(ToolCell::Generic(GenericToolCell {
+                name: "read_file".to_string(),
+                status: ToolStatus::Success,
+                input_summary: Some("deepseek-tui/CHANGELOG.md".to_string()),
+                output: Some("done".to_string()),
+                prompts: None,
+                spillover_path: None,
+                output_summary: Some("Reading CHANGELOG.md".to_string()),
+                is_diff: false,
+            })));
+
+        let text = lines_to_text(&task_panel_lines(&app, 64, 8));
+
+        assert!(
+            text.iter().any(|line| line == "Recent tools"),
+            "recent section missing: {text:?}"
+        );
+        assert!(
+            text.iter().any(|line| line.contains("[x] read_file")),
+            "recent read_file row missing: {text:?}"
+        );
+    }
+
+    #[test]
+    fn tasks_panel_does_not_double_count_running_shell_job_as_live_and_background() {
+        let mut app = create_test_app();
+        let mut active = ActiveCell::new();
+        active.push_tool(
+            "shell-1",
+            HistoryCell::Tool(ToolCell::Exec(ExecCell {
+                command: "cargo test --workspace".to_string(),
+                status: ToolStatus::Running,
+                output: None,
+                started_at: Some(std::time::Instant::now()),
+                duration_ms: None,
+                source: ExecSource::Assistant,
+                interaction: None,
+                output_summary: None,
+            })),
+        );
+        app.active_cell = Some(active);
+        app.task_panel.push(TaskPanelEntry {
+            id: "job_123".to_string(),
+            status: "running".to_string(),
+            prompt_summary: "shell: cargo test --workspace".to_string(),
+            duration_ms: Some(12_000),
+        });
+
+        let text = lines_to_text(&task_panel_lines(&app, 80, 10));
+        let command_lines = text
+            .iter()
+            .filter(|line| line.contains("cargo test --workspace"))
+            .count();
+
+        assert!(
+            text.iter().any(|line| line == "Live tools"),
+            "live shell row missing: {text:?}"
+        );
+        assert_eq!(
+            command_lines, 1,
+            "running shell command should not render as both live and background: {text:?}"
+        );
+        assert!(
+            !text.iter().any(|line| line.contains("Background jobs")),
+            "duplicate background shell row should be hidden: {text:?}"
+        );
+    }
+
+    #[test]
+    fn tasks_panel_collapses_repeated_low_value_recent_tools_after_failures() {
+        let mut app = create_test_app();
+        for path in ["src/a.rs", "src/b.rs", "src/c.rs"] {
+            app.history
+                .push(HistoryCell::Tool(ToolCell::Generic(GenericToolCell {
+                    name: "read_file".to_string(),
+                    status: ToolStatus::Success,
+                    input_summary: Some(path.to_string()),
+                    output: Some("ok".to_string()),
+                    prompts: None,
+                    spillover_path: None,
+                    output_summary: None,
+                    is_diff: false,
+                })));
+        }
+        app.history
+            .push(HistoryCell::Tool(ToolCell::Generic(GenericToolCell {
+                name: "checklist_update".to_string(),
+                status: ToolStatus::Success,
+                input_summary: Some("mark item 2 done".to_string()),
+                output: Some("updated".to_string()),
+                prompts: None,
+                spillover_path: None,
+                output_summary: None,
+                is_diff: false,
+            })));
+        app.history
+            .push(HistoryCell::Tool(ToolCell::Generic(GenericToolCell {
+                name: "grep_files".to_string(),
+                status: ToolStatus::Failed,
+                input_summary: Some("pattern: Activity Detail".to_string()),
+                output: Some("regex parse error".to_string()),
+                prompts: None,
+                spillover_path: None,
+                output_summary: Some("regex parse error".to_string()),
+                is_diff: false,
+            })));
+
+        let text = lines_to_text(&task_panel_lines(&app, 80, 12));
+        let failed_index = text
+            .iter()
+            .position(|line| line.contains("[!] grep_files"))
+            .expect("failed grep row should stay visible");
+        let read_group_index = text
+            .iter()
+            .position(|line| line.contains("[x] read_file x3"))
+            .expect("repeated read_file rows should collapse");
+
+        assert!(
+            failed_index < read_group_index,
+            "failure should sort above low-value success noise: {text:?}"
+        );
+        assert_eq!(
+            text.iter()
+                .filter(|line| line.contains("[x] read_file"))
+                .count(),
+            1,
+            "read_file should render once after grouping: {text:?}"
+        );
+        assert!(
+            text.iter().any(|line| line.contains("regex parse error")),
+            "failure detail should remain visible: {text:?}"
+        );
+    }
+
+    #[test]
+    fn tasks_panel_keeps_duration_and_status_on_recent_shell_rows() {
+        let mut app = create_test_app();
+        app.history.push(HistoryCell::Tool(ToolCell::Exec(ExecCell {
+            command: "cargo check".to_string(),
+            status: ToolStatus::Success,
+            output: Some("Finished".to_string()),
+            started_at: None,
+            duration_ms: Some(1_250),
+            source: ExecSource::Assistant,
+            interaction: None,
+            output_summary: None,
+        })));
+
+        let text = lines_to_text(&task_panel_lines(&app, 80, 8));
+
+        assert!(
+            text.iter().any(|line| line.contains("[x] run 1.2s")),
+            "status marker and duration should stay in the row label: {text:?}"
+        );
+        assert!(
+            text.iter().any(|line| line.contains("cargo check")),
+            "current command summary should stay visible: {text:?}"
         );
     }
 
     #[test]
     fn navigator_empty_state_says_no_agents() {
         let summary = SidebarSubagentSummary::default();
-        let lines = subagent_navigator_lines(&summary, 32);
+        let lines = subagent_panel_lines(&summary, &[], 32, 8);
         let text = lines_to_text(&lines);
         assert_eq!(text, vec!["No agents".to_string()]);
     }
 
     #[test]
-    fn navigator_running_state_renders_count_role_and_navigator_hint() {
+    fn agents_panel_running_state_renders_count_role_and_rows() {
         // Two general agents (one running, one done) + one explore (running).
         let mut role_counts = std::collections::BTreeMap::new();
         role_counts.insert("general".to_string(), 2);
@@ -891,7 +1875,27 @@ mod tests {
             foreground_rlm_running: false,
             role_counts,
         };
-        let text = lines_to_text(&subagent_navigator_lines(&summary, 64));
+        let rows = vec![
+            SidebarAgentRow {
+                id: "agent_a5e674dc".to_string(),
+                name: "check-docs-mcp".to_string(),
+                role: "explore".to_string(),
+                status: "running".to_string(),
+                progress: Some("step 2/3: running tool 'read_file'".to_string()),
+                steps_taken: 2,
+                duration_ms: Some(22_000),
+            },
+            SidebarAgentRow {
+                id: "agent_850aa63f".to_string(),
+                name: "check-install-docs".to_string(),
+                role: "general".to_string(),
+                status: "done".to_string(),
+                progress: Some("SUMMARY: docs checked".to_string()),
+                steps_taken: 5,
+                duration_ms: Some(21_000),
+            },
+        ];
+        let text = lines_to_text(&subagent_panel_lines(&summary, &rows, 64, 12));
         assert!(text[0].contains("2 running"), "header: {:?}", text[0]);
         assert!(text[0].contains("/ 3"), "total in header: {:?}", text[0]);
         assert!(
@@ -900,8 +1904,13 @@ mod tests {
             text[1]
         );
         assert!(
-            text.iter().any(|l| l.contains("transcript card")),
-            "navigator hint must defer to transcript: {text:?}",
+            text.iter()
+                .any(|l| l.contains("[~] explore check-docs-mcp")),
+            "running row missing: {text:?}",
+        );
+        assert!(
+            text.iter().any(|l| l.contains("step 2/3")),
+            "progress detail missing: {text:?}",
         );
     }
 
@@ -917,7 +1926,7 @@ mod tests {
             role_counts: std::collections::BTreeMap::new(),
         };
 
-        let text = lines_to_text(&subagent_navigator_lines(&summary, 64));
+        let text = lines_to_text(&subagent_panel_lines(&summary, &[], 64, 8));
 
         assert!(text[0].contains("1 running"), "header: {:?}", text[0]);
         assert!(text[0].contains("/ 6"), "fanout total: {:?}", text[0]);
@@ -936,7 +1945,7 @@ mod tests {
             foreground_rlm_running: false,
             role_counts,
         };
-        let text = lines_to_text(&subagent_navigator_lines(&summary, 32));
+        let text = lines_to_text(&subagent_panel_lines(&summary, &[], 32, 8));
         assert!(text[0].contains("1 done"), "settled header: {:?}", text[0]);
     }
 
@@ -956,7 +1965,7 @@ mod tests {
             foreground_rlm_running: false,
             role_counts,
         };
-        let lines = subagent_navigator_lines(&summary, 16);
+        let lines = subagent_panel_lines(&summary, &[], 16, 8);
         let role_line: &str = lines[1]
             .spans
             .first()
@@ -974,7 +1983,7 @@ mod tests {
             foreground_rlm_running: true,
             ..SidebarSubagentSummary::default()
         };
-        let text = lines_to_text(&subagent_navigator_lines(&summary, 64));
+        let text = lines_to_text(&subagent_panel_lines(&summary, &[], 64, 8));
 
         assert!(!text[0].contains("No agents"), "header: {:?}", text);
         assert!(
diff --git a/crates/tui/src/tui/subagent_routing.rs b/crates/tui/src/tui/subagent_routing.rs
index 914f76c7..cece93c6 100644
--- a/crates/tui/src/tui/subagent_routing.rs
+++ b/crates/tui/src/tui/subagent_routing.rs
@@ -142,7 +142,7 @@ pub(super) fn handle_subagent_mailbox(app: &mut App, seq: u64, message: &Mailbox
     };
 
     let dispatch_kind = app.pending_subagent_dispatch.as_deref();
-    let is_fanout = matches!(dispatch_kind, Some("rlm"));
+    let is_fanout = matches!(dispatch_kind, Some("rlm_open" | "rlm_eval" | "rlm"));
 
     if is_fanout {
         // Reuse the active fanout card for sibling spawns; otherwise create
@@ -154,7 +154,7 @@ pub(super) fn handle_subagent_mailbox(app: &mut App, seq: u64, message: &Mailbox
             card.claim_pending_worker(&agent_id, AgentLifecycle::Running);
             app.subagent_card_index.insert(agent_id, idx);
         } else {
-            let mut card = FanoutCard::new(dispatch_kind.unwrap_or("rlm").to_string());
+            let mut card = FanoutCard::new(dispatch_kind.unwrap_or("rlm_eval").to_string());
             card.upsert_worker(&agent_id, AgentLifecycle::Running);
             app.add_message(HistoryCell::SubAgent(SubAgentCell::Fanout(card)));
             let idx = app.history.len().saturating_sub(1);
diff --git a/crates/tui/src/tui/ui.rs b/crates/tui/src/tui/ui.rs
index 66b4c511..c4d853cb 100644
--- a/crates/tui/src/tui/ui.rs
+++ b/crates/tui/src/tui/ui.rs
@@ -102,7 +102,8 @@ use super::approval::{
     ApprovalMode, ApprovalRequest, ApprovalView, ElevationRequest, ElevationView, ReviewDecision,
 };
 use super::history::{
-    HistoryCell, ToolCell, ToolStatus, history_cells_from_message, summarize_tool_output,
+    HistoryCell, ToolCell, ToolStatus, TranscriptRenderOptions, history_cells_from_message,
+    summarize_tool_output,
 };
 use super::slash_menu::{
     apply_slash_menu_selection, try_autocomplete_slash_command, visible_slash_menu_entries,
@@ -433,6 +434,8 @@ pub async fn run_tui(config: &Config, options: TuiOptions) -> Result<()> {
         // #456: plumb the App's HookExecutor so `exec_shell` can surface
         // the configured `shell_env` hooks. Wrapped in Arc once and shared.
         hook_executor: Some(std::sync::Arc::new(app.hooks.clone())),
+        handle_store: app.runtime_services.handle_store.clone(),
+        rlm_sessions: app.runtime_services.rlm_sessions.clone(),
     };
     refresh_active_task_panel(&mut app, &task_manager).await;
 
@@ -687,7 +690,11 @@ fn active_rlm_task_entries(app: &App) -> Vec<TaskPanelEntry> {
             let HistoryCell::Tool(ToolCell::Generic(generic)) = entry else {
                 return None;
             };
-            if generic.name != "rlm" || generic.status != ToolStatus::Running {
+            if !matches!(
+                generic.name.as_str(),
+                "rlm_open" | "rlm_eval" | "rlm_configure" | "rlm_close" | "rlm"
+            ) || generic.status != ToolStatus::Running
+            {
                 return None;
             }
             let summary = generic
@@ -1074,9 +1081,17 @@ async fn run_event_loop(
                         // Note this dispatch so the next sub-agent `Started`
                         // mailbox envelope routes into the right card kind
                         // (delegate vs fanout).
-                        if matches!(name.as_str(), "agent_spawn" | "rlm" | "delegate") {
+                        if matches!(
+                            name.as_str(),
+                            "agent_open"
+                                | "agent_spawn"
+                                | "rlm_open"
+                                | "rlm_eval"
+                                | "rlm"
+                                | "delegate"
+                        ) {
                             app.pending_subagent_dispatch = Some(name.clone());
-                            if name == "rlm" {
+                            if matches!(name.as_str(), "rlm_open" | "rlm_eval" | "rlm") {
                                 // New fanout invocation — children should
                                 // group under a fresh card, not the
                                 // previous fanout's leftover.
@@ -1115,7 +1130,9 @@ async fn run_event_loop(
                         // poll. Also merge shell jobs (#373).
                         if matches!(
                             name.as_str(),
-                            "agent_spawn"
+                            "agent_open"
+                                | "agent_spawn"
+                                | "agent_close"
                                 | "agent_cancel"
                                 | "todo_write"
                                 | "task_shell_start"
@@ -1126,7 +1143,9 @@ async fn run_event_loop(
                         }
                         if matches!(
                             name.as_str(),
-                            "agent_spawn"
+                            "agent_open"
+                                | "agent_eval"
+                                | "agent_close"
                                 | "agent_cancel"
                                 | "agent_wait"
                                 | "agent_result"
@@ -2028,9 +2047,7 @@ async fn run_event_loop(
             if app.use_mouse_capture
                 && let Event::Mouse(mouse) = evt
             {
-                if app.is_loading
-                    && matches!(mouse.kind, MouseEventKind::Moved | MouseEventKind::Drag(_))
-                {
+                if should_drop_loading_mouse_motion(app, mouse) {
                     continue;
                 }
                 let events = handle_mouse_event(app, mouse);
@@ -2470,7 +2487,7 @@ async fn run_event_loop(
                 KeyCode::Char('o')
                     if key.modifiers.contains(KeyModifiers::CONTROL)
                         && app.input.is_empty()
-                        && open_thinking_pager(app) =>
+                        && open_activity_detail_pager(app) =>
                 {
                     continue;
                 }
@@ -2482,8 +2499,8 @@ async fn run_event_loop(
                 }
                 KeyCode::Char('1') if key.modifiers.contains(KeyModifiers::ALT) => {
                     if key.modifiers.contains(KeyModifiers::CONTROL) {
-                        app.set_sidebar_focus(SidebarFocus::Plan);
-                        app.status_message = Some("Sidebar focus: plan".to_string());
+                        app.set_sidebar_focus(SidebarFocus::Work);
+                        app.status_message = Some("Sidebar focus: work".to_string());
                     } else {
                         app.set_mode(AppMode::Plan);
                     }
@@ -2491,8 +2508,8 @@ async fn run_event_loop(
                 }
                 KeyCode::Char('2') if key.modifiers.contains(KeyModifiers::ALT) => {
                     if key.modifiers.contains(KeyModifiers::CONTROL) {
-                        app.set_sidebar_focus(SidebarFocus::Todos);
-                        app.status_message = Some("Sidebar focus: todos".to_string());
+                        app.set_sidebar_focus(SidebarFocus::Tasks);
+                        app.status_message = Some("Sidebar focus: tasks".to_string());
                     } else {
                         app.set_mode(AppMode::Agent);
                     }
@@ -2500,8 +2517,8 @@ async fn run_event_loop(
                 }
                 KeyCode::Char('3') if key.modifiers.contains(KeyModifiers::ALT) => {
                     if key.modifiers.contains(KeyModifiers::CONTROL) {
-                        app.set_sidebar_focus(SidebarFocus::Tasks);
-                        app.status_message = Some("Sidebar focus: tasks".to_string());
+                        app.set_sidebar_focus(SidebarFocus::Agents);
+                        app.status_message = Some("Sidebar focus: agents".to_string());
                     } else {
                         app.set_mode(AppMode::Yolo);
                     }
@@ -2512,26 +2529,23 @@ async fn run_event_loop(
                     continue;
                 }
                 KeyCode::Char('!') if key.modifiers.contains(KeyModifiers::ALT) => {
-                    app.set_sidebar_focus(SidebarFocus::Plan);
-                    app.status_message = Some("Sidebar focus: plan".to_string());
+                    app.set_sidebar_focus(SidebarFocus::Work);
+                    app.status_message = Some("Sidebar focus: work".to_string());
                     continue;
                 }
                 KeyCode::Char('@') if key.modifiers.contains(KeyModifiers::ALT) => {
-                    app.set_sidebar_focus(SidebarFocus::Todos);
-                    app.status_message = Some("Sidebar focus: todos".to_string());
-                    continue;
-                }
-                KeyCode::Char('#') if key.modifiers.contains(KeyModifiers::ALT) => {
                     app.set_sidebar_focus(SidebarFocus::Tasks);
                     app.status_message = Some("Sidebar focus: tasks".to_string());
                     continue;
                 }
-                KeyCode::Char('$') if key.modifiers.contains(KeyModifiers::ALT) => {
+                KeyCode::Char('#') if key.modifiers.contains(KeyModifiers::ALT) => {
                     app.set_sidebar_focus(SidebarFocus::Agents);
                     app.status_message = Some("Sidebar focus: agents".to_string());
                     continue;
                 }
-                KeyCode::Char('%') if key.modifiers.contains(KeyModifiers::ALT) => {
+                KeyCode::Char('$') | KeyCode::Char('%')
+                    if key.modifiers.contains(KeyModifiers::ALT) =>
+                {
                     app.set_sidebar_focus(SidebarFocus::Context);
                     app.status_message = Some("Sidebar focus: context".to_string());
                     continue;
@@ -5151,22 +5165,6 @@ async fn apply_command_result(
                 let queued = build_queued_message(app, content);
                 submit_or_steer_message(app, config, engine_handle, queued).await?;
             }
-            AppAction::Rlm {
-                prompt,
-                model,
-                child_model,
-                max_depth,
-            } => {
-                app.status_message = Some("RLM turn starting...".to_string());
-                let _ = engine_handle
-                    .send(Op::Rlm {
-                        content: prompt,
-                        model,
-                        child_model,
-                        max_depth,
-                    })
-                    .await;
-            }
             AppAction::ListSubAgents => {
                 let _ = engine_handle.send(Op::ListSubAgents).await;
             }
@@ -7688,7 +7686,7 @@ fn collect_active_tool_status(cell: &HistoryCell, snapshot: &mut ActiveToolStatu
             // status. RLM is different today: it is a foreground tool call,
             // so keep it in the live tool footer until the async RLM
             // workbench lands (#513).
-            if generic.name == "agent_spawn" {
+            if matches!(generic.name.as_str(), "agent_open" | "agent_spawn") {
                 return;
             }
             snapshot.record(format!("tool {}", generic.name), generic.status, None);
@@ -8381,6 +8379,21 @@ pub(crate) fn truncate_line_to_width(text: &str, max_width: usize) -> String {
     out
 }
 
+fn should_drop_loading_mouse_motion(app: &App, mouse: MouseEvent) -> bool {
+    if !app.is_loading {
+        return false;
+    }
+
+    match mouse.kind {
+        MouseEventKind::Moved => true,
+        MouseEventKind::Drag(_) => {
+            !app.viewport.transcript_selection.dragging
+                && !app.viewport.transcript_scrollbar_dragging
+        }
+        _ => false,
+    }
+}
+
 fn handle_mouse_event(app: &mut App, mouse: MouseEvent) -> Vec<ViewEvent> {
     if app.view_stack.top_kind() == Some(ModalKind::ContextMenu) {
         if matches!(mouse.kind, MouseEventKind::Down(MouseButton::Right)) {
@@ -9003,21 +9016,63 @@ fn open_pager_for_last_message(app: &mut App) -> bool {
     true
 }
 
-/// Open a pager showing the full thinking block. Targets the cell at the
-/// current selection if it's a Thinking cell; otherwise falls back to the
-/// most recent Thinking cell across the virtual transcript (history +
-/// in-flight `active_cell`). Bound to Ctrl+O so users can read reasoning
-/// content that's been collapsed in calm-mode rendering.
-///
-/// The virtual-index lookup matters: after `ThinkingComplete` fires the
-/// finalized thinking entry sits in `active_cell` with `streaming = false`
-/// until the active cell flushes to history. During that window the
-/// transcript already renders the "thinking collapsed; press Ctrl+O for
-/// full text" affordance, so the handler must address active-cell entries
-/// or the affordance becomes a lie.
+/// Compatibility wrapper for the old test name. The user-facing Ctrl+O
+/// surface is now Activity Detail, not a thinking-only pager.
+#[cfg(test)]
 fn open_thinking_pager(app: &mut App) -> bool {
-    let selected_cell = app
+    open_activity_detail_pager(app)
+}
+
+/// Open a pager for the activity the user is most likely asking about.
+///
+/// Ctrl+O uses this path. It prefers an explicitly selected activity cell,
+/// then a live activity in the current turn, then the most recent meaningful
+/// activity across history + active cells. Tool activity is intentionally
+/// rendered through the compact live view so Activity Detail does not become
+/// an accidental raw-output dump; Alt+V remains the direct full tool-detail
+/// surface.
+fn open_activity_detail_pager(app: &mut App) -> bool {
+    let Some(idx) = activity_target_cell_index(app) else {
+        app.status_message = Some("No activity detail available".to_string());
+        return true;
+    };
+
+    let width = app
         .viewport
+        .last_transcript_area
+        .map(|area| area.width)
+        .unwrap_or(80);
+    let Some(text) = activity_detail_text(app, idx, width) else {
+        app.status_message = Some("No activity detail available".to_string());
+        return true;
+    };
+    app.view_stack.push(PagerView::from_text(
+        "Activity Detail",
+        &text,
+        width.saturating_sub(2),
+    ));
+    true
+}
+
+fn activity_target_cell_index(app: &App) -> Option<usize> {
+    if let Some(selected) = selected_transcript_cell_index(app)
+        && app
+            .cell_at_virtual_index(selected)
+            .is_some_and(is_meaningful_activity_cell)
+    {
+        return Some(selected);
+    }
+
+    current_activity_cell_index(app).or_else(|| {
+        (0..app.virtual_cell_count()).rev().find(|&idx| {
+            app.cell_at_virtual_index(idx)
+                .is_some_and(is_meaningful_activity_cell)
+        })
+    })
+}
+
+fn selected_transcript_cell_index(app: &App) -> Option<usize> {
+    app.viewport
         .transcript_selection
         .ordered_endpoints()
         .and_then(|(start, _)| {
@@ -9028,45 +9083,226 @@ fn open_thinking_pager(app: &mut App) -> bool {
                 .and_then(|meta| meta.cell_line())
                 .map(|(cell_index, _)| cell_index)
         })
-        .filter(|&idx| {
-            matches!(
-                app.cell_at_virtual_index(idx),
-                Some(crate::tui::history::HistoryCell::Thinking { .. })
-            )
-        });
+}
 
-    let target_idx = selected_cell.or_else(|| {
-        (0..app.virtual_cell_count()).rev().find(|&idx| {
-            matches!(
-                app.cell_at_virtual_index(idx),
-                Some(crate::tui::history::HistoryCell::Thinking { .. })
-            )
-        })
-    });
+fn current_activity_cell_index(app: &App) -> Option<usize> {
+    let active = app.active_cell.as_ref()?;
+    let base = app.history.len();
+    for desired_rank in [0, 1, 2] {
+        if let Some((entry_idx, _)) = active
+            .entries()
+            .iter()
+            .enumerate()
+            .rev()
+            .find(|(_, cell)| activity_cell_rank(cell) == Some(desired_rank))
+        {
+            return Some(base + entry_idx);
+        }
+    }
+    None
+}
 
-    let Some(idx) = target_idx else {
-        app.status_message = Some("No thinking blocks to expand".to_string());
-        return true;
-    };
+fn is_meaningful_activity_cell(cell: &HistoryCell) -> bool {
+    activity_cell_rank(cell).is_some()
+}
 
-    let width = app
-        .viewport
-        .last_transcript_area
-        .map(|area| area.width)
-        .unwrap_or(80);
-    let text = {
-        let Some(cell) = app.cell_at_virtual_index(idx) else {
-            app.status_message = Some("No thinking blocks to expand".to_string());
-            return true;
-        };
-        history_cell_to_text(cell, width)
-    };
-    app.view_stack.push(PagerView::from_text(
-        "Thinking",
-        &text,
-        width.saturating_sub(2),
+fn activity_cell_rank(cell: &HistoryCell) -> Option<u8> {
+    match cell {
+        HistoryCell::Thinking {
+            streaming: true, ..
+        } => Some(0),
+        HistoryCell::Tool(tool) => match tool_status_for_activity(tool) {
+            Some(ToolStatus::Running) => Some(0),
+            Some(ToolStatus::Failed) => Some(1),
+            Some(ToolStatus::Success) => Some(2),
+            None => Some(2),
+        },
+        HistoryCell::SubAgent(_) => Some(0),
+        HistoryCell::Error { .. } => Some(1),
+        HistoryCell::Thinking { .. } => Some(2),
+        _ => None,
+    }
+}
+
+fn activity_detail_text(app: &App, cell_index: usize, width: u16) -> Option<String> {
+    let cell = app.cell_at_virtual_index(cell_index)?;
+    let mut sections = Vec::new();
+
+    if let Some(turn_id) = app.runtime_turn_id.as_ref() {
+        let status = app.runtime_turn_status.as_deref().unwrap_or("in progress");
+        sections.push(format!(
+            "Turn: {} ({status})",
+            truncate_line_to_width(turn_id, 24)
+        ));
+    }
+
+    sections.push(format!(
+        "Activity: {}",
+        activity_cell_label(app, cell_index, cell)
     ));
-    true
+
+    if let Some(status) = activity_status_line(cell) {
+        sections.push(status);
+    }
+
+    if let Some((position, total)) = thinking_chunk_position(app, cell_index) {
+        sections.push(format!("Thinking chunk: {position} of {total}"));
+    }
+
+    sections.push(String::new());
+    sections.push(activity_cell_to_text(cell, width));
+    Some(sections.join("\n"))
+}
+
+fn activity_cell_label(app: &App, cell_index: usize, cell: &HistoryCell) -> String {
+    match cell {
+        HistoryCell::Thinking { .. } => "thinking".to_string(),
+        HistoryCell::Error { .. } => "error".to_string(),
+        HistoryCell::SubAgent(_) => "sub-agent".to_string(),
+        HistoryCell::Tool(_) => {
+            detail_target_label(app, cell_index).unwrap_or_else(|| "tool activity".to_string())
+        }
+        _ => "message".to_string(),
+    }
+}
+
+fn activity_status_line(cell: &HistoryCell) -> Option<String> {
+    match cell {
+        HistoryCell::Thinking {
+            streaming,
+            duration_secs,
+            ..
+        } => {
+            let mut line = if *streaming {
+                "Status: running".to_string()
+            } else {
+                "Status: done".to_string()
+            };
+            if let Some(duration_secs) = duration_secs {
+                line.push_str(" · ");
+                line.push_str(&format!("{duration_secs:.1}s"));
+            }
+            Some(line)
+        }
+        HistoryCell::Tool(tool) => {
+            let status = tool_status_for_activity(tool)?;
+            let mut line = format!("Status: {}", activity_status_label(status));
+            if let Some(duration_ms) = tool_duration_for_activity(tool) {
+                line.push_str(" · ");
+                line.push_str(&format_activity_duration_ms(duration_ms));
+            }
+            Some(line)
+        }
+        HistoryCell::Error { severity, .. } => Some(format!("Status: {:?}", severity)),
+        HistoryCell::SubAgent(_) => None,
+        _ => None,
+    }
+}
+
+fn tool_status_for_activity(tool: &ToolCell) -> Option<ToolStatus> {
+    match tool {
+        ToolCell::Exec(cell) => Some(cell.status),
+        ToolCell::Exploring(cell) => {
+            if cell
+                .entries
+                .iter()
+                .any(|entry| entry.status == ToolStatus::Running)
+            {
+                Some(ToolStatus::Running)
+            } else if cell
+                .entries
+                .iter()
+                .any(|entry| entry.status == ToolStatus::Failed)
+            {
+                Some(ToolStatus::Failed)
+            } else {
+                Some(ToolStatus::Success)
+            }
+        }
+        ToolCell::PlanUpdate(cell) => Some(cell.status),
+        ToolCell::PatchSummary(cell) => Some(cell.status),
+        ToolCell::Review(cell) => Some(cell.status),
+        ToolCell::DiffPreview(_) => Some(ToolStatus::Success),
+        ToolCell::Mcp(cell) => Some(cell.status),
+        ToolCell::ViewImage(_) => Some(ToolStatus::Success),
+        ToolCell::WebSearch(cell) => Some(cell.status),
+        ToolCell::Generic(cell) => Some(cell.status),
+    }
+}
+
+fn tool_duration_for_activity(tool: &ToolCell) -> Option<u64> {
+    match tool {
+        ToolCell::Exec(cell) => cell.duration_ms.or_else(|| {
+            (cell.status == ToolStatus::Running).then(|| {
+                u64::try_from(
+                    cell.started_at
+                        .map(|started| started.elapsed().as_millis())
+                        .unwrap_or_default(),
+                )
+                .unwrap_or(u64::MAX)
+            })
+        }),
+        _ => None,
+    }
+}
+
+fn activity_status_label(status: ToolStatus) -> &'static str {
+    match status {
+        ToolStatus::Running => "running",
+        ToolStatus::Success => "done",
+        ToolStatus::Failed => "failed",
+    }
+}
+
+fn format_activity_duration_ms(ms: u64) -> String {
+    if ms < 1000 {
+        format!("{ms}ms")
+    } else {
+        format!("{:.1}s", ms as f64 / 1000.0)
+    }
+}
+
+fn thinking_chunk_position(app: &App, cell_index: usize) -> Option<(usize, usize)> {
+    if !matches!(
+        app.cell_at_virtual_index(cell_index),
+        Some(HistoryCell::Thinking { .. })
+    ) {
+        return None;
+    }
+
+    let mut total = 0usize;
+    let mut position = None;
+    for idx in 0..app.virtual_cell_count() {
+        if matches!(
+            app.cell_at_virtual_index(idx),
+            Some(HistoryCell::Thinking { .. })
+        ) {
+            total += 1;
+            if idx == cell_index {
+                position = Some(total);
+            }
+        }
+    }
+    position.map(|pos| (pos, total))
+}
+
+fn activity_cell_to_text(cell: &HistoryCell, width: u16) -> String {
+    let lines = match cell {
+        HistoryCell::Tool(_) => cell.lines_with_options(
+            width,
+            TranscriptRenderOptions {
+                calm_mode: true,
+                low_motion: true,
+                ..TranscriptRenderOptions::default()
+            },
+        ),
+        _ => cell.transcript_lines(width),
+    };
+    lines
+        .iter()
+        .map(line_to_plain)
+        .collect::<Vec<_>>()
+        .join("\n")
 }
 
 fn open_tool_details_pager(app: &mut App) -> bool {
@@ -9233,19 +9469,44 @@ fn selected_detail_footer_label(app: &App) -> Option<String> {
     if app.viewport.transcript_selection.is_active() {
         return None;
     }
-    let cell_index = app.detail_cell_index_for_viewport(
-        app.viewport.last_transcript_top,
-        app.viewport.last_transcript_visible.max(1),
-        app.viewport.transcript_cache.line_meta(),
-    )?;
-    let label = detail_target_label(app, cell_index)?;
+    let cell_index = activity_footer_target_cell_index(app)?;
+    let cell = app.cell_at_virtual_index(cell_index)?;
+    let label = truncate_line_to_width(&activity_cell_label(app, cell_index, cell), 30);
+    let raw_hint = if app.cell_has_detail_target(cell_index) {
+        format!(" · {} raw", tool_details_shortcut_label())
+    } else {
+        String::new()
+    };
     Some(format!(
-        "{} details: {}",
-        tool_details_shortcut_label(),
-        truncate_line_to_width(&label, 34)
+        "{} Activity: {label}{raw_hint}",
+        activity_shortcut_label()
     ))
 }
 
+fn activity_footer_target_cell_index(app: &App) -> Option<usize> {
+    let line_meta = app.viewport.transcript_cache.line_meta();
+    let start = app
+        .viewport
+        .last_transcript_top
+        .min(line_meta.len().saturating_sub(1));
+    let end = start
+        .saturating_add(app.viewport.last_transcript_visible.max(1))
+        .min(line_meta.len());
+    for meta in line_meta.iter().take(end).skip(start) {
+        let Some((cell_index, _)) = meta.cell_line() else {
+            continue;
+        };
+        if app
+            .cell_at_virtual_index(cell_index)
+            .is_some_and(is_meaningful_activity_cell)
+        {
+            return Some(cell_index);
+        }
+    }
+
+    activity_target_cell_index(app)
+}
+
 fn detail_target_label(app: &App, cell_index: usize) -> Option<String> {
     if let Some(detail) = app.tool_detail_record_for_cell(cell_index) {
         return Some(detail.tool_name.clone());
@@ -9322,6 +9583,10 @@ fn tool_details_shortcut_label() -> &'static str {
     }
 }
 
+fn activity_shortcut_label() -> &'static str {
+    "Ctrl+O"
+}
+
 /// Modifier predicate for the v0.8.30 family of `Alt+<letter>` transcript-
 /// nav shortcuts (`Alt+G` / `Alt+Shift+G` / `Alt+[` / `Alt+]` / `Alt+?` /
 /// `Alt+L` / `Alt+V`). Requires `Alt` and disallows `Ctrl` / `Super` so the
diff --git a/crates/tui/src/tui/ui/tests.rs b/crates/tui/src/tui/ui/tests.rs
index 78ee2d93..9c2b0157 100644
--- a/crates/tui/src/tui/ui/tests.rs
+++ b/crates/tui/src/tui/ui/tests.rs
@@ -449,6 +449,35 @@ fn mouse_selection_autocopies_on_release_without_ctrl_c() {
     );
 }
 
+#[test]
+fn loading_mouse_filter_keeps_active_drags() {
+    let mut app = create_test_app();
+    app.is_loading = true;
+
+    let moved = MouseEvent {
+        kind: MouseEventKind::Moved,
+        column: 3,
+        row: 2,
+        modifiers: KeyModifiers::NONE,
+    };
+    let drag = MouseEvent {
+        kind: MouseEventKind::Drag(MouseButton::Left),
+        column: 5,
+        row: 2,
+        modifiers: KeyModifiers::NONE,
+    };
+
+    assert!(should_drop_loading_mouse_motion(&app, moved));
+    assert!(should_drop_loading_mouse_motion(&app, drag));
+
+    app.viewport.transcript_selection.dragging = true;
+    assert!(!should_drop_loading_mouse_motion(&app, drag));
+
+    app.viewport.transcript_selection.dragging = false;
+    app.viewport.transcript_scrollbar_dragging = true;
+    assert!(!should_drop_loading_mouse_motion(&app, drag));
+}
+
 #[test]
 fn jump_to_latest_button_click_scrolls_to_tail() {
     let mut app = create_test_app();
@@ -1732,7 +1761,10 @@ fn make_subagent(
     status: crate::tools::subagent::SubAgentStatus,
 ) -> crate::tools::subagent::SubAgentResult {
     crate::tools::subagent::SubAgentResult {
+        name: id.to_string(),
         agent_id: id.to_string(),
+        context_mode: "fresh".to_string(),
+        fork_context: false,
         agent_type: crate::tools::subagent::SubAgentType::General,
         assignment: crate::tools::subagent::SubAgentAssignment {
             objective: format!("objective-{id}"),
@@ -2762,6 +2794,15 @@ fn first_line_for_cell(app: &App, cell_index: usize) -> usize {
         .expect("cell should have rendered line")
 }
 
+fn pop_pager_body(app: &mut App) -> String {
+    let mut view = app.view_stack.pop().expect("pager view");
+    let pager = view
+        .as_any_mut()
+        .downcast_mut::<PagerView>()
+        .expect("top view should be pager");
+    pager.body_text()
+}
+
 #[test]
 fn detail_target_prefers_visible_tool_card() {
     let mut app = create_test_app();
@@ -2824,13 +2865,42 @@ fn detail_target_prefers_visible_tool_card() {
     app.viewport.last_transcript_visible = 6;
 
     assert_eq!(detail_target_cell_index(&app), Some(1));
-    let expected = format!("{} details: file_search", tool_details_shortcut_label());
+    let expected = format!(
+        "{} Activity: file_search · {} raw",
+        activity_shortcut_label(),
+        tool_details_shortcut_label()
+    );
     assert_eq!(
         selected_detail_footer_label(&app).as_deref(),
         Some(expected.as_str())
     );
 }
 
+#[test]
+fn activity_footer_hint_surfaces_visible_thinking_without_raw_tool_hint() {
+    let mut app = create_test_app();
+    app.history = vec![HistoryCell::Thinking {
+        content: "visible reasoning".to_string(),
+        streaming: false,
+        duration_secs: Some(1.4),
+    }];
+    app.resync_history_revisions();
+    let revisions = app.history_revisions.clone();
+    app.viewport.transcript_cache.ensure(
+        &app.history,
+        &revisions,
+        100,
+        app.transcript_render_options(),
+    );
+    app.viewport.last_transcript_top = first_line_for_cell(&app, 0);
+    app.viewport.last_transcript_visible = 4;
+
+    assert_eq!(
+        selected_detail_footer_label(&app).as_deref(),
+        Some("Ctrl+O Activity: thinking")
+    );
+}
+
 #[test]
 fn macos_option_v_glyph_is_treated_as_details_shortcut_only_on_macos() {
     let option_v = KeyEvent::new(KeyCode::Char('\u{221A}'), KeyModifiers::NONE);
@@ -3680,7 +3750,7 @@ fn orphan_during_active_keeps_subsequent_completion_routed_correctly() {
 
 #[test]
 fn tool_details_survive_active_cell_flush() {
-    // The pager / Ctrl+O resolves tool details by cell index. Flushing the
+    // Detail pagers resolve tool details by cell index. Flushing the
     // active cell must move detail records into `tool_details_by_cell` so
     // the pager keeps working after the turn settles.
     let mut app = create_test_app();
@@ -3985,7 +4055,7 @@ fn open_thinking_pager_finds_thinking_in_active_cell() {
     // `app.active_cell` with `streaming = false` until the active cell is
     // flushed to history (end-of-turn, or when an assistant text arrives).
     // During that window the transcript still renders the
-    // "thinking collapsed; press Ctrl+O for full text" affordance from
+    // "thinking collapsed; Ctrl+O opens Activity Detail" affordance from
     // `render_thinking`, so the handler must reach across the virtual
     // transcript — not just `app.history` — or the promise is a lie.
     // Regression guard for the v0.8.29 affordance/handler mismatch.
@@ -4015,6 +4085,123 @@ fn open_thinking_pager_finds_thinking_in_active_cell() {
     );
 }
 
+#[test]
+fn activity_detail_opens_selected_thinking_chunk() {
+    let mut app = create_test_app();
+    app.history = vec![
+        HistoryCell::Thinking {
+            content: "first chunk reasoning".to_string(),
+            streaming: false,
+            duration_secs: Some(0.8),
+        },
+        HistoryCell::Assistant {
+            content: "interlude".to_string(),
+            streaming: false,
+        },
+        HistoryCell::Thinking {
+            content: "second chunk reasoning".to_string(),
+            streaming: false,
+            duration_secs: Some(1.1),
+        },
+    ];
+    app.resync_history_revisions();
+    let revisions = app.history_revisions.clone();
+    app.viewport.transcript_cache.ensure(
+        &app.history,
+        &revisions,
+        100,
+        app.transcript_render_options(),
+    );
+    let line = first_line_for_cell(&app, 0);
+    let point = TranscriptSelectionPoint {
+        line_index: line,
+        column: 0,
+    };
+    app.viewport.transcript_selection.anchor = Some(point);
+    app.viewport.transcript_selection.head = Some(point);
+
+    assert!(open_activity_detail_pager(&mut app));
+    let body = pop_pager_body(&mut app);
+
+    assert!(
+        body.contains("Activity: thinking"),
+        "activity label missing: {body}"
+    );
+    assert!(
+        body.contains("Thinking chunk: 1 of 2"),
+        "chunk position missing: {body}"
+    );
+    assert!(body.contains("first chunk reasoning"), "body: {body}");
+    assert!(
+        !body.contains("second chunk reasoning"),
+        "selected chunk should not fall through to latest thinking: {body}"
+    );
+}
+
+#[test]
+fn activity_detail_fallback_prefers_live_activity_context() {
+    let mut app = create_test_app();
+    let mut active = ActiveCell::new();
+    active.push_tool(
+        "active-1",
+        HistoryCell::Tool(ToolCell::Generic(GenericToolCell {
+            name: "agent_eval".to_string(),
+            status: ToolStatus::Running,
+            input_summary: Some("agent_id: agent_af58ba3a".to_string()),
+            output: None,
+            prompts: None,
+            spillover_path: None,
+            output_summary: None,
+            is_diff: false,
+        })),
+    );
+    app.active_cell = Some(active);
+    app.runtime_turn_id = Some("turn_live_123456789".to_string());
+    app.runtime_turn_status = Some("in_progress".to_string());
+
+    assert!(open_activity_detail_pager(&mut app));
+    let body = pop_pager_body(&mut app);
+
+    assert!(body.contains("Turn: turn_live_123456789"));
+    assert!(body.contains("Activity: tool agent_eval"));
+    assert!(body.contains("Status: running"));
+    assert!(body.contains("agent_id: agent_af58ba3a"));
+}
+
+#[test]
+fn activity_detail_fallback_uses_recent_meaningful_activity_without_full_tool_dump() {
+    let mut app = create_test_app();
+    let output = (0..20)
+        .map(|idx| format!("line {idx}"))
+        .collect::<Vec<_>>()
+        .join("\n");
+    app.history
+        .push(HistoryCell::Tool(ToolCell::Generic(GenericToolCell {
+            name: "read_file".to_string(),
+            status: ToolStatus::Success,
+            input_summary: Some("src/large.rs".to_string()),
+            output: Some(output),
+            prompts: None,
+            spillover_path: None,
+            output_summary: None,
+            is_diff: false,
+        })));
+
+    assert!(open_activity_detail_pager(&mut app));
+    let body = pop_pager_body(&mut app);
+
+    assert!(body.contains("Activity: tool read_file"));
+    assert!(body.contains("Status: done"));
+    assert!(
+        body.contains("Alt+V for details"),
+        "activity detail should stay bounded and point to Alt+V for raw detail: {body}"
+    );
+    assert!(
+        !body.contains("line 10"),
+        "middle of large raw output should not be dumped into Activity Detail: {body}"
+    );
+}
+
 #[test]
 fn engine_error_finalizes_active_thinking_block() {
     use crate::error_taxonomy::StreamError;
diff --git a/crates/tui/src/tui/views/mod.rs b/crates/tui/src/tui/views/mod.rs
index 845572ac..3a53b775 100644
--- a/crates/tui/src/tui/views/mod.rs
+++ b/crates/tui/src/tui/views/mod.rs
@@ -1044,7 +1044,7 @@ fn config_hint_for_key(key: &str) -> &'static str {
         "background_color" => "#RRGGBB | default",
         "default_mode" => "agent | plan | yolo",
         "sidebar_width" => "10..=50",
-        "sidebar_focus" => "auto | plan | todos | tasks | agents",
+        "sidebar_focus" => "auto | work | tasks | agents | context",
         "max_history" => "integer (0 allowed)",
         "default_model" => "deepseek-v4-pro | deepseek-v4-flash | deepseek-* | none/default",
         "mcp_config_path" => "path to mcp.json",
@@ -1516,7 +1516,10 @@ fn live_subagent_result(
     role: Option<&str>,
 ) -> SubAgentResult {
     SubAgentResult {
+        name: agent_id.to_string(),
         agent_id: agent_id.to_string(),
+        context_mode: "fresh".to_string(),
+        fork_context: false,
         agent_type,
         assignment: SubAgentAssignment {
             objective: summarize_tool_output(objective),
@@ -1938,7 +1941,10 @@ mod tests {
 
     fn manager_agent(id: &str, status: SubAgentStatus) -> SubAgentResult {
         SubAgentResult {
+            name: id.to_string(),
             agent_id: id.to_string(),
+            context_mode: "fresh".to_string(),
+            fork_context: false,
             agent_type: SubAgentType::Explore,
             assignment: SubAgentAssignment {
                 objective: "read the docs".to_string(),
diff --git a/crates/tui/src/tui/widgets/agent_card.rs b/crates/tui/src/tui/widgets/agent_card.rs
index e9504bef..dde137d3 100644
--- a/crates/tui/src/tui/widgets/agent_card.rs
+++ b/crates/tui/src/tui/widgets/agent_card.rs
@@ -283,7 +283,7 @@ impl FanoutCard {
         let mut lines = Vec::with_capacity(3);
         let header_status = self.aggregate_status();
         let title = format!("{} ({} workers)", self.kind, self.workers.len());
-        let family = if self.kind == "rlm" {
+        let family = if matches!(self.kind.as_str(), "rlm_open" | "rlm_eval" | "rlm") {
             ToolFamily::Rlm
         } else {
             ToolFamily::Fanout
diff --git a/crates/tui/src/tui/widgets/tool_card.rs b/crates/tui/src/tui/widgets/tool_card.rs
index 143262f1..de1ec4c0 100644
--- a/crates/tui/src/tui/widgets/tool_card.rs
+++ b/crates/tui/src/tui/widgets/tool_card.rs
@@ -69,7 +69,7 @@ pub fn tool_family_for_title(title: &str) -> ToolFamily {
 }
 
 /// Map an arbitrary tool name (as exposed to the model — e.g. `read_file`,
-/// `apply_patch`, `agent_spawn`) to a family. Used by `GenericToolCell`
+/// `apply_patch`, `agent_open`) to a family. Used by `GenericToolCell`
 /// where the `tool_family_for_title` shortcut isn't enough because every
 /// generic cell shares the title `"Tool"`.
 #[must_use]
@@ -79,8 +79,8 @@ pub fn tool_family_for_name(name: &str) -> ToolFamily {
         "edit_file" | "apply_patch" | "write_file" => ToolFamily::Patch,
         "exec_shell" | "exec_shell_wait" | "exec_shell_interact" => ToolFamily::Run,
         "grep_files" | "file_search" | "web_search" | "fetch_url" => ToolFamily::Find,
-        "agent_spawn" => ToolFamily::Delegate,
-        "rlm" => ToolFamily::Rlm,
+        "agent_open" | "agent_eval" | "agent_close" | "agent_spawn" => ToolFamily::Delegate,
+        "rlm_open" | "rlm_eval" | "rlm_configure" | "rlm_close" | "rlm" => ToolFamily::Rlm,
         _ => ToolFamily::Generic,
     }
 }
@@ -217,8 +217,8 @@ mod tests {
         assert_eq!(tool_family_for_name("apply_patch"), ToolFamily::Patch);
         assert_eq!(tool_family_for_name("exec_shell"), ToolFamily::Run);
         assert_eq!(tool_family_for_name("grep_files"), ToolFamily::Find);
-        assert_eq!(tool_family_for_name("agent_spawn"), ToolFamily::Delegate);
-        assert_eq!(tool_family_for_name("rlm"), ToolFamily::Rlm);
+        assert_eq!(tool_family_for_name("agent_open"), ToolFamily::Delegate);
+        assert_eq!(tool_family_for_name("rlm_eval"), ToolFamily::Rlm);
         assert_eq!(
             tool_family_for_name("totally_new_tool"),
             ToolFamily::Generic
diff --git a/docs/ARCHITECTURE.md b/docs/ARCHITECTURE.md
index ad39a438..7cf0eb2b 100644
--- a/docs/ARCHITECTURE.md
+++ b/docs/ARCHITECTURE.md
@@ -7,7 +7,7 @@ Current boundary note (v0.8.6):
 - Other workspace crates are being split out incrementally, but they are not yet the sole runtime source of truth.
 - The LSP subsystem (`crates/tui/src/lsp/`) is fully wired into the engine's post-tool-execution path
   (`core/engine/lsp_hooks.rs`), providing inline diagnostics after every edit_file/apply_patch/write_file.
-- The swarm agent system was removed in v0.8.5 in favour of sub-agents (agent_spawn) and RLM (rlm_query).
+- The swarm agent system was removed in v0.8.5. The active v0.8.33 orchestration surface is persistent sub-agent sessions (`agent_open` / `agent_eval` / `agent_close`) and persistent RLM sessions (`rlm_open` / `rlm_eval` / `rlm_configure` / `rlm_close`).
   No model-visible swarm tool remains in the active codebase.
 
 ## High-Level Overview
@@ -129,9 +129,9 @@ drives turns through Chat Completions.
   - `github.rs` - Read-only GitHub context and guarded comment/closure tools backed by `gh`
   - `automation.rs` - Model-visible scheduling tools over `AutomationManager`
   - `plan.rs` - Planning tools
-  - `subagent.rs` - Sub-agent spawning (replaces the removed `agent_swarm` surface)
+  - `subagent.rs` - Persistent sub-agent sessions (replaces the removed `agent_swarm` surface)
   - `spec.rs` - Tool specifications
-  - `rlm.rs` - Recursive Language Model (RLM) tool — sandboxed Python REPL with `llm_query()` helpers
+  - `rlm.rs` - Persistent Recursive Language Model (RLM) sessions — sandboxed Python REPLs with semantic helper calls and `var_handle` output support
 
 ### Extension Systems
 
diff --git a/docs/COMPETITIVE_ANALYSIS.md b/docs/COMPETITIVE_ANALYSIS.md
deleted file mode 100644
index 40007dad..00000000
--- a/docs/COMPETITIVE_ANALYSIS.md
+++ /dev/null
@@ -1,320 +0,0 @@
-# Competitive Analysis: DeepSeek TUI vs OpenCode vs Codex CLI
-
-Analysis of capabilities across three AI coding agents: OpenCode (`/Volumes/VIXinSSD/opencode`), Codex CLI (`/Volumes/VIXinSSD/codex-main`), and DeepSeek TUI (`/Volumes/VIXinSSD/deepseek-tui`).
-
-## Tool Matrix
-
-| Capability | OpenCode | Codex CLI | DeepSeek TUI |
-|---|---|---|---|
-| File read | ✅ Read | ✅ | ✅ file |
-| File write | ✅ Write | ✅ | ✅ file |
-| File edit | ✅ Edit (string replace) | ✅ apply_patch (diff format) | ✅ edit_file + apply_patch |
-| File glob | ✅ Glob | ✅ | ✅ file_search |
-| Code search | ✅ Grep + CodeSearch (Exa) | ✅ | ✅ grep_files + search |
-| Shell exec | ✅ Bash | ✅ exec/shell | ✅ shell |
-| Web fetch | ✅ WebFetch | ✅ | ✅ fetch_url |
-| Web search | ✅ WebSearch | ✅ WebSearchRequest | ✅ web_search |
-| Web browse | ❌ | ❌ | ✅ web_run |
-| LSP | ✅ Lsp (experimental) | ❌ | ✅ Post-edit diagnostics (auto) |
-| Task/todo tracking | ✅ TodoWrite | ✅ | ✅ todo_write |
-| Subagent spawn | ✅ Task | ✅ Collab/SpawnCsv | ✅ agent_spawn |
-| Skill system | ✅ Skill (multi-location discovery) | ✅ core-skills | ⚠️ Partial (.deepseek/skills/) |
-| Plan mode | ✅ plan-enter/exit | ✅ Plan mode | ✅ Plan mode |
-| User question | ✅ Question | ✅ request_user_input | ✅ user_input |
-| Patch apply | ✅ apply_patch (custom format) | ✅ apply_patch (diff format) | ✅ apply_patch |
-| Data validation | ❌ | ❌ | ✅ validate_data |
-| Finance | ❌ | ❌ | ✅ finance |
-| Git ops | Via Bash tool | ✅ git-utils | ✅ git module |
-| GitHub ops | Via Bash (gh) | ✅ | ✅ github |
-| Test running | ❌ | ✅ | ✅ test_runner |
-| Automation | ❌ | ❌ | ✅ automation |
-| Code review | ❌ | ✅ GuardianApproval | ✅ review |
-| Recall/archive | ❌ | ❌ | ✅ recall_archive |
-| Diagnostics | ❌ | ✅ | ✅ diagnostics |
-| Revert turn | ❌ | ❌ | ✅ revert_turn |
-| Image generation | ❌ | ✅ ImageGeneration | ❌ |
-| Browser use | ❌ | ✅ BrowserUse | ❌ (web_run is headless) |
-| Computer use | ❌ | ✅ ComputerUse | ❌ |
-| Realtime voice | ❌ | ✅ RealtimeConversation | ❌ |
-
----
-
-## High Priority Gaps
-
-These are capabilities that would most directly improve DeepSeek TUI's effectiveness as a coding agent.
-
-### 1. LSP Integration — ✅ IMPLEMENTED (Post-Edit Diagnostics)
-
-**Status:** Implemented in `crates/tui/src/lsp/` + `crates/tui/src/core/engine/lsp_hooks.rs`. Shipped as automatic post-edit diagnostics injection.
-
-**What DeepSeek TUI has:**
-
-- **Post-edit diagnostics hook:** After every successful `edit_file`, `write_file`, or `apply_patch`, the engine automatically requests diagnostics from the appropriate LSP server and injects compiler errors into the model's context as a synthetic message.
-- **Custom JSON-RPC stdio client** (`client.rs`): Implements the LSP wire protocol without `tower-lsp` dependency. Spawns LSP servers as child processes, handles `Content-Length` framing, routes `publishDiagnostics` notifications.
-- **Language registry** (`registry.rs`): Detects language from file extensions and maps to built-in defaults:
-  - Rust → `rust-analyzer`
-  - Go → `gopls serve`
-  - Python → `pyright-langserver --stdio`
-  - TypeScript/JavaScript → `typescript-language-server --stdio`
-  - C/C++ → `clangd`
-- **Configurable** via `[lsp]` table in `~/.deepseek/config.toml`: `enabled`, `poll_after_edit_ms` (default 5000), `max_diagnostics_per_file` (default 20), `include_warnings` (default false), and per-language `[lsp.servers]` overrides.
-- **Non-blocking by design:** Missing LSP binary, server crashes, or timeouts degrade silently to "no diagnostics this turn." Servers spawn lazily on first edit per language.
-- **Test infrastructure:** `FakeTransport` seam for CI testing without real LSP servers.
-
-**Remaining gap vs OpenCode:** OpenCode exposes LSP as a **model-callable tool** with 9 operations (goToDefinition, findReferences, hover, documentSymbol, workspaceSymbol, goToImplementation, prepareCallHierarchy, incomingCalls, outgoingCalls). DeepSeek TUI's LSP is currently passive (auto-fires after edits) rather than active (model can query on demand for navigation).
-
-**What DeepSeek TUI could still add:**
-
-A model-callable `lsp` tool in `crates/tui/src/tools/` that exposes the interactive LSP operations (goToDefinition, findReferences, hover, documentSymbol, workspaceSymbol). The transport infrastructure already exists — the gap is only the tool wrapper and the request/response cycle for LSP methods beyond `didOpen`/`didChange`/`publishDiagnostics`.
-
-### 2. Granular Permission System
-
-**What it is:** Allow/deny/ask rules keyed on tool name × file path pattern, with wildcard support, home-directory expansion, and cascading to pending requests.
-
-**Why it matters:** The current all-or-nothing approval model creates friction. Users can't express "always allow reads in `src/` but always ask for `.env` files." The ability to permanently approve a pattern reduces approval fatigue by 60–80% over a long session.
-
-**OpenCode implementation:** `packages/opencode/src/permission/index.ts` implements:
-
-- `Action`: `allow | deny | ask`
-- `Rule`: `{ permission: string, pattern: string, action: Action }`
-- `Ruleset`: ordered list of rules with last-match-wins semantics
-- Pattern expansion for `~/`, `$HOME/`
-- Wildcard matching on both permission names and path patterns
-- Reply modes: `once` (approve this one call), `always` (approve pattern forever), `reject` (deny this one)
-- Automatic cascading: an "always" reply auto-resolves pending requests for the same session
-- Distinct error types: `DeniedError` (rule-based), `RejectedError` (user said no), `CorrectedError` (user said no with feedback)
-
-Agent definitions inherit permission rulesets that can be user-overridden:
-```typescript
-build: {
-  permission: merge(defaults, { question: "allow", plan_enter: "allow" }, user),
-}
-plan: {
-  permission: merge(defaults, { edit: { "*": "deny" } }, user),
-}
-explore: {
-  permission: merge(defaults, { "*": "deny", grep: "allow", read: "allow", ... }, user),
-}
-```
-
-**What DeepSeek TUI would need:** A permission rule engine with the same dimension (tool name × path pattern × action), persistence to disk, and hook integration so approval decisions can cascade.
-
-### 3. Lifecycle Hooks
-
-**What it is:** User-defined shell commands or plugin functions that fire on specific lifecycle events — before a tool executes, after it completes, when permission is requested, at session start, when the user submits a prompt, and at session stop.
-
-**Why it matters:** Hooks are the escape hatch that lets users enforce invariants without polluting the system prompt. "Always run `cargo fmt` after writing a `.rs` file." "Warn me before any `rm -rf`." "Log every shell command to a file." They are composable, auditable, and don't consume context window tokens.
-
-**Codex CLI implementation:** `codex-rs/hooks/` defines six event types with typed request/response payloads:
-
-| Event | When it fires | Payload |
-|---|---|---|
-| `PreToolUse` | Before tool execution | tool name, input params, sandbox state |
-| `PostToolUse` | After tool execution | tool name, input, success/failure, duration, output preview |
-| `PermissionRequest` | When model requests permission | permission type, justification |
-| `SessionStart` | New session begins | session ID, cwd, source (new/resume) |
-| `UserPromptSubmit` | User sends a message | prompt text |
-| `Stop` | Session ending | reason |
-
-Each hook handler supports:
-- `matcher`: optional regex to filter which tool calls trigger the hook
-- `command`: shell command to run
-- `timeout_sec`: maximum runtime
-- `status_message`: shown to the user while the hook runs
-- `source_path` + `source`: tracks where the hook was defined (project hooks.json, user config, plugin)
-- Hooks can return `Success`, `FailedContinue`, or `FailedAbort` (blocks the operation)
-
-**What DeepSeek TUI would need:** Extend `crates/hooks/` to support the full event surface, add matcher-based filtering, and provide a `hooks.json` discovery mechanism similar to Codex CLI's.
-
-### 4. Persistent Memories
-
-**What it is:** Automatic extraction of user preferences, project conventions, and past decisions from conversations, stored as retrievable memories that are injected into new sessions.
-
-**Why it matters:** Across a long debugging session, the agent rediscovers the same facts: "this project uses Rust edition 2024," "tests run with `cargo test --workspace`," "the user prefers 4-space indentation." A memory system compounds value — each session builds on prior knowledge rather than starting from zero.
-
-**Codex CLI implementation:** The `MemoryTool` feature (experimental, behind `/experimental` menu) enables:
-- Memory generation: the model creates structured memories from conversation content
-- Memory retrieval: relevant memories are injected into new conversation context
-- The `Chronicle` feature adds passive screen-context memories via a sidecar process
-- Memories are stored in SQLite and surfaced in the TUI via `/memories` command
-
-**What DeepSeek TUI would need:** A memory extraction prompt, a vector or keyword-based retrieval system, and storage in the existing session/state infrastructure.
-
-### 5. Skill Auto-Discovery
-
-**What it is:** Automatic scanning of multiple locations for `SKILL.md` files that provide domain-specific instructions, scripts, and references. Skills are injected into the conversation on demand via a `skill` tool.
-
-**Why it matters:** Skills are how the community packages expertise. A "Rust refactoring" skill, a "Docker deployment" skill, a "GitHub Actions" skill — each provides specialized instructions without bloating the main system prompt. OpenCode's multi-location discovery means skills can be project-local, user-global, or pulled from URLs.
-
-**OpenCode implementation:** `packages/opencode/src/skill/index.ts` scans:
-
-1. `~/.claude/skills/**/SKILL.md` (Claude Code compatibility)
-2. `~/.agents/skills/**/SKILL.md` (Agents SDK compatibility)  
-3. Parent directories from cwd to workspace root for `.claude/skills/` and `.agents/skills/`
-4. Project config directories for `{skill,skills}/**/SKILL.md`
-5. User-configured paths (with `~/` expansion)
-6. User-configured URLs (pulled via discovery module)
-
-Skills are parsed for YAML frontmatter (`name`, `description`) and Markdown content. Duplicate names warn but don't error. Skills respect agent permissions — an agent can only load skills its permission ruleset allows.
-
-**What DeepSeek TUI would need:** Extend the existing `~/.deepseek/skills/` discovery to parent-directory walking, Claude Code compatibility paths, and URL-based skill sources. Add YAML frontmatter parsing.
-
----
-
-## Medium Priority Gaps
-
-These would meaningfully improve the agent experience but are less urgent.
-
-### 6. Agent Profiles with Permission Inheritance
-
-**What it is:** Named agent types (build, plan, general, explore) that inherit different tool permission sets. Users can define custom agents with specific models, temperatures, system prompts, and permission rules.
-
-**OpenCode implementation:** `packages/opencode/src/agent/agent.ts`:
-
-- `build`: full-access with ask on sensitive paths
-- `plan`: all edit tools denied, plan-exit allowed, plan file writes in `.opencode/plans/` allowed
-- `general`: subagent-only, todo-write denied
-- `explore`: read-only, grep/glob/read/bash/webfetch/websearch allowed
-- Plus hidden agents for internal tasks (compaction, title generation, summarization)
-
-Each agent carries its own `model`, `temperature`, `topP`, `prompt`, and `permission` ruleset. A `generate` function creates new agent configs dynamically from user descriptions.
-
-**What DeepSeek TUI would need:** Extend the mode system (Plan/Agent/YOLO) to support named agent profiles with per-profile tool filtering and model configuration.
-
-### 7. Shell Sandboxing
-
-**What it is:** OS-level sandbox enforcement for shell commands — network restrictions, filesystem read-only mounts, allowed/disallowed paths.
-
-**Codex CLI implementation:** `codex-rs/sandboxing/`:
-
-- macOS: Seatbelt (`sandboxing/src/seatbelt.rs`) with `.sbpl` policy files
-- Linux: bubblewrap (default) or Landlock (legacy fallback)
-- Windows: restricted token
-- Configurable sandbox policies per command
-- Integration tests can detect they're running under sandbox and early-exit
-
-**What DeepSeek TUI would need:** Extend `crates/execpolicy/` to support platform-specific sandbox enforcement. Start with macOS Seatbelt (most DeepSeek TUI users are on macOS).
-
-### 8. Tool Search / Deferred MCP Tool Exposure
-
-**What it is:** Instead of dumping all MCP tools into the system prompt (bloating context), expose a `tool_search` function that the model calls to discover relevant tools by name or description.
-
-**Codex CLI implementation:** `ToolSearch` feature (stable, default-enabled). `ToolSearchAlwaysDeferMcpTools` goes further — never exposes MCP tools directly, always requires search. This is critical when MCP servers expose hundreds of tools.
-
-**What DeepSeek TUI would need:** `tool_search_tool_regex` and `tool_search_tool_bm25` already exist as deferred tool discovery mechanisms. Extend them to gate MCP tool exposure behind on-demand search.
-
-### 9. ExecPolicy / Command Approval Rules
-
-**What it is:** A policy engine that evaluates shell commands against user-defined rules — prefix allowlists, network restrictions, pattern matching — and auto-approves, denies, or escalates.
-
-**Codex CLI implementation:** `codex-rs/execpolicy/src/`:
-
-- `Policy`: ordered list of `Rule` entries
-- `Rule`: prefix patterns (e.g., allow `cargo build*`, deny `rm *`)
-- `NetworkRule`: protocol-level network restrictions
-- `MatchOptions`: controls rule evaluation behavior
-- `Evaluation`: result of policy evaluation against a command
-
-Rules can be amended at runtime via `blocking_append_allow_prefix_rule`.
-
-**What DeepSeek TUI would need:** Extend `crates/execpolicy/` to support prefix rules, network rules, and runtime policy amendments.
-
-### 10. Dynamic Agent Generation
-
-**What it is:** On-the-fly generation of new agent configurations from natural language descriptions.
-
-**OpenCode implementation:** The `generate` function in `agent.ts` takes a description like "code reviewer that only reads files and reports issues" and returns an `{ identifier, whenToUse, systemPrompt }` object using a structured LLM call. Generated agents respect existing agent name collisions.
-
-**What DeepSeek TUI would need:** A model-callable tool or slash command that generates agent configs from descriptions and registers them for the session.
-
-### 11. Streaming Patch Events
-
-**What it is:** Structured progress events streamed while the model is generating `apply_patch` input, giving the user real-time feedback on what files will change.
-
-**Codex CLI implementation:** `ApplyPatchStreamingEvents` feature (under development) streams file-level progress as the model produces patch hunks. The `StreamingPatchParser` in `apply-patch/src/streaming_parser.rs` handles incremental parsing.
-
-**What DeepSeek TUI would need:** Extend `apply_patch.rs` to emit progress events during streaming model output.
-
----
-
-## Lower Priority Gaps
-
-Specialized features that are valuable but less critical for core coding workflow.
-
-| Capability | Where | Notes |
-|---|---|---|
-| Image Generation | Codex CLI `ImageGeneration` | Niche for coding; useful for documentation diagrams |
-| Browser Use | Codex CLI `BrowserUse` | Interactive browser automation (click, type, screenshot). DeepSeek TUI has `web_run` for headless |
-| Computer Use | Codex CLI `ComputerUse` | Full desktop automation. Desktop-app-gated |
-| Realtime Voice | Codex CLI `RealtimeConversation` | Voice conversation mode. Experimental |
-| Unified PTY Exec | Codex CLI `UnifiedExec` | Single PTY-backed shell with state snapshotting across turns |
-| Artifacts | Codex CLI `Artifact` | Native artifact rendering tools |
-| Goals | Codex CLI `Goals` | Persistent thread goals that survive compaction and session restarts |
-| Git Commit Attribution | Codex CLI `CodexGitCommit` | Model instructions for proper commit attribution |
-| CSV Agent Spawning | Codex CLI `SpawnCsv` | CSV-backed parallel agent job distribution |
-| Shell Snapshotting | Codex CLI `ShellSnapshot` | Save/restore shell state across turns |
-| Prevent Idle Sleep | Codex CLI `PreventIdleSleep` | Keep machine awake during long-running agent tasks |
-
----
-
-## Architectural Patterns
-
-### OpenCode
-
-**Client/Server Architecture:** The TUI is one client; the server can be driven remotely from a mobile app, desktop app, or web console. This decouples the agent runtime from the UI layer.
-
-**Plugin System:** `packages/opencode/src/plugin/` supports hot-loadable JS/TS plugins that add tools, models, auth providers, and chat middleware. Plugins receive a typed context with tool execution, auth, and filesystem access.
-
-**Multi-Provider:** Not coupled to any single AI provider. Models are configured with provider IDs and resolved through a provider registry. OAuth support for OpenAI Codex (ChatGPT subscription integration) in `plugin/codex.ts`.
-
-**Config Layering:** Config is loaded from multiple sources (global, project, env vars) and merged with well-defined precedence.
-
-### Codex CLI
-
-**App-Server Protocol:** `codex-rs/app-server-protocol/` defines a versioned RPC protocol (v2) between the TUI frontend and the agent backend. All new API development goes through v2 with strict naming conventions (`*Params`/`*Response`/`*Notification`, `resource/method` RPC naming).
-
-**Feature Flag System:** `codex-rs/features/` centralizes 60+ feature flags with lifecycle stages (UnderDevelopment, Experimental, Stable, Deprecated, Removed). Features have metadata (menu name, description, announcement text) and can carry custom config structs.
-
-**Bazel + Cargo Dual Build:** Codex CLI uses both Cargo (for development) and Bazel (for CI/release). The `find_resource!` macro and `cargo_bin()` helper abstract over runfile differences.
-
-**Snapshot Testing:** `codex-rs/tui/` extensively uses `insta` for UI snapshot tests. Any UI change requires corresponding snapshot coverage.
-
-**Core Modularity:** Explicit resistance to adding code to `codex-core`. New functionality goes into purpose-built crates (`codex-apply-patch`, `codex-memories`, `codex-sandboxing`) rather than growing the core crate.
-
-### DeepSeek TUI
-
-**RLM (Recursive Language Model):** Unique in this space. A sandboxed Python REPL where a sub-LLM can call helpers (`llm_query`, `llm_query_batched`, `rlm_query`) for batch processing, chunking, and recursive critique. Neither competitor has an equivalent.
-
-**Durable Tasks:** Restart-aware persistent task objects with evidence tracking (gate runs, PR attempts, timeline). Designed for long-running autonomous work that survives restarts.
-
-**Automations:** Scheduled recurring tasks with cron-style RRULE recurrence. Unique among the three.
-
----
-
-## What DeepSeek TUI Already Excels At
-
-- **LSP diagnostics** — automatic post-edit compiler/linter feedback injected into model context; neither competitor has passive LSP integration (OpenCode's is model-callable only)
-- **RLM** — batch/bulk LLM processing in a Python sandbox; no equivalent in either competitor
-- **Finance** — live stock/crypto quotes; unique in this space
-- **Automations** — scheduled recurring tasks with cron rules
-- **Durable tasks** — restart-aware with evidence tracking and gate verification
-- **Turn revert** — undo workspace changes per turn via side-git snapshots
-- **Data validation** — JSON/TOML validation tool
-- **Web run** — headless browser interaction (Codex CLI has Browser Use but it's desktop-app-gated)
-- **Parallel tool execution** — explicitly modeled as infrastructure
-- **Git/GitHub operations** — comprehensive git module with blame, log, diff, status plus full GitHub API via gh
-- **Project map** — high-level project structure generation
-
----
-
-## Recommended Implementation Order
-
-1. ~~**LSP tool**~~ — ✅ **DONE** (post-edit diagnostics). Remaining: model-callable navigation tool.
-2. **Path-pattern permissions** — reduces approval fatigue by 60–80% over long sessions.
-3. **Persistent memory** — compounds value across sessions; foundational for long-running projects.
-4. **Pre/Post-tool-use hooks** — escape hatch for user-defined guardrails without system prompt bloat.
-5. **Skill auto-discovery** — enables community skill ecosystem and Claude Code compatibility.
-6. **LSP navigation tool** — expose goToDefinition/findReferences/hover as model-callable tool. Infrastructure exists; add request/response methods + tool wrapper.
-7. **Agent profiles** — named agent types with model/permission inheritance.
-8. **Tool search for MCP** — keeps context window manageable when connecting to MCP servers with many tools.
-9. **Shell sandboxing** — security improvement, starting with macOS Seatbelt.
diff --git a/docs/CONFIGURATION.md b/docs/CONFIGURATION.md
index 970e8424..5e9cb27a 100644
--- a/docs/CONFIGURATION.md
+++ b/docs/CONFIGURATION.md
@@ -316,6 +316,10 @@ Common settings keys:
   context panel, `/cost`, `/tokens`, and long-turn notification summaries. The
   aliases `rmb` and `yuan` normalize to `cny`.
 - `default_mode` (agent, plan, yolo; legacy `normal` is accepted and normalized to `agent`)
+- `sidebar_focus` (`auto`, `work`, `tasks`, `agents`, `context`; default
+  `auto`): selects the right sidebar focus. `auto` prioritizes Work, Tasks,
+  Agents, then optional Context, and uses Work as the single quiet empty state.
+  Legacy `plan` and `todos` values are accepted and normalized to `work`.
 - `max_history` (number of submitted input history entries; cleared drafts are
   also kept locally for composer history search)
 - `default_model` (model name override)
@@ -392,8 +396,8 @@ If you are upgrading from older releases:
 - `managed_config_path` (string, optional): managed config file loaded after user/env config.
 - `requirements_path` (string, optional): requirements file used to enforce allowed approval/sandbox values.
 - `max_subagents` (int, optional): defaults to `10` and is clamped to `1..=20`.
-- `subagents.*` (optional): per-role/type model defaults for `agent_spawn` and
-  related sub-agent tools. Explicit tool `model` values win, then role/type
+- `subagents.*` (optional): per-role/type model defaults for `agent_open` and
+  related persistent sub-agent sessions. Explicit tool `model` values win, then role/type
   overrides, then the parent runtime model. Supported convenience keys are
   `default_model`, `worker_model`, `explorer_model`, `awaiter_model`,
   `review_model`, `custom_model`, and `max_concurrent`. The
diff --git a/docs/KEYBINDINGS.md b/docs/KEYBINDINGS.md
index 3db301f1..e717671e 100644
--- a/docs/KEYBINDINGS.md
+++ b/docs/KEYBINDINGS.md
@@ -16,6 +16,7 @@ Bindings are not (yet) user-configurable — tracked for a future release (#436,
 | `Shift-Tab`          | Cycle reasoning effort: off → high → max → off                 |
 | `Ctrl-R`             | Open the resume-session picker                                 |
 | `Ctrl-L`             | Refresh / clear the screen                                     |
+| `Ctrl-O`             | Open Activity Detail for the selected, live, or most recent activity when the composer is empty |
 | `Ctrl-Shift-E` / `Cmd-Shift-E` | Toggle the file-tree sidebar                          |
 | `Esc`                | Close topmost modal · cancel slash menu · dismiss toast        |
 
@@ -40,7 +41,7 @@ Editing the message you're about to send.
 | `Ctrl-S`                    | Stash current draft (`/stash list`, `/stash pop` to recover) |
 | `Alt-R`                    | Search prompt history (Alt-R to exit)                  |
 | `Tab`                       | Slash-command / `@`-mention completion (popup-aware)    |
-| `Ctrl-O`                    | Open external editor for the composer draft             |
+| `Ctrl-O`                    | Open external editor for the composer draft when it has focus |
 
 ### `@` mentions
 
@@ -69,7 +70,7 @@ When `[memory] enabled = true`, typing `# foo` and pressing `Enter` appends `foo
 |----------------------|-----------------------------------------------------|
 | `↑` / `↓` / `j` / `k`| Move selection                                     |
 | `Enter`              | Activate the selected item (open / focus / cancel) |
-| `Tab`                | Cycle to next sidebar panel (Files → Tasks → Agents → Todos) |
+| `Tab`                | Cycle to next sidebar panel (Work → Tasks → Agents → Context) |
 | `Esc`                | Return focus to composer                           |
 
 ## Slash-command palette (after `Ctrl-K` or typing `/`)
diff --git a/docs/MODES.md b/docs/MODES.md
index cf78af74..4b996166 100644
--- a/docs/MODES.md
+++ b/docs/MODES.md
@@ -18,7 +18,7 @@ Run `/mode` to open the mode picker, or switch directly with `/mode agent`,
 - **Agent**: multi-step tool use. Approvals for shell and paid tools (file writes are allowed without a prompt).
 - **YOLO**: enables shell + trust mode and auto-approves all tools. Use only in trusted repos.
 
-All three modes have access to the `rlm` tool. Inside its Python REPL, `llm_query_batched` fans out 1–16 cheap parallel child calls pinned to `deepseek-v4-flash`. The model reaches for it when work is decomposable.
+All three modes have access to persistent RLM sessions through `rlm_open`, `rlm_eval`, `rlm_configure`, and `rlm_close`. Inside an RLM Python REPL, `sub_query_batch` fans out 1-16 cheap parallel child calls pinned to `deepseek-v4-flash`. The model reaches for it when work is too large or repetitive for the parent transcript.
 
 ## Compatibility Notes
 
diff --git a/docs/SUBAGENTS.md b/docs/SUBAGENTS.md
index 25482dfb..053a88b6 100644
--- a/docs/SUBAGENTS.md
+++ b/docs/SUBAGENTS.md
@@ -1,23 +1,21 @@
 # Sub-Agents
 
-Sub-agents are background instances of the agent loop. The parent
-agent spawns one with a focused task, gets back an `agent_id`
-immediately, and continues working while the sub-agent runs to
-completion. Sub-agents inherit the parent's tool registry by default
-and run with `CancellationToken::child_token()`, so cancelling the
-parent cancels every descendant.
+Sub-agents are persistent background instances of the agent loop. The parent
+opens one with a focused task, gets back an `agent_id` and session name
+immediately, and continues working while the sub-agent runs to completion.
+Sub-agents inherit the parent's tool registry by default and run with
+`CancellationToken::child_token()`, so cancelling the parent cancels every
+descendant.
 
-This doc covers the role taxonomy. For the orchestration tool surface
-(`agent_spawn` / `agent_wait` / `agent_result` / `agent_cancel` /
-`agent_list` / `agent_send_input` / `agent_resume` / `agent_assign`)
-see `prompts/base.md` "Sub-Agent Strategy" and the in-line tool
-descriptions.
+This doc covers the role taxonomy. The active orchestration surface is
+`agent_open`, `agent_eval`, and `agent_close`; see `prompts/base.md`
+"Sub-Agent Strategy" and the in-line tool descriptions.
 
 ## Role taxonomy
 
-The `agent_type` field on `agent_spawn` selects a system-prompt
-posture for the child. Each role is a distinct stance toward the
-work — not just a different label.
+The `type` field on `agent_open` selects a system-prompt posture for the child
+(`agent_type` is accepted as a compatibility alias). Each role is a distinct
+stance toward the work — not just a different label.
 
 | Role          | Stance                                 | Writes? | Runs shell? | Typical use                                  |
 |---------------|----------------------------------------|---------|-------------|----------------------------------------------|
@@ -32,23 +30,22 @@ work — not just a different label.
 Each role's full system prompt lives in
 `crates/tui/src/tools/subagent/mod.rs` (search for
 `*_AGENT_PROMPT`). The prompt prefix loads automatically when the
-child agent boots; the parent's spawn prompt becomes the first
+child agent boots; the parent's assignment prompt becomes the first
 turn's user message.
 
 ## Context forking
 
-`agent_spawn` starts fresh by default: the child gets its role prompt
-plus the task you pass. Use `fork_context: true` when the child should
-continue from the parent's current request prefix instead. In fork
-mode the child request keeps the parent's system prompt and message
-history byte-identical, appends a structured state snapshot, then
-adds the sub-agent role instructions and task at the tail. That keeps
-DeepSeek prefix-cache reuse high while giving the child the context
-needed for continuation, review, summarization, or compaction work.
+`agent_open` starts fresh by default: the child gets its role prompt plus the
+task you pass. Use `fork_context: true` when the child should continue from
+the parent's current request prefix instead. In fork mode the runtime keeps the
+parent prefill/prompt prefix byte-identical where available, appends a
+structured state snapshot, then adds the sub-agent role instructions and task
+at the tail. That preserves DeepSeek prefix-cache reuse while giving the child
+the context needed for continuation, review, summarization, or compaction work.
 
-Use fresh spawns for independent exploration. Use forked spawns when
-the task depends on decisions, files, todos, or plan state already in
-the parent transcript.
+Use fresh sessions for independent exploration. Use forked sessions when the
+task depends on decisions, files, todos, or plan state already in the parent
+transcript.
 
 ### When to pick which role
 
@@ -56,8 +53,12 @@ the parent transcript.
   look", "design", or "verify". This is the right default; reach for
   a more specific role only when the posture matters.
 - **`explore`** — when the parent needs evidence before deciding what
-  to do next. Explorers are cheap and fast; spawn 2–3 in parallel
+  to do next. Explorers are cheap and fast; open 2–3 in parallel
   for independent regions.
+  They should orient first: confirm the project root, read relevant
+  `AGENTS.md`/`README.md` guidance in unfamiliar trees, search only the
+  likely scope, and return `path:line-range` evidence instead of a narrative
+  tour. The role name to use is `explore` or `explorer`.
 - **`plan`** — when the parent has an objective but no executable
   decomposition. Planners write artifacts (`update_plan` rows,
   `checklist_write` entries) but don't carry them out.
@@ -74,7 +75,7 @@ the parent transcript.
   candidates under RISKS.
 - **`custom`** — only when the parent needs to constrain the tool
   set explicitly. Pass the allowlist via the `allowed_tools` field
-  on `agent_spawn`.
+  on `agent_open`.
 
 ### Aliases
 
@@ -98,9 +99,9 @@ the next turn.
 
 The dispatcher caps concurrent sub-agents at 10 by default
 (configurable via `[subagents].max_concurrent` in `~/.deepseek/config.toml`,
-hard ceiling 20). When the parent hits the cap, `agent_spawn` returns
-an error with the cap value; the parent should `agent_wait` for
-completion or `agent_cancel` to free a slot before retrying.
+hard ceiling 20). When the parent hits the cap, `agent_open` returns
+an error with the cap value; the parent should use `agent_eval` to wait for
+completion or `agent_close` to free a slot before retrying.
 
 The cap counts only **running** agents — completed / failed /
 cancelled records persist for inspection but don't occupy a slot.
@@ -109,7 +110,7 @@ restart) also don't count against the cap.
 
 ## Lifecycle
 
-Each spawn produces a record that progresses through:
+Each opened session produces a record that progresses through:
 
 ```
 Pending → Running → (Completed | Failed(reason) | Cancelled | Interrupted(reason))
@@ -118,20 +119,18 @@ Pending → Running → (Completed | Failed(reason) | Cancelled | Interrupted(re
 `Interrupted` fires when the manager detects a `Running` agent
 whose task handle is gone — typically after a process restart that
 loaded the agent from `~/.deepseek/subagents.v1.json`. The parent
-can `agent_resume` to attempt continuation or treat it as a
+can open a replacement session with the same assignment or treat it as a
 terminal state.
 
 ### Session boundaries (#405)
 
 Each `SubAgentManager` instance assigns itself a fresh
-`session_boot_id` on construction. Every spawn stamps the agent
+`session_boot_id` on construction. Every new session stamps the agent
 with that id; the persisted state file carries it across restarts.
 
-`agent_list` defaults to **current-session only**: prior-session
-agents that aren't still running are filtered out. Pass
-`include_archived=true` to surface every record, with the
-`from_prior_session: true` flag so the model can tell archived
-records apart from live ones.
+`agent_eval` and the sidebar/status projections focus on current-session
+agents by default. Prior-session agents that are not still running are treated
+as archived records so the model does not mistake stale work for live work.
 
 Records that loaded from a pre-#405 persisted state file (no
 `session_boot_id` field) classify as prior-session because the
diff --git a/docs/TOOL_SURFACE.md b/docs/TOOL_SURFACE.md
index da3547dc..6b7ab033 100644
--- a/docs/TOOL_SURFACE.md
+++ b/docs/TOOL_SURFACE.md
@@ -15,7 +15,7 @@ chosen over the available shell equivalent. Companion to `crates/tui/src/prompts
   for the same backing operation are a model trap — the LLM will alternate
   between them and the cache hit rate suffers.
 
-## Current surface (v0.7.5)
+## Current surface (v0.8.33)
 
 ### File operations
 
@@ -27,6 +27,7 @@ chosen over the available shell equivalent. Companion to `crates/tui/src/prompts
 | `edit_file` | Search-and-replace inside a single file. Cheaper than a full rewrite. |
 | `apply_patch` | Apply a unified diff. The right tool for multi-hunk edits. |
 | `retrieve_tool_result` | Read summaries or slices of prior large tool outputs spilled to `~/.deepseek/tool_outputs/`; use `summary`, `head`, `tail`, `lines`, or `query` instead of replaying the whole result. |
+| `handle_read` | Read bounded projections from `var_handle` payloads held by live tool environments. This is the foundation for RLM sessions, sub-agent transcripts, and other large symbolic payloads. |
 
 ### Search
 
@@ -137,18 +138,57 @@ Large logs and command outputs should be artifacts with compact summaries in the
 
 ### Sub-agents
 
-`agent_spawn` plus the supporting tools (`agent_result` / `wait` / `send_input` /
-`agent_assign` / `agent_cancel` / `resume_agent` / `agent_list`).
+v0.8.33 begins moving large tool outputs toward symbolic handles: tools return
+small `var_handle` objects, and `handle_read` retrieves bounded slices, counts,
+or JSON projections from the backing environment. This keeps the parent
+transcript small while preserving a recovery path to the full payload.
+
+The active model-facing sub-agent surface is persistent and intentionally small:
+
+| Tool | Niche |
+|---|---|
+| `agent_open` | Open a named sub-agent session for independent work. Returns a session projection immediately so the parent can keep coordinating. |
+| `agent_eval` | Send follow-up input, block for completion, or fetch the current projection/transcript handle for an existing session. |
+| `agent_close` | Cancel or release a sub-agent session by name or id. |
+
 See `agent.txt` for the delegation protocol and
 [`SUBAGENTS.md`](SUBAGENTS.md) for the role taxonomy
 (`general` / `explore` / `plan` / `review` / `implementer` /
 `verifier` / `custom`).
 
-`agent_spawn` defaults to a fresh child conversation. Pass
-`fork_context: true` for continuation-style work that should inherit the
-parent's system prompt and message prefix for DeepSeek prefix-cache reuse.
-The deprecated `delegate_to_agent` compatibility wrapper routes through
-`agent_spawn` and defaults `fork_context` to true.
+`agent_open` defaults to a fresh child conversation. Pass
+`fork_context: true` for continuation-style work or multi-perspective reviews
+that should inherit the parent's context. In fork mode, the runtime preserves
+the parent prefill/prompt prefix byte-identically where available so DeepSeek's
+prefix cache can be reused, then appends the child role instructions and task.
+
+### Recursive LM sessions
+
+RLM is now persistent as well:
+
+| Tool | Niche |
+|---|---|
+| `rlm_open` | Open a named Python REPL over a file, inline content, or URL. |
+| `rlm_eval` | Run bounded Python against that session, using deterministic code and in-REPL semantic helpers such as `sub_query_batch`. |
+| `rlm_configure` | Adjust output feedback, child-query timeout/depth, and session-sharing settings. |
+| `rlm_close` | Shut down the Python runtime and return final session stats. |
+
+Large RLM outputs should come back as `var_handle`s. Use `handle_read` for
+bounded text slices, line ranges, counts, or JSONPath projections instead of
+replaying the full value into the parent transcript.
+
+### Session relay
+
+`/relay [focus]` asks the current agent to write `.deepseek/handoff.md` as a
+compact `# Session relay` artifact for the next thread. The filename remains
+for compatibility with existing prompt loading and older sessions; the visible
+mental model is relay / 接力.
+
+Aliases: `/batonpass`, `/接力`.
+
+Use it before a long break, compaction, or moving work to a fresh session. The
+relay should preserve the goal, current Work checklist item, changed files,
+decisions, verification state, and one concrete next action.
 
 ### Parallel fan-out: cost-class caps
 
@@ -157,55 +197,73 @@ reflect very different cost classes:
 
 | Tool | What each child does | Wall-clock | Token cost | Cap |
 |---|---|---|---|---|
-| `agent_spawn` | Full sub-agent loop (planning, tool calls, multi-turn streaming, can spawn children) | minutes | thousands of tokens | 10 in flight by default (`[subagents].max_concurrent`, hard ceiling 20) |
-| `rlm` helper `llm_query_batched` | One-shot non-streaming Chat Completions calls pinned to `deepseek-v4-flash` | seconds | ~hundreds of tokens | 16 per call |
+| `agent_open` | Full sub-agent loop (planning, tool calls, multi-turn streaming, can open children) | minutes | thousands of tokens | 10 in flight by default (`[subagents].max_concurrent`, hard ceiling 20) |
+| `rlm_eval` helper `sub_query_batch` | One-shot non-streaming Chat Completions calls pinned to `deepseek-v4-flash` inside a live RLM session | seconds | ~hundreds of tokens | 16 per call |
 
 The caps appear in each tool's description and error messages so the model
 (and the user) can choose the right tool for the job. If one sub-agent is
-enough but you need parallel lookups, prefer `rlm` with `llm_query_batched`; if each task needs
-its own tool-carrying agent loop, use `agent_spawn` (and cancel completed
-ones to free slots).
+enough but you need parallel semantic lookups over the same loaded context,
+prefer `rlm_eval` with `sub_query_batch`; if each task needs its own
+tool-carrying agent loop, use `agent_open` and close completed sessions to free
+slots.
 
-## Recently consolidated (v0.5.1)
+## Removed legacy aliases and surfaces
 
-Removed from the prompt as duplicates of equivalent tools (the underlying
-dispatchers still resolve them, so existing sessions don't break — they just
-no longer pollute the model's tool list):
+v0.8.33 removes the old model-facing sub-agent fan-out surface from active
+prompting and tool catalogs. Do not use these names in new active guidance:
+`agent_spawn`, `agent_wait`, `agent_result`, `agent_send_input`,
+`agent_assign`, `agent_resume`, `agent_list`, `spawn_agent`,
+`delegate_to_agent`, `send_input`, and `close_agent`.
 
-- `spawn_agent` → use `agent_spawn`.
-- `close_agent` → use `agent_cancel`.
-- `assign_agent` → use `agent_assign`.
+The old one-shot `rlm` model-facing tool is also replaced by persistent
+`rlm_open` / `rlm_eval` / `rlm_configure` / `rlm_close` sessions.
 
-## Deprecation schedule (v0.6.2 → v0.8.0)
-
-The alias tools below still execute successfully but now attach a
-`_deprecation` block to every result they return. Models should migrate to
-the canonical name before v0.8.0, when the aliases will be removed.
-
-| Deprecated alias | Canonical name | Warning since | Removal |
-|---|---|---|---|
-| `spawn_agent` | `agent_spawn` | v0.6.2 | v0.8.0 |
-| `delegate_to_agent` | `agent_spawn` | v0.6.2 | v0.8.0 |
-| `close_agent` | `agent_cancel` | v0.6.2 | v0.8.0 |
-| `send_input` | `agent_send_input` | v0.6.2 | v0.8.0 |
-
-The `_deprecation` block shape:
+Historical compatibility results may include a `_deprecation` block shaped
+like this:
 
 ```json
 {
   "_deprecation": {
     "this_tool": "spawn_agent",
-    "use_instead": "agent_spawn",
-    "removed_in": "0.8.0",
-    "message": "Tool 'spawn_agent' is deprecated; switch to 'agent_spawn' before v0.8.0."
+    "use_instead": "agent_open",
+    "removed_in": "0.8.33",
+    "message": "Tool 'spawn_agent' is deprecated; switch to 'agent_open'."
   }
 }
 ```
 
-This block is merged into the tool result's `metadata` object alongside any
-other metadata keys (e.g. `status`, `timed_out`) so it does not displace
-existing metadata.  A one-line deprecation warning is also emitted to the
-audit log at `tracing::warn` level every time an alias is invoked.
+This is a legacy/compatibility note, not the active recommended surface.
+
+## Release smoke: verify the live names
+
+When validating a release, verify the model-visible registry names directly.
+Do not grep random handler function names; handler names are allowed to drift
+while the registry contract stays stable.
+
+Version smoke:
+
+```bash
+deepseek --version
+deepseek-tui --version
+```
+
+Tool-surface smoke:
+
+```bash
+rg -n '"handle_read"|"rlm_open"|"rlm_eval"|"rlm_configure"|"rlm_close"|"agent_open"|"agent_eval"|"agent_close"' crates/tui/src
+rg -n 'handle_read|rlm_open|rlm_eval|rlm_configure|rlm_close|agent_open|agent_eval|agent_close' docs crates/tui/src/prompts crates/tui/src/tools
+```
+
+The canonical v0.8.33 live names are:
+
+- `handle_read`
+- `rlm_open`, `rlm_eval`, `rlm_configure`, `rlm_close`
+- `agent_open`, `agent_eval`, `agent_close`
+
+The registry should not actively advertise the legacy one-shot names
+`agent_spawn`, `agent_wait`, `agent_result`, or the old foreground `rlm` tool
+outside legacy/removal notes. Historical changelog entries and compatibility
+code may still mention them.
 
 ## Why we don't ship a single `bash` tool
 
diff --git a/web/lib/community-agent-tasks.ts b/web/lib/community-agent-tasks.ts
index 00c96d78..2847d779 100644
--- a/web/lib/community-agent-tasks.ts
+++ b/web/lib/community-agent-tasks.ts
@@ -1,6 +1,6 @@
 import { fetchFeed, fetchRepoStats } from "@/lib/github";
 import { curate } from "@/lib/deepseek";
-import { putDispatch } from "@/lib/kv";
+import { putDispatchWithKv } from "@/lib/kv";
 import {
   agentChat,
   TRIAGE_PROMPT,
@@ -32,6 +32,8 @@ export interface AgentEnv {
   MAINTAINER_GITHUB_PAT?: string;
 }
 
+const CRON_STATUS_TTL = 60 * 60 * 24 * 14;
+
 function dsEnv(env: AgentEnv): DeepSeekEnv {
   return {
     baseUrl: env.DEEPSEEK_BASE_URL ?? process.env.DEEPSEEK_BASE_URL,
@@ -49,10 +51,29 @@ export async function runCurate(env: AgentEnv): Promise<Record<string, unknown>>
       fetchFeed(env.GITHUB_TOKEN, 30),
     ]);
     const dispatch = await curate(env.DEEPSEEK_API_KEY, stats, feed, dsEnv(env));
-    await putDispatch(dispatch);
-    return { ok: true, headline: dispatch.headline };
+    await putDispatchWithKv(env.CURATED_KV, dispatch);
+    await env.CURATED_KV?.put(
+      "cron:curate:last",
+      JSON.stringify({
+        ok: true,
+        generatedAt: dispatch.generatedAt,
+        headline: dispatch.headline,
+      }),
+      { expirationTtl: CRON_STATUS_TTL }
+    );
+    return { ok: true, headline: dispatch.headline, stored: env.CURATED_KV ? "kv" : "memory" };
   } catch (e) {
-    return { ok: false, error: String(e) };
+    const error = String(e);
+    await env.CURATED_KV?.put(
+      "cron:curate:last",
+      JSON.stringify({
+        ok: false,
+        generatedAt: new Date().toISOString(),
+        error,
+      }),
+      { expirationTtl: CRON_STATUS_TTL }
+    );
+    return { ok: false, error };
   }
 }
 
diff --git a/web/lib/facts.generated.ts b/web/lib/facts.generated.ts
index e42fc4f1..c509eecf 100644
--- a/web/lib/facts.generated.ts
+++ b/web/lib/facts.generated.ts
@@ -18,8 +18,8 @@ export interface RepoFacts {
 }
 
 export const FACTS: RepoFacts = {
-  "generatedAt": "2026-05-12T19:02:49.213Z",
-  "version": "0.8.32",
+  "generatedAt": "2026-05-12T22:56:03.599Z",
+  "version": "0.8.33",
   "crates": [
     "agent",
     "app-server",
@@ -90,7 +90,7 @@ export const FACTS: RepoFacts = {
   ],
   "defaultModel": "deepseek-v4-pro",
   "nodeEngines": ">=18",
-  "toolCount": 64,
+  "toolCount": 68,
   "license": "MIT",
   "latestRelease": null
 };
diff --git a/web/lib/kv.ts b/web/lib/kv.ts
index f2bfcd4c..c6048b3a 100644
--- a/web/lib/kv.ts
+++ b/web/lib/kv.ts
@@ -6,7 +6,7 @@ import type { CuratedDispatch } from "./types";
 
 const MEM = new Map<string, string>();
 
-interface KVNamespace {
+export interface KVNamespace {
   get(key: string): Promise<string | null>;
   put(key: string, value: string, opts?: { expirationTtl?: number }): Promise<void>;
   list(opts?: { prefix?: string; limit?: number }): Promise<{ keys: { name: string }[] }>;
@@ -53,9 +53,13 @@ export async function getDispatch(): Promise<CuratedDispatch | null> {
 
 export async function putDispatch(d: CuratedDispatch): Promise<void> {
   const env = await getEnv();
+  await putDispatchWithKv(env.CURATED_KV, d);
+}
+
+export async function putDispatchWithKv(kv: KVNamespace | undefined, d: CuratedDispatch): Promise<void> {
   const value = JSON.stringify(d);
-  if (env.CURATED_KV) {
-    await env.CURATED_KV.put("dispatch:latest", value, { expirationTtl: 60 * 60 * 24 * 7 });
+  if (kv) {
+    await kv.put("dispatch:latest", value, { expirationTtl: 60 * 60 * 24 * 7 });
   } else {
     MEM.set("dispatch:latest", value);
   }