diff --git a/CLAUDE.md b/CLAUDE.md
index a321d21..6295a79 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -1062,3 +1062,12 @@ are usually marketing / human-PR docs, not agent guidance.
   `complete` and emits a single `Finish` chunk.
 - **Tool naming collisions** are silent — if you register two tools with the same
   `name()`, the second wins. Prefer unique, namespaced names (`fs.read`, `http.fetch`).
+- **Wire-shape types are codegen'd to TypeScript.** Rust types crossing the SPA
+  boundary (REST replies, WS frames) use `#[derive(ts_rs::TS)]` so the frontend
+  imports a generated `.ts` instead of hand-maintaining a duplicate. Annotations
+  live on the type in its owning domain crate (`harness-channel`,
+  `harness-project`, `harness-observability` — never `harness-core`).
+  Regenerate with `make ts-codegen` after changing an annotated type; the
+  output under `apps/jarvis-web/src/types/generated/` is committed to git so
+  the SPA-only build doesn't need a Rust toolchain. See
+  `docs/conventions/rust-ts-codegen.md`.
diff --git a/Cargo.lock b/Cargo.lock
index 9665f29..9a35933 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -2003,12 +2003,13 @@ dependencies = [
 
 [[package]]
 name = "harness-channel"
-version = "0.1.0"
+version = "0.2.0"
 dependencies = [
  "async-trait",
  "chrono",
  "serde",
  "serde_json",
+ "ts-rs",
  "uuid",
 ]
 
@@ -2100,7 +2101,7 @@ dependencies = [
 
 [[package]]
 name = "harness-observability"
-version = "0.1.0"
+version = "0.2.0"
 dependencies = [
  "async-trait",
  "serde",
@@ -2126,7 +2127,7 @@ dependencies = [
 
 [[package]]
 name = "harness-project"
-version = "0.1.0"
+version = "0.2.0"
 dependencies = [
  "async-trait",
  "chrono",
@@ -2134,6 +2135,7 @@ dependencies = [
  "serde",
  "serde_json",
  "tokio",
+ "ts-rs",
  "uuid",
 ]
 
@@ -2252,6 +2254,7 @@ name = "harness-tools"
 version = "0.2.0"
 dependencies = [
  "async-trait",
+ "blake3",
  "chrono",
  "diffy",
  "harness-channel",
@@ -5688,6 +5691,15 @@ dependencies = [
  "utf-8",
 ]
 
+[[package]]
+name = "termcolor"
+version = "1.4.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "06794f8f6c5c898b3275aebefa6b8a1cb24cd2c6c79397ab15774837a0bc5755"
+dependencies = [
+ "winapi-util",
+]
+
 [[package]]
 name = "thiserror"
 version = "1.0.69"
@@ -6253,6 +6265,29 @@ version = "0.2.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "e421abadd41a4225275504ea4d6566923418b7f05506fbc9c0fe86ba7396114b"
 
+[[package]]
+name = "ts-rs"
+version = "10.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e640d9b0964e9d39df633548591090ab92f7a4567bc31d3891af23471a3365c6"
+dependencies = [
+ "lazy_static",
+ "thiserror 2.0.18",
+ "ts-rs-macros",
+]
+
+[[package]]
+name = "ts-rs-macros"
+version = "10.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0e9d8656589772eeec2cf7a8264d9cda40fb28b9bc53118ceb9e8c07f8f38730"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+ "termcolor",
+]
+
 [[package]]
 name = "tungstenite"
 version = "0.24.0"
diff --git a/Cargo.toml b/Cargo.toml
index 2e75af5..ff73742 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -86,6 +86,13 @@ aes = "0.8"
 cbc = "0.1"
 rand = "0.8"
 base64 = "0.22"
+# Rust → TypeScript codegen for wire-shape types shared with the
+# web frontend. `cargo test --workspace` runs the embedded `export`
+# tests `ts-rs` injects for each `#[derive(TS)]` type and writes a
+# `.ts` file under `apps/jarvis-web/src/types/generated/`. The
+# frontend imports from there instead of hand-maintaining
+# duplicates. See `docs/conventions/rust-ts-codegen.md`.
+ts-rs = { version = "10", features = ["serde-compat", "no-serde-warnings"] }
 open = "5"
 tiktoken-rs = "0.6"
 libc = "0.2"
diff --git a/Makefile b/Makefile
index 55c3ee1..b9476a9 100644
--- a/Makefile
+++ b/Makefile
@@ -84,6 +84,24 @@ test: ## Run the workspace test suite
 .PHONY: check
 check: lint test ## Run clippy + tests, what CI runs
 
+# ---------------------------------------------------------------------------
+# Rust → TypeScript type codegen (see docs/conventions/rust-ts-codegen.md)
+# ---------------------------------------------------------------------------
+# Every `#[derive(TS)]` type emits its own `<TypeName>.ts` under
+# `apps/jarvis-web/src/types/generated/` when the embedded export
+# test runs. Crates with annotated types today: harness-channel,
+# harness-project. Add more by following the convention doc.
+#
+# Output goes in git so the SPA-only Vite build doesn't need a
+# Rust toolchain. `make ts-codegen` is the canonical "I changed a
+# wire type, regenerate" target; CI's `make test` covers it as a
+# side effect.
+.PHONY: ts-codegen
+ts-codegen: ## Regenerate TS types from Rust (`#[derive(TS)]`)
+	$(CARGO) test -p harness-channel -p harness-project --lib --quiet
+	@printf "\ngenerated:\n"
+	@ls apps/jarvis-web/src/types/generated/ | sed 's/^/  /'
+
 # ---------------------------------------------------------------------------
 # Docker / Compose
 # ---------------------------------------------------------------------------
diff --git a/apps/jarvis-cli/src/main.rs b/apps/jarvis-cli/src/main.rs
index 282d668..68b3c04 100644
--- a/apps/jarvis-cli/src/main.rs
+++ b/apps/jarvis-cli/src/main.rs
@@ -73,6 +73,31 @@ pub struct Args {
     #[arg(long)]
     pub no_git_read: bool,
 
+    /// Enable the agent-maintained `memory.{list,read,write,delete}`
+    /// tools (M3.1). Off by default — opt in when you want the CLI
+    /// session to persist notes under `<workspace>/.jarvis/memory/`
+    /// and inject MEMORY.md into the system prompt at startup.
+    /// `memory.write` / `memory.delete` are approval-gated.
+    #[arg(long)]
+    pub enable_memory: bool,
+
+    /// Enable the P10 git-sync tools (`memory.sync`,
+    /// `memory.sync_status`). The memory dir must be a git working
+    /// tree with a configured remote; the tools wrap
+    /// `git pull --rebase && git push` so notes propagate between
+    /// machines / teammates. Off by default — only useful once
+    /// you've actually set up a remote.
+    #[arg(long)]
+    pub enable_memory_sync: bool,
+
+    /// Enable the `enter_plan_mode` tool so the model can volunteer
+    /// to switch into Plan Mode before risky changes. Default: on
+    /// (the CLI's `fs.edit` is on by default, so coding-mode
+    /// criteria are met). Pass `--no-enter-plan-mode` to disable
+    /// and keep Plan-Mode entry strictly operator-driven.
+    #[arg(long, action = clap::ArgAction::SetTrue, default_value_t = false)]
+    pub no_enter_plan_mode: bool,
+
     /// Pipe mode: read the prompt from `--prompt` (or stdin if
     /// omitted), run one turn with `AlwaysDeny` so no tool that
     /// needs a human can fire, print the final assistant text,
diff --git a/apps/jarvis-cli/src/runner.rs b/apps/jarvis-cli/src/runner.rs
index e8baa0a..7e38e7a 100644
--- a/apps/jarvis-cli/src/runner.rs
+++ b/apps/jarvis-cli/src/runner.rs
@@ -151,6 +151,20 @@ pub(crate) async fn load_project_prelude(needle: &str) -> Result<String> {
     ))
 }
 
+fn resolve_memory_user_root() -> Option<std::path::PathBuf> {
+    if let Ok(v) = std::env::var("JARVIS_MEMORY_USER_ROOT") {
+        let trimmed = v.trim();
+        if trimmed.is_empty() {
+            return None;
+        }
+        return Some(std::path::PathBuf::from(trimmed));
+    }
+    std::env::var_os("HOME")
+        .map(std::path::PathBuf::from)
+        .or_else(|| std::env::var_os("USERPROFILE").map(std::path::PathBuf::from))
+        .map(|h| h.join(".jarvis"))
+}
+
 fn build_tools(args: &Args, workspace: &Path) -> ToolRegistry {
     let cfg = BuiltinsConfig {
         fs_root: workspace.to_path_buf(),
@@ -165,6 +179,21 @@ fn build_tools(args: &Args, workspace: &Path) -> ToolRegistry {
         enable_fs_write: args.allow_fs_write,
         enable_shell_exec: args.allow_shell,
         enable_git_read: !args.no_git_read,
+        // CLI defaults: enter_plan_mode on (coding REPL benefits from
+        // the model being able to volunteer a plan-first pass);
+        // memory tools off until opted in.
+        enable_enter_plan_mode: !args.no_enter_plan_mode,
+        enable_memory: args.enable_memory,
+        // P9: user-scope memory follows the operator across
+        // workspaces. Default to `~/.jarvis` so the same notes
+        // are visible from any CLI invocation; `JARVIS_MEMORY_USER_ROOT`
+        // overrides (e.g. point at a Dropbox path) and an empty
+        // value disables. No-op when `enable_memory == false`.
+        memory_user_root: resolve_memory_user_root(),
+        // P10: git-as-transport sync. No-op when `enable_memory`
+        // is false (the underlying tree only exists when memory
+        // tools are registered).
+        enable_memory_sync: args.enable_memory_sync,
         ..Default::default()
     };
     let mut tools = ToolRegistry::new();
@@ -615,6 +644,17 @@ async fn run_one_turn(
                             event.reason,
                         );
                     }
+                    AgentEvent::ModeChanged { mode } => {
+                        // CLI mirrors the WS handler: surface the
+                        // mode change inline so the operator sees
+                        // why the next turn behaves differently.
+                        if delta_open { println!(); delta_open = false; }
+                        eprintln!(
+                            "{} permission mode → {:?}",
+                            yellow("⇄"),
+                            mode,
+                        );
+                    }
                     AgentEvent::Error { message } => {
                         if delta_open { println!(); }
                         return TurnOutcome::Error(message);
diff --git a/apps/jarvis-web/src/components/AppChatPane.tsx b/apps/jarvis-web/src/components/AppChatPane.tsx
index f201130..94ab8f7 100644
--- a/apps/jarvis-web/src/components/AppChatPane.tsx
+++ b/apps/jarvis-web/src/components/AppChatPane.tsx
@@ -12,6 +12,7 @@ import { AskTextCard } from "./Chat/AskTextCard";
 import { ApprovalCard } from "./Approvals/ApprovalCard";
 import { BypassBanner } from "./Approvals/BypassBanner";
 import { ModeBadge } from "./Approvals/ModeBadge";
+import { ModeChangedToast } from "./Approvals/ModeChangedToast";
 import { PlanModeBanner } from "./Approvals/PlanModeBanner";
 import { PlanProposedCard } from "./Approvals/PlanProposedCard";
 import { ModelMenu } from "./ModelMenu/ModelMenu";
@@ -19,6 +20,7 @@ import { UsageBadge } from "./UsageBadge";
 import { ComposerShoulder } from "./ComposerShoulder";
 import { ComposerProjectRail } from "./Composer/ComposerProjectRail";
 import { OpenSidebarButton, WorkspacePanelMenu } from "./Workspace/WorkspaceToggles";
+import { BackgroundTasksButton } from "./BackgroundTasks/BackgroundTasksButton";
 import { pickedRouting } from "../services/socket";
 import { slashCommands } from "../services/slash_commands";
 import { useAppStore } from "../store/appStore";
@@ -48,6 +50,7 @@ export function AppChatPane() {
           <ChatHeader />
         </div>
         <div className="header-actions">
+          <BackgroundTasksButton />
           <WorkspacePanelMenu />
         </div>
       </header>
@@ -56,6 +59,7 @@ export function AppChatPane() {
       <BypassBanner />
       <PlanModeBanner />
       <FallbackBanner />
+      <ModeChangedToast />
 
       <MessageList />
 
diff --git a/apps/jarvis-web/src/components/Approvals/ModeChangedToast.test.tsx b/apps/jarvis-web/src/components/Approvals/ModeChangedToast.test.tsx
new file mode 100644
index 0000000..f23cb19
--- /dev/null
+++ b/apps/jarvis-web/src/components/Approvals/ModeChangedToast.test.tsx
@@ -0,0 +1,66 @@
+// Renders the M2.3 toast when the server reports a non-user
+// mode change. Operator-initiated changes (via:"user" / absent)
+// stay silent — verified separately so a future regression that
+// pops a toast on every click is caught.
+
+import { afterEach, beforeEach, describe, expect, it, vi } from "vitest";
+import { act, render, screen } from "@testing-library/react";
+import { useAppStore } from "../../store/appStore";
+import { ModeChangedToast } from "./ModeChangedToast";
+
+beforeEach(() => {
+  vi.useFakeTimers();
+  useAppStore.getState().setRecentModeChange(null);
+});
+afterEach(() => {
+  vi.useRealTimers();
+});
+
+describe("ModeChangedToast", () => {
+  it("renders when the change came from the agent (via:tool)", () => {
+    act(() => {
+      useAppStore.getState().setRecentModeChange({
+        mode: "plan",
+        via: "tool",
+        at: Date.now(),
+      });
+    });
+    render(<ModeChangedToast />);
+    expect(screen.getByRole("status")).toHaveTextContent(
+      /Agent.*switched permission mode to.*plan.*read-only/i,
+    );
+  });
+
+  it("stays silent for operator-initiated changes (via:user)", () => {
+    act(() => {
+      useAppStore.getState().setRecentModeChange({
+        mode: "auto",
+        via: "user",
+        at: Date.now(),
+      });
+    });
+    const { container } = render(<ModeChangedToast />);
+    expect(container).toBeEmptyDOMElement();
+  });
+
+  it("renders nothing when no recent change is recorded", () => {
+    const { container } = render(<ModeChangedToast />);
+    expect(container).toBeEmptyDOMElement();
+  });
+
+  it("can be dismissed via the × button", () => {
+    act(() => {
+      useAppStore.getState().setRecentModeChange({
+        mode: "plan",
+        via: "tool",
+        at: Date.now(),
+      });
+    });
+    render(<ModeChangedToast />);
+    const close = screen.getByLabelText("Dismiss");
+    act(() => {
+      close.click();
+    });
+    expect(useAppStore.getState().recentModeChange).toBeNull();
+  });
+});
diff --git a/apps/jarvis-web/src/components/Approvals/ModeChangedToast.tsx b/apps/jarvis-web/src/components/Approvals/ModeChangedToast.tsx
new file mode 100644
index 0000000..6587fa6
--- /dev/null
+++ b/apps/jarvis-web/src/components/Approvals/ModeChangedToast.tsx
@@ -0,0 +1,72 @@
+// M2.3 UX: transient toast that surfaces an out-of-band
+// permission-mode change. The mode-badge in the header updates
+// silently, which is fine when the operator clicked it
+// themselves — but when the agent self-switched via
+// `enter_plan_mode`, the user needs a visible cue or they'll
+// wonder why the next turn behaves differently.
+//
+// The store action only fires this when the `via` field is
+// present (server-emitted). Operator-initiated changes through
+// the same handler don't include `via` (or pass `via:"user"`),
+// so this stays dormant for the common case.
+//
+// Auto-clears after `AUTO_CLEAR_MS`. Sticky-style: a brand-new
+// change in the same window resets the timer and re-shows.
+
+import { useEffect, useState } from "react";
+import { useAppStore } from "../../store/appStore";
+
+const AUTO_CLEAR_MS = 6000;
+
+export function ModeChangedToast() {
+  const recent = useAppStore((s) => s.recentModeChange);
+  const clear = useAppStore((s) => s.setRecentModeChange);
+  const [hiddenAt, setHiddenAt] = useState<number | null>(null);
+
+  useEffect(() => {
+    if (!recent) return;
+    // Reset any prior hide-debounce when a fresh change arrives.
+    setHiddenAt(null);
+    const id = window.setTimeout(() => {
+      setHiddenAt(Date.now());
+      clear(null);
+    }, AUTO_CLEAR_MS);
+    return () => window.clearTimeout(id);
+  }, [recent, clear]);
+
+  // Operator-initiated changes (via:"user" or no via) are silent —
+  // the mode badge already reflects the click, no need to toast.
+  if (!recent) return null;
+  if (recent.via === "user") return null;
+  if (hiddenAt !== null && hiddenAt > recent.at) return null;
+
+  return (
+    <div className="mode-changed-toast" role="status" aria-live="polite">
+      <span className="mode-changed-toast-icon" aria-hidden="true">⇄</span>
+      <span className="mode-changed-toast-body">
+        {describe(recent.via)} switched permission mode to{" "}
+        <strong>{recent.mode}</strong>
+        {recent.mode === "plan" ? " — next turn will be read-only." : ""}
+      </span>
+      <button
+        type="button"
+        className="mode-changed-toast-close"
+        aria-label="Dismiss"
+        onClick={() => clear(null)}
+      >
+        ×
+      </button>
+    </div>
+  );
+}
+
+function describe(via: string): string {
+  switch (via) {
+    case "tool":
+      return "Agent";
+    case "plan_accepted":
+      return "Plan accept";
+    default:
+      return "Mode change";
+  }
+}
diff --git a/apps/jarvis-web/src/components/BackgroundTasks/BackgroundTasksButton.tsx b/apps/jarvis-web/src/components/BackgroundTasks/BackgroundTasksButton.tsx
new file mode 100644
index 0000000..c8fba68
--- /dev/null
+++ b/apps/jarvis-web/src/components/BackgroundTasks/BackgroundTasksButton.tsx
@@ -0,0 +1,39 @@
+// Header trigger for `<BackgroundTasksPanel>`. Lives next to
+// `<WorkspacePanelMenu>` in `<AppChatPane>`'s header-actions slot.
+// The panel itself is portal-free and renders right under the button
+// — the visible chrome is just an icon + label; click toggles open.
+
+import { useState } from "react";
+import { BackgroundTasksPanel } from "./BackgroundTasksPanel";
+
+export function BackgroundTasksButton() {
+  const [open, setOpen] = useState(false);
+  return (
+    <div className="bg-tasks-trigger-wrap">
+      <button
+        type="button"
+        className="bg-tasks-trigger"
+        aria-expanded={open}
+        aria-label="Background tasks"
+        title="Background tasks"
+        onClick={() => setOpen((v) => !v)}
+      >
+        <svg
+          width="16"
+          height="16"
+          viewBox="0 0 24 24"
+          fill="none"
+          stroke="currentColor"
+          strokeWidth="1.8"
+          strokeLinecap="round"
+          strokeLinejoin="round"
+          aria-hidden="true"
+        >
+          <circle cx="12" cy="12" r="9" />
+          <polyline points="12 7 12 12 15 14" />
+        </svg>
+      </button>
+      <BackgroundTasksPanel open={open} onClose={() => setOpen(false)} />
+    </div>
+  );
+}
diff --git a/apps/jarvis-web/src/components/BackgroundTasks/BackgroundTasksPanel.tsx b/apps/jarvis-web/src/components/BackgroundTasks/BackgroundTasksPanel.tsx
new file mode 100644
index 0000000..0c950b1
--- /dev/null
+++ b/apps/jarvis-web/src/components/BackgroundTasks/BackgroundTasksPanel.tsx
@@ -0,0 +1,165 @@
+// Background-tasks panel — a single "what's in flight right now"
+// view that aggregates chat turns, subagent runs, and (over time)
+// auto-mode picks / MCP / shell jobs into one list. Backed by the
+// `GET /v1/tasks` aggregator; polled while open and immediately
+// stopped when the panel closes so a quiet system doesn't pay for
+// idle fetches.
+
+import { useEffect, useRef, useState } from "react";
+import { apiUrl } from "../../services/api";
+import { useAppStore } from "../../store/appStore";
+
+// Safety-net poll: the server pushes `tasks_snapshot` frames at
+// every turn boundary (P7), so under normal use the panel gets
+// real-time updates and the poll just covers "first open" and
+// "WS hiccup" gaps. 15s is gentle on the backend while still
+// catching missed pushes within a typical usage window.
+const POLL_INTERVAL_MS = 15000;
+
+type TaskKind = "chat_run" | "subagent_run" | "requirement_run" | "mcp_server";
+
+interface TaskEntry {
+  kind: TaskKind;
+  id: string;
+  label: string;
+  status: string;
+  started_at: number;
+  updated_at: number;
+  // eslint-disable-next-line @typescript-eslint/no-explicit-any
+  detail: any;
+}
+
+interface TasksResponse {
+  items: TaskEntry[];
+  generated_at: number;
+}
+
+interface Props {
+  open: boolean;
+  onClose: () => void;
+}
+
+export function BackgroundTasksPanel({ open, onClose }: Props) {
+  // Pushed snapshot from the WS `tasks_snapshot` frame; preferred
+  // over the panel's own poll when present so the panel reflects
+  // server state in near-real-time.
+  const pushed = useAppStore((s) => s.backgroundTasksSnapshot);
+  const [polled, setPolled] = useState<TaskEntry[] | null>(null);
+  const [error, setError] = useState<string | null>(null);
+  const [loading, setLoading] = useState(false);
+  const timerRef = useRef<number | null>(null);
+  const tasks: TaskEntry[] =
+    (pushed as TaskEntry[] | null) ?? polled ?? [];
+
+  useEffect(() => {
+    if (!open) {
+      if (timerRef.current != null) {
+        window.clearInterval(timerRef.current);
+        timerRef.current = null;
+      }
+      return;
+    }
+    let cancelled = false;
+    async function fetchOnce() {
+      try {
+        setLoading(true);
+        const r = await fetch(apiUrl("/v1/tasks"));
+        if (!r.ok) {
+          if (!cancelled) setError(`HTTP ${r.status}`);
+          return;
+        }
+        const body = (await r.json()) as TasksResponse;
+        if (!cancelled) {
+          setPolled(body.items);
+          setError(null);
+        }
+      } catch (e) {
+        if (!cancelled) setError(String(e));
+      } finally {
+        if (!cancelled) setLoading(false);
+      }
+    }
+    void fetchOnce();
+    timerRef.current = window.setInterval(() => {
+      void fetchOnce();
+    }, POLL_INTERVAL_MS);
+    return () => {
+      cancelled = true;
+      if (timerRef.current != null) {
+        window.clearInterval(timerRef.current);
+        timerRef.current = null;
+      }
+    };
+  }, [open]);
+
+  if (!open) return null;
+
+  return (
+    <div className="bg-tasks-panel" role="dialog" aria-label="Background tasks">
+      <header className="bg-tasks-header">
+        <h2>Background tasks</h2>
+        <button
+          type="button"
+          onClick={onClose}
+          aria-label="Close"
+          className="bg-tasks-close"
+        >
+          ×
+        </button>
+      </header>
+      <div className="bg-tasks-body">
+        {error && (
+          <div className="bg-tasks-error" role="alert">
+            Failed to load: {error}
+          </div>
+        )}
+        {!error && tasks.length === 0 && !loading && (
+          <div className="bg-tasks-empty">No active work right now.</div>
+        )}
+        {tasks.length > 0 && (
+          <ul className="bg-tasks-list">
+            {tasks.map((t) => (
+              <li
+                key={`${t.kind}-${t.id}`}
+                className="bg-tasks-row"
+                data-kind={t.kind}
+                data-status={t.status}
+              >
+                <span className="bg-tasks-kind">{kindLabel(t.kind)}</span>
+                <span className="bg-tasks-label">{t.label}</span>
+                <span className="bg-tasks-status">{t.status}</span>
+                <span className="bg-tasks-age">{relativeAge(t.started_at)}</span>
+              </li>
+            ))}
+          </ul>
+        )}
+      </div>
+    </div>
+  );
+}
+
+function kindLabel(k: TaskKind): string {
+  switch (k) {
+    case "chat_run":
+      return "Chat";
+    case "subagent_run":
+      return "SubAgent";
+    case "requirement_run":
+      return "Requirement";
+    case "mcp_server":
+      return "MCP";
+    default:
+      return k;
+  }
+}
+
+function relativeAge(startedAt: number): string {
+  const dt = Math.max(0, Date.now() - startedAt);
+  if (dt < 1000) return "just now";
+  const sec = Math.floor(dt / 1000);
+  if (sec < 60) return `${sec}s`;
+  const min = Math.floor(sec / 60);
+  if (min < 60) return `${min}m`;
+  const hr = Math.floor(min / 60);
+  return `${hr}h`;
+}
diff --git a/apps/jarvis-web/src/components/Chat/CollapsedToolGroup.tsx b/apps/jarvis-web/src/components/Chat/CollapsedToolGroup.tsx
new file mode 100644
index 0000000..f990b81
--- /dev/null
+++ b/apps/jarvis-web/src/components/Chat/CollapsedToolGroup.tsx
@@ -0,0 +1,116 @@
+// Folded card for a run of consecutive assistant iterations whose
+// tool calls are all read-only (`fs.read`, `code.grep`, `git.*`,
+// `workspace.context`, etc.) and whose visible content is empty.
+//
+// Without this fold, a long investigation loop (read → grep → read
+// → grep → read → ... before finally writing a patch) bloats the
+// transcript with 5–10 near-identical "Read 1 file" rows the user
+// has to skim past. The fold collapses them into one summary like
+// "Read 6 files, ran 3 greps (across 9 steps) ▸" with a click-to-
+// expand that re-shows the original `AssistantBubble`s inline.
+//
+// The fold rule is enforced upstream in `<MessageList>`; this
+// component just renders whatever it's handed. Folding is
+// strictly opt-in by the upstream classifier — anything that
+// touched a write/exec/mutating tool stays as its own bubble.
+
+import { useMemo, useState } from "react";
+import { useAppStore } from "../../store/appStore";
+import { AssistantBubble } from "./AssistantBubble";
+import {
+  aggregateStepStatus,
+  describeStep,
+} from "./toolStepSummary";
+import { t } from "../../utils/i18n";
+import type { UiMessage } from "../../store/types";
+
+interface Props {
+  /// Consecutive assistant `UiMessage`s being folded. Must each
+  /// carry only read-only tool calls and no visible content —
+  /// the classifier in `<MessageList>` is the source of truth for
+  /// that invariant.
+  messages: Array<Extract<UiMessage, { kind: "assistant" }>>;
+}
+
+export function CollapsedToolGroup({ messages }: Props) {
+  // Same Zustand discipline as ToolStepRow: subscribe to the raw
+  // map and derive the flat block list via useMemo so the selector
+  // doesn't churn on every store snapshot.
+  const allBlocks = useAppStore((s) => s.toolBlocks);
+  const blocks = useMemo(() => {
+    const flat = [];
+    for (const m of messages) {
+      for (const id of m.toolCallIds) {
+        const b = allBlocks[id];
+        if (b) flat.push(b);
+      }
+    }
+    return flat;
+  }, [messages, allBlocks]);
+
+  const [manualOpen, setManualOpen] = useState<boolean | null>(null);
+  const status = aggregateStepStatus(blocks);
+  // Auto-expand while anything in the run is still working so the
+  // user sees live progress, mirroring `ToolStepRow`'s pattern.
+  const defaultOpen = status === "running";
+  const open = manualOpen ?? defaultOpen;
+
+  if (blocks.length === 0) return null;
+  const summary = describeStep(blocks);
+  const badge =
+    status === "ok" || status === "empty"
+      ? null
+      : (({
+          running: t("running"),
+          denied: t("denied", ""),
+          error: t("error"),
+        } as Record<string, string>)[status] || status);
+
+  return (
+    <div
+      className="tool-step tool-step-grouped"
+      data-status={status}
+      data-open={open ? "true" : "false"}
+    >
+      <button
+        type="button"
+        className="tool-step-row"
+        onClick={() => setManualOpen(!open)}
+        aria-expanded={open}
+        title={open ? t("toolStepCollapse") : t("toolStepExpand")}
+      >
+        <span className="tool-step-chevron" aria-hidden="true">
+          <svg width="12" height="12" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2.4" strokeLinecap="round" strokeLinejoin="round">
+            <polyline points="9 18 15 12 9 6" />
+          </svg>
+        </span>
+        <span className="tool-step-summary">
+          {summary}
+          <span className="tool-step-step-count">
+            {" "}· {messages.length} steps
+          </span>
+        </span>
+        {badge ? <span className="tool-step-badge">{badge}</span> : null}
+      </button>
+      {open ? (
+        <div className="tool-step-body tool-step-body-grouped">
+          {messages.map((m, idx) => (
+            <AssistantBubble
+              key={m.uid}
+              uid={m.uid}
+              content={m.content}
+              reasoning={m.reasoning}
+              toolCallIds={m.toolCallIds}
+              finalised={m.finalised}
+              // First expanded child gets the full header; the
+              // rest stack as continuations so the expanded list
+              // reads as one logical run rather than N separate
+              // "Jarvis" bubbles.
+              continuation={idx > 0}
+            />
+          ))}
+        </div>
+      ) : null}
+    </div>
+  );
+}
diff --git a/apps/jarvis-web/src/components/Chat/MessageList.test.ts b/apps/jarvis-web/src/components/Chat/MessageList.test.ts
new file mode 100644
index 0000000..0756ad5
--- /dev/null
+++ b/apps/jarvis-web/src/components/Chat/MessageList.test.ts
@@ -0,0 +1,157 @@
+// Tests for the transcript folding classifier + grouper used by
+// `<MessageList>`. These are pure data-shape tests — no React
+// involved — so they stay fast and stable across UI tweaks.
+
+import { describe, expect, it } from "vitest";
+import { groupForFolding, isFoldable } from "./MessageList";
+import type { ToolBlockEntry, UiMessage } from "../../store/types";
+
+function block(over: Partial<ToolBlockEntry>): ToolBlockEntry {
+  return {
+    id: over.id ?? "t",
+    name: over.name ?? "fs.read",
+    args: over.args ?? {},
+    status: over.status ?? "ok",
+    output: over.output ?? null,
+    progress: over.progress ?? "",
+    decisionSource: null,
+    startedAt: 0,
+    finishedAt: 0,
+  };
+}
+
+function assistant(over: {
+  uid: string;
+  toolCallIds: string[];
+  content?: string;
+  reasoning?: string;
+  finalised?: boolean;
+}): UiMessage {
+  return {
+    uid: over.uid,
+    kind: "assistant",
+    content: over.content ?? "",
+    reasoning: over.reasoning ?? "",
+    toolCallIds: over.toolCallIds,
+    finalised: over.finalised ?? true,
+  };
+}
+
+function user(uid: string, content = "hi", userOrdinal = 1): UiMessage {
+  return { uid, kind: "user", content, userOrdinal };
+}
+
+describe("isFoldable", () => {
+  it("folds an assistant with one read-only tool call and no content", () => {
+    const m = assistant({ uid: "a", toolCallIds: ["t1"] });
+    const blocks = { t1: block({ id: "t1", name: "fs.read" }) };
+    expect(isFoldable(m, blocks)).toBe(true);
+  });
+
+  it("rejects when the assistant has visible content", () => {
+    const m = assistant({ uid: "a", toolCallIds: ["t1"], content: "thinking..." });
+    const blocks = { t1: block({ id: "t1", name: "fs.read" }) };
+    expect(isFoldable(m, blocks)).toBe(false);
+  });
+
+  it("rejects when any tool call is a write/exec tool", () => {
+    const m = assistant({ uid: "a", toolCallIds: ["t1", "t2"] });
+    const blocks = {
+      t1: block({ id: "t1", name: "fs.read" }),
+      t2: block({ id: "t2", name: "fs.edit" }),
+    };
+    expect(isFoldable(m, blocks)).toBe(false);
+  });
+
+  it("rejects when a referenced tool block is missing", () => {
+    const m = assistant({ uid: "a", toolCallIds: ["t1"] });
+    const blocks = {};
+    expect(isFoldable(m, blocks)).toBe(false);
+  });
+
+  it("rejects an assistant with no tool calls", () => {
+    const m = assistant({ uid: "a", toolCallIds: [] });
+    expect(isFoldable(m, {})).toBe(false);
+  });
+
+  it("rejects an unknown tool name (don't aggressively fold unknowns)", () => {
+    const m = assistant({ uid: "a", toolCallIds: ["t1"] });
+    const blocks = { t1: block({ id: "t1", name: "totally.new.mcp.tool" }) };
+    expect(isFoldable(m, blocks)).toBe(false);
+  });
+});
+
+describe("groupForFolding", () => {
+  it("folds 3 consecutive read-only iterations into one group", () => {
+    const msgs: UiMessage[] = [
+      user("u1"),
+      assistant({ uid: "a1", toolCallIds: ["t1"] }),
+      assistant({ uid: "a2", toolCallIds: ["t2"] }),
+      assistant({ uid: "a3", toolCallIds: ["t3"] }),
+      assistant({ uid: "a4", toolCallIds: ["t4"] }), // the final reply
+    ];
+    const blocks = {
+      t1: block({ id: "t1", name: "fs.read" }),
+      t2: block({ id: "t2", name: "code.grep" }),
+      t3: block({ id: "t3", name: "git.status" }),
+      t4: block({ id: "t4", name: "fs.edit" }), // not foldable → standalone
+    };
+    const groups = groupForFolding(msgs, blocks);
+    expect(groups.map((g) => g.kind)).toEqual(["single", "folded", "single"]);
+    if (groups[1].kind === "folded") {
+      expect(groups[1].messages.map((m) => m.uid)).toEqual(["a1", "a2", "a3"]);
+    }
+  });
+
+  it("leaves a sub-threshold run inline", () => {
+    const msgs: UiMessage[] = [
+      user("u1"),
+      assistant({ uid: "a1", toolCallIds: ["t1"] }),
+      assistant({ uid: "a2", toolCallIds: ["t2"] }), // only 2 read-only — below MIN_GROUP_SIZE
+      assistant({ uid: "a3", toolCallIds: ["t3"] }),
+    ];
+    const blocks = {
+      t1: block({ id: "t1", name: "fs.read" }),
+      t2: block({ id: "t2", name: "fs.read" }),
+      t3: block({ id: "t3", name: "fs.edit" }),
+    };
+    const groups = groupForFolding(msgs, blocks);
+    expect(groups.map((g) => g.kind)).toEqual([
+      "single",
+      "single",
+      "single",
+      "single",
+    ]);
+  });
+
+  it("does not fold across a non-foldable interruption", () => {
+    const msgs: UiMessage[] = [
+      assistant({ uid: "a1", toolCallIds: ["t1"] }),
+      assistant({ uid: "a2", toolCallIds: ["t2"] }),
+      assistant({ uid: "a3", toolCallIds: ["t3"], content: "I think we should..." }), // breaks the run
+      assistant({ uid: "a4", toolCallIds: ["t4"] }),
+      assistant({ uid: "a5", toolCallIds: ["t5"] }),
+      assistant({ uid: "a6", toolCallIds: ["t6"] }),
+    ];
+    const blocks = {
+      t1: block({ id: "t1", name: "fs.read" }),
+      t2: block({ id: "t2", name: "fs.read" }),
+      t3: block({ id: "t3", name: "fs.read" }),
+      t4: block({ id: "t4", name: "fs.read" }),
+      t5: block({ id: "t5", name: "fs.read" }),
+      t6: block({ id: "t6", name: "fs.read" }),
+    };
+    const groups = groupForFolding(msgs, blocks);
+    // a1+a2 are sub-threshold (only 2) → inline. a3 standalone.
+    // a4+a5+a6 hit threshold → folded.
+    expect(groups.map((g) => g.kind)).toEqual([
+      "single",
+      "single",
+      "single",
+      "folded",
+    ]);
+    if (groups[3].kind === "folded") {
+      expect(groups[3].messages.map((m) => m.uid)).toEqual(["a4", "a5", "a6"]);
+    }
+  });
+});
diff --git a/apps/jarvis-web/src/components/Chat/MessageList.tsx b/apps/jarvis-web/src/components/Chat/MessageList.tsx
index 9539d58..6d0e0aa 100644
--- a/apps/jarvis-web/src/components/Chat/MessageList.tsx
+++ b/apps/jarvis-web/src/components/Chat/MessageList.tsx
@@ -3,7 +3,17 @@
 // scroll-to-bottom strategy lives in `useStickToBottom` — see that
 // file's header for why a naive "scroll on every render" effect
 // doesn't work with the async XMarkdown subtree.
+//
+// MessageList is also the "view transformer" layer: before
+// rendering, it groups consecutive assistant iterations whose tool
+// calls are *all* read-only and whose visible content is empty
+// into a single `<CollapsedToolGroup>` card. This keeps a long
+// investigation loop (read → grep → read → grep → … before the
+// real edit) from drowning the transcript. The fold threshold is
+// `MIN_GROUP_SIZE` — small enough to be useful, large enough that
+// brief lookups don't get hidden behind an extra click.
 
+import { useMemo } from "react";
 import { useAppStore } from "../../store/appStore";
 import { useStickToBottom } from "../../hooks/useStickToBottom";
 import { UserBubble } from "./UserBubble";
@@ -11,20 +21,100 @@ import { AssistantBubble } from "./AssistantBubble";
 import { AgentLoadingFooter } from "./AgentLoadingFooter";
 import { WelcomeScreen } from "./WelcomeScreen";
 import { EmptyConvoHint } from "./EmptyConvoHint";
+import { CollapsedToolGroup } from "./CollapsedToolGroup";
 import { MarkdownView } from "./MarkdownView";
+import { isReadOnlyTool } from "./toolStepSummary";
 import { t } from "../../utils/i18n";
+import type { UiMessage, ToolBlockEntry } from "../../store/types";
+
+const MIN_GROUP_SIZE = 3;
+
+type AssistantMsg = Extract<UiMessage, { kind: "assistant" }>;
+
+type Group =
+  | { kind: "single"; message: UiMessage }
+  | { kind: "folded"; messages: AssistantMsg[] };
+
+/// True when this assistant message qualifies for folding: it has
+/// at least one tool call, every tool call is a known read-only
+/// tool, and its visible body content is empty (whitespace-only is
+/// treated as empty). Reasoning is allowed — it lives inside a
+/// collapsed disclosure either way.
+///
+/// Exported for testing — see [`groupForFolding`].
+export function isFoldable(
+  m: UiMessage,
+  toolBlocks: Record<string, ToolBlockEntry>,
+): m is AssistantMsg {
+  if (m.kind !== "assistant") return false;
+  if (m.toolCallIds.length === 0) return false;
+  if (m.content.trim().length > 0) return false;
+  for (const id of m.toolCallIds) {
+    const b = toolBlocks[id];
+    // Missing block = can't classify safely → don't fold.
+    if (!b) return false;
+    if (!isReadOnlyTool(b.name)) return false;
+  }
+  return true;
+}
+
+/// Walk `messages` once, batching runs of foldable assistant
+/// iterations of length >= MIN_GROUP_SIZE into a `folded` group;
+/// everything else stays as its own `single` entry. Runs shorter
+/// than the threshold pass through unchanged so brief reads still
+/// render inline.
+///
+/// Exported for testing — the rest of the SPA should never need to
+/// call this directly. The classifier `isFoldable` is exposed
+/// alongside for the same reason.
+export function groupForFolding(
+  messages: UiMessage[],
+  toolBlocks: Record<string, ToolBlockEntry>,
+): Group[] {
+  const out: Group[] = [];
+  let buf: AssistantMsg[] = [];
+  const flushBuf = () => {
+    if (buf.length >= MIN_GROUP_SIZE) {
+      out.push({ kind: "folded", messages: buf });
+    } else {
+      for (const m of buf) out.push({ kind: "single", message: m });
+    }
+    buf = [];
+  };
+  for (const m of messages) {
+    if (isFoldable(m, toolBlocks)) {
+      buf.push(m);
+    } else {
+      flushBuf();
+      out.push({ kind: "single", message: m });
+    }
+  }
+  flushBuf();
+  return out;
+}
 
 export function MessageList() {
   const messages = useAppStore((s) => s.messages);
+  const toolBlocks = useAppStore((s) => s.toolBlocks);
   const activeId = useAppStore((s) => s.activeId);
   const emptyHint = useAppStore((s) => s.emptyHintIdShort);
   const { ref } = useStickToBottom<HTMLElement>({ activeId });
 
+  const groups = useMemo(
+    () => groupForFolding(messages, toolBlocks),
+    [messages, toolBlocks],
+  );
+
   return (
     <section id="messages" aria-live="polite" ref={ref}>
       {messages.length === 0 && !emptyHint && <WelcomeScreen />}
       {messages.length === 0 && emptyHint && <EmptyConvoHint idShort={emptyHint} />}
-      {messages.map((m, i) => {
+      {groups.map((g, gi) => {
+        if (g.kind === "folded") {
+          const head = g.messages[0];
+          return <CollapsedToolGroup key={`grp-${head.uid}`} messages={g.messages} />;
+        }
+        const m = g.message;
         if (m.kind === "user") {
           return (
             <UserBubble
@@ -45,8 +135,16 @@ export function MessageList() {
           // tool-call attribution but render them stacked under one
           // avatar + name header so the user doesn't see "Jarvis,
           // Jarvis, Jarvis" repeating down the page.
-          const prev = messages[i - 1];
-          const continuation = prev != null && prev.kind === "assistant";
+          //
+          // Continuation here is computed against the prior *group*,
+          // not the prior raw message: a folded read-only run
+          // immediately followed by a final reply still wants the
+          // reply to read as a continuation of the same Jarvis turn.
+          const prev = groups[gi - 1];
+          const continuation =
+            prev != null &&
+            (prev.kind === "folded" ||
+              (prev.kind === "single" && prev.message.kind === "assistant"));
           return (
             <AssistantBubble
               key={m.uid}
diff --git a/apps/jarvis-web/src/components/Chat/toolStepSummary.ts b/apps/jarvis-web/src/components/Chat/toolStepSummary.ts
index badab69..02c8b17 100644
--- a/apps/jarvis-web/src/components/Chat/toolStepSummary.ts
+++ b/apps/jarvis-web/src/components/Chat/toolStepSummary.ts
@@ -323,6 +323,44 @@ export function describeStep(blocks: ToolBlockEntry[]): string {
   return out;
 }
 
+/// Tools that don't mutate the workspace, the network, or any
+/// external system. Used by the MessageList transcript-folding
+/// rule: runs of consecutive assistant iterations that *only* call
+/// these tools (and produce no visible content) collapse into a
+/// single summary card so a long investigation loop doesn't drown
+/// the user's view of the conversation.
+///
+/// Anything that writes a file, runs a shell command, sends a
+/// channel message, or mutates a project / requirement / doc /
+/// memory / todo must NOT appear here.
+const READ_ONLY_TOOL_NAMES: ReadonlySet<string> = new Set([
+  "fs.read",
+  "fs.list",
+  "code.grep",
+  "grep",
+  "git.status",
+  "git.diff",
+  "git.log",
+  "git.show",
+  "workspace.context",
+  "project.checks",
+  "time.now",
+  "http.fetch",
+  "echo",
+  "doc.list",
+  "doc.search",
+  "doc.get",
+  "doc.draft.get",
+]);
+
+/// True when the tool is safe to fold under the transcript
+/// "read-only run" rule. Unknown / new tools default to false —
+/// folding aggressively for unrecognised tools could hide a
+/// dangerous mutation behind a "Read 5 files" summary.
+export function isReadOnlyTool(name: string): boolean {
+  return READ_ONLY_TOOL_NAMES.has(name);
+}
+
 /// Aggregate status for the whole step. Drives the row's badge:
 ///   • any running   → "running"
 ///   • any error     → "error"
diff --git a/apps/jarvis-web/src/components/Composer/AutoActivatedSkillsChip.test.tsx b/apps/jarvis-web/src/components/Composer/AutoActivatedSkillsChip.test.tsx
new file mode 100644
index 0000000..074d9cd
--- /dev/null
+++ b/apps/jarvis-web/src/components/Composer/AutoActivatedSkillsChip.test.tsx
@@ -0,0 +1,50 @@
+// Composer chip surfaces server-predicted next-turn skill
+// auto-activations. Renders nothing when the list is empty so a
+// quiet session doesn't pay for chrome.
+
+import { beforeEach, describe, expect, it } from "vitest";
+import { act, render, screen } from "@testing-library/react";
+import { useAppStore } from "../../store/appStore";
+import { AutoActivatedSkillsChip } from "./AutoActivatedSkillsChip";
+
+beforeEach(() => {
+  useAppStore.getState().setAutoActivatedNextTurnSkills([]);
+});
+
+describe("AutoActivatedSkillsChip", () => {
+  it("renders nothing on an empty list", () => {
+    const { container } = render(<AutoActivatedSkillsChip />);
+    expect(container).toBeEmptyDOMElement();
+  });
+
+  it("renders one pill per skill name", () => {
+    act(() => {
+      useAppStore.getState().setAutoActivatedNextTurnSkills([
+        "rs-helper",
+        "tsx-helper",
+      ]);
+    });
+    render(<AutoActivatedSkillsChip />);
+    expect(screen.getByRole("status")).toHaveTextContent(
+      /Auto-activated for next turn/i,
+    );
+    expect(screen.getByText("rs-helper")).toBeInTheDocument();
+    expect(screen.getByText("tsx-helper")).toBeInTheDocument();
+  });
+
+  it("dedupes and skips blanks via store action", () => {
+    act(() => {
+      useAppStore.getState().setAutoActivatedNextTurnSkills([
+        "rs-helper",
+        "rs-helper",
+        "",
+        "  ",
+        "tsx-helper",
+      ]);
+    });
+    render(<AutoActivatedSkillsChip />);
+    // Each pill text appears once.
+    expect(screen.getAllByText("rs-helper")).toHaveLength(1);
+    expect(screen.getAllByText("tsx-helper")).toHaveLength(1);
+  });
+});
diff --git a/apps/jarvis-web/src/components/Composer/AutoActivatedSkillsChip.tsx b/apps/jarvis-web/src/components/Composer/AutoActivatedSkillsChip.tsx
new file mode 100644
index 0000000..f560d42
--- /dev/null
+++ b/apps/jarvis-web/src/components/Composer/AutoActivatedSkillsChip.tsx
@@ -0,0 +1,33 @@
+// M3.3 UX: tiny notice above the composer telling the user which
+// skills *will* auto-activate on the next user turn given the
+// files the agent touched in the previous turn. Backed by the
+// `skill_auto_activated_for_next_turn` WS frame; falls back to
+// rendering nothing when no skills match — no chrome cost on
+// quiet sessions.
+//
+// Self-contained on purpose: the chip subscribes to its single
+// store field and renders inline; no portal, no popover. Sits
+// between the form opening tag and the input-wrapper in Composer
+// so it visually attaches to the input the user is about to type
+// into.
+
+import { useAppStore } from "../../store/appStore";
+
+export function AutoActivatedSkillsChip() {
+  const skills = useAppStore((s) => s.autoActivatedNextTurnSkills);
+  if (!skills || skills.length === 0) return null;
+  return (
+    <div className="composer-auto-skills" role="status" aria-live="polite">
+      <span className="composer-auto-skills-label">
+        Auto-activated for next turn:
+      </span>
+      <ul className="composer-auto-skills-list">
+        {skills.map((name) => (
+          <li key={name} className="composer-auto-skills-pill" title={`Skill: ${name}`}>
+            {name}
+          </li>
+        ))}
+      </ul>
+    </div>
+  );
+}
diff --git a/apps/jarvis-web/src/components/Composer/Composer.tsx b/apps/jarvis-web/src/components/Composer/Composer.tsx
index 18817bc..11e7a9f 100644
--- a/apps/jarvis-web/src/components/Composer/Composer.tsx
+++ b/apps/jarvis-web/src/components/Composer/Composer.tsx
@@ -8,6 +8,7 @@ import { useEffect, useRef, useState } from "react";
 import { useAppStore } from "../../store/appStore";
 import { t } from "../../utils/i18n";
 import { SendButton, StopButton } from "../ComposerButtons";
+import { AutoActivatedSkillsChip } from "./AutoActivatedSkillsChip";
 import { SlashPalette, type SlashCommand } from "./SlashPalette";
 import { sendFrame, isOpen } from "../../services/socket";
 import { startConversationTurn } from "../../services/conversationSockets";
@@ -163,6 +164,7 @@ export function Composer({ slashCommands, pickedRouting, metaChildren }: Props)
       autoComplete="off"
       onSubmit={(e) => { e.preventDefault(); submit(); }}
     >
+      <AutoActivatedSkillsChip />
       <div className="input-wrapper">
         <textarea
           id="input"
diff --git a/apps/jarvis-web/src/components/Projects/WorkOverview/HealthCenter.tsx b/apps/jarvis-web/src/components/Projects/WorkOverview/HealthCenter.tsx
index 6917484..cbe8ddb 100644
--- a/apps/jarvis-web/src/components/Projects/WorkOverview/HealthCenter.tsx
+++ b/apps/jarvis-web/src/components/Projects/WorkOverview/HealthCenter.tsx
@@ -1,5 +1,5 @@
 import { useCallback, useEffect, useMemo, useState } from "react";
-import { useNavigate } from "react-router-dom";
+import { useNavigate, type NavigateFunction } from "react-router-dom";
 import { useAppStore } from "../../../store/appStore";
 import { t } from "../../../utils/i18n";
 import { resumeConversation } from "../../../services/conversations";
@@ -63,6 +63,33 @@ interface OptimizationMetric {
   hint: string[];
 }
 
+export interface HealthCenterState {
+  // Inputs (passthrough for child sections that still need them)
+  overview: WorkOverview | null;
+  loading: boolean;
+  error: string | null;
+  onRefresh: () => void;
+  refreshDiagnostics: () => Promise<void>;
+  // Tone + labels
+  tone: Tone;
+  toneLabel: string;
+  summary: string;
+  unavailable: boolean;
+  // Derived stats
+  qualityStats: QualitySignal;
+  optimizationScore: number;
+  optimizationMetrics: OptimizationMetric[];
+  direction: HarnessDirectionSnapshot | null;
+  signals: HealthSignal[];
+  // Auto-mode runtime
+  autoMode: AutoModeStatus | null;
+  autoPending: boolean;
+  autoError: string | null;
+  toggleAutoMode: () => Promise<void>;
+  // Navigation helper for action buttons
+  navigate: NavigateFunction;
+}
+
 function formatPercent(v: number | null): string {
   return v === null ? "—" : `${Math.round(v * 100)}%`;
 }
@@ -192,15 +219,21 @@ function topIssue(issues: Issue[]): Issue | null {
   return issues[0] ?? null;
 }
 
-export function HealthCenter({
-  overview,
-  quality,
-  overviewUnavailable,
-  qualityUnavailable,
-  loading,
-  error,
-  onRefresh,
-}: Props) {
+// Owns all data fetches + derivations for the health center. Called
+// once in `WorkOverviewPage`; the returned state is fanned out to
+// both `HealthCenterCompact` (top of page) and `HealthCenterDetails`
+// (the "Quality" tab) so we don't double-poll the auto-mode endpoint
+// or re-derive the optimization grid twice per render.
+export function useHealthCenterState(props: Props): HealthCenterState {
+  const {
+    overview,
+    quality,
+    overviewUnavailable,
+    qualityUnavailable,
+    loading,
+    error,
+    onRefresh,
+  } = props;
   const [orphans, setOrphans] = useState<OrphanWorktree[]>([]);
   const [stuck, setStuck] = useState<StuckRun[]>([]);
   const [autoMode, setAutoMode] = useState<AutoModeStatus | null>(null);
@@ -381,11 +414,11 @@ export function HealthCenter({
     },
   ];
 
-  const openConversation = (id: string) => {
+  const openConversation = useCallback((id: string) => {
     void resumeConversation(id);
-  };
+  }, []);
 
-  const toggleAutoMode = async () => {
+  const toggleAutoMode = useCallback(async () => {
     if (!autoMode?.configured || autoPending) return;
     setAutoPending(true);
     setAutoError(null);
@@ -397,7 +430,7 @@ export function HealthCenter({
     } finally {
       setAutoPending(false);
     }
-  };
+  }, [autoMode, autoPending]);
 
   const signals: HealthSignal[] = [];
   const failures = overview?.recent_failures ?? [];
@@ -485,16 +518,72 @@ export function HealthCenter({
     });
   }
 
+  return {
+    overview,
+    loading,
+    error,
+    onRefresh,
+    refreshDiagnostics,
+    tone,
+    toneLabel: healthLabel(tone),
+    summary: healthSummary(tone, overview, qualityStats, issues, unavailable),
+    unavailable,
+    qualityStats,
+    optimizationScore,
+    optimizationMetrics,
+    direction,
+    signals,
+    autoMode,
+    autoPending,
+    autoError,
+    toggleAutoMode,
+    navigate,
+  };
+}
+
+interface CompactProps {
+  state: HealthCenterState;
+  /// Triggered when the user clicks "view all" under a truncated
+  /// signals list. The page wires this to switch into the Quality tab
+  /// where the full list lives.
+  onExpandSignals?: () => void;
+}
+
+// Top-of-page strip: status pill + summary + KpiStrip +
+// AgentRuntimeStrip + top-3 Next Actions. Always visible.
+export function HealthCenterCompact({ state, onExpandSignals }: CompactProps) {
+  const {
+    tone,
+    toneLabel,
+    summary,
+    error,
+    autoError,
+    loading,
+    onRefresh,
+    refreshDiagnostics,
+    autoMode,
+    autoPending,
+    toggleAutoMode,
+    overview,
+    navigate,
+    signals,
+  } = state;
+  const visibleSignals = signals.slice(0, 3);
+  const hasMore = signals.length > visibleSignals.length;
+
   return (
-    <section className={"health-center health-center-" + tone} aria-label={t("healthCenterTitle")}>
+    <section
+      className={"health-center health-center-compact health-center-" + tone}
+      aria-label={t("healthCenterTitle")}
+    >
       <header className="health-center-head">
         <div className="health-center-title-block">
           <span className={"health-center-state tone-" + tone}>
             <span className="health-center-state-dot" aria-hidden="true" />
-            {healthLabel(tone)}
+            {toneLabel}
           </span>
           <h3>{t("healthCenterTitle")}</h3>
-          <p>{healthSummary(tone, overview, qualityStats, issues, unavailable)}</p>
+          <p>{summary}</p>
           {(error || autoError) && (
             <p className="health-center-error">
               {error
@@ -536,6 +625,60 @@ export function HealthCenter({
 
       <AgentRuntimeStrip status={autoMode} />
 
+      <div className="health-center-body">
+        <div className="health-center-signals">
+          <div className="health-center-section-label">
+            {t("healthCenterNextActions")}
+            {hasMore && onExpandSignals && (
+              <button
+                type="button"
+                className="health-center-section-link"
+                onClick={onExpandSignals}
+                title={t("healthCenterSignalsViewAllHint")}
+              >
+                {t("healthCenterSignalsViewAll", signals.length)}
+              </button>
+            )}
+          </div>
+          <ul className="health-signal-list">
+            {visibleSignals.map((signal) => (
+              <li
+                key={signal.label + signal.value + signal.detail}
+                className={"health-signal tone-" + signal.tone}
+              >
+                <span className="health-signal-label">{signal.label}</span>
+                <span className="health-signal-value tabular-nums">{signal.value}</span>
+                <span className="health-signal-detail" title={signal.detail}>
+                  {signal.detail}
+                </span>
+                {signal.action && (
+                  <button type="button" onClick={signal.action.onClick}>
+                    {signal.action.label}
+                  </button>
+                )}
+              </li>
+            ))}
+          </ul>
+        </div>
+      </div>
+    </section>
+  );
+}
+
+interface DetailsProps {
+  state: HealthCenterState;
+}
+
+// Quality-tab body: optimization grid + Direction components + the
+// full (untruncated) Next Actions list. Reuses the same derived
+// state — no extra fetches.
+export function HealthCenterDetails({ state }: DetailsProps) {
+  const { tone, optimizationMetrics, direction, signals } = state;
+  return (
+    <section
+      className={"health-center health-center-details health-center-" + tone}
+      aria-label={t("harnessEvolutionTitle")}
+    >
       <div className="health-optimization">
         <div className="health-center-section-label">
           <span className="harness-metric-label-with-hint">
@@ -594,8 +737,11 @@ export function HealthCenter({
         <div className="health-center-signals">
           <div className="health-center-section-label">{t("healthCenterNextActions")}</div>
           <ul className="health-signal-list">
-            {signals.slice(0, 5).map((signal) => (
-              <li key={signal.label + signal.value + signal.detail} className={"health-signal tone-" + signal.tone}>
+            {signals.map((signal) => (
+              <li
+                key={signal.label + signal.value + signal.detail}
+                className={"health-signal tone-" + signal.tone}
+              >
                 <span className="health-signal-label">{signal.label}</span>
                 <span className="health-signal-value tabular-nums">{signal.value}</span>
                 <span className="health-signal-detail" title={signal.detail}>
@@ -615,6 +761,19 @@ export function HealthCenter({
   );
 }
 
+// Back-compat composite — renders compact + details inline. Not used
+// by the redesigned overview page; kept so any other call sites
+// (tests, embedded views) keep working without code changes.
+export function HealthCenter(props: Props) {
+  const state = useHealthCenterState(props);
+  return (
+    <>
+      <HealthCenterCompact state={state} />
+      <HealthCenterDetails state={state} />
+    </>
+  );
+}
+
 function AutoModeControl({
   status,
   pending,
diff --git a/apps/jarvis-web/src/components/Projects/WorkOverview/WorkOverviewPage.tsx b/apps/jarvis-web/src/components/Projects/WorkOverview/WorkOverviewPage.tsx
index 2963b1a..822a631 100644
--- a/apps/jarvis-web/src/components/Projects/WorkOverview/WorkOverviewPage.tsx
+++ b/apps/jarvis-web/src/components/Projects/WorkOverview/WorkOverviewPage.tsx
@@ -1,12 +1,17 @@
-import { useEffect, useState } from "react";
+import { useEffect, useMemo, useState } from "react";
 import { Link, useNavigate } from "react-router-dom";
 import { useAppStore } from "../../../store/appStore";
 import { t } from "../../../utils/i18n";
 import { newConversation } from "../../../services/conversations";
 import type { WorkOverview, WindowDays } from "../../../services/workOverview";
 import { getAutoModeStatus, type AutoModeStatus } from "../../../services/autoMode";
+import { Tabs, type TabItem } from "../../ui/Tabs";
 import { useWorkOverview } from "./useWorkOverview";
-import { HealthCenter } from "./HealthCenter";
+import {
+  HealthCenterCompact,
+  HealthCenterDetails,
+  useHealthCenterState,
+} from "./HealthCenter";
 import { ThroughputChart } from "./ThroughputChart";
 import { ProjectLeaderboard } from "./ProjectLeaderboard";
 import { UsagePanel } from "./UsagePanel";
@@ -16,6 +21,27 @@ import { SubAgentRunsRail } from "./SubAgentRunsRail";
 
 const WINDOW_OPTIONS: WindowDays[] = [7, 30, 90];
 
+type OverviewTab =
+  | "overview"
+  | "quality"
+  | "usage"
+  | "activity"
+  | "observability";
+
+const TAB_IDS: OverviewTab[] = [
+  "overview",
+  "quality",
+  "usage",
+  "activity",
+  "observability",
+];
+
+function readTabFromHash(): OverviewTab {
+  if (typeof window === "undefined") return "overview";
+  const raw = window.location.hash.replace(/^#/, "");
+  return (TAB_IDS as string[]).includes(raw) ? (raw as OverviewTab) : "overview";
+}
+
 function pct(value: number | null | undefined): string {
   return value === null || value === undefined
     ? t("workOverviewDiagnoseNoData")
@@ -98,13 +124,50 @@ function projectIdsWithRunIssues(overview: WorkOverview | null): string[] {
 
 // Top-level dashboard shown on `/projects/overview`. Owns the
 // time-window state + the data hook; child panels just render slices
-// of the response.
+// of the response. Layout is two-tier:
+//
+//   1. Always-visible header: title row, ProjectLeaderboard,
+//      HealthCenterCompact (status + KPI strip + runtime + top-3
+//      next actions).
+//   2. Tab body: Overview / Quality / Usage / Activity / Observability —
+//      synced to URL hash so deep-links + back button work.
 export function WorkOverviewPage() {
   const [windowDays, setWindowDays] = useState<WindowDays>(7);
   const state = useWorkOverview(windowDays);
   const navigate = useNavigate();
   const projectsById = useAppStore((s) => s.projectsById);
   const setComposerValue = useAppStore((s) => s.setComposerValue);
+  const [activeTab, setActiveTab] = useState<OverviewTab>(() => readTabFromHash());
+  const healthState = useHealthCenterState({
+    overview: state.overview,
+    quality: state.quality,
+    overviewUnavailable: state.overviewUnavailable,
+    qualityUnavailable: state.qualityUnavailable,
+    loading: state.loading,
+    error: state.error,
+    onRefresh: state.refetch,
+  });
+
+  // Keep URL hash in sync with the active tab without polluting
+  // history. Use replaceState so back-button still steps out of the
+  // page rather than cycling through tabs.
+  useEffect(() => {
+    if (typeof window === "undefined") return;
+    const current = window.location.hash.replace(/^#/, "");
+    if (current === activeTab) return;
+    history.replaceState(null, "", "#" + activeTab);
+  }, [activeTab]);
+
+  // Pick up hash changes that came from elsewhere (manual edit,
+  // back/forward navigation across other state changes).
+  useEffect(() => {
+    if (typeof window === "undefined") return;
+    const onHashChange = () => {
+      setActiveTab(readTabFromHash());
+    };
+    window.addEventListener("hashchange", onHashChange);
+    return () => window.removeEventListener("hashchange", onHashChange);
+  }, []);
 
   const startDiagnosis = async () => {
     const issueProjectIds = projectIdsWithRunIssues(state.overview);
@@ -157,6 +220,46 @@ export function WorkOverviewPage() {
     return () => window.removeEventListener("keydown", onKey);
   }, [state.refetch]);
 
+  const tabItems: TabItem[] = useMemo(
+    () => [
+      {
+        id: "overview",
+        label: t("workOverviewTabOverview"),
+        content: <ThroughputChart overview={state.overview} />,
+      },
+      {
+        id: "quality",
+        label: t("workOverviewTabQuality"),
+        content: <HealthCenterDetails state={healthState} />,
+      },
+      {
+        id: "usage",
+        label: t("workOverviewTabUsage"),
+        content: (
+          <div className="work-insights-grid work-overview-tab-usage-grid">
+            <div className="work-insights-cell work-insights-cell-usage">
+              <UsagePanel windowDays={windowDays} />
+            </div>
+            <div className="work-insights-cell work-insights-cell-models">
+              <ModelComparisonPanel windowDays={windowDays} />
+            </div>
+          </div>
+        ),
+      },
+      {
+        id: "activity",
+        label: t("workOverviewTabActivity"),
+        content: <SubAgentRunsRail />,
+      },
+      {
+        id: "observability",
+        label: t("workOverviewTabObservability"),
+        content: <HarnessObservabilityPanel windowDays={windowDays} />,
+      },
+    ],
+    [healthState, state.overview, windowDays],
+  );
+
   return (
     <section className="work-overview" aria-label={t("workOverviewTitle")}>
       <div className="work-overview-header">
@@ -212,44 +315,18 @@ export function WorkOverviewPage() {
         <ProjectLeaderboard overview={state.overview} />
       </div>
 
-      <div id="work-overview-operational" className="work-overview-anchor">
-        <HealthCenter
-          overview={state.overview}
-          quality={state.quality}
-          overviewUnavailable={state.overviewUnavailable}
-          qualityUnavailable={state.qualityUnavailable}
-          loading={state.loading}
-          error={state.error}
-          onRefresh={state.refetch}
-        />
-      </div>
-
-      <section className="work-insights-group" aria-label={t("workInsightsTitle")}>
-        <header className="work-insights-head">
-          <div>
-            <h3>{t("workInsightsTitle")}</h3>
-            <p>{t("workInsightsSubtitle")}</p>
-          </div>
-        </header>
-        <div className="work-insights-grid">
-          <div
-            id="work-overview-throughput"
-            className="work-insights-cell work-insights-cell-throughput"
-          >
-            <ThroughputChart overview={state.overview} />
-          </div>
-          <div className="work-insights-cell work-insights-cell-usage">
-            <UsagePanel windowDays={windowDays} />
-          </div>
-          <div className="work-insights-cell work-insights-cell-models">
-            <ModelComparisonPanel windowDays={windowDays} />
-          </div>
-        </div>
-      </section>
-
-      <SubAgentRunsRail />
+      <HealthCenterCompact
+        state={healthState}
+        onExpandSignals={() => setActiveTab("quality")}
+      />
 
-      <HarnessObservabilityPanel windowDays={windowDays} />
+      <Tabs
+        ariaLabel={t("workOverviewTabsLabel")}
+        className="work-overview-tabs"
+        value={activeTab}
+        onChange={(id) => setActiveTab(id as OverviewTab)}
+        items={tabItems}
+      />
 
       {/* Footer kept for absolute timestamp (the banner already shows
           relative time, but exact wall-clock is useful for ops
diff --git a/apps/jarvis-web/src/components/Settings/sections/MemoryIncludesPanel.tsx b/apps/jarvis-web/src/components/Settings/sections/MemoryIncludesPanel.tsx
new file mode 100644
index 0000000..973cafb
--- /dev/null
+++ b/apps/jarvis-web/src/components/Settings/sections/MemoryIncludesPanel.tsx
@@ -0,0 +1,236 @@
+// P17 — Includes management embedded inside MemorySyncSection.
+//
+// Reads /v1/memory/includes for the active scope, shows each
+// directive with resolution status, lets the operator add/remove
+// directives and refresh git+ caches. Independent from the
+// sync backend choice (includes work whether sync is git, iCloud,
+// or none).
+
+import { useCallback, useEffect, useState } from "react";
+import { apiUrl } from "../../../services/api";
+
+type Scope = "workspace" | "user";
+
+interface IncludeItem {
+  target: string;
+  kind: "local_path" | "git_url";
+  resolves: boolean;
+  path?: string;
+  error?: string;
+}
+
+interface IncludesResponse {
+  scope: string;
+  memory_md: string;
+  items: IncludeItem[];
+}
+
+interface Props {
+  scope: Scope;
+}
+
+export function MemoryIncludesPanel({ scope }: Props) {
+  const [data, setData] = useState<IncludesResponse | null>(null);
+  const [loading, setLoading] = useState(false);
+  const [error, setError] = useState<string | null>(null);
+  const [unavailable, setUnavailable] = useState(false);
+  const [actionBusy, setActionBusy] = useState(false);
+  const [actionMessage, setActionMessage] = useState<{ ok: boolean; text: string } | null>(null);
+  const [newTarget, setNewTarget] = useState("");
+
+  const refresh = useCallback(async () => {
+    setLoading(true);
+    try {
+      const r = await fetch(apiUrl(`/v1/memory/includes?scope=${scope}`));
+      if (r.status === 503) {
+        setUnavailable(true);
+        setData(null);
+        return;
+      }
+      if (!r.ok) {
+        setError(`HTTP ${r.status}`);
+        return;
+      }
+      const body = (await r.json()) as IncludesResponse;
+      setUnavailable(false);
+      setData(body);
+      setError(null);
+    } catch (e) {
+      setError(String(e));
+    } finally {
+      setLoading(false);
+    }
+  }, [scope]);
+
+  useEffect(() => {
+    void refresh();
+  }, [refresh]);
+
+  const callJson = useCallback(
+    async (method: string, path: string, body: unknown): Promise<void> => {
+      setActionBusy(true);
+      setActionMessage(null);
+      try {
+        const r = await fetch(apiUrl(path), {
+          method,
+          headers: { "Content-Type": "application/json" },
+          body: JSON.stringify(body),
+        });
+        const text = await r.text();
+        let parsed: unknown = text;
+        try {
+          parsed = JSON.parse(text);
+        } catch {
+          // raw — leave as-is
+        }
+        if (!r.ok) {
+          const obj = (parsed ?? {}) as Record<string, unknown>;
+          setActionMessage({
+            ok: false,
+            text:
+              (typeof obj.error === "string" && obj.error) || `HTTP ${r.status}`,
+          });
+          return;
+        }
+        const obj = (parsed ?? {}) as Record<string, unknown>;
+        const summary =
+          (typeof obj.added === "string" && `Added ${obj.added}`) ||
+          (typeof obj.removed === "string" && `Removed ${obj.removed}`) ||
+          (typeof obj.target === "string" && `Refreshed ${obj.target}`) ||
+          "OK";
+        setActionMessage({ ok: true, text: summary });
+        await refresh();
+      } catch (e) {
+        setActionMessage({ ok: false, text: String(e) });
+      } finally {
+        setActionBusy(false);
+      }
+    },
+    [refresh],
+  );
+
+  if (unavailable) {
+    return (
+      <div className="memory-sync-empty">
+        Memory tools aren't enabled on this server, so includes are unavailable.
+      </div>
+    );
+  }
+
+  return (
+    <div className="memory-includes">
+      <div className="memory-includes-header">
+        <span className="memory-sync-label">Includes ({scope})</span>
+        <button
+          type="button"
+          className="memory-sync-btn ghost"
+          onClick={() => void refresh()}
+          disabled={loading}
+        >
+          {loading ? "…" : "Reload"}
+        </button>
+      </div>
+
+      {error && (
+        <div className="memory-sync-error" role="alert">
+          {error}
+        </div>
+      )}
+
+      {data && data.items.length === 0 && (
+        <div className="memory-includes-empty">No include directives yet.</div>
+      )}
+
+      {data && data.items.length > 0 && (
+        <ul className="memory-includes-list">
+          {data.items.map((item) => (
+            <li
+              key={item.target}
+              className={`memory-includes-item ${item.resolves ? "ok" : "fail"}`}
+            >
+              <div className="memory-includes-row">
+                <span className={`memory-includes-kind kind-${item.kind}`}>
+                  {item.kind === "git_url" ? "git" : "local"}
+                </span>
+                <code className="memory-includes-target">{item.target}</code>
+                <div className="memory-includes-actions">
+                  {item.kind === "git_url" && (
+                    <button
+                      type="button"
+                      className="memory-sync-btn ghost"
+                      disabled={actionBusy}
+                      onClick={() =>
+                        void callJson("POST", "/v1/memory/includes/refresh", {
+                          target: item.target,
+                        })
+                      }
+                      title="Re-clone the cached git copy"
+                    >
+                      Refresh
+                    </button>
+                  )}
+                  <button
+                    type="button"
+                    className="memory-sync-btn ghost"
+                    disabled={actionBusy}
+                    onClick={() =>
+                      void callJson("DELETE", "/v1/memory/includes", {
+                        target: item.target,
+                        scope,
+                      })
+                    }
+                    title="Remove this directive from MEMORY.md"
+                  >
+                    Remove
+                  </button>
+                </div>
+              </div>
+              {item.resolves ? (
+                <div className="memory-includes-detail">
+                  resolved → <code>{item.path}</code>
+                </div>
+              ) : (
+                <div className="memory-includes-detail memory-includes-err">
+                  {item.error || "unresolved"}
+                </div>
+              )}
+            </li>
+          ))}
+        </ul>
+      )}
+
+      <div className="memory-includes-add">
+        <input
+          type="text"
+          className="memory-sync-input"
+          placeholder="/abs/path/memory or git+https://host/r.git[#branch]"
+          value={newTarget}
+          onChange={(e) => setNewTarget(e.target.value)}
+          disabled={actionBusy}
+        />
+        <button
+          type="button"
+          className="memory-sync-btn"
+          disabled={actionBusy || !newTarget.trim()}
+          onClick={() =>
+            void callJson("POST", "/v1/memory/includes", {
+              target: newTarget.trim(),
+              scope,
+            }).then(() => setNewTarget(""))
+          }
+        >
+          {actionBusy ? "Adding…" : "Add include"}
+        </button>
+      </div>
+
+      {actionMessage && (
+        <div
+          className={`memory-sync-result ${actionMessage.ok ? "ok" : "fail"}`}
+          role="status"
+        >
+          {actionMessage.text}
+        </div>
+      )}
+    </div>
+  );
+}
diff --git a/apps/jarvis-web/src/components/Settings/sections/MemorySyncSection.tsx b/apps/jarvis-web/src/components/Settings/sections/MemorySyncSection.tsx
new file mode 100644
index 0000000..57c331c
--- /dev/null
+++ b/apps/jarvis-web/src/components/Settings/sections/MemorySyncSection.tsx
@@ -0,0 +1,354 @@
+// P14 — Settings → System → Memory Sync.
+//
+// One panel covering all three backend modes:
+// - `none`: shows "memory sync is off" with how-to-enable hint
+// - `git`: status (branch / remote / dirty), "Sync now" + setup form
+// - `icloud`: shows iCloud Drive path, setup button
+//
+// Talks to /v1/memory/sync_status (read) and /v1/memory/{sync,
+// sync_setup, sync_setup_icloud} (write). All 503-aware — the
+// operator who hasn't enabled memory sees a clean off-state
+// instead of a broken page.
+
+import { useCallback, useEffect, useState } from "react";
+import { apiUrl } from "../../../services/api";
+import { Section } from "./Section";
+import { MemoryIncludesPanel } from "./MemoryIncludesPanel";
+
+interface SyncStatus {
+  backend: "none" | "git" | "icloud";
+  user_root: string | null;
+  workspace_root: string | null;
+  user_scope?: GitUserScope | { error: string } | { raw: string };
+}
+
+interface GitUserScope {
+  scope: string;
+  dir: string;
+  is_git_repo: boolean;
+  branch?: string;
+  remote_url?: string | null;
+  dirty?: boolean;
+  status?: string;
+  head?: string;
+  setup_hint?: string;
+  hint?: string;
+}
+
+interface ActionResult {
+  ok: boolean;
+  message: string;
+  raw?: unknown;
+}
+
+interface Props {
+  embedded?: boolean;
+}
+
+export function MemorySyncSection({ embedded }: Props = {}) {
+  const [status, setStatus] = useState<SyncStatus | null>(null);
+  const [loading, setLoading] = useState(false);
+  const [unavailable, setUnavailable] = useState(false);
+  const [error, setError] = useState<string | null>(null);
+  const [actionBusy, setActionBusy] = useState(false);
+  const [actionResult, setActionResult] = useState<ActionResult | null>(null);
+  const [remoteUrl, setRemoteUrl] = useState("");
+
+  const fetchStatus = useCallback(async () => {
+    setLoading(true);
+    try {
+      const r = await fetch(apiUrl("/v1/memory/sync_status"));
+      if (r.status === 503) {
+        setUnavailable(true);
+        setStatus(null);
+        return;
+      }
+      if (!r.ok) {
+        setError(`HTTP ${r.status}`);
+        return;
+      }
+      const body = (await r.json()) as SyncStatus;
+      setUnavailable(false);
+      setStatus(body);
+      setError(null);
+    } catch (e) {
+      setError(String(e));
+    } finally {
+      setLoading(false);
+    }
+  }, []);
+
+  useEffect(() => {
+    void fetchStatus();
+  }, [fetchStatus]);
+
+  const doAction = useCallback(
+    async (path: string, body?: unknown): Promise<void> => {
+      setActionBusy(true);
+      setActionResult(null);
+      try {
+        const r = await fetch(apiUrl(path), {
+          method: "POST",
+          headers: body ? { "Content-Type": "application/json" } : {},
+          body: body ? JSON.stringify(body) : undefined,
+        });
+        const text = await r.text();
+        let parsed: unknown = text;
+        try {
+          parsed = JSON.parse(text);
+        } catch {
+          // raw text — keep as-is
+        }
+        if (!r.ok) {
+          setActionResult({
+            ok: false,
+            message: extractError(parsed) || `HTTP ${r.status}`,
+            raw: parsed,
+          });
+          return;
+        }
+        setActionResult({
+          ok: true,
+          message: extractMessage(parsed) || "ok",
+          raw: parsed,
+        });
+        await fetchStatus();
+      } catch (e) {
+        setActionResult({ ok: false, message: String(e) });
+      } finally {
+        setActionBusy(false);
+      }
+    },
+    [fetchStatus],
+  );
+
+  const content = (
+    <>
+      {unavailable && (
+        <div className="memory-sync-empty">
+          Memory tools aren't enabled on this server. Set{" "}
+          <code>JARVIS_ENABLE_MEMORY=1</code> (or{" "}
+          <code>[agent].enable_memory = true</code> in config) and restart.
+        </div>
+      )}
+      {error && (
+        <div className="memory-sync-error" role="alert">
+          Failed to load status: {error}
+        </div>
+      )}
+      {!unavailable && status && (
+        <>
+          <div className="memory-sync-row">
+            <span className="memory-sync-label">Backend</span>
+            <BackendBadge backend={status.backend} />
+          </div>
+          <div className="memory-sync-row">
+            <span className="memory-sync-label">User root</span>
+            <code>{status.user_root ?? "(unconfigured)"}</code>
+          </div>
+          <div className="memory-sync-row">
+            <span className="memory-sync-label">Workspace root</span>
+            <code>{status.workspace_root ?? "(unconfigured)"}</code>
+          </div>
+
+          {status.backend === "git" && status.user_scope && (
+            <GitDetails
+              scope={status.user_scope as GitUserScope}
+              busy={actionBusy}
+              remoteUrl={remoteUrl}
+              onRemoteUrlChange={setRemoteUrl}
+              onSync={() => doAction("/v1/memory/sync")}
+              onSetup={() =>
+                doAction("/v1/memory/sync_setup", {
+                  remote_url: remoteUrl,
+                  force: false,
+                })
+              }
+            />
+          )}
+
+          {status.backend === "icloud" && (
+            <div className="memory-sync-icloud">
+              <p>
+                iCloud Drive syncs at the OS level — no manual push/pull needed.
+                Use the button below to create the <code>Jarvis</code> folder
+                inside iCloud Drive if it doesn't exist yet.
+              </p>
+              <button
+                type="button"
+                className="memory-sync-btn"
+                disabled={actionBusy}
+                onClick={() => doAction("/v1/memory/sync_setup_icloud")}
+              >
+                {actionBusy ? "Setting up…" : "Set up iCloud folder"}
+              </button>
+            </div>
+          )}
+
+          {status.backend === "none" && (
+            <div className="memory-sync-off">
+              Sync backend is set to <strong>none</strong>. Memory tools work
+              locally but nothing leaves this machine.
+              <br />
+              Set <code>JARVIS_MEMORY_SYNC_BACKEND=git</code> (or{" "}
+              <code>=icloud</code> on macOS) and restart to enable.
+            </div>
+          )}
+
+          {actionResult && (
+            <div
+              className={`memory-sync-result ${actionResult.ok ? "ok" : "fail"}`}
+              role="status"
+            >
+              {actionResult.message}
+            </div>
+          )}
+          <div className="memory-sync-footer">
+            <button
+              type="button"
+              className="memory-sync-btn ghost"
+              disabled={loading}
+              onClick={() => void fetchStatus()}
+            >
+              {loading ? "Refreshing…" : "Refresh"}
+            </button>
+          </div>
+
+          {/* P17 — include directives, independent of the sync
+              backend. Workspace + user shown side-by-side; the
+              user one only renders when user_root is configured. */}
+          <div className="memory-includes-wrap">
+            <MemoryIncludesPanel scope="workspace" />
+            {status.user_root && <MemoryIncludesPanel scope="user" />}
+          </div>
+        </>
+      )}
+    </>
+  );
+
+  if (embedded) return <div className="memory-sync-pane">{content}</div>;
+  return (
+    <Section
+      id="memory-sync"
+      titleKey="settingsMemorySyncTitle"
+      titleFallback="Memory Sync"
+      descKey="settingsMemorySyncDesc"
+      descFallback="Configure where agent-maintained memory is stored and how it syncs across machines."
+    >
+      <div className="memory-sync-pane">{content}</div>
+    </Section>
+  );
+}
+
+interface GitDetailsProps {
+  scope: GitUserScope;
+  busy: boolean;
+  remoteUrl: string;
+  onRemoteUrlChange: (v: string) => void;
+  onSync: () => void;
+  onSetup: () => void;
+}
+
+function GitDetails({
+  scope,
+  busy,
+  remoteUrl,
+  onRemoteUrlChange,
+  onSync,
+  onSetup,
+}: GitDetailsProps) {
+  if (!scope.is_git_repo) {
+    return (
+      <div className="memory-sync-setup">
+        <p>Memory dir is not a git repo yet. Connect it to a remote:</p>
+        <div className="memory-sync-form">
+          <input
+            type="text"
+            placeholder="git@github.com:me/jarvis-memory.git"
+            value={remoteUrl}
+            onChange={(e) => onRemoteUrlChange(e.target.value)}
+            disabled={busy}
+            className="memory-sync-input"
+          />
+          <button
+            type="button"
+            className="memory-sync-btn"
+            onClick={onSetup}
+            disabled={busy || !remoteUrl.trim()}
+          >
+            {busy ? "Setting up…" : "Set up & push"}
+          </button>
+        </div>
+        <details>
+          <summary>Setup hint</summary>
+          <pre>{scope.setup_hint ?? "—"}</pre>
+        </details>
+      </div>
+    );
+  }
+  return (
+    <div className="memory-sync-git">
+      <div className="memory-sync-row">
+        <span className="memory-sync-label">Branch</span>
+        <code>{scope.branch ?? "—"}</code>
+      </div>
+      <div className="memory-sync-row">
+        <span className="memory-sync-label">Remote</span>
+        <code>{scope.remote_url ?? "(none — set one with git remote add origin)"}</code>
+      </div>
+      <div className="memory-sync-row">
+        <span className="memory-sync-label">HEAD</span>
+        <code>{scope.head?.slice(0, 12) ?? "—"}</code>
+      </div>
+      <div className="memory-sync-row">
+        <span className="memory-sync-label">Dirty</span>
+        <code>{scope.dirty ? "yes" : "no"}</code>
+      </div>
+      {scope.status && scope.status.trim() && (
+        <details>
+          <summary>git status</summary>
+          <pre>{scope.status}</pre>
+        </details>
+      )}
+      <button
+        type="button"
+        className="memory-sync-btn"
+        onClick={onSync}
+        disabled={busy}
+      >
+        {busy ? "Syncing…" : "Sync now"}
+      </button>
+    </div>
+  );
+}
+
+function BackendBadge({ backend }: { backend: SyncStatus["backend"] }) {
+  const label = backend === "icloud" ? "iCloud" : backend === "git" ? "Git" : "None";
+  return <span className={`memory-sync-badge backend-${backend}`}>{label}</span>;
+}
+
+function extractMessage(parsed: unknown): string | null {
+  if (typeof parsed === "string") return parsed;
+  if (parsed && typeof parsed === "object") {
+    const obj = parsed as Record<string, unknown>;
+    if (typeof obj.message === "string") return obj.message;
+    if (typeof obj.hint === "string") return obj.hint;
+    if (obj.push && typeof obj.push === "object") {
+      const push = obj.push as Record<string, unknown>;
+      if (push.ok === true) return "Synced successfully.";
+      if (push.ok === false && typeof push.stderr === "string") {
+        return `Push failed: ${push.stderr.slice(0, 240)}`;
+      }
+    }
+    if (typeof obj.path === "string") return `Set up at ${obj.path}`;
+  }
+  return null;
+}
+
+function extractError(parsed: unknown): string | null {
+  if (parsed && typeof parsed === "object") {
+    const obj = parsed as Record<string, unknown>;
+    if (typeof obj.error === "string") return obj.error;
+  }
+  return null;
+}
diff --git a/apps/jarvis-web/src/components/Settings/sections/SystemSection.tsx b/apps/jarvis-web/src/components/Settings/sections/SystemSection.tsx
index 98e4a7d..50189fa 100644
--- a/apps/jarvis-web/src/components/Settings/sections/SystemSection.tsx
+++ b/apps/jarvis-web/src/components/Settings/sections/SystemSection.tsx
@@ -9,6 +9,7 @@ import { WorkspaceSection } from "./WorkspaceSection";
 import { ServerSection } from "./ServerSection";
 import { ApiSection } from "./ApiSection";
 import { DiagnosticsSection } from "./DiagnosticsSection";
+import { MemorySyncSection } from "./MemorySyncSection";
 import { AboutSection } from "./AboutSection";
 import { t } from "../../../utils/i18n";
 
@@ -17,7 +18,7 @@ function tx(key: string, fallback: string): string {
   return v === key ? fallback : v;
 }
 
-export const SYSTEM_TABS = ["workspace", "server", "api", "diagnostics", "about"] as const;
+export const SYSTEM_TABS = ["workspace", "server", "api", "memory", "diagnostics", "about"] as const;
 export type SystemTab = (typeof SYSTEM_TABS)[number];
 export const DEFAULT_SYSTEM_TAB: SystemTab = "workspace";
 
@@ -43,6 +44,11 @@ export function SystemSection({ tab, onTabChange }: Props = {}) {
       label: tx("settingsTabApi", "Connection"),
       content: <ApiSection embedded />,
     },
+    {
+      id: "memory",
+      label: tx("settingsTabMemorySync", "Memory Sync"),
+      content: <MemorySyncSection embedded />,
+    },
     {
       id: "diagnostics",
       label: tx("settingsTabDiagnostics", "Diagnostics"),
diff --git a/apps/jarvis-web/src/components/Workspace/TodosRail.tsx b/apps/jarvis-web/src/components/Workspace/TodosRail.tsx
index 6cc04d0..3ca43b4 100644
--- a/apps/jarvis-web/src/components/Workspace/TodosRail.tsx
+++ b/apps/jarvis-web/src/components/Workspace/TodosRail.tsx
@@ -14,7 +14,7 @@
 // Two named exports follow the rail's convention:
 // `TodosCountSpan` for the header, `TodosList` for the body.
 
-import { useEffect, useState } from "react";
+import { useEffect, useMemo, useRef, useState } from "react";
 import { useAppStore } from "../../store/appStore";
 import type { TodoItem } from "../../store/appStore";
 import {
@@ -22,6 +22,7 @@ import {
   deleteTodo,
   listTodos,
   updateTodo,
+  type TodoPriority,
   type TodoStatus,
 } from "../../services/todos";
 import { t } from "../../utils/i18n";
@@ -46,6 +47,9 @@ function statusLabel(status: TodoStatus): string {
   return tx(key, fallback);
 }
 
+const ALL_STATUSES: TodoStatus[] = ["pending", "in_progress", "completed", "cancelled", "blocked"];
+const ALL_PRIORITIES: (TodoPriority | "")[] = ["", "low", "medium", "high"];
+
 export function TodosCountSpan() {
   const todos = useAppStore((s) => s.todos);
   return <span id="todos-count">{String(todos.length)}</span>;
@@ -57,6 +61,15 @@ export function TodosList() {
   const [draft, setDraft] = useState("");
   const [unavailable, setUnavailable] = useState(false);
   const [busy, setBusy] = useState(false);
+  const [loading, setLoading] = useState(true);
+
+  // Filters
+  const [filterStatus, setFilterStatus] = useState<TodoStatus | "">("");
+  const [filterPriority, setFilterPriority] = useState<TodoPriority | "">("");
+
+  // Batch selection
+  const [selectedIds, setSelectedIds] = useState<Set<string>>(new Set());
+  const batchBarRef = useRef<HTMLDivElement>(null);
 
   // Hydrate on mount. The server is the source of truth; live frames
   // keep us current after this initial fetch.
@@ -64,6 +77,7 @@ export function TodosList() {
     let cancelled = false;
     void listTodos().then((res) => {
       if (cancelled) return;
+      setLoading(false);
       if (res === null) {
         setUnavailable(true);
         return;
@@ -76,6 +90,14 @@ export function TodosList() {
     };
   }, [setTodos]);
 
+  const filtered = useMemo(() => {
+    return todos.filter((t) => {
+      if (filterStatus && t.status !== filterStatus) return false;
+      if (filterPriority && t.priority !== filterPriority) return false;
+      return true;
+    });
+  }, [todos, filterStatus, filterPriority]);
+
   const onAdd = async () => {
     const title = draft.trim();
     if (!title || busy) return;
@@ -90,6 +112,61 @@ export function TodosList() {
     }
   };
 
+  const toggleSelect = (id: string) => {
+    setSelectedIds((prev) => {
+      const next = new Set(prev);
+      if (next.has(id)) next.delete(id);
+      else next.add(id);
+      return next;
+    });
+  };
+
+  const selectAllVisible = () => {
+    setSelectedIds(new Set(filtered.map((t) => t.id)));
+  };
+
+  const clearSelection = () => setSelectedIds(new Set());
+
+  const batchDelete = async () => {
+    if (!selectedIds.size) return;
+    const msg = tx("todosBatchDeleteConfirm", `Delete ${selectedIds.size} selected TODOs?`);
+    if (!confirm(msg)) return;
+    const ids = Array.from(selectedIds);
+    setSelectedIds(new Set());
+    await Promise.all(
+      ids.map(async (id) => {
+        const ok = await deleteTodo(id);
+        if (ok) useAppStore.getState().removeTodo(id);
+      }),
+    );
+  };
+
+  const batchSetStatus = async (status: TodoStatus) => {
+    if (!selectedIds.size) return;
+    const ids = Array.from(selectedIds);
+    setSelectedIds(new Set());
+    await Promise.all(
+      ids.map(async (id) => {
+        const updated = await updateTodo(id, { status });
+        if (updated) useAppStore.getState().upsertTodo(updated);
+      }),
+    );
+  };
+
+  const batchSetPriority = async (priority: TodoPriority | "") => {
+    if (!selectedIds.size) return;
+    const ids = Array.from(selectedIds);
+    setSelectedIds(new Set());
+    await Promise.all(
+      ids.map(async (id) => {
+        const updated = await updateTodo(id, { priority: priority || "" });
+        if (updated) useAppStore.getState().upsertTodo(updated);
+      }),
+    );
+  };
+
+  const hasSelection = selectedIds.size > 0;
+
   if (unavailable) {
     return (
       <div className="rail-empty">
@@ -104,6 +181,20 @@ export function TodosList() {
     );
   }
 
+  if (loading) {
+    return (
+      <div className="todos-panel">
+        <div className="todos-skeleton-form" />
+        <div className="todos-skeleton-filters" />
+        <div className="todos-skeleton-list">
+          {Array.from({ length: 5 }).map((_, i) => (
+            <div key={i} className="todo-skeleton-row" />
+          ))}
+        </div>
+      </div>
+    );
+  }
+
   return (
     <div className="todos-panel">
       <form
@@ -128,33 +219,189 @@ export function TodosList() {
           {tx("todosAdd", "Add")}
         </button>
       </form>
-      {todos.length === 0 ? (
-        <div className="rail-empty">
-          <span>
-            {tx(
-              "todosEmpty",
-              "No TODOs yet. Add one above or let the agent surface follow-ups via todo.add.",
-            )}
-          </span>
+
+      {/* Filters */}
+      {todos.length > 0 && (
+        <div className="todos-filters">
+          <div className="todos-filter-group">
+            {ALL_STATUSES.map((s) => (
+              <button
+                key={s}
+                type="button"
+                className={`todos-filter-chip ${filterStatus === s ? "is-active" : ""} status-${s}`}
+                onClick={() => setFilterStatus((prev) => (prev === s ? "" : s))}
+                aria-pressed={filterStatus === s}
+              >
+                {statusLabel(s)}
+              </button>
+            ))}
+          </div>
+          <select
+            className="todos-filter-select"
+            value={filterPriority}
+            onChange={(e) => setFilterPriority(e.target.value as TodoPriority | "")}
+            aria-label={tx("todosFilterPriorityAria", "Filter by priority")}
+          >
+            <option value="">{tx("todosFilterAllPriorities", "All priorities")}</option>
+            <option value="low">{tx("todosPriorityLow", "Low")}</option>
+            <option value="medium">{tx("todosPriorityMedium", "Medium")}</option>
+            <option value="high">{tx("todosPriorityHigh", "High")}</option>
+          </select>
+          {(filterStatus || filterPriority) && (
+            <button
+              type="button"
+              className="todos-filter-clear"
+              onClick={() => {
+                setFilterStatus("");
+                setFilterPriority("");
+              }}
+            >
+              {tx("todosFilterClear", "Clear")}
+            </button>
+          )}
+        </div>
+      )}
+
+      {filtered.length === 0 ? (
+        <div className="rail-empty todos-empty">
+          {todos.length === 0 ? (
+            <>
+              <div className="todos-empty-icon" aria-hidden="true">
+                <svg width="32" height="32" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" strokeLinejoin="round">
+                  <path d="M12 20h9" />
+                  <path d="M16.5 3.5a2.121 2.121 0 0 1 3 3L7 19l-4 1 1-4L16.5 3.5z" />
+                </svg>
+              </div>
+              <strong>{tx("todosEmptyTitle", "No TODOs yet")}</strong>
+              <span>
+                {tx(
+                  "todosEmpty",
+                  "Add one above or let the agent surface follow-ups via todo.add.",
+                )}
+              </span>
+            </>
+          ) : (
+            <>
+              <strong>{tx("todosNoMatches", "No matching TODOs")}</strong>
+              <span>{tx("todosNoMatchesHint", "Try adjusting your filters.")}</span>
+            </>
+          )}
         </div>
       ) : (
-        <ol className="todos-list" aria-label={tx("todosListAria", "Project TODOs")}>
-          {todos.map((item) => (
-            <TodoRow key={item.id} item={item} />
-          ))}
-        </ol>
+        <>
+          <ol className="todos-list" aria-label={tx("todosListAria", "Project TODOs")}>
+            {filtered.map((item) => (
+              <TodoRow
+                key={item.id}
+                item={item}
+                selected={selectedIds.has(item.id)}
+                onToggleSelect={() => toggleSelect(item.id)}
+                anySelected={hasSelection}
+              />
+            ))}
+          </ol>
+
+          {/* Batch action bar */}
+          {hasSelection && (
+            <div ref={batchBarRef} className="todos-batch-bar">
+              <div className="todos-batch-info">
+                <button type="button" className="todos-batch-check" onClick={selectAllVisible}>
+                  {tx("todosSelectAll", "Select all")}
+                </button>
+                <button type="button" className="todos-batch-check" onClick={clearSelection}>
+                  {tx("todosClearSelection", "Clear")}
+                </button>
+                <span className="todos-batch-count">
+                  {selectedIds.size} {tx("todosSelected", "selected")}
+                </span>
+              </div>
+              <div className="todos-batch-actions">
+                <span className="todos-batch-label">{tx("todosBatchMark", "Mark")}</span>
+                {ALL_STATUSES.map((s) => (
+                  <button
+                    key={s}
+                    type="button"
+                    className={`todos-batch-btn status-${s}`}
+                    onClick={() => void batchSetStatus(s)}
+                  >
+                    {statusLabel(s)}
+                  </button>
+                ))}
+                <span className="todos-batch-divider" />
+                {(["low", "medium", "high"] as TodoPriority[]).map((p) => (
+                  <button
+                    key={p}
+                    type="button"
+                    className={`todos-batch-btn priority-${p}`}
+                    onClick={() => void batchSetPriority(p)}
+                  >
+                    <PriorityIcon priority={p} />
+                    {tx(`todosPriority${p.charAt(0).toUpperCase() + p.slice(1)}`, p)}
+                  </button>
+                ))}
+                <button
+                  type="button"
+                  className="todos-batch-btn priority-clear"
+                  onClick={() => void batchSetPriority("")}
+                >
+                  {tx("todosPriorityClear", "—")}
+                </button>
+                <span className="todos-batch-divider" />
+                <button
+                  type="button"
+                  className="todos-batch-btn batch-delete"
+                  onClick={() => void batchDelete()}
+                >
+                  {tx("todosDeleteSelected", "Delete")}
+                </button>
+              </div>
+            </div>
+          )}
+        </>
       )}
     </div>
   );
 }
 
-function TodoRow({ item }: { item: TodoItem }) {
+function TodoRow({
+  item,
+  selected,
+  onToggleSelect,
+  anySelected,
+}: {
+  item: TodoItem;
+  selected: boolean;
+  onToggleSelect: () => void;
+  anySelected: boolean;
+}) {
   const status = item.status;
-  const onCycle = async () => {
-    const next = nextStatus(status);
-    const updated = await updateTodo(item.id, { status: next });
+  const [menuOpen, setMenuOpen] = useState(false);
+  const menuRef = useRef<HTMLDivElement>(null);
+
+  // Close menu on outside click
+  useEffect(() => {
+    if (!menuOpen) return;
+    const onDocClick = (e: MouseEvent) => {
+      if (!menuRef.current?.contains(e.target as Node)) {
+        setMenuOpen(false);
+      }
+    };
+    document.addEventListener("mousedown", onDocClick);
+    return () => document.removeEventListener("mousedown", onDocClick);
+  }, [menuOpen]);
+
+  const onSetStatus = async (s: TodoStatus) => {
+    setMenuOpen(false);
+    const updated = await updateTodo(item.id, { status: s });
     if (updated) useAppStore.getState().upsertTodo(updated);
   };
+
+  const onSetPriority = async (p: TodoPriority | "") => {
+    setMenuOpen(false);
+    const updated = await updateTodo(item.id, { priority: p || "" });
+    if (updated) useAppStore.getState().upsertTodo(updated);
+  };
+
   const onDelete = async () => {
     const tmpl = tx("todosDeleteConfirm", "Delete TODO {title}?");
     const msg = tmpl.includes("{title}") ? tmpl.replace("{title}", item.title) : `${tmpl} (${item.title})`;
@@ -162,29 +409,65 @@ function TodoRow({ item }: { item: TodoItem }) {
     const ok = await deleteTodo(item.id);
     if (ok) useAppStore.getState().removeTodo(item.id);
   };
+
   return (
-    <li className={`todo-item todo-item-${status}`}>
+    <li className={`todo-item todo-item-${status} ${selected ? "is-selected" : ""}`}>
+      {/* Batch checkbox */}
+      <label className={`todo-check ${anySelected ? "is-visible" : ""}`}>
+        <input
+          type="checkbox"
+          checked={selected}
+          onChange={onToggleSelect}
+          aria-label={tx("todosSelectAria", "Select TODO")}
+        />
+        <span className="todo-check-box" aria-hidden="true">
+          {selected && (
+            <svg width="10" height="10" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="3" strokeLinecap="round" strokeLinejoin="round">
+              <path d="m5 12 4 4 10-10" />
+            </svg>
+          )}
+        </span>
+      </label>
+
       <button
         type="button"
         className="todo-status-button"
-        onClick={() => void onCycle()}
+        onClick={() => void onSetStatus(nextStatus(status))}
+        onContextMenu={(e) => {
+          e.preventDefault();
+          setMenuOpen(true);
+        }}
         aria-label={tx("todosCycleStatusAria", "Cycle status")}
-        title={tx("todosCycleStatus", "Cycle status")}
+        title={tx("todosCycleStatus", "Cycle status (right-click for menu)")}
       >
         <StatusIcon status={status} />
       </button>
+
       <div className="todo-item-body">
         <div className="todo-item-title">
-          <span>{item.title}</span>
+          <span className={status === "completed" || status === "cancelled" ? "is-struck" : ""}>
+            {item.title}
+          </span>
           {item.priority ? (
-            <span className={`todo-priority todo-priority-${item.priority}`}>
+            <span className={`todo-priority todo-priority-${item.priority}`} title={tx(`todosPriority${item.priority.charAt(0).toUpperCase() + item.priority.slice(1)}`, item.priority)}>
+              <PriorityIcon priority={item.priority} />
               {item.priority}
             </span>
           ) : null}
         </div>
         {item.notes ? <div className="todo-item-note">{item.notes}</div> : null}
       </div>
-      <span className="todo-status-label">{statusLabel(status)}</span>
+
+      <button
+        type="button"
+        className={`todo-status-label status-${status}`}
+        onClick={() => setMenuOpen((o) => !o)}
+        aria-haspopup="menu"
+        aria-expanded={menuOpen}
+      >
+        {statusLabel(status)}
+      </button>
+
       <button
         type="button"
         className="ghost-icon todo-delete"
@@ -207,6 +490,44 @@ function TodoRow({ item }: { item: TodoItem }) {
           <path d="m6 6 12 12" />
         </svg>
       </button>
+
+      {/* Quick-status dropdown */}
+      {menuOpen && (
+        <div ref={menuRef} className="todo-quick-menu">
+          <div className="todo-quick-menu-section">
+            <span className="todo-quick-menu-heading">{tx("todosQuickStatus", "Status")}</span>
+            <div className="todo-quick-menu-grid">
+              {ALL_STATUSES.map((s) => (
+                <button
+                  key={s}
+                  type="button"
+                  className={`todo-quick-menu-chip status-${s} ${s === status ? "is-active" : ""}`}
+                  onClick={() => void onSetStatus(s)}
+                >
+                  <StatusIcon status={s} />
+                  {statusLabel(s)}
+                </button>
+              ))}
+            </div>
+          </div>
+          <div className="todo-quick-menu-section">
+            <span className="todo-quick-menu-heading">{tx("todosQuickPriority", "Priority")}</span>
+            <div className="todo-quick-menu-grid">
+              {(["", "low", "medium", "high"] as const).map((p) => (
+                <button
+                  key={p || "none"}
+                  type="button"
+                  className={`todo-quick-menu-chip priority-${p || "none"} ${item.priority === p || (!item.priority && !p) ? "is-active" : ""}`}
+                  onClick={() => void onSetPriority(p)}
+                >
+                  {p ? <PriorityIcon priority={p} /> : <span className="priority-none-dot" />}
+                  {p ? tx(`todosPriority${p.charAt(0).toUpperCase() + p.slice(1)}`, p) : tx("todosPriorityNone", "None")}
+                </button>
+              ))}
+            </div>
+          </div>
+        </div>
+      )}
     </li>
   );
 }
@@ -276,3 +597,39 @@ function StatusIcon({ status }: { status: TodoStatus }) {
       );
   }
 }
+
+function PriorityIcon({ priority }: { priority: TodoPriority }) {
+  const common = {
+    width: 12,
+    height: 12,
+    viewBox: "0 0 24 24",
+    fill: "none",
+    stroke: "currentColor",
+    strokeWidth: 2.2,
+    strokeLinecap: "round" as const,
+    strokeLinejoin: "round" as const,
+  };
+  switch (priority) {
+    case "high":
+      return (
+        <svg {...common}>
+          <path d="M12 19V5" />
+          <path d="m5 12 7-7 7 7" />
+        </svg>
+      );
+    case "medium":
+      return (
+        <svg {...common}>
+          <path d="M5 12h14" />
+          <path d="m12 5 7 7-7 7" />
+        </svg>
+      );
+    case "low":
+      return (
+        <svg {...common}>
+          <path d="M12 5v14" />
+          <path d="m5 12 7 7 7-7" />
+        </svg>
+      );
+  }
+}
diff --git a/apps/jarvis-web/src/services/channels.ts b/apps/jarvis-web/src/services/channels.ts
index 2ac14db..4835549 100644
--- a/apps/jarvis-web/src/services/channels.ts
+++ b/apps/jarvis-web/src/services/channels.ts
@@ -3,21 +3,19 @@
 // Wraps `/v1/channels*`. Mirrors the conventions used by
 // `services/conversations.ts` etc. — fetch, surface 503 as null,
 // throw on other non-2xx so the UI surfaces actionable errors.
+//
+// `ChannelInstance` + `ChannelInstanceStatus` are re-exported from
+// the auto-generated bindings (`src/types/generated/`) — they're
+// the canonical wire-shape source of truth, regenerated by
+// `cargo test -p harness-channel`. Local aliases keep the legacy
+// import sites stable.
 
 import { apiUrl } from "./api";
+import type { ChannelInstance as GeneratedChannelInstance } from "../types/generated/ChannelInstance";
+import type { ChannelInstanceStatus } from "../types/generated/ChannelInstanceStatus";
 
-export type ChannelStatus = "enabled" | "disabled" | "unconfigured";
-
-export interface ChannelInstance {
-  id: string;
-  kind: string;
-  display_name: string;
-  status: ChannelStatus;
-  /** Kind-specific config blob. May contain `${env:NAME}` templates. */
-  config: Record<string, unknown>;
-  created_at: string;
-  updated_at: string;
-}
+export type ChannelStatus = ChannelInstanceStatus;
+export type ChannelInstance = GeneratedChannelInstance;
 
 /** Catalogue entry returned by `GET /v1/channels/kinds`. Drives the
  *  "Add channel" picker and the per-kind config form. */
diff --git a/apps/jarvis-web/src/services/frames/approvalFrames.ts b/apps/jarvis-web/src/services/frames/approvalFrames.ts
index d68fcf9..c12e3e3 100644
--- a/apps/jarvis-web/src/services/frames/approvalFrames.ts
+++ b/apps/jarvis-web/src/services/frames/approvalFrames.ts
@@ -28,9 +28,29 @@ export const approvalFrameHandlers: Record<string, (ev: any) => void> = {
   },
   permission_mode: (ev) => {
     appStore.getState().setPermissionMode(ev.mode ?? "ask");
+    // M2.3 UX: when the model itself switched the mode (via the
+    // `enter_plan_mode` tool), surface a transient toast so the
+    // operator isn't silently surprised on the next turn. The
+    // store action no-ops when `via` isn't "tool".
+    if (typeof ev?.via === "string") {
+      appStore.getState().setRecentModeChange?.({
+        mode: ev.mode ?? "ask",
+        via: ev.via,
+        at: Date.now(),
+      });
+    }
   },
   permission_rules_changed: () => {
     // Trigger any subscribed surface (Settings / Permissions) to refetch.
     appStore.getState().bumpPermissionRulesVersion?.();
   },
+  /// M3.3: server's prediction of which skills would auto-activate
+  /// on the next user turn given the agent's recently-touched
+  /// files. Emitted at end-of-turn (Done) and at session start;
+  /// payload `{skills: string[]}`. Empty array clears any stale
+  /// Composer chip when the user pivots and no files match.
+  skill_auto_activated_for_next_turn: (ev) => {
+    const names: string[] = Array.isArray(ev?.skills) ? ev.skills : [];
+    appStore.getState().setAutoActivatedNextTurnSkills(names);
+  },
 };
diff --git a/apps/jarvis-web/src/services/frames/lifecycleFrames.ts b/apps/jarvis-web/src/services/frames/lifecycleFrames.ts
index 41ac4af..bc8ef73 100644
--- a/apps/jarvis-web/src/services/frames/lifecycleFrames.ts
+++ b/apps/jarvis-web/src/services/frames/lifecycleFrames.ts
@@ -21,6 +21,16 @@ export const lifecycleFrameHandlers: Record<string, (ev: any) => void> = {
     // for the WorkOverview UsagePanel).
     recordUsageDaily(ev);
   },
+  tasks_snapshot: (ev) => {
+    // P7: server pushes a fresh BackgroundTasksPanel snapshot at
+    // every turn boundary so the panel can drop its tight 3s poll
+    // and rely on push for most updates. The frontend keeps a
+    // longer-interval safety poll for the panel's first-open case.
+    const items: unknown = ev?.items;
+    appStore
+      .getState()
+      .setBackgroundTasksSnapshot(Array.isArray(items) ? (items as unknown[]) : []);
+  },
   forked: (ev) => {
     appStore.getState().applyForked(ev.user_ordinal);
   },
diff --git a/apps/jarvis-web/src/store/slices/approvalSlice.ts b/apps/jarvis-web/src/store/slices/approvalSlice.ts
index 2405e0c..a0672f2 100644
--- a/apps/jarvis-web/src/store/slices/approvalSlice.ts
+++ b/apps/jarvis-web/src/store/slices/approvalSlice.ts
@@ -33,6 +33,22 @@ export interface ApprovalSlice {
   /// every component (Settings tab, future header chip) sees the
   /// same source of truth. Empty until the user toggles one.
   activeSkills: string[];
+  /// Most-recent mode change, with its source ("tool" when the
+  /// model self-switched via `enter_plan_mode`, "user" when the
+  /// operator clicked, "plan_accepted" after AcceptPlan, etc.).
+  /// `<ModeChangedToast>` watches this and auto-clears after a
+  /// few seconds — only the source != "user" path produces a
+  /// visible toast (an operator click shouldn't toast back at
+  /// themselves). `null` between events.
+  recentModeChange: { mode: PermissionMode; via: string; at: number } | null;
+  /// Skills the server predicts WILL auto-activate via the M3.3
+  /// path-match rule on the *next* user turn, given the files the
+  /// agent touched in the previous turn. Refreshed by the
+  /// `skill_auto_activated_for_next_turn` WS frame at end-of-turn;
+  /// cleared (server-side recomputes) at the next user message.
+  /// Lets the Composer chip warn the user "if you send now, X will
+  /// auto-activate" before they actually type.
+  autoActivatedNextTurnSkills: string[];
 
   // eslint-disable-next-line @typescript-eslint/no-explicit-any
   pushApprovalRequest: (id: string, name: string, args: any) => void;
@@ -53,6 +69,10 @@ export interface ApprovalSlice {
   bumpPermissionRulesVersion: () => void;
   setProposedPlan: (plan: string | null) => void;
   setActiveSkills: (names: string[]) => void;
+  setAutoActivatedNextTurnSkills: (names: string[]) => void;
+  setRecentModeChange: (
+    change: { mode: PermissionMode; via: string; at: number } | null,
+  ) => void;
 }
 
 export const createApprovalSlice: StateCreator<FullState, [], [], ApprovalSlice> = (set) => ({
@@ -61,6 +81,8 @@ export const createApprovalSlice: StateCreator<FullState, [], [], ApprovalSlice>
   permissionRulesVersion: 0,
   proposedPlan: null,
   activeSkills: [],
+  autoActivatedNextTurnSkills: [],
+  recentModeChange: null,
 
   pushApprovalRequest: (id, name, args) => {
     set((s) => {
@@ -121,4 +143,9 @@ export const createApprovalSlice: StateCreator<FullState, [], [], ApprovalSlice>
     const unique = Array.from(new Set(names.map((name) => name.trim()).filter(Boolean)));
     set({ activeSkills: unique });
   },
+  setAutoActivatedNextTurnSkills: (names) => {
+    const unique = Array.from(new Set(names.map((name) => name.trim()).filter(Boolean)));
+    set({ autoActivatedNextTurnSkills: unique });
+  },
+  setRecentModeChange: (change) => set({ recentModeChange: change }),
 });
diff --git a/apps/jarvis-web/src/store/slices/lifecycleSlice.ts b/apps/jarvis-web/src/store/slices/lifecycleSlice.ts
index d93cec0..28ae8eb 100644
--- a/apps/jarvis-web/src/store/slices/lifecycleSlice.ts
+++ b/apps/jarvis-web/src/store/slices/lifecycleSlice.ts
@@ -63,6 +63,16 @@ export interface LifecycleSlice {
     entry: Omit<TaskRailEntry, "startedAt" | "updatedAt"> & { startedAt?: number },
   ) => void;
   clearTasks: () => void;
+  /// Backend-pushed snapshot for the BackgroundTasksPanel
+  /// (`tasks_snapshot` WS frame). `null` means "no push received
+  /// yet — fall back to REST poll". A non-null empty array means
+  /// "the backend says nothing's in flight", which the panel
+  /// renders as the empty-state hint rather than re-polling.
+  /// eslint-disable-next-line @typescript-eslint/no-explicit-any
+  // eslint-disable-next-line @typescript-eslint/no-explicit-any
+  backgroundTasksSnapshot: any[] | null;
+  // eslint-disable-next-line @typescript-eslint/no-explicit-any
+  setBackgroundTasksSnapshot: (items: any[] | null) => void;
 }
 
 export const createLifecycleSlice: StateCreator<FullState, [], [], LifecycleSlice> = (set, get) => ({
@@ -76,6 +86,7 @@ export const createLifecycleSlice: StateCreator<FullState, [], [], LifecycleSlic
   conversationSurfaces: {},
   conversationRuns: {},
   conversationUnread: {},
+  backgroundTasksSnapshot: null,
 
   setActiveId: (id) => {
     set((s) => {
@@ -238,6 +249,7 @@ export const createLifecycleSlice: StateCreator<FullState, [], [], LifecycleSlic
     });
   },
   clearTasks: () => set({ tasks: [] }),
+  setBackgroundTasksSnapshot: (items) => set({ backgroundTasksSnapshot: items }),
 });
 
 function isRunActive(status: ConversationRunStatus | undefined): boolean {
diff --git a/apps/jarvis-web/src/styles.css b/apps/jarvis-web/src/styles.css
index c26dd01..4974001 100644
--- a/apps/jarvis-web/src/styles.css
+++ b/apps/jarvis-web/src/styles.css
@@ -16707,6 +16707,10 @@ select.settings-input {
 }
 
 .health-center-section-label {
+  display: flex;
+  align-items: baseline;
+  justify-content: space-between;
+  gap: 12px;
   margin-bottom: 8px;
   color: var(--text-soft);
   font-size: var(--fs-12);
@@ -16715,6 +16719,52 @@ select.settings-input {
   letter-spacing: 0;
 }
 
+.health-center-section-link {
+  appearance: none;
+  border: 0;
+  background: transparent;
+  padding: 2px 6px;
+  border-radius: var(--radius-sm, 6px);
+  color: var(--accent);
+  font-size: var(--fs-12);
+  font-weight: 650;
+  cursor: pointer;
+  transition: background 0.15s ease, color 0.15s ease;
+}
+.health-center-section-link:hover {
+  background: var(--panel-hover);
+}
+.health-center-section-link:focus-visible {
+  outline: 2px solid var(--accent);
+  outline-offset: 2px;
+}
+
+.health-center-details {
+  padding-top: 14px;
+}
+.health-center-details .health-optimization {
+  margin-top: 0;
+}
+
+.work-overview-tabs {
+  margin-top: 8px;
+}
+.work-overview-tabs .settings-tabs-list {
+  border-bottom-color: var(--border);
+}
+.work-overview-tabs .settings-tabs-panel {
+  gap: 16px;
+}
+.work-overview-tab-usage-grid {
+  grid-template-columns: minmax(0, 1fr) minmax(0, 1fr);
+  gap: 16px;
+}
+@media (max-width: 900px) {
+  .work-overview-tab-usage-grid {
+    grid-template-columns: minmax(0, 1fr);
+  }
+}
+
 .health-optimization {
   display: flex;
   min-width: 0;
@@ -23062,3 +23112,438 @@ select.settings-input {
     grid-template-columns: 1fr auto;
   }
 }
+
+/* --- Background-tasks panel (M2.2) --- */
+.bg-tasks-trigger-wrap {
+  position: relative;
+}
+.bg-tasks-trigger {
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  width: 28px;
+  height: 28px;
+  padding: 0;
+  background: transparent;
+  border: 1px solid var(--border);
+  border-radius: 6px;
+  color: var(--text-muted);
+  cursor: pointer;
+}
+.bg-tasks-trigger:hover {
+  color: var(--text);
+  background: var(--panel-hover);
+}
+.bg-tasks-trigger[aria-expanded="true"] {
+  color: var(--text);
+  background: var(--panel-hover);
+}
+.bg-tasks-panel {
+  position: absolute;
+  top: calc(100% + 7px);
+  right: 0;
+  z-index: 75;
+  width: 360px;
+  max-height: 480px;
+  display: flex;
+  flex-direction: column;
+  color: var(--text);
+  background: var(--panel);
+  border: 1px solid var(--border);
+  border-radius: 8px;
+  box-shadow: var(--shadow-popover);
+  overflow: hidden;
+}
+.bg-tasks-header {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  padding: 10px 12px;
+  border-bottom: 1px solid var(--border);
+}
+.bg-tasks-header h2 {
+  margin: 0;
+  font-size: var(--fs-14);
+  font-weight: 600;
+}
+.bg-tasks-close {
+  background: transparent;
+  border: none;
+  color: var(--text-muted);
+  cursor: pointer;
+  font-size: 18px;
+  line-height: 1;
+}
+.bg-tasks-body {
+  overflow-y: auto;
+  padding: 6px;
+}
+.bg-tasks-empty,
+.bg-tasks-error {
+  padding: 16px;
+  font-size: var(--fs-13);
+  color: var(--text-muted);
+  text-align: center;
+}
+.bg-tasks-error {
+  color: var(--danger, #c44);
+}
+.bg-tasks-list {
+  list-style: none;
+  margin: 0;
+  padding: 0;
+  display: flex;
+  flex-direction: column;
+  gap: 2px;
+}
+.bg-tasks-row {
+  display: grid;
+  grid-template-columns: auto 1fr auto auto;
+  align-items: center;
+  gap: 8px;
+  padding: 6px 8px;
+  border-radius: 6px;
+  font-size: var(--fs-13);
+}
+.bg-tasks-row:hover {
+  background: var(--panel-hover);
+}
+.bg-tasks-kind {
+  display: inline-block;
+  padding: 1px 6px;
+  font-size: var(--fs-12);
+  font-weight: 500;
+  color: var(--text-muted);
+  background: var(--panel-hover);
+  border-radius: 4px;
+}
+.bg-tasks-label {
+  overflow: hidden;
+  text-overflow: ellipsis;
+  white-space: nowrap;
+  color: var(--text);
+}
+.bg-tasks-status {
+  font-size: var(--fs-12);
+  color: var(--text-muted);
+}
+.bg-tasks-age {
+  font-size: var(--fs-12);
+  color: var(--text-muted);
+  font-variant-numeric: tabular-nums;
+}
+
+/* --- Composer auto-activated skills chip (M3.3 UX) --- */
+.composer-auto-skills {
+  display: flex;
+  align-items: center;
+  gap: 8px;
+  margin-bottom: 6px;
+  padding: 4px 10px;
+  background: var(--panel);
+  border: 1px solid var(--border);
+  border-radius: 6px;
+  font-size: var(--fs-12);
+  color: var(--text-muted);
+}
+.composer-auto-skills-label {
+  flex-shrink: 0;
+}
+.composer-auto-skills-list {
+  display: flex;
+  flex-wrap: wrap;
+  gap: 4px;
+  margin: 0;
+  padding: 0;
+  list-style: none;
+}
+.composer-auto-skills-pill {
+  padding: 1px 6px;
+  background: var(--panel-hover);
+  border-radius: 4px;
+  color: var(--text);
+  font-weight: 500;
+}
+
+/* --- Mode-changed toast (M2.3 UX) --- */
+.mode-changed-toast {
+  display: flex;
+  align-items: center;
+  gap: 10px;
+  margin: 8px 16px;
+  padding: 8px 12px;
+  background: var(--panel);
+  border: 1px solid var(--border);
+  border-left: 3px solid var(--accent, #5b8def);
+  border-radius: 6px;
+  font-size: var(--fs-13);
+  color: var(--text);
+  box-shadow: var(--shadow-popover);
+  animation: mode-toast-in 0.18s ease-out;
+}
+@keyframes mode-toast-in {
+  from { opacity: 0; transform: translateY(-4px); }
+  to { opacity: 1; transform: translateY(0); }
+}
+.mode-changed-toast-icon {
+  font-size: 14px;
+  color: var(--accent, #5b8def);
+}
+.mode-changed-toast-body {
+  flex: 1;
+  line-height: 1.4;
+}
+.mode-changed-toast-body strong {
+  font-weight: 600;
+}
+.mode-changed-toast-close {
+  background: transparent;
+  border: none;
+  color: var(--text-muted);
+  cursor: pointer;
+  font-size: 16px;
+  line-height: 1;
+  padding: 0 4px;
+}
+.mode-changed-toast-close:hover {
+  color: var(--text);
+}
+
+/* --- Memory Sync settings panel (P14) --- */
+.memory-sync-pane {
+  display: flex;
+  flex-direction: column;
+  gap: 10px;
+  font-size: var(--fs-13);
+}
+.memory-sync-row {
+  display: flex;
+  align-items: center;
+  gap: 12px;
+  padding: 6px 10px;
+  background: var(--panel);
+  border: 1px solid var(--border);
+  border-radius: 6px;
+}
+.memory-sync-label {
+  flex-shrink: 0;
+  width: 110px;
+  color: var(--text-muted);
+}
+.memory-sync-row code,
+.memory-sync-pane code {
+  font-family: var(--font-mono, ui-monospace);
+  font-size: var(--fs-12);
+  background: var(--panel-hover);
+  padding: 2px 6px;
+  border-radius: 4px;
+  word-break: break-all;
+}
+.memory-sync-badge {
+  padding: 2px 10px;
+  border-radius: 999px;
+  font-size: var(--fs-12);
+  font-weight: 500;
+}
+.memory-sync-badge.backend-git {
+  background: var(--accent-soft, #d8ecff);
+  color: var(--accent, #2563eb);
+}
+.memory-sync-badge.backend-icloud {
+  background: #ffe9d8;
+  color: #b45309;
+}
+.memory-sync-badge.backend-none {
+  background: var(--panel-hover);
+  color: var(--text-muted);
+}
+.memory-sync-empty,
+.memory-sync-off {
+  padding: 12px;
+  background: var(--panel);
+  border: 1px dashed var(--border);
+  border-radius: 6px;
+  color: var(--text-muted);
+  line-height: 1.5;
+}
+.memory-sync-error {
+  padding: 8px 12px;
+  background: var(--danger-soft, #fde7e7);
+  color: var(--danger, #c44);
+  border-radius: 6px;
+}
+.memory-sync-result {
+  padding: 8px 12px;
+  border-radius: 6px;
+  font-size: var(--fs-12);
+}
+.memory-sync-result.ok {
+  background: var(--success-soft, #e3f6e1);
+  color: var(--success, #2e7d32);
+}
+.memory-sync-result.fail {
+  background: var(--danger-soft, #fde7e7);
+  color: var(--danger, #c44);
+  white-space: pre-wrap;
+}
+.memory-sync-setup,
+.memory-sync-icloud,
+.memory-sync-git {
+  display: flex;
+  flex-direction: column;
+  gap: 10px;
+  padding: 10px;
+  background: var(--panel);
+  border: 1px solid var(--border);
+  border-radius: 6px;
+}
+.memory-sync-form {
+  display: flex;
+  gap: 8px;
+}
+.memory-sync-input {
+  flex: 1;
+  padding: 6px 10px;
+  border: 1px solid var(--border);
+  border-radius: 4px;
+  font-family: var(--font-mono, ui-monospace);
+  font-size: var(--fs-12);
+  background: var(--panel-hover);
+  color: var(--text);
+}
+.memory-sync-btn {
+  padding: 6px 14px;
+  border: 1px solid var(--border);
+  border-radius: 4px;
+  background: var(--accent, #2563eb);
+  color: white;
+  cursor: pointer;
+  font-size: var(--fs-13);
+}
+.memory-sync-btn:hover:not(:disabled) {
+  filter: brightness(1.1);
+}
+.memory-sync-btn:disabled {
+  opacity: 0.5;
+  cursor: not-allowed;
+}
+.memory-sync-btn.ghost {
+  background: transparent;
+  color: var(--text);
+}
+.memory-sync-footer {
+  display: flex;
+  justify-content: flex-end;
+  margin-top: 4px;
+}
+.memory-sync-pane details {
+  font-size: var(--fs-12);
+}
+.memory-sync-pane details pre {
+  background: var(--panel-hover);
+  padding: 8px;
+  border-radius: 4px;
+  overflow-x: auto;
+  white-space: pre-wrap;
+  word-break: break-all;
+}
+
+/* --- Memory Includes panel (P17) --- */
+.memory-includes-wrap {
+  display: flex;
+  flex-direction: column;
+  gap: 16px;
+  margin-top: 8px;
+}
+.memory-includes {
+  display: flex;
+  flex-direction: column;
+  gap: 8px;
+  padding: 10px;
+  background: var(--panel);
+  border: 1px solid var(--border);
+  border-radius: 6px;
+}
+.memory-includes-header {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+}
+.memory-includes-empty {
+  font-size: var(--fs-12);
+  color: var(--text-muted);
+  padding: 4px 0;
+}
+.memory-includes-list {
+  list-style: none;
+  margin: 0;
+  padding: 0;
+  display: flex;
+  flex-direction: column;
+  gap: 6px;
+}
+.memory-includes-item {
+  display: flex;
+  flex-direction: column;
+  gap: 4px;
+  padding: 6px 8px;
+  background: var(--panel-hover);
+  border-radius: 4px;
+  border-left: 3px solid transparent;
+}
+.memory-includes-item.ok {
+  border-left-color: var(--success, #2e7d32);
+}
+.memory-includes-item.fail {
+  border-left-color: var(--danger, #c44);
+}
+.memory-includes-row {
+  display: flex;
+  align-items: center;
+  gap: 8px;
+  flex-wrap: wrap;
+}
+.memory-includes-kind {
+  flex-shrink: 0;
+  font-size: var(--fs-11);
+  font-weight: 600;
+  padding: 1px 6px;
+  border-radius: 4px;
+  background: var(--panel);
+  border: 1px solid var(--border);
+  color: var(--text-muted);
+}
+.memory-includes-kind.kind-git_url {
+  color: var(--accent, #2563eb);
+  border-color: var(--accent, #2563eb);
+}
+.memory-includes-target {
+  flex: 1;
+  font-family: var(--font-mono, ui-monospace);
+  font-size: var(--fs-12);
+  word-break: break-all;
+}
+.memory-includes-actions {
+  display: flex;
+  gap: 4px;
+  flex-shrink: 0;
+}
+.memory-includes-detail {
+  font-size: var(--fs-11);
+  color: var(--text-muted);
+  padding-left: 6px;
+}
+.memory-includes-detail code {
+  font-size: var(--fs-11);
+  background: var(--panel);
+  padding: 1px 4px;
+  border-radius: 3px;
+}
+.memory-includes-err {
+  color: var(--danger, #c44);
+}
+.memory-includes-add {
+  display: flex;
+  gap: 8px;
+  margin-top: 4px;
+}
diff --git a/apps/jarvis-web/src/types/generated/AcceptancePolicy.ts b/apps/jarvis-web/src/types/generated/AcceptancePolicy.ts
new file mode 100644
index 0000000..b2efc3a
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/AcceptancePolicy.ts
@@ -0,0 +1,13 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+/**
+ * Who decides `Review → Done` for a [`Requirement`].
+ *
+ * Older JSON rows on disk that don't carry the field deserialise
+ * as the default [`AcceptancePolicy::Subagent`] — i.e. the new
+ * reviewer-subagent behaviour applies once the v1.0 subagent
+ * machinery is wired in. Until that machinery lands, the field is
+ * inert (no caller checks it), so the default is forward-looking
+ * without changing today's flow.
+ */
+export type AcceptancePolicy = "subagent" | "human";
diff --git a/apps/jarvis-web/src/types/generated/Activity.ts b/apps/jarvis-web/src/types/generated/Activity.ts
new file mode 100644
index 0000000..022f517
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/Activity.ts
@@ -0,0 +1,41 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+import type { ActivityActor } from "./ActivityActor";
+import type { ActivityKind } from "./ActivityKind";
+
+/**
+ * One audit-timeline row.
+ *
+ * `body` is intentionally an open `serde_json::Value` rather than a
+ * per-kind enum payload — different events carry different shapes
+ * (`{from, to}` for status, `{run_id, status}` for run finished,
+ * etc.) and routing every shape through a typed enum would force
+ * every consumer to know the full set. UIs that need to read a
+ * field do so on a per-kind basis; the wire format documents the
+ * expected shape per kind below.
+ */
+export type Activity = { 
+/**
+ * Stable identifier (UUID v4).
+ */
+id: string, 
+/**
+ * Requirement this activity belongs to.
+ */
+requirement_id: string, 
+/**
+ * What happened.
+ */
+kind: ActivityKind, 
+/**
+ * Who did it.
+ */
+actor: ActivityActor, 
+/**
+ * Free-form payload, shape varies by `kind`. See variant docs
+ * for the expected fields.
+ */
+body: Record<string, unknown>, 
+/**
+ * RFC-3339 / ISO-8601 timestamp.
+ */
+created_at: string, };
diff --git a/apps/jarvis-web/src/types/generated/ActivityActor.ts b/apps/jarvis-web/src/types/generated/ActivityActor.ts
new file mode 100644
index 0000000..77eabdc
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/ActivityActor.ts
@@ -0,0 +1,13 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+/**
+ * Who triggered an activity.
+ *
+ * `Human` is the v0 default for any REST-driven mutation (we don't
+ * have user identity yet — every authenticated REST call counts as
+ * "the human at the keyboard"). `Agent` is reserved for Phase 4
+ * when `requirement.*` tools let the model drive board state.
+ * `System` is the bucket for server-side auto-advances
+ * (e.g. `start_run` flipping `Backlog → InProgress`).
+ */
+export type ActivityActor = { "type": "human" } | { "type": "agent", profile_id: string, } | { "type": "system" };
diff --git a/apps/jarvis-web/src/types/generated/ActivityKind.ts b/apps/jarvis-web/src/types/generated/ActivityKind.ts
new file mode 100644
index 0000000..8508e2f
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/ActivityKind.ts
@@ -0,0 +1,11 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+/**
+ * Kind of activity. Wire form is snake_case
+ * (`"status_change"` / `"run_started"` / ...).
+ *
+ * The set is intentionally small in v0; AssigneeChange / Comment /
+ * Blocked / Unblocked are reserved for Phases 3.6 / 4 when their
+ * driving features land.
+ */
+export type ActivityKind = "status_change" | "run_started" | "run_finished" | "verification_finished" | "assignee_change" | "comment" | "blocked" | "unblocked";
diff --git a/apps/jarvis-web/src/types/generated/ChannelInstance.ts b/apps/jarvis-web/src/types/generated/ChannelInstance.ts
new file mode 100644
index 0000000..a63ff07
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/ChannelInstance.ts
@@ -0,0 +1,45 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+import type { ChannelInstanceStatus } from "./ChannelInstanceStatus";
+
+/**
+ * One configured channel — e.g. a WeCom group robot, a WeChat MP
+ * callback target, a Feishu bot. Instances are user-named (`display_name`)
+ * because a deployment may host several of the same `kind` (multiple
+ * WeCom groups = multiple `wecom_webhook` rows).
+ *
+ * `config` is left as a `serde_json::Value` so each kind owns its own
+ * schema without baking variant-specific fields into the trait
+ * surface. The current kinds and their schemas live next to the
+ * `kind`-specific senders in `harness-server`.
+ */
+export type ChannelInstance = { 
+/**
+ * Stable UUID. Frontend keys list rows by this.
+ */
+id: string, 
+/**
+ * Discriminator: "wecom_webhook" / "wechat_mp" / "feishu_bot" / …
+ * Validators in the server know which `config` shape to expect
+ * per kind; unknown kinds are rejected at the REST boundary.
+ */
+kind: string, 
+/**
+ * User-set human-readable name (e.g. "prod-alerts"). The REST
+ * layer enforces non-empty + max 64 chars; the trait stays
+ * liberal so storage doesn't need to know.
+ */
+display_name: string, status: ChannelInstanceStatus, 
+/**
+ * Kind-specific config payload. May embed `${env:NAME}` template
+ * strings — resolved at send-time, never at store-time, so a
+ * rotated env var takes effect immediately.
+ */
+config: Record<string, unknown>, 
+/**
+ * RFC-3339 timestamp set on insert.
+ */
+created_at: string, 
+/**
+ * RFC-3339 timestamp bumped on every upsert.
+ */
+updated_at: string, };
diff --git a/apps/jarvis-web/src/types/generated/ChannelInstanceStatus.ts b/apps/jarvis-web/src/types/generated/ChannelInstanceStatus.ts
new file mode 100644
index 0000000..1d00c00
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/ChannelInstanceStatus.ts
@@ -0,0 +1,11 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+/**
+ * User-driven enabled/disabled/unconfigured state. Distinct from
+ * "did the last send succeed" — that's surfaced via per-instance
+ * telemetry instead. `Unconfigured` is set by handlers when the
+ * validator detects required fields are missing (so the UI can show
+ * a "继续配置" CTA without the user having to remember which fields
+ * they skipped).
+ */
+export type ChannelInstanceStatus = "enabled" | "disabled" | "unconfigured";
diff --git a/apps/jarvis-web/src/types/generated/ChannelMessageFormat.ts b/apps/jarvis-web/src/types/generated/ChannelMessageFormat.ts
new file mode 100644
index 0000000..4afd287
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/ChannelMessageFormat.ts
@@ -0,0 +1,9 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+/**
+ * Wire format of an outbound message body. Adapters that don't
+ * support a particular format fall back to `Text` and tag the
+ * `SendOutcome` so the caller (e.g. `channel.send` tool) can
+ * surface "downgraded to text" in the agent's transcript.
+ */
+export type ChannelMessageFormat = "text" | "markdown";
diff --git a/apps/jarvis-web/src/types/generated/Comment.ts b/apps/jarvis-web/src/types/generated/Comment.ts
new file mode 100644
index 0000000..2b100d0
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/Comment.ts
@@ -0,0 +1,52 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+import type { ActivityActor } from "./ActivityActor";
+
+/**
+ * One row in the discussion thread for a Requirement.
+ *
+ * `parent_id` enables one level of threading: a top-level comment
+ * has `parent_id = None`; a reply has `parent_id = Some(top_level_id)`.
+ * We deliberately keep this flat (no nesting deeper than two levels)
+ * — multi-level reply trees are a feature trap; Linear / GitHub /
+ * Multica all flatten beyond depth 1, and so do we.
+ */
+export type Comment = { 
+/**
+ * Stable identifier (UUID v4).
+ */
+id: string, 
+/**
+ * The Requirement this comment is attached to.
+ */
+requirement_id: string, 
+/**
+ * Who wrote it. Reuses `ActivityActor` so a comment authored by
+ * an agent can carry its profile id and a human-authored one
+ * stays a flat `Human` variant. `System` is reserved for any
+ * future "the server posted this" case (release notes,
+ * auto-summaries) — humans should not write `System` comments
+ * directly.
+ */
+author: ActivityActor, 
+/**
+ * Plain markdown body. No HTML sanitisation here — the trait
+ * stays format-agnostic; the web UI renders via its existing
+ * markdown component which handles sanitisation.
+ */
+body: string, 
+/**
+ * `Some(<top_level_id>)` for a one-level reply; `None` for a
+ * top-level comment. Implementations MUST reject inserts where
+ * `parent_id` itself has a non-`None` parent — i.e. depth > 1.
+ */
+parent_id: string | null, 
+/**
+ * RFC-3339 / ISO-8601. Set on insert, never mutated.
+ */
+created_at: string, 
+/**
+ * RFC-3339 / ISO-8601. Set on insert (= `created_at`), bumped
+ * on every edit. The UI compares the two to decide whether to
+ * render an "(edited)" marker.
+ */
+updated_at: string, };
diff --git a/apps/jarvis-web/src/types/generated/KanbanColumn.ts b/apps/jarvis-web/src/types/generated/KanbanColumn.ts
new file mode 100644
index 0000000..e41d547
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/KanbanColumn.ts
@@ -0,0 +1,31 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+/**
+ * One user-configurable column on a project's kanban board. Stored
+ * inline on the [`Project`] (not a separate table) since the
+ * cardinality is tiny (typically 3–6 per project) and edits always go
+ * through the project's PATCH endpoint anyway.
+ */
+export type KanbanColumn = { 
+/**
+ * Stable id; what `Requirement.status` references. Validated as
+ * non-empty + ≤ 64 bytes by [`validate_column_id`]. Built-in
+ * defaults use `"backlog"` / `"in_progress"` / `"review"` /
+ * `"done"` so existing projects upgrade without a data migration.
+ */
+id: string, 
+/**
+ * Display label. Free-form, language-of-the-user. The Web UI
+ * renders this verbatim — no i18n lookup once a project has
+ * customised columns. The i18n fallback only applies when
+ * `Project.columns` is `None` and the four default ids are used.
+ */
+label: string, 
+/**
+ * Optional kind hint that drives the icon. Recognised values:
+ * `"backlog"` / `"in_progress"` / `"review"` / `"done"`. Custom
+ * columns omit this and get a neutral dot. Storing the kind
+ * lets a renamed-but-still-Backlog column keep its dashed-circle
+ * glyph.
+ */
+kind: string | null, };
diff --git a/apps/jarvis-web/src/types/generated/Label.ts b/apps/jarvis-web/src/types/generated/Label.ts
new file mode 100644
index 0000000..25a1eee
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/Label.ts
@@ -0,0 +1,43 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+/**
+ * One project-scoped tag.
+ */
+export type Label = { 
+/**
+ * Stable identifier (UUID v4).
+ */
+id: string, 
+/**
+ * Project this label belongs to. Labels do not cross project
+ * boundaries — two projects with a "bug" label have two
+ * independent rows.
+ */
+project_id: string, 
+/**
+ * Display name. Trimmed and required non-empty by
+ * [`validate_label_name`]. Case-preserving, but uniqueness
+ * inside a project is enforced case-insensitively (mirrors
+ * `Project.slug` and Multica's behaviour).
+ */
+name: string, 
+/**
+ * Hex colour in `#rrggbb` form (lowercase). Validated by
+ * [`validate_label_colour`]. The UI overlays text on top, so
+ * extreme contrast values (`#ffffff`, `#000000`) are allowed
+ * — the renderer picks a contrasting text colour.
+ */
+colour: string, 
+/**
+ * Optional one-line guidance: "use this when X". Markdown
+ * allowed; the kanban shows it on hover.
+ */
+description: string | null, 
+/**
+ * RFC-3339 / ISO-8601. Set on insert, never mutated.
+ */
+created_at: string, 
+/**
+ * RFC-3339 / ISO-8601. Bumped on every mutation.
+ */
+updated_at: string, };
diff --git a/apps/jarvis-web/src/types/generated/Project.ts b/apps/jarvis-web/src/types/generated/Project.ts
new file mode 100644
index 0000000..6b9f35b
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/Project.ts
@@ -0,0 +1,78 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+import type { KanbanColumn } from "./KanbanColumn";
+import type { ProjectAutomation } from "./ProjectAutomation";
+import type { ProjectWorkspace } from "./ProjectWorkspace";
+
+/**
+ * A reusable, named bundle of instructions / context that can be bound
+ * to one or more [`Conversation`](crate::Conversation)s.
+ *
+ * Stored opaquely by [`ProjectStore`](crate::store::ProjectStore)
+ * implementations; the wire shape is the JSON serialisation of this
+ * struct, so all fields must round-trip through `serde`.
+ */
+export type Project = { 
+/**
+ * Stable internal identifier (UUID v4). Conversations reference
+ * this, never the slug.
+ */
+id: string, 
+/**
+ * Human-readable, URL/CLI-friendly handle. Globally unique within
+ * a store. Renameable (with care: existing references break).
+ */
+slug: string, 
+/**
+ * Display name. Free-form, not unique.
+ */
+name: string, 
+/**
+ * Optional one-liner shown in pickers / sidebars.
+ */
+description: string | null, 
+/**
+ * The body that gets injected into the system prompt for any
+ * conversation bound to this project. Markdown-friendly.
+ */
+instructions: string, 
+/**
+ * Free-form tags; useful for UI grouping. Order is preserved.
+ */
+tags: Array<string>, 
+/**
+ * Workspace folders associated with this project. Order is
+ * preserved and is the order the UI displays them in.
+ *
+ * Empty for projects that exist purely as instruction containers.
+ * `#[serde(default)]` keeps legacy JSON rows that pre-date this
+ * field loadable.
+ */
+workspaces: Array<ProjectWorkspace>, 
+/**
+ * Soft-delete flag. Archived projects are hidden from default
+ * listings but their bound conversations keep working.
+ */
+archived: boolean, 
+/**
+ * Custom kanban columns. When `None`, clients fall back to the
+ * four built-in defaults (Backlog / In Progress / Review / Done)
+ * — see [`default_kanban_columns`]. Order is the render order
+ * on the board, left-to-right. Each column's [`KanbanColumn::id`]
+ * is what [`Requirement::status`](crate::Requirement::status)
+ * stores.
+ */
+columns: Array<KanbanColumn> | null, 
+/**
+ * Per-project automation policy. Omitted on legacy JSON rows;
+ * such rows default to auto-mode eligibility.
+ */
+automation: ProjectAutomation, 
+/**
+ * RFC-3339 / ISO-8601 timestamp of creation.
+ */
+created_at: string, 
+/**
+ * RFC-3339 / ISO-8601 timestamp of the last mutation. Bumped by
+ * the `set_*` / `with_*` helpers so callers don't have to.
+ */
+updated_at: string, };
diff --git a/apps/jarvis-web/src/types/generated/ProjectAutomation.ts b/apps/jarvis-web/src/types/generated/ProjectAutomation.ts
new file mode 100644
index 0000000..53b7f68
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/ProjectAutomation.ts
@@ -0,0 +1,12 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+/**
+ * Per-project automation policy.
+ *
+ * The process-level auto-mode flag remains the master switch, but
+ * each Project can now opt out independently. The default is
+ * enabled so existing deployments that turn on `JARVIS_WORK_MODE=auto`
+ * keep the historical "all approved projects are eligible" behaviour
+ * until an operator pauses a specific project.
+ */
+export type ProjectAutomation = { auto_mode_enabled: boolean, };
diff --git a/apps/jarvis-web/src/types/generated/ProjectWorkspace.ts b/apps/jarvis-web/src/types/generated/ProjectWorkspace.ts
new file mode 100644
index 0000000..a8ee2fe
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/ProjectWorkspace.ts
@@ -0,0 +1,25 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+/**
+ * A workspace folder a [`Project`] knows about.
+ *
+ * Projects live independently of any particular filesystem root, but
+ * many real workflows (Claude Code-style multi-repo projects) want to
+ * associate a project with one or more on-disk folders so the chat UI
+ * can offer them as candidates and surface their VCS state.
+ *
+ * Paths are stored verbatim — canonicalisation is the caller's job
+ * (the REST layer canonicalises on insert).
+ */
+export type ProjectWorkspace = { 
+/**
+ * Filesystem path. Expected to be absolute and canonical, but the
+ * type does not enforce that — see `harness-server`'s create /
+ * update handlers for the normalisation pass.
+ */
+path: string, 
+/**
+ * Optional display label. When `None`, UIs fall back to the last
+ * path segment.
+ */
+name: string | null, };
diff --git a/apps/jarvis-web/src/types/generated/Requirement.ts b/apps/jarvis-web/src/types/generated/Requirement.ts
new file mode 100644
index 0000000..7686f4e
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/Requirement.ts
@@ -0,0 +1,104 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+import type { RequirementStatus } from "./RequirementStatus";
+import type { RequirementTodo } from "./RequirementTodo";
+import type { TriageState } from "./TriageState";
+import type { VerificationPlan } from "./VerificationPlan";
+
+/**
+ * One persistent requirement scoped to a single [`Project`](crate::Project).
+ *
+ * The wire shape matches the JSON serialisation of this struct.
+ * Renderers should treat unknown statuses as
+ * [`RequirementStatus::Backlog`] for forward compat.
+ */
+export type Requirement = { 
+/**
+ * Stable identifier (UUID v4 string). Server-allocated on
+ * `POST /v1/projects/:id/requirements` so clients can't pick
+ * colliding ids.
+ */
+id: string, 
+/**
+ * Foreign key into [`Project::id`](crate::Project). Not enforced
+ * at the storage layer (no DB FK) so a project delete doesn't
+ * cascade-orphan requirements; higher layers should check.
+ */
+project_id: string, 
+/**
+ * Headline. One sentence; markdown is allowed but most UIs
+ * render it as plain text.
+ */
+title: string, 
+/**
+ * Optional longer body. `None` means no body — UI shows just the
+ * title.
+ */
+description: string | null, 
+/**
+ * Kanban column.
+ */
+status: RequirementStatus, 
+/**
+ * Conversations (by id) that have been used to work on this
+ * requirement — i.e. the "runs". Each id refers to a row in
+ * [`ConversationStore`](crate::ConversationStore). Empty by
+ * default; appended when the user opens a fresh chat from the
+ * requirement card.
+ */
+conversation_ids: Array<string>, 
+/**
+ * Phase 6 — optional pinned [`VerificationPlan`] that auto
+ * mode (and the manual "Run verification" UI when filled
+ * from a template) should fire after each
+ * [`RequirementRun`](crate::RequirementRun) finishes. `None`
+ * = "no per-requirement template; verify only when the
+ * caller passes commands explicitly". Newer field so older
+ * JSON rows without it deserialise as `None`.
+ */
+verification_plan: VerificationPlan | null, 
+/**
+ * Structured execution / verification checklist under this
+ * requirement. These are intentionally more operational than a
+ * requirement description: CI commands, deploy-preview checks,
+ * manual QA items, reviewer passes, etc. The auto loop and
+ * future CI/CD adapters can update `status` + `evidence` here
+ * so later inspection doesn't depend on reading chat history.
+ */
+todos: Array<RequirementTodo>, 
+/**
+ * Triage gate (v1.0). Distinguishes "user-approved work the
+ * auto executor may pick up" from "agent-proposed / scan-
+ * surfaced candidate that must be reviewed first". Auto loop
+ * only consumes [`TriageState::Approved`] rows. Older JSON
+ * rows without the field deserialise as `Approved` (the
+ * pre-v1.0 default behaviour).
+ */
+triage_state: TriageState, 
+/**
+ * Other requirement ids that must reach
+ * [`RequirementStatus::Done`] before this one is eligible for
+ * auto execution. Manual `Start` ignores this list — the gate
+ * is a scheduler concern, not a hard FK. Empty = no
+ * dependencies. Older JSON rows without the field deserialise
+ * as an empty `Vec`.
+ */
+depends_on: Array<string>, 
+/**
+ * Project-scoped [`Label`](crate::Label) ids attached to this
+ * row. The label rows themselves live in [`LabelStore`](crate::LabelStore)
+ * — this field only carries references so renaming / recolouring
+ * a label doesn't rewrite every Requirement that uses it.
+ * Order is preserved so the UI can render chips in the order
+ * the operator added them. Older JSON rows without the field
+ * deserialise as an empty `Vec`.
+ */
+label_ids: Array<string>, 
+/**
+ * RFC-3339 / ISO-8601 timestamp of creation.
+ */
+created_at: string, 
+/**
+ * RFC-3339 / ISO-8601 timestamp; bumped on every mutation via
+ * [`Self::touch`].
+ */
+updated_at: string, };
diff --git a/apps/jarvis-web/src/types/generated/RequirementStatus.ts b/apps/jarvis-web/src/types/generated/RequirementStatus.ts
new file mode 100644
index 0000000..a34077a
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/RequirementStatus.ts
@@ -0,0 +1,9 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+/**
+ * Kanban column / lifecycle state of a [`Requirement`]. Serialised
+ * snake_case (`"backlog"` / `"in_progress"` / `"review"` / `"done"`)
+ * to match the wire shape the Web UI already produces and consumes
+ * (see `apps/jarvis-web/src/types/frames.ts`).
+ */
+export type RequirementStatus = "backlog" | "in_progress" | "review" | "done";
diff --git a/apps/jarvis-web/src/types/generated/RequirementTodo.ts b/apps/jarvis-web/src/types/generated/RequirementTodo.ts
new file mode 100644
index 0000000..9de37c0
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/RequirementTodo.ts
@@ -0,0 +1,48 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+import type { RequirementTodoCreator } from "./RequirementTodoCreator";
+import type { RequirementTodoEvidence } from "./RequirementTodoEvidence";
+import type { RequirementTodoKind } from "./RequirementTodoKind";
+import type { RequirementTodoStatus } from "./RequirementTodoStatus";
+
+/**
+ * Structured TODO / check item scoped to one [`Requirement`].
+ *
+ * This is the durable execution ledger for a card. It is not a
+ * free-form chat plan: every item has a kind, status, optional
+ * command, dependencies, and evidence so automation can decide what
+ * to run next and humans can audit what happened later.
+ */
+export type RequirementTodo = { 
+/**
+ * Stable item id (UUID v4).
+ */
+id: string, 
+/**
+ * Short actionable label.
+ */
+title: string, 
+/**
+ * Operational category.
+ */
+kind: RequirementTodoKind, 
+/**
+ * Current state.
+ */
+status: RequirementTodoStatus, 
+/**
+ * Optional shell command or workflow command. Only meaningful
+ * for `ci`, `deploy`, and command-backed `check` items.
+ */
+command: string | null, 
+/**
+ * Latest machine-readable proof for this item.
+ */
+evidence: RequirementTodoEvidence | null, 
+/**
+ * Other TODO ids that must pass before this one is eligible.
+ */
+depends_on: Array<string>, 
+/**
+ * Who created the item.
+ */
+created_by: RequirementTodoCreator, created_at: string, updated_at: string, };
diff --git a/apps/jarvis-web/src/types/generated/RequirementTodoCreator.ts b/apps/jarvis-web/src/types/generated/RequirementTodoCreator.ts
new file mode 100644
index 0000000..a8ae7f5
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/RequirementTodoCreator.ts
@@ -0,0 +1,3 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+export type RequirementTodoCreator = "human" | "agent" | "workflow";
diff --git a/apps/jarvis-web/src/types/generated/RequirementTodoEvidence.ts b/apps/jarvis-web/src/types/generated/RequirementTodoEvidence.ts
new file mode 100644
index 0000000..edd1b96
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/RequirementTodoEvidence.ts
@@ -0,0 +1,6 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+/**
+ * Latest proof attached to a [`RequirementTodo`].
+ */
+export type RequirementTodoEvidence = { run_id: string | null, exit_code: number | null, stdout_excerpt: string | null, stderr_excerpt: string | null, artifact_url: string | null, note: string | null, };
diff --git a/apps/jarvis-web/src/types/generated/RequirementTodoKind.ts b/apps/jarvis-web/src/types/generated/RequirementTodoKind.ts
new file mode 100644
index 0000000..4519a14
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/RequirementTodoKind.ts
@@ -0,0 +1,3 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+export type RequirementTodoKind = "work" | "check" | "ci" | "deploy" | "review" | "manual";
diff --git a/apps/jarvis-web/src/types/generated/RequirementTodoStatus.ts b/apps/jarvis-web/src/types/generated/RequirementTodoStatus.ts
new file mode 100644
index 0000000..ffe499a
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/RequirementTodoStatus.ts
@@ -0,0 +1,3 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+export type RequirementTodoStatus = "pending" | "running" | "passed" | "failed" | "skipped" | "blocked";
diff --git a/apps/jarvis-web/src/types/generated/TriageState.ts b/apps/jarvis-web/src/types/generated/TriageState.ts
new file mode 100644
index 0000000..6eaa054
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/TriageState.ts
@@ -0,0 +1,14 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+/**
+ * Triage gate for a [`Requirement`]. Distinguishes
+ * **user-approved** work (default) from **agent-proposed** or
+ * **scan-surfaced** candidates that must be reviewed before any
+ * automation picks them up.
+ *
+ * Wire form is snake_case (`"approved"` / `"proposed_by_agent"` /
+ * `"proposed_by_scan"`). Older requirement rows on disk that
+ * don't carry the field deserialise as [`TriageState::Approved`]
+ * — i.e. v0 behaviour is preserved when no triage gate was set.
+ */
+export type TriageState = "approved" | "proposed_by_agent" | "proposed_by_scan";
diff --git a/apps/jarvis-web/src/types/generated/VerificationPlan.ts b/apps/jarvis-web/src/types/generated/VerificationPlan.ts
new file mode 100644
index 0000000..bd2be40
--- /dev/null
+++ b/apps/jarvis-web/src/types/generated/VerificationPlan.ts
@@ -0,0 +1,31 @@
+// This file was generated by [ts-rs](https://github.com/Aleph-Alpha/ts-rs). Do not edit this file manually.
+
+/**
+ * What success looks like for the run, expressed as commands the
+ * host should execute and policy gates the user / harness should
+ * honour.
+ */
+export type VerificationPlan = { 
+/**
+ * Shell-style commands to run after the agent finishes. Each
+ * is run via the binary's existing `shell.exec` plumbing
+ * (sandbox-rooted, approval-gated).
+ */
+commands: Array<string>, 
+/**
+ * Require the run to produce a non-empty `git diff` before
+ * passing? Useful for code-change requirements.
+ */
+require_diff: boolean, 
+/**
+ * Require the agent to declare which tests it ran (and that
+ * at least one was run)? Free-form text expectation; the
+ * harness only checks that *some* command in `commands` was
+ * recognisable as a test runner.
+ */
+require_tests: boolean, 
+/**
+ * Hold for human review before flipping the parent
+ * Requirement to `done`?
+ */
+require_human_review: boolean, };
diff --git a/apps/jarvis-web/src/utils/i18n.ts b/apps/jarvis-web/src/utils/i18n.ts
index 6a69fe5..837dc23 100644
--- a/apps/jarvis-web/src/utils/i18n.ts
+++ b/apps/jarvis-web/src/utils/i18n.ts
@@ -1144,6 +1144,15 @@ Expected workflow:
     workOverviewWindow7d: "7d",
     workOverviewWindow30d: "30d",
     workOverviewWindow90d: "90d",
+    workOverviewTabsLabel: "Project overview sections",
+    workOverviewTabOverview: "Overview",
+    workOverviewTabQuality: "Quality",
+    workOverviewTabUsage: "Usage",
+    workOverviewTabActivity: "Activity",
+    workOverviewTabObservability: "Observability",
+    healthCenterSignalsViewAll: (total: number) => `View all (${total}) →`,
+    healthCenterSignalsViewAllHint:
+      "Switch to the Quality tab to see every actionable signal.",
     workOverviewAsOf: (when: string) => `Last refreshed ${when}`,
     workOverviewError: (msg: string) => `Refresh failed: ${msg}`,
     workOverviewUnavailable:
@@ -3481,6 +3490,14 @@ ${blockedRows}
     workOverviewWindow7d: "近 7 天",
     workOverviewWindow30d: "近 30 天",
     workOverviewWindow90d: "近 90 天",
+    workOverviewTabsLabel: "总览页分组",
+    workOverviewTabOverview: "概览",
+    workOverviewTabQuality: "质量",
+    workOverviewTabUsage: "用量",
+    workOverviewTabActivity: "活动",
+    workOverviewTabObservability: "可观测",
+    healthCenterSignalsViewAll: (total: number) => `查看全部 (${total}) →`,
+    healthCenterSignalsViewAllHint: "切到「质量」Tab 查看完整的待办信号列表。",
     workOverviewAsOf: (when: string) => `数据更新于 ${when}`,
     workOverviewError: (msg: string) => `刷新失败：${msg}`,
     workOverviewUnavailable:
diff --git a/apps/jarvis/src/config.rs b/apps/jarvis/src/config.rs
index 9d6c34d..fac53e1 100644
--- a/apps/jarvis/src/config.rs
+++ b/apps/jarvis/src/config.rs
@@ -183,6 +183,39 @@ pub struct AgentSection {
     /// Env override: `JARVIS_PARALLEL_TOOL_CALLS=1`.
     #[serde(skip_serializing_if = "Option::is_none")]
     pub parallel_tool_calls: Option<bool>,
+    /// Whether to register the `enter_plan_mode` tool so the agent
+    /// can voluntarily switch the session into Plan Mode. Unset =
+    /// "default on in coding mode" (any mutation tool enabled),
+    /// "default off otherwise". Set `false` to keep Plan Mode entry
+    /// strictly operator-driven (CLI flag / WS `SetMode` frame).
+    /// Env override: `JARVIS_ENABLE_ENTER_PLAN_MODE=0|1`.
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub allow_self_plan_mode: Option<bool>,
+    /// Whether to register the agent-maintained `memory.*` tools
+    /// (M3.1). Unset = off. Set `true` to expose
+    /// `memory.list / read / write / delete` and inject MEMORY.md
+    /// into the system prompt at conversation start. Env override:
+    /// `JARVIS_ENABLE_MEMORY=1`.
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub enable_memory: Option<bool>,
+    /// Whether to register the P10 git-sync tools
+    /// (`memory.sync`, `memory.sync_status`). When `true`, the
+    /// agent can pull/push the memory tree against a remote git
+    /// repo so notes flow between machines / teammates without a
+    /// custom sync server. Off by default — opt in once you've
+    /// hooked up a remote. Env override:
+    /// `JARVIS_ENABLE_MEMORY_SYNC=1`. Requires `enable_memory` to
+    /// also be on. Treated as a shortcut for
+    /// `memory_sync_backend = "git"` when the latter is unset.
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub enable_memory_sync: Option<bool>,
+    /// P13 — which sync transport the memory tools should expose.
+    /// One of `"git"` (default when sync is enabled), `"icloud"`
+    /// (macOS-only, OS-managed), or `"none"`. Env override:
+    /// `JARVIS_MEMORY_SYNC_BACKEND`. The explicit choice wins
+    /// over the legacy `enable_memory_sync` flag.
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub memory_sync_backend: Option<String>,
 }
 
 /// Per-provider config. All fields optional; provider-specific
diff --git a/apps/jarvis/src/serve.rs b/apps/jarvis/src/serve.rs
index 8253847..7a594e8 100644
--- a/apps/jarvis/src/serve.rs
+++ b/apps/jarvis/src/serve.rs
@@ -62,6 +62,103 @@ pub async fn run(
         || bcfg.enable_fs_patch
         || bcfg.enable_shell_exec;
 
+    // `enter_plan_mode` defaults to ON in coding mode so the model
+    // can volunteer "let me draft a plan first" before risky edits.
+    // Operators who want the historical "operator-driven plan-mode
+    // entry only" can flip `JARVIS_ENABLE_ENTER_PLAN_MODE=0` or set
+    // `[agent].allow_self_plan_mode = false`. Resolution mirrors the
+    // existing `pick_bool_flag` order: env > config > default.
+    bcfg.enable_enter_plan_mode = pick_bool_flag(
+        "JARVIS_ENABLE_ENTER_PLAN_MODE",
+        cfg.agent.allow_self_plan_mode,
+        coding_mode,
+    );
+    // `memory.*` tools stay off by default but obey the same
+    // env/config override pattern so operators can flip them on
+    // without recompiling. Coding mode is *not* enough to flip
+    // these — memory is a longer-term storage primitive whose
+    // value depends on the operator actively wanting it.
+    bcfg.enable_memory = pick_bool_flag(
+        "JARVIS_ENABLE_MEMORY",
+        cfg.agent.enable_memory,
+        false,
+    );
+    // P9 — user-scope memory root. Defaults to the operator's home
+    // directory (the `.jarvis/memory/` subtree under it), so a
+    // single `~/.jarvis/memory/MEMORY.md` follows the user across
+    // workspaces. `JARVIS_MEMORY_USER_ROOT=/path` overrides for
+    // ops that want it under e.g. Dropbox; `=` (empty) disables.
+    // Unset and home unresolvable ⇒ user scope is off, writes to
+    // `scope:"user"` error cleanly.
+    bcfg.memory_user_root = resolve_memory_user_root();
+    // P10 — git-as-transport memory sync. Off by default; flip
+    // on when the operator has set up `git remote add origin
+    // <url>` inside their memory dirs.
+    bcfg.enable_memory_sync = pick_bool_flag(
+        "JARVIS_ENABLE_MEMORY_SYNC",
+        cfg.agent.enable_memory_sync,
+        false,
+    );
+    // P13 — explicit sync backend choice. Resolution order:
+    //   1. JARVIS_MEMORY_SYNC_BACKEND env
+    //   2. [agent].memory_sync_backend config
+    //   3. fall back to `Git` when legacy `enable_memory_sync` is
+    //      on, `None` otherwise (handled inside register_builtins)
+    let backend_pick = pick_string_opt(
+        "JARVIS_MEMORY_SYNC_BACKEND",
+        cfg.agent.memory_sync_backend.as_deref(),
+    );
+    bcfg.memory_sync_backend = match backend_pick {
+        Some(s) => harness_tools::MemorySyncBackend::from_wire(&s)
+            .unwrap_or(harness_tools::MemorySyncBackend::None),
+        None => harness_tools::MemorySyncBackend::None,
+    };
+    // iCloud backend auto-resolves user_root to iCloud Drive when
+    // the operator didn't pin one explicitly. Saves them having to
+    // remember `~/Library/Mobile Documents/com~apple~CloudDocs/`.
+    if matches!(
+        bcfg.memory_sync_backend,
+        harness_tools::MemorySyncBackend::ICloud
+    ) && bcfg.memory_user_root.is_none()
+    {
+        match harness_tools::icloud_memory_root() {
+            Some(p) => {
+                info!(path = %p.display(), "iCloud backend: pinning user memory root");
+                bcfg.memory_user_root = Some(p);
+            }
+            None => {
+                warn!(
+                    "iCloud backend selected but iCloud Drive base \
+                     (`~/Library/Mobile Documents/com~apple~CloudDocs/`) not found; \
+                     iCloud sync will be unavailable. \
+                     Enable iCloud Drive in System Settings, then restart."
+                );
+            }
+        }
+    }
+    // P11.2 — background auto-sync ticker. Sub-flag of
+    // `enable_memory_sync` because there's nothing to tick when
+    // the sync tools aren't even registered. Default off so the
+    // existing "agent calls memory.sync explicitly" workflow
+    // doesn't grow background network calls without explicit
+    // opt-in. P13: the ticker is git-only — iCloud syncs at OS
+    // level, so a Jarvis-side ticker would be redundant.
+    let git_backend_active = matches!(
+        bcfg.memory_sync_backend,
+        harness_tools::MemorySyncBackend::Git
+    ) || (bcfg.enable_memory_sync
+        && matches!(
+            bcfg.memory_sync_backend,
+            harness_tools::MemorySyncBackend::None
+        ));
+    let auto_sync_enabled =
+        git_backend_active && pick_bool_flag("JARVIS_MEMORY_AUTO_SYNC", None, false);
+    let auto_sync_user_root = bcfg.memory_user_root.clone();
+    let auto_sync_interval = std::env::var("JARVIS_MEMORY_AUTO_SYNC_INTERVAL_SECS")
+        .ok()
+        .and_then(|s| s.parse::<u64>().ok())
+        .unwrap_or(harness_tools::memory_sync::DEFAULT_AUTO_SYNC_INTERVAL_SECS);
+
     // Open persistence early so the TODO store can flow into
     // [`BuiltinsConfig`] before [`register_builtins`] runs. The same
     // URL drives all three stores (conversations, projects, todos);
@@ -221,6 +318,20 @@ pub async fn run(
         info!("channel-instance store active (channel.send tool registered)");
     }
 
+    // Snapshot the few flags later code paths still need before
+    // `register_builtins` consumes `bcfg`. Avoids cloning the whole
+    // config (which holds Arc<dyn Store> handles).
+    let memory_tools_enabled = bcfg.enable_memory;
+    let memory_user_root = bcfg.memory_user_root.clone();
+    // Effective backend after the same resolution
+    // `register_builtins` applies: an explicit backend wins,
+    // otherwise the legacy `enable_memory_sync` bool maps to Git.
+    let memory_sync_backend_active = match bcfg.memory_sync_backend {
+        harness_tools::MemorySyncBackend::None if bcfg.enable_memory_sync => {
+            harness_tools::MemorySyncBackend::Git
+        }
+        other => other,
+    };
     register_builtins(&mut tools, bcfg);
     tools.register(HarnessHealthTool::new(
         observability_store.clone(),
@@ -388,7 +499,15 @@ pub async fn run(
     // opened earlier so the TODO store could flow into
     // `BuiltinsConfig`. The same handles are reused below — no
     // second connection.
-    let mut system_prompt = pick_system_prompt(&cfg, coding_mode);
+    // Assemble the system prompt via the typed slot builder. The
+    // result is byte-equivalent to the prior `push_str` flow (slots
+    // joined with `\n\n` in slot order) so the LLM prompt-cache
+    // fingerprint doesn't rotate, but the structure makes it easy
+    // for future subsystems (M3.1 Project Memory writes, sub-agent
+    // overrides) to drop their text into a known slot without
+    // touching this site.
+    let mut prompt_builder = harness_core::SystemPromptBuilder::new()
+        .with_base(pick_system_prompt(&cfg, coding_mode));
     let project_ctx_cap = project_context_max_bytes(&cfg);
     let mut project_context_loaded = false;
     if include_project_context(&cfg) {
@@ -398,11 +517,6 @@ pub async fn run(
                 cap = project_ctx_cap,
                 "loaded project instructions (AGENTS.md / JARVIS.md / CLAUDE.md / .jarvis)"
             );
-            // The loader truncates at the cap and tags the suffix. When
-            // it fired, surface a WARN so operators with larger
-            // instruction files notice and can opt back to a higher cap
-            // via `JARVIS_PROJECT_CONTEXT_BYTES` rather than silently
-            // shipping truncated guidance to the model.
             if extra.contains("project context truncated at") {
                 warn!(
                     cap = project_ctx_cap,
@@ -411,8 +525,7 @@ pub async fn run(
                      to raise (default lowered to 8 KiB to keep system prompt focused)."
                 );
             }
-            system_prompt.push_str("\n\n");
-            system_prompt.push_str(&extra);
+            prompt_builder = prompt_builder.append_runtime_inject(extra);
             project_context_loaded = true;
         }
     }
@@ -439,11 +552,73 @@ pub async fn run(
                 dir = %project_memory_dir.display(),
                 "loaded project memory prompt"
             );
-            system_prompt.push_str("\n\n");
-            system_prompt.push_str(&extra);
+            prompt_builder = prompt_builder.append_runtime_inject(extra);
             project_memory_loaded = true;
         }
     }
+    // Agent-maintained memory indices (M3.1 + P9). When the memory
+    // tools are enabled, inject both scopes' MEMORY.md files so the
+    // model wakes up with "what do I know about this project" AND
+    // "what do I know about this user" before turn 1. Each entry's
+    // body is fetched on demand via `memory.read(slug, scope?)`.
+    let user_memory_root = resolve_memory_user_root();
+    let mut memory_index_loaded = false;
+    let include_cache_root = home_dir()
+        .map(|h| h.join(".jarvis/include-cache"))
+        .unwrap_or_else(|| std::env::temp_dir().join("jarvis-include-cache"));
+    // P18.3 — optional gentle TTL refresh. `JARVIS_INCLUDE_TTL_HOURS=N`
+    // causes git+ includes whose cache is older than N hours to
+    // trigger a `git pull --ff-only` before being injected.
+    // Unset (or `0`) keeps the original "manual refresh only"
+    // behaviour from P16.
+    let include_ttl = std::env::var("JARVIS_INCLUDE_TTL_HOURS")
+        .ok()
+        .and_then(|s| s.parse::<u64>().ok())
+        .filter(|n| *n > 0)
+        .map(|n| std::time::Duration::from_secs(n * 3600));
+    if memory_tools_enabled {
+        // Shared dedup set spans both scope walks so a directive
+        // included from both workspace + user injects only once.
+        let mut include_seen: std::collections::HashSet<String> =
+            std::collections::HashSet::new();
+        let (next, loaded) = inject_memory_with_includes(
+            prompt_builder,
+            "project memory index",
+            "workspace",
+            &workspace_root,
+            &include_cache_root,
+            &mut include_seen,
+            include_ttl,
+        )
+        .await;
+        prompt_builder = next;
+        if loaded {
+            memory_index_loaded = true;
+        }
+        if let Some(user_root) = user_memory_root.as_deref() {
+            let (next, loaded) = inject_memory_with_includes(
+                prompt_builder,
+                "user memory index",
+                "user",
+                user_root,
+                &include_cache_root,
+                &mut include_seen,
+                include_ttl,
+            )
+            .await;
+            prompt_builder = next;
+            if loaded {
+                memory_index_loaded = true;
+            }
+        }
+    }
+    let _ = memory_index_loaded; // reserved for future telemetry
+    let system_prompt = prompt_builder.build();
+    info!(
+        slots = ?prompt_builder.trace(),
+        total_bytes = system_prompt.len(),
+        "system prompt assembled",
+    );
     // Snapshot the canonical registry as the agent template's tool
     // catalogue. `AppState::build_agent` always re-snapshots from
     // `canonical_tools` per request, so this seed is only for the
@@ -469,8 +644,10 @@ pub async fn run(
         &extras,
         &route_policy,
     );
-    if let Some(mem) = build_memory(&cfg, &llm, &model, store.as_ref(), summary_resolver)? {
-        agent_cfg = agent_cfg.with_memory(mem);
+    let mut memory_stats: Option<Arc<dyn harness_core::MemoryStatsProvider>> = None;
+    if let Some(bundle) = build_memory(&cfg, &llm, &model, store.as_ref(), summary_resolver)? {
+        agent_cfg = agent_cfg.with_memory(bundle.memory);
+        memory_stats = bundle.stats;
     }
     if let Some(approver) = build_approver(&cfg)? {
         agent_cfg = agent_cfg.with_approver(approver);
@@ -668,6 +845,20 @@ pub async fn run(
         .with_worktree_config(worktree_mode, worktree_root, worktree_allow_dirty)
         .with_route_policy(route_policy)
         .with_subagent_runs(harness_server::SubAgentRunRegistry::new());
+    if let Some(stats) = memory_stats {
+        state = state.with_memory_stats(stats);
+    }
+    // P14 — expose memory runtime metadata to the Web UI / REST.
+    // Only attached when the memory tools are actually enabled —
+    // otherwise the panel's REST endpoints render 503 cleanly so
+    // the UI knows to show an "off, enable in config" state.
+    if memory_tools_enabled {
+        state = state.with_memory_runtime(harness_server::MemoryRuntime {
+            workspace_root: workspace_root.clone(),
+            user_root: memory_user_root.clone(),
+            backend: memory_sync_backend_active,
+        });
+    }
     if let Some(pm) = project_memory_runtime.clone() {
         state = state.with_project_memory(pm);
     }
@@ -919,6 +1110,33 @@ pub async fn run(
         });
     }
 
+    // P11.2 — background memory auto-sync. Started after AppState
+    // is finalised but before `serve(...)` runs forever; the
+    // handle is held by `serve(...)`'s lifetime via Drop semantics.
+    // When the process exits the task drops along with it.
+    let _auto_sync_handle = if auto_sync_enabled {
+        if let Some(user_root) = auto_sync_user_root {
+            let mut roots = harness_tools::MemoryRoots::new(workspace_root.clone());
+            roots = roots.with_user_root(user_root);
+            let cfg = harness_tools::memory_sync::AutoSyncConfig {
+                roots,
+                scope: harness_tools::MemoryScope::User,
+                interval: std::time::Duration::from_secs(auto_sync_interval),
+                initial_pull: true,
+            };
+            info!(
+                interval_secs = auto_sync_interval,
+                "memory auto-sync ticker started"
+            );
+            Some(harness_tools::memory_sync::spawn_auto_sync_task(cfg))
+        } else {
+            warn!("JARVIS_MEMORY_AUTO_SYNC set but user_root is unconfigured; ticker not started");
+            None
+        }
+    } else {
+        None
+    };
+
     serve(addr, state).await?;
 
     drop(mcp_manager);
@@ -1232,6 +1450,142 @@ fn home_dir() -> Option<PathBuf> {
         .or_else(|| std::env::var_os("USERPROFILE").map(PathBuf::from))
 }
 
+/// Per-include body cap when injected into the system prompt
+/// (P18). Anything larger gets truncated with a stable marker so
+/// the model knows there's more behind it. Same value as
+/// `harness_tools::memory::MAX_INDEX_BYTES` because that's also
+/// the limit on the index file itself — keeps the prompt budget
+/// predictable when both scopes pull from sizeable upstreams.
+const INCLUDE_INJECT_MAX_BYTES: usize = 25 * 1024;
+
+/// P16/P18: read one memory scope's MEMORY.md, append it as a
+/// slot in the prompt, then walk its include directives and
+/// append each upstream MEMORY.md as its own
+/// `=== included from <label> ===` block.
+///
+/// - **Cycle-safe by construction**: depth=1 only.
+/// - **Cross-scope dedup**: `seen` accumulates directive
+///   wire-strings across workspace + user invocations, so a
+///   `git+...` URL referenced by both scopes is injected only
+///   once (whichever scope sees it first wins).
+/// - **Body cap**: each upstream body is truncated to
+///   [`INCLUDE_INJECT_MAX_BYTES`] before append, with a marker.
+/// - **Failures are warn'd**, never propagated — a broken
+///   include can't bring down startup.
+///
+/// Returns the (possibly mutated) builder + whether anything was
+/// injected for this scope.
+async fn inject_memory_with_includes(
+    mut builder: harness_core::SystemPromptBuilder,
+    label: &str,
+    scope_tag: &str,
+    root: &std::path::Path,
+    cache_root: &std::path::Path,
+    seen: &mut std::collections::HashSet<String>,
+    ttl: Option<std::time::Duration>,
+) -> (harness_core::SystemPromptBuilder, bool) {
+    let body = match harness_tools::memory::read_index(root).await {
+        Ok(Some(b)) if !b.trim().is_empty() => b,
+        Ok(_) => return (builder, false),
+        Err(e) => {
+            warn!(error = %e, scope = scope_tag, path = %root.display(),
+                  "failed to load memory index");
+            return (builder, false);
+        }
+    };
+    let block = format!("=== {label} ===\n{}", body.trim_end());
+    info!(
+        bytes = block.len(),
+        scope = scope_tag,
+        path = %root.display(),
+        "loaded memory index"
+    );
+    builder = builder.append_runtime_inject(block);
+
+    let directives = harness_tools::memory_include::parse_include_directives(&body);
+    for d in directives {
+        let key = d.as_wire();
+        if !seen.insert(key.clone()) {
+            info!(target = %d.label(), scope = scope_tag,
+                  "include skipped (already injected from another scope)");
+            continue;
+        }
+        // P18.3 — TTL-driven gentle refresh before resolve.
+        // Skipped when no TTL is configured or the directive
+        // isn't a git URL. Failures are logged inside the helper;
+        // we keep the stale cache and continue.
+        if let Some(ttl_dur) = ttl {
+            let _ = harness_tools::memory_include::maybe_refresh_git_cache(
+                &d, cache_root, ttl_dur,
+            )
+            .await;
+        }
+        let dir = match harness_tools::memory_include::resolve_include(&d, cache_root).await {
+            Ok(p) => p,
+            Err(e) => {
+                warn!(error = %e, target = %d.label(),
+                      "include resolution failed; skipping");
+                continue;
+            }
+        };
+        let path = dir.join("MEMORY.md");
+        let upstream = match tokio::fs::read_to_string(&path).await {
+            Ok(b) => b,
+            Err(e) => {
+                warn!(error = %e, target = %d.label(),
+                      "include read failed; skipping");
+                continue;
+            }
+        };
+        let trimmed = upstream.trim_end();
+        if trimmed.is_empty() {
+            continue;
+        }
+        let capped = if trimmed.len() > INCLUDE_INJECT_MAX_BYTES {
+            // Truncate at a UTF-8 char boundary, then append a
+            // stable marker so the byte count of the marker
+            // doesn't shift the cache key.
+            let mut cut = INCLUDE_INJECT_MAX_BYTES;
+            while cut > 0 && !trimmed.is_char_boundary(cut) {
+                cut -= 1;
+            }
+            let mut s = trimmed[..cut].to_string();
+            s.push_str(
+                "\n\n[... include body truncated to fit system-prompt budget ...]",
+            );
+            s
+        } else {
+            trimmed.to_string()
+        };
+        let inc_block = format!("=== included from {} ===\n{}", d.label(), capped);
+        info!(
+            bytes = inc_block.len(),
+            target = %d.label(),
+            truncated = trimmed.len() > INCLUDE_INJECT_MAX_BYTES,
+            "loaded include"
+        );
+        builder = builder.append_runtime_inject(inc_block);
+    }
+    (builder, true)
+}
+
+/// Resolve where user-scope memory (P9) should live.
+/// Order: explicit env var > `~`. Empty env value disables the
+/// scope. Returns `None` when the home directory can't be resolved
+/// and no override is set — user-scope writes will then error
+/// cleanly via the tool's "user-scope not configured" message.
+fn resolve_memory_user_root() -> Option<PathBuf> {
+    if let Ok(v) = std::env::var("JARVIS_MEMORY_USER_ROOT") {
+        let trimmed = v.trim();
+        if trimmed.is_empty() {
+            // Explicitly disabled.
+            return None;
+        }
+        return Some(PathBuf::from(trimmed));
+    }
+    home_dir().map(|h| h.join(".jarvis"))
+}
+
 /// Read `JARVIS_SHELL_LIMITS=safe` to opt into the
 /// 60s/2GB/256fd/256proc preset, or set individual env vars
 /// (`JARVIS_SHELL_CPU_SECS`, `JARVIS_SHELL_AS_BYTES`,
@@ -1757,7 +2111,7 @@ fn build_memory(
     active_model: &str,
     store: Option<&Arc<dyn harness_core::ConversationStore>>,
     route_resolver: Option<Arc<harness_memory::LlmRouteResolver>>,
-) -> Result<Option<Arc<dyn Memory>>> {
+) -> Result<Option<MemoryBundle>> {
     let budget = std::env::var("JARVIS_MEMORY_TOKENS")
         .ok()
         .and_then(|s| s.parse::<usize>().ok())
@@ -1771,6 +2125,7 @@ fn build_memory(
     // reflects what the model actually counts. Cheap to ask once per
     // memory backend; the estimator is `Arc`-shared internally.
     let estimator = llm.estimator();
+    let mut stats: Option<Arc<dyn harness_core::MemoryStatsProvider>> = None;
     let mem: Arc<dyn Memory> = match mode.as_str() {
         "summary" => {
             let summary_model = pick_string_opt("JARVIS_MEMORY_MODEL", cfg.memory.model.as_deref())
@@ -1796,6 +2151,11 @@ fn build_memory(
                 routed,
                 "summarising memory enabled",
             );
+            // P8: expose the backend's compaction counters so the
+            // diagnostics endpoint can render them. SlidingWindow
+            // has no LLM-driven state worth tracking; its branch
+            // below leaves `stats` as `None`.
+            stats = Some(sm.counters() as Arc<dyn harness_core::MemoryStatsProvider>);
             Arc::new(sm)
         }
         "window" => {
@@ -1806,7 +2166,15 @@ fn build_memory(
             anyhow::bail!("memory.mode=`{other}` is not recognised; use `window` or `summary`");
         }
     };
-    Ok(Some(mem))
+    Ok(Some(MemoryBundle { memory: mem, stats }))
+}
+
+/// Memory backend + the optional telemetry handle the diagnostics
+/// surface needs. Wrapper struct so `build_memory` can return both
+/// without the caller needing to branch on memory mode.
+pub struct MemoryBundle {
+    pub memory: Arc<dyn Memory>,
+    pub stats: Option<Arc<dyn harness_core::MemoryStatsProvider>>,
 }
 
 /// Build the global [`Approver`] attached to the agent's
diff --git a/crates/harness-channel/Cargo.toml b/crates/harness-channel/Cargo.toml
index 9c292dd..5488a30 100644
--- a/crates/harness-channel/Cargo.toml
+++ b/crates/harness-channel/Cargo.toml
@@ -10,4 +10,5 @@ async-trait.workspace = true
 chrono.workspace = true
 serde.workspace = true
 serde_json.workspace = true
+ts-rs.workspace = true
 uuid.workspace = true
diff --git a/crates/harness-channel/src/instance.rs b/crates/harness-channel/src/instance.rs
index bf7ec18..d430358 100644
--- a/crates/harness-channel/src/instance.rs
+++ b/crates/harness-channel/src/instance.rs
@@ -14,6 +14,7 @@
 //! needed for the next message)`.
 
 use serde::{Deserialize, Serialize};
+use ts_rs::TS;
 
 /// User-driven enabled/disabled/unconfigured state. Distinct from
 /// "did the last send succeed" — that's surfaced via per-instance
@@ -21,8 +22,9 @@ use serde::{Deserialize, Serialize};
 /// validator detects required fields are missing (so the UI can show
 /// a "继续配置" CTA without the user having to remember which fields
 /// they skipped).
-#[derive(Debug, Clone, Copy, PartialEq, Eq, Default, Serialize, Deserialize)]
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Default, Serialize, Deserialize, TS)]
 #[serde(rename_all = "snake_case")]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub enum ChannelInstanceStatus {
     #[default]
     Enabled,
@@ -58,7 +60,8 @@ impl ChannelInstanceStatus {
 /// schema without baking variant-specific fields into the trait
 /// surface. The current kinds and their schemas live next to the
 /// `kind`-specific senders in `harness-server`.
-#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize, TS)]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub struct ChannelInstance {
     /// Stable UUID. Frontend keys list rows by this.
     pub id: String,
@@ -74,6 +77,7 @@ pub struct ChannelInstance {
     /// Kind-specific config payload. May embed `${env:NAME}` template
     /// strings — resolved at send-time, never at store-time, so a
     /// rotated env var takes effect immediately.
+    #[ts(type = "Record<string, unknown>")]
     pub config: serde_json::Value,
     /// RFC-3339 timestamp set on insert.
     pub created_at: String,
diff --git a/crates/harness-channel/src/message.rs b/crates/harness-channel/src/message.rs
index 6ae208a..f9ab6d6 100644
--- a/crates/harness-channel/src/message.rs
+++ b/crates/harness-channel/src/message.rs
@@ -7,13 +7,15 @@
 //! - normalise the result so retries are explicit ([`SendOutcome`])
 
 use serde::{Deserialize, Serialize};
+use ts_rs::TS;
 
 /// Wire format of an outbound message body. Adapters that don't
 /// support a particular format fall back to `Text` and tag the
 /// `SendOutcome` so the caller (e.g. `channel.send` tool) can
 /// surface "downgraded to text" in the agent's transcript.
-#[derive(Debug, Clone, Copy, PartialEq, Eq, Default, Serialize, Deserialize)]
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Default, Serialize, Deserialize, TS)]
 #[serde(rename_all = "snake_case")]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub enum ChannelMessageFormat {
     #[default]
     Text,
diff --git a/crates/harness-core/src/agent.rs b/crates/harness-core/src/agent.rs
index fd749e3..b8ccd58 100644
--- a/crates/harness-core/src/agent.rs
+++ b/crates/harness-core/src/agent.rs
@@ -300,6 +300,15 @@ pub enum AgentEvent {
     /// stays in Plan Mode until the user accepts via the WS frame
     /// `{type:"accept_plan", post_mode:"..."}`.
     PlanProposed { plan: String },
+    /// A tool requested a permission-mode switch via
+    /// [`crate::mode_signal::emit`]. Emitted *after* the tool's
+    /// `ToolEnd`. Transports react by updating their per-session
+    /// mode handle so the next turn's approver / tool_filter see
+    /// the new mode. Today only the `enter_plan_mode` tool emits
+    /// this — it sends [`crate::PermissionMode::Plan`] so the model
+    /// can voluntarily switch into read-only investigation mode
+    /// without the operator clicking the UI toggle.
+    ModeChanged { mode: crate::permission::PermissionMode },
     /// Provider-reported token usage for the LLM call that just
     /// finished. Optional fields — see [`crate::Usage`]. Emitted at
     /// most once per LLM iteration; transports typically aggregate
@@ -388,7 +397,16 @@ impl Agent {
         // (`run_stream`) leaves scoping to its transport callers
         // because async-stream `yield` can't traverse a
         // `LocalKey::scope` boundary.
-        crate::todo::with_turn_budget(self.run_inner(conversation)).await
+        //
+        // The working-context slot is installed at the same level so
+        // every tool call inside the loop can `note_file` and every
+        // `Memory::compact` can snapshot the latest plan + recent
+        // files. Scope is per-run: a fresh `Agent::run` invocation
+        // gets a fresh slot.
+        crate::working_context::with_working_context(
+            crate::todo::with_turn_budget(self.run_inner(conversation)),
+        )
+        .await
     }
 
     async fn run_inner(&self, conversation: &mut Conversation) -> Result<(RunOutcome, Usage)> {
@@ -425,14 +443,30 @@ impl Agent {
                     {
                         // Parallel dispatch path: when the operator opted
                         // in *and* the model emitted >1 tool call this
-                        // turn, run them concurrently and push the
-                        // resulting `Message::Tool` rows in the original
+                        // turn *and* every called tool advertises
+                        // `is_concurrency_safe() && !is_destructive()`,
+                        // run them concurrently and push the resulting
+                        // `Message::Tool` rows in the original
                         // `tool_calls` index order. Order matters
                         // because OpenAI / Anthropic require tool
-                        // replies paired with the assistant's
-                        // tool_use ids — out-of-order or missing entries
-                        // trip 400s on the next request.
-                        if self.config.parallel_tool_calls && tool_calls.len() > 1 {
+                        // replies paired with the assistant's tool_use
+                        // ids — out-of-order or missing entries trip
+                        // 400s on the next request.
+                        //
+                        // The per-tool safety gate (M2.1) keeps a
+                        // mixed turn — e.g. 3 reads + 1 write —
+                        // fully serial so a sibling read can't observe
+                        // a half-applied mutation. The model rarely
+                        // mixes write tools into a parallel-friendly
+                        // batch anyway; investigation turns vs. action
+                        // turns are usually separate.
+                        if self.config.parallel_tool_calls
+                            && tool_calls.len() > 1
+                            && crate::tool::all_calls_concurrency_safe(
+                                &self.config.tools,
+                                tool_calls,
+                            )
+                        {
                             // Resolve approvals concurrently first so
                             // `run_one` sees a `Some(Deny { reason })`
                             // and surfaces the synthetic `tool denied:`
@@ -652,8 +686,17 @@ impl Agent {
                         // sequential path is preserved verbatim so
                         // single-tool turns and small-LLM compatibility
                         // don't regress.
+                        // Parallel gate matches the blocking path: opt-in
+                        // flag AND >1 call AND every call advertises
+                        // concurrency safety. A single destructive sibling
+                        // forces the whole turn back to serial dispatch
+                        // — see [`crate::all_calls_concurrency_safe`].
                         let parallel = agent.config.parallel_tool_calls
-                            && tool_calls.len() > 1;
+                            && tool_calls.len() > 1
+                            && crate::tool::all_calls_concurrency_safe(
+                                &agent.config.tools,
+                                tool_calls,
+                            );
 
                         if !parallel {
                             for call in tool_calls {
@@ -738,6 +781,8 @@ impl Agent {
                                     tokio::sync::mpsc::unbounded_channel::<Vec<crate::plan::PlanItem>>();
                                 let (sub_tx, mut sub_rx) =
                                     tokio::sync::mpsc::unbounded_channel::<crate::subagent::SubAgentFrame>();
+                                let (mode_tx, mut mode_rx) =
+                                    tokio::sync::mpsc::unbounded_channel::<crate::permission::PermissionMode>();
                                 let invoke = crate::workspace::with_session_workspace(
                                     agent.config.session_workspace.clone(),
                                     crate::progress::with_progress(
@@ -746,12 +791,15 @@ impl Agent {
                                             plan_tx,
                                             crate::subagent::with_subagent(
                                                 sub_tx,
-                                                run_one_with_optional_hitl(
-                                                    agent.config.hitl_tx.clone(),
-                                                    Self::run_one(
-                                                        &agent.config.tools,
-                                                        call,
-                                                        decision.as_ref(),
+                                                crate::mode_signal::with_mode_signal(
+                                                    mode_tx,
+                                                    run_one_with_optional_hitl(
+                                                        agent.config.hitl_tx.clone(),
+                                                        Self::run_one(
+                                                            &agent.config.tools,
+                                                            call,
+                                                            decision.as_ref(),
+                                                        ),
                                                     ),
                                                 ),
                                             ),
@@ -771,11 +819,15 @@ impl Agent {
                                             };
                                         }
                                         Some(items) = plan_rx.recv() => {
+                                            crate::working_context::note_plan(items.clone());
                                             yield AgentEvent::PlanUpdate { items };
                                         }
                                         Some(frame) = sub_rx.recv() => {
                                             yield AgentEvent::SubAgentEvent { frame };
                                         }
+                                        Some(mode) = mode_rx.recv() => {
+                                            yield AgentEvent::ModeChanged { mode };
+                                        }
                                         res = &mut invoke => {
                                             // Drain anything the tool
                                             // queued in the same wake as
@@ -790,11 +842,15 @@ impl Agent {
                                                 };
                                             }
                                             while let Ok(items) = plan_rx.try_recv() {
+                                                crate::working_context::note_plan(items.clone());
                                                 yield AgentEvent::PlanUpdate { items };
                                             }
                                             while let Ok(frame) = sub_rx.try_recv() {
                                                 yield AgentEvent::SubAgentEvent { frame };
                                             }
+                                            while let Ok(mode) = mode_rx.try_recv() {
+                                                yield AgentEvent::ModeChanged { mode };
+                                            }
                                             break res;
                                         }
                                     }
@@ -987,6 +1043,7 @@ impl Agent {
                                         let (prog_tx, mut prog_rx) = tokio::sync::mpsc::unbounded_channel::<crate::progress::ToolProgress>();
                                         let (plan_tx, mut plan_rx) = tokio::sync::mpsc::unbounded_channel::<Vec<crate::plan::PlanItem>>();
                                         let (sub_tx, mut sub_rx) = tokio::sync::mpsc::unbounded_channel::<crate::subagent::SubAgentFrame>();
+                                        let (mode_tx, mut mode_rx) = tokio::sync::mpsc::unbounded_channel::<crate::permission::PermissionMode>();
                                         let invoke = crate::workspace::with_session_workspace(
                                             agent.config.session_workspace.clone(),
                                             crate::progress::with_progress(
@@ -995,12 +1052,15 @@ impl Agent {
                                                     plan_tx,
                                                     crate::subagent::with_subagent(
                                                         sub_tx,
-                                                        run_one_with_optional_hitl(
-                                                            agent.config.hitl_tx.clone(),
-                                                            Self::run_one(
-                                                                &agent.config.tools,
-                                                                &call,
-                                                                decision.as_ref(),
+                                                        crate::mode_signal::with_mode_signal(
+                                                            mode_tx,
+                                                            run_one_with_optional_hitl(
+                                                                agent.config.hitl_tx.clone(),
+                                                                Self::run_one(
+                                                                    &agent.config.tools,
+                                                                    &call,
+                                                                    decision.as_ref(),
+                                                                ),
                                                             ),
                                                         ),
                                                     ),
@@ -1022,11 +1082,15 @@ impl Agent {
                                                     });
                                                 }
                                                 Some(items) = plan_rx.recv() => {
+                                                    crate::working_context::note_plan(items.clone());
                                                     let _ = event_tx.send(AgentEvent::PlanUpdate { items });
                                                 }
                                                 Some(frame) = sub_rx.recv() => {
                                                     let _ = event_tx.send(AgentEvent::SubAgentEvent { frame });
                                                 }
+                                                Some(mode) = mode_rx.recv() => {
+                                                    let _ = event_tx.send(AgentEvent::ModeChanged { mode });
+                                                }
                                                 res = &mut invoke => {
                                                     while let Ok(p) = prog_rx.try_recv() {
                                                         let _ = event_tx.send(AgentEvent::ToolProgress {
@@ -1037,11 +1101,15 @@ impl Agent {
                                                         });
                                                     }
                                                     while let Ok(items) = plan_rx.try_recv() {
+                                                        crate::working_context::note_plan(items.clone());
                                                         let _ = event_tx.send(AgentEvent::PlanUpdate { items });
                                                     }
                                                     while let Ok(frame) = sub_rx.try_recv() {
                                                         let _ = event_tx.send(AgentEvent::SubAgentEvent { frame });
                                                     }
+                                                    while let Ok(mode) = mode_rx.try_recv() {
+                                                        let _ = event_tx.send(AgentEvent::ModeChanged { mode });
+                                                    }
                                                     break res;
                                                 }
                                             }
@@ -1164,8 +1232,12 @@ impl Agent {
                 ),
             };
         };
+        // Wrap once for the working-context slot (per-stream, shared
+        // across all polls) and once for the tracing span. Both are
+        // shallow `poll_next` wrappers — they don't change the
+        // event sequence.
         Box::pin(SpanStream {
-            inner: Box::pin(inner),
+            inner: Box::pin(crate::working_context::scope_stream(inner)),
             span: run_span,
         })
     }
diff --git a/crates/harness-core/src/lib.rs b/crates/harness-core/src/lib.rs
index 11469c0..f97b886 100644
--- a/crates/harness-core/src/lib.rs
+++ b/crates/harness-core/src/lib.rs
@@ -15,16 +15,19 @@ pub mod hitl;
 pub mod llm;
 pub mod memory;
 pub mod message;
+pub mod mode_signal;
 pub mod permission;
 pub mod plan;
 pub mod progress;
 pub mod redact;
 pub mod store;
 pub mod subagent;
+pub mod system_prompt;
 pub mod tenant;
 pub mod todo;
 pub mod tool;
 pub mod tool_metadata;
+pub mod working_context;
 pub mod workspace;
 
 // `activity` / `comment` / `doc` / `label` / `project` / `project_memory`
@@ -52,9 +55,12 @@ pub use hitl::{
 pub use llm::{ChatRequest, ChatResponse, FinishReason, LlmChunk, LlmProvider, LlmStream, Usage};
 pub use memory::{
     cache_breakpoint_indices, default_estimator, estimate_tokens, estimate_total_tokens,
-    CharRatioEstimator, JsonAwareEstimator, Memory, TokenEstimator,
+    CharRatioEstimator, JsonAwareEstimator, Memory, MemoryStatsProvider, TokenEstimator,
 };
 pub use message::{CacheHint, Message, ToolCall};
+pub use mode_signal::{
+    emit as emit_mode_signal, is_active as mode_signal_active, with_mode_signal,
+};
 // `observability` module + all its types (Eval* / Observed* /
 // Metric* / Dashboard* / TimeWindow / *Store / *Filter) moved to
 // the `harness-observability` crate. Import via
@@ -77,6 +83,7 @@ pub use subagent::{
     active_sender as subagent_active_sender, emit as emit_subagent, is_active as subagent_active,
     with_subagent, SubAgentEvent, SubAgentFrame,
 };
+pub use system_prompt::{SystemPromptBuilder, SystemPromptSlot};
 /// Tenant (multi-tenant isolation boundary) value types and store trait.
 ///
 /// **Important distinction:** [`Tenant`](crate::tenant::Tenant) is a
@@ -85,10 +92,17 @@ pub use subagent::{
 /// directory concept lives in [`workspace`](crate::workspace).
 pub use tenant::{Tenant, TenantSettings, TenantStore};
 pub use todo::{TodoEvent, TodoItem, TodoPriority, TodoStatus};
-pub use tool::{Tool, ToolCategory, ToolRegistry, ToolSpec};
+pub use tool::{all_calls_concurrency_safe, Tool, ToolCategory, ToolRegistry, ToolSpec};
 pub use tool_metadata::{
     derive_pack, derive_risk, ToolMetadata, ToolPackCategory, ToolRisk, ToolSource,
 };
+pub use working_context::{
+    is_active as working_context_active, note_command as note_working_command,
+    note_file as note_working_file,
+    note_file_relative_to as note_working_file_relative_to, note_plan as note_working_plan,
+    snapshot as working_context_snapshot, with_working_context, with_working_context_capped,
+    WorkingContext, DEFAULT_RECENT_COMMANDS_CAP, DEFAULT_RECENT_FILES_CAP,
+};
 pub use workspace::{
     active_workspace, active_workspace_or, canonicalize_workspace, with_session_workspace,
 };
diff --git a/crates/harness-core/src/memory.rs b/crates/harness-core/src/memory.rs
index 7fe5cb5..3c8c804 100644
--- a/crates/harness-core/src/memory.rs
+++ b/crates/harness-core/src/memory.rs
@@ -202,6 +202,28 @@ pub fn default_estimator() -> Arc<dyn TokenEstimator> {
     Arc::new(CharRatioEstimator)
 }
 
+/// Diagnostics surface for memory backends — exposes a JSON snapshot
+/// of internal counters (compaction count, cache hits, circuit-breaker
+/// trips, PTL triggers, …) so a `GET /v1/diagnostics/memory` endpoint
+/// can render dashboards / tune budgets without backends having to
+/// depend on `harness-observability`.
+///
+/// Implementations should return cheap snapshots (a few atomic
+/// loads + a JSON serialization). The endpoint can be hit on every
+/// poll without affecting agent latency.
+///
+/// `harness-memory::SummarizingMemory` ships the canonical impl;
+/// future backends (e.g. an LLM-summary-with-retrieval one) can opt
+/// in by implementing the trait and getting picked up by the same
+/// surface for free.
+pub trait MemoryStatsProvider: Send + Sync {
+    /// Return a JSON object describing the backend's current
+    /// counters. Shape is backend-defined; the only contract is
+    /// that it's a JSON object (not a primitive) so the endpoint
+    /// can flatten / extend it.
+    fn snapshot(&self) -> serde_json::Value;
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
diff --git a/crates/harness-core/src/mode_signal.rs b/crates/harness-core/src/mode_signal.rs
new file mode 100644
index 0000000..24081ed
--- /dev/null
+++ b/crates/harness-core/src/mode_signal.rs
@@ -0,0 +1,78 @@
+//! Mode-signal channel — typed "switch permission mode" stream.
+//!
+//! Companion to [`crate::plan`] / [`crate::progress`]. Lets a tool
+//! ask the host transport to change the current permission mode
+//! from inside an agent turn — e.g. the `enter_plan_mode` tool
+//! emits [`PermissionMode::Plan`] and the WS handler reacts by
+//! flipping its per-socket mode handle. Without a typed channel,
+//! transports would have to parse mode hints out of free-form tool
+//! output.
+//!
+//! Wire model mirrors `plan` / `progress`:
+//!
+//! - The agent loop installs an [`mpsc::UnboundedSender<PermissionMode>`]
+//!   in a [`tokio::task_local`] before invoking each tool, scoped via
+//!   [`with_mode_signal`].
+//! - A tool calls [`emit`] with the target mode. The mode change does
+//!   **not** take effect inside the current tool dispatch — the agent
+//!   loop drains the receiver after the tool returns and emits
+//!   [`crate::AgentEvent::ModeChanged`]. Transports intercept the
+//!   event and apply the mode for subsequent turns.
+//! - Outside an agent invocation the channel is absent — emits become
+//!   no-ops, which keeps the tool's unit tests trivial.
+
+use tokio::sync::mpsc;
+
+use crate::permission::PermissionMode;
+
+tokio::task_local! {
+    /// Per-invocation mode-signal sender, scoped via [`with_mode_signal`].
+    static MODE_SIGNAL_TX: mpsc::UnboundedSender<PermissionMode>;
+}
+
+/// Publish a mode-change request. No-op when no listener is installed
+/// (e.g. the tool was invoked outside an agent loop in a unit test).
+pub fn emit(mode: PermissionMode) {
+    let _ = MODE_SIGNAL_TX.try_with(|tx| {
+        let _ = tx.send(mode);
+    });
+}
+
+/// Whether a mode-signal sender is installed for the current task.
+pub fn is_active() -> bool {
+    MODE_SIGNAL_TX.try_with(|_| ()).is_ok()
+}
+
+/// Run `fut` with `tx` installed as the active mode-signal sender.
+/// Used by the agent loop to scope a sender to a single tool
+/// invocation.
+pub async fn with_mode_signal<F, R>(tx: mpsc::UnboundedSender<PermissionMode>, fut: F) -> R
+where
+    F: std::future::Future<Output = R>,
+{
+    MODE_SIGNAL_TX.scope(tx, fut).await
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[tokio::test]
+    async fn emit_inside_with_mode_signal_reaches_receiver() {
+        let (tx, mut rx) = mpsc::unbounded_channel();
+        with_mode_signal(tx, async {
+            assert!(is_active());
+            emit(PermissionMode::Plan);
+        })
+        .await;
+        let got = rx.try_recv().unwrap();
+        assert_eq!(got, PermissionMode::Plan);
+    }
+
+    #[tokio::test]
+    async fn emit_outside_scope_is_noop() {
+        assert!(!is_active());
+        emit(PermissionMode::Plan);
+        // No panic; receiver doesn't exist.
+    }
+}
diff --git a/crates/harness-core/src/system_prompt.rs b/crates/harness-core/src/system_prompt.rs
new file mode 100644
index 0000000..1e12dbc
--- /dev/null
+++ b/crates/harness-core/src/system_prompt.rs
@@ -0,0 +1,259 @@
+//! Layered system-prompt assembly.
+//!
+//! Historically the composition root (`apps/jarvis::serve`) pushed
+//! strings into a single `String` to build the agent's system
+//! prompt: pick a base prompt, append project context, append
+//! project memory, append skill fences. That worked for the one
+//! call site but didn't compose: later subsystems (sub-agents,
+//! per-conversation overrides, M3.1 Project Memory writes) need to
+//! slot their own contributions in at predictable positions
+//! without re-implementing the string-pushing protocol.
+//!
+//! [`SystemPromptBuilder`] is the typed equivalent. Five ordered
+//! slots, each optional, joined by a stable delimiter. Empty slots
+//! contribute nothing, so callers that don't use a slot get the
+//! same bytes a hand-written push would have produced.
+//!
+//! Slot order (final prompt is the non-empty slots in this order,
+//! delimited by `\n\n`):
+//!
+//! 1. **base** — the agent's role/identity (general vs. coding
+//!    persona). Picked by the composition root from policy.
+//! 2. **role** — situational role override. Today unused at the
+//!    process level; sub-agent dispatch will set this per call
+//!    when wired up.
+//! 3. **per_agent_override** — caller-supplied override from a
+//!    persistent agent profile / WS frame. Lets a power user
+//!    swap in a custom prompt without losing the project context
+//!    that lives in `runtime_inject`.
+//! 4. **config_append** — operator's `[agent].system_prompt_append`
+//!    config value. Appended verbatim; the operator controls the
+//!    full text.
+//! 5. **runtime_inject** — context the runtime knows but the
+//!    operator didn't author: AGENTS.md / CLAUDE.md, project
+//!    memory index, active skill fences, etc. Last so the model
+//!    sees it freshly each turn.
+//!
+//! The builder is **immutable per call**: there's no in-place
+//! mutator. Callers chain `.with_*(...)` setters and call
+//! `.build()` once. The Drop-debug pretty-print enumerates each
+//! slot's byte count so a future `--dump-system-prompt` style flag
+//! can show the build trace without re-running.
+
+use std::fmt;
+
+/// Stable separator between slots. Matches the original ad-hoc
+/// `push_str("\n\n")` pattern so existing prompt-cache fingerprints
+/// don't rotate when the assembly moves through this builder.
+const SLOT_SEPARATOR: &str = "\n\n";
+
+/// Logical slot identifier. The `usize` repr is the build order
+/// (lowest first).
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum SystemPromptSlot {
+    Base = 0,
+    Role = 1,
+    PerAgentOverride = 2,
+    ConfigAppend = 3,
+    RuntimeInject = 4,
+}
+
+/// Layered system-prompt assembly. Cheap to clone (vec of small
+/// strings) so a composition root can lay down a baseline and let
+/// per-request handlers fork it.
+#[derive(Debug, Clone, Default)]
+pub struct SystemPromptBuilder {
+    base: Option<String>,
+    role: Option<String>,
+    per_agent_override: Option<String>,
+    config_append: Option<String>,
+    runtime_inject: Option<String>,
+}
+
+impl SystemPromptBuilder {
+    pub fn new() -> Self {
+        Self::default()
+    }
+
+    /// Replace a slot. `None` clears it. Whitespace-only strings are
+    /// treated as empty so callers don't have to filter their own
+    /// inputs.
+    pub fn set(mut self, slot: SystemPromptSlot, value: Option<String>) -> Self {
+        let cleaned = value
+            .map(|v| v.trim().to_string())
+            .filter(|v| !v.is_empty());
+        match slot {
+            SystemPromptSlot::Base => self.base = cleaned,
+            SystemPromptSlot::Role => self.role = cleaned,
+            SystemPromptSlot::PerAgentOverride => self.per_agent_override = cleaned,
+            SystemPromptSlot::ConfigAppend => self.config_append = cleaned,
+            SystemPromptSlot::RuntimeInject => self.runtime_inject = cleaned,
+        }
+        self
+    }
+
+    pub fn with_base(self, value: impl Into<String>) -> Self {
+        self.set(SystemPromptSlot::Base, Some(value.into()))
+    }
+    pub fn with_role(self, value: impl Into<String>) -> Self {
+        self.set(SystemPromptSlot::Role, Some(value.into()))
+    }
+    pub fn with_per_agent_override(self, value: impl Into<String>) -> Self {
+        self.set(SystemPromptSlot::PerAgentOverride, Some(value.into()))
+    }
+    pub fn with_config_append(self, value: impl Into<String>) -> Self {
+        self.set(SystemPromptSlot::ConfigAppend, Some(value.into()))
+    }
+    pub fn with_runtime_inject(self, value: impl Into<String>) -> Self {
+        self.set(SystemPromptSlot::RuntimeInject, Some(value.into()))
+    }
+
+    /// Append text into the `runtime_inject` slot. Multiple calls
+    /// across the same builder collect each fragment separated by
+    /// `\n\n` so the M3.1 Project Memory injector and the existing
+    /// skill-fence injector can both contribute without overwriting
+    /// each other.
+    pub fn append_runtime_inject(mut self, value: impl Into<String>) -> Self {
+        let v = value.into();
+        let trimmed = v.trim();
+        if trimmed.is_empty() {
+            return self;
+        }
+        self.runtime_inject = Some(match self.runtime_inject.take() {
+            Some(existing) => format!("{existing}{SLOT_SEPARATOR}{trimmed}"),
+            None => trimmed.to_string(),
+        });
+        self
+    }
+
+    /// Whether a slot has a non-empty value.
+    pub fn has(&self, slot: SystemPromptSlot) -> bool {
+        match slot {
+            SystemPromptSlot::Base => self.base.is_some(),
+            SystemPromptSlot::Role => self.role.is_some(),
+            SystemPromptSlot::PerAgentOverride => self.per_agent_override.is_some(),
+            SystemPromptSlot::ConfigAppend => self.config_append.is_some(),
+            SystemPromptSlot::RuntimeInject => self.runtime_inject.is_some(),
+        }
+    }
+
+    /// Materialise the final prompt string. Non-empty slots are
+    /// joined by [`SLOT_SEPARATOR`] in slot order; an empty builder
+    /// returns the empty string.
+    pub fn build(&self) -> String {
+        let slots = [
+            self.base.as_deref(),
+            self.role.as_deref(),
+            self.per_agent_override.as_deref(),
+            self.config_append.as_deref(),
+            self.runtime_inject.as_deref(),
+        ];
+        let mut out = String::new();
+        let mut first = true;
+        for slot in slots.iter().flatten() {
+            if !first {
+                out.push_str(SLOT_SEPARATOR);
+            }
+            out.push_str(slot);
+            first = false;
+        }
+        out
+    }
+
+    /// Build trace: `[(name, bytes), ...]` for every populated slot.
+    /// Lets observability surfaces log a one-line "system prompt
+    /// assembled (base=NNN, runtime_inject=NNN)" without exposing
+    /// the prompt text itself.
+    pub fn trace(&self) -> Vec<(&'static str, usize)> {
+        let entries: [(&'static str, Option<&String>); 5] = [
+            ("base", self.base.as_ref()),
+            ("role", self.role.as_ref()),
+            ("per_agent_override", self.per_agent_override.as_ref()),
+            ("config_append", self.config_append.as_ref()),
+            ("runtime_inject", self.runtime_inject.as_ref()),
+        ];
+        entries
+            .into_iter()
+            .filter_map(|(n, s)| s.map(|v| (n, v.len())))
+            .collect()
+    }
+}
+
+impl fmt::Display for SystemPromptBuilder {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        f.write_str(&self.build())
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn empty_builder_returns_empty_string() {
+        assert_eq!(SystemPromptBuilder::new().build(), "");
+    }
+
+    #[test]
+    fn single_slot_is_verbatim() {
+        let s = SystemPromptBuilder::new().with_base("hello").build();
+        assert_eq!(s, "hello");
+    }
+
+    #[test]
+    fn multiple_slots_joined_in_order_with_double_newline() {
+        let s = SystemPromptBuilder::new()
+            .with_base("BASE")
+            .with_runtime_inject("RUNTIME")
+            .with_config_append("CFG")
+            .build();
+        // Order is base → config_append → runtime_inject regardless
+        // of caller call order.
+        assert_eq!(s, "BASE\n\nCFG\n\nRUNTIME");
+    }
+
+    #[test]
+    fn whitespace_only_slot_is_treated_as_empty() {
+        let s = SystemPromptBuilder::new()
+            .with_base("BASE")
+            .with_runtime_inject("   ")
+            .build();
+        assert_eq!(s, "BASE");
+        assert!(!SystemPromptBuilder::new()
+            .with_runtime_inject("   ")
+            .has(SystemPromptSlot::RuntimeInject));
+    }
+
+    #[test]
+    fn append_runtime_inject_concatenates() {
+        let s = SystemPromptBuilder::new()
+            .with_base("BASE")
+            .append_runtime_inject("=== project context ===\nfoo")
+            .append_runtime_inject("=== skill ===\nbar")
+            .build();
+        assert_eq!(
+            s,
+            "BASE\n\n=== project context ===\nfoo\n\n=== skill ===\nbar"
+        );
+    }
+
+    #[test]
+    fn trace_lists_only_populated_slots_in_build_order() {
+        let b = SystemPromptBuilder::new()
+            .with_base("hi")
+            .with_runtime_inject("ctx");
+        let trace = b.trace();
+        assert_eq!(trace.len(), 2);
+        assert_eq!(trace[0].0, "base");
+        assert_eq!(trace[1].0, "runtime_inject");
+    }
+
+    #[test]
+    fn clearing_slot_via_set_none() {
+        let b = SystemPromptBuilder::new()
+            .with_base("BASE")
+            .set(SystemPromptSlot::Base, None);
+        assert!(!b.has(SystemPromptSlot::Base));
+        assert_eq!(b.build(), "");
+    }
+}
diff --git a/crates/harness-core/src/tool.rs b/crates/harness-core/src/tool.rs
index b792359..6e948e4 100644
--- a/crates/harness-core/src/tool.rs
+++ b/crates/harness-core/src/tool.rs
@@ -96,6 +96,34 @@ pub trait Tool: Send + Sync {
     fn is_terminal(&self) -> bool {
         false
     }
+
+    /// Safe to invoke concurrently with sibling tool calls in the
+    /// same assistant turn. Default: `true` for [`ToolCategory::Read`]
+    /// tools (pure observation), `false` for everything else.
+    ///
+    /// The agent loop consults this when partitioning a turn's
+    /// `tool_calls` for parallel dispatch — see
+    /// [`crate::AgentConfig::parallel_tool_calls`]. Tools that look
+    /// safe by category but actually mutate hidden state (e.g. write
+    /// to a shared in-memory queue) should override to `false`.
+    fn is_concurrency_safe(&self) -> bool {
+        matches!(self.category(), ToolCategory::Read)
+    }
+
+    /// Mutates user data, state outside the workspace, or otherwise
+    /// requires an explicit "commit" semantics. Defaults to `true`
+    /// for [`ToolCategory::Write`] and [`ToolCategory::Exec`] tools.
+    ///
+    /// Combined with [`Tool::is_concurrency_safe`] this lets the
+    /// agent loop reason about which calls can interleave with
+    /// siblings: a destructive call is *always* dispatched in
+    /// isolation so a sibling read can't see a half-applied
+    /// mutation. `requires_approval` is a related-but-distinct
+    /// concern (user permission); `is_destructive` is about
+    /// scheduling.
+    fn is_destructive(&self) -> bool {
+        matches!(self.category(), ToolCategory::Write | ToolCategory::Exec)
+    }
 }
 
 /// Provider-agnostic description of a tool, suitable for serialising into a
@@ -296,6 +324,24 @@ impl ToolRegistry {
     }
 }
 
+/// Decide whether every tool referenced by `calls` is safe to run
+/// concurrently with its siblings in the same batch. Used by the
+/// agent loop as a precondition for parallel dispatch — when any
+/// call resolves to a destructive or not-concurrency-safe tool,
+/// the loop falls back to strict serial execution.
+///
+/// Unknown / muted tools count as unsafe so the loop never
+/// parallelises a call it can't classify.
+pub fn all_calls_concurrency_safe(
+    registry: &ToolRegistry,
+    calls: &[crate::message::ToolCall],
+) -> bool {
+    calls.iter().all(|call| match registry.resolve(&call.name) {
+        Some(tool) => tool.is_concurrency_safe() && !tool.is_destructive(),
+        None => false,
+    })
+}
+
 pub async fn invoke_tool(registry: &ToolRegistry, name: &str, args: Value) -> Result<String> {
     let tool = registry
         .resolve(name)
@@ -509,6 +555,129 @@ mod tests {
         );
     }
 
+    // --- M2.1: concurrency-safety helpers ---
+
+    struct CategorisedTool {
+        name: &'static str,
+        category: ToolCategory,
+    }
+    #[async_trait]
+    impl Tool for CategorisedTool {
+        fn name(&self) -> &str {
+            self.name
+        }
+        fn description(&self) -> &str {
+            "test"
+        }
+        fn parameters(&self) -> Value {
+            json!({"type":"object"})
+        }
+        fn category(&self) -> ToolCategory {
+            self.category
+        }
+        async fn invoke(&self, _args: Value) -> std::result::Result<String, BoxError> {
+            Ok(String::new())
+        }
+    }
+
+    #[test]
+    fn default_concurrency_flags_match_category() {
+        let read = CategorisedTool {
+            name: "fs.read",
+            category: ToolCategory::Read,
+        };
+        assert!(read.is_concurrency_safe());
+        assert!(!read.is_destructive());
+
+        let write = CategorisedTool {
+            name: "fs.write",
+            category: ToolCategory::Write,
+        };
+        assert!(!write.is_concurrency_safe());
+        assert!(write.is_destructive());
+
+        let exec = CategorisedTool {
+            name: "shell.exec",
+            category: ToolCategory::Exec,
+        };
+        assert!(!exec.is_concurrency_safe());
+        assert!(exec.is_destructive());
+
+        let net = CategorisedTool {
+            name: "http.fetch",
+            category: ToolCategory::Network,
+        };
+        // Network defaults: concurrency-safe=false (don't pound external
+        // services in parallel without explicit opt-in), destructive=false.
+        assert!(!net.is_concurrency_safe());
+        assert!(!net.is_destructive());
+    }
+
+    #[test]
+    fn all_calls_concurrency_safe_with_only_reads() {
+        let mut registry = ToolRegistry::new();
+        registry.register(CategorisedTool {
+            name: "fs.read",
+            category: ToolCategory::Read,
+        });
+        registry.register(CategorisedTool {
+            name: "code.grep",
+            category: ToolCategory::Read,
+        });
+        let calls = vec![
+            crate::message::ToolCall {
+                id: "1".into(),
+                name: "fs.read".into(),
+                arguments: json!({}),
+            },
+            crate::message::ToolCall {
+                id: "2".into(),
+                name: "code.grep".into(),
+                arguments: json!({}),
+            },
+        ];
+        assert!(all_calls_concurrency_safe(&registry, &calls));
+    }
+
+    #[test]
+    fn all_calls_concurrency_safe_rejects_mixed_batch() {
+        let mut registry = ToolRegistry::new();
+        registry.register(CategorisedTool {
+            name: "fs.read",
+            category: ToolCategory::Read,
+        });
+        registry.register(CategorisedTool {
+            name: "fs.write",
+            category: ToolCategory::Write,
+        });
+        let calls = vec![
+            crate::message::ToolCall {
+                id: "1".into(),
+                name: "fs.read".into(),
+                arguments: json!({}),
+            },
+            crate::message::ToolCall {
+                id: "2".into(),
+                name: "fs.write".into(),
+                arguments: json!({}),
+            },
+        ];
+        assert!(!all_calls_concurrency_safe(&registry, &calls));
+    }
+
+    #[test]
+    fn all_calls_concurrency_safe_rejects_unknown_tool() {
+        // An unknown / muted tool name forces the safe path: we
+        // can't classify what we can't resolve.
+        let registry = ToolRegistry::new();
+        let calls = vec![crate::message::ToolCall {
+            id: "1".into(),
+            name: "missing".into(),
+            arguments: json!({}),
+        }];
+        assert!(!all_calls_concurrency_safe(&registry, &calls));
+    }
+
     #[test]
     fn toolspec_serialises_cacheable_true() {
         let s = ToolSpec {
diff --git a/crates/harness-core/src/working_context.rs b/crates/harness-core/src/working_context.rs
new file mode 100644
index 0000000..efcde9d
--- /dev/null
+++ b/crates/harness-core/src/working_context.rs
@@ -0,0 +1,486 @@
+//! Working-context channel — "what the agent has its hands on right now".
+//!
+//! Long-running agent loops compact older turns out of the prompt as
+//! the context window fills. Plain truncation / summarisation throws
+//! away the *operational* state that the recent turns carried: which
+//! files the agent had been reading, which plan it was working
+//! against, etc. After compaction the assistant looks at a clean slate
+//! and re-grep's files it already knew about, or forgets that it had
+//! a plan in progress.
+//!
+//! `WorkingContext` is the smallest amount of state we can reinject
+//! after compaction to keep that situational awareness. It's *not* a
+//! second memory — it's a tiny, bounded, latest-only snapshot of:
+//!
+//! - **Recent files** the agent has touched (FIFO, capped). Tools that
+//!   read or write a file call [`note_file`]; the snapshot lists each
+//!   path at most once with the most-recent access at the head.
+//! - **Latest plan snapshot** — whatever the most recent
+//!   `plan.update` carried. Forwarded by the agent loop from the
+//!   `plan` task-local channel; tools don't have to do anything new.
+//!
+//! ## Wire model
+//!
+//! - The agent loop installs a per-run [`Arc<Mutex<WorkingContext>>`]
+//!   in a [`tokio::task_local`] via [`with_working_context`] **once
+//!   per `Agent::run` / `Agent::run_stream` invocation**, not per
+//!   tool — every tool dispatch and every memory `compact` call sees
+//!   the same accumulating snapshot.
+//! - Memory backends read the latest snapshot via [`snapshot`] inside
+//!   their `compact` implementation and append a `System` block
+//!   `=== working context ===` to the returned slice. The block is
+//!   appended only at the wire stage (`build_request`); the
+//!   canonical [`crate::Conversation`] is never mutated, mirroring
+//!   how compacted summaries already work.
+//! - Outside an agent invocation (e.g. tool unit tests) the channel
+//!   is absent and all mutators are no-ops, so callers can use these
+//!   helpers freely without standing up a harness.
+
+use std::collections::VecDeque;
+use std::path::{Path, PathBuf};
+use std::pin::Pin;
+use std::sync::{Arc, Mutex};
+use std::task::{Context, Poll};
+
+use futures::Stream;
+use serde::Serialize;
+
+use crate::plan::PlanItem;
+
+/// How many distinct recently-touched files we surface to the model
+/// after compaction. The list is the FIFO tail; older entries fall
+/// off as new ones land. 20 paths fit in ~1 KiB of system message
+/// even with long workspace-relative paths, which is well within the
+/// SUMMARY_RESERVE_TOKENS budget that `harness-memory` carves out.
+pub const DEFAULT_RECENT_FILES_CAP: usize = 20;
+
+/// How many distinct recently-issued commands / search patterns we
+/// surface alongside the files. Smaller cap than files because each
+/// entry is a free-form string the model has to read in full; 8 is
+/// enough to capture the relevant "I just ran `cargo test`,
+/// `grep foo`, ..." trail without crowding the prompt.
+pub const DEFAULT_RECENT_COMMANDS_CAP: usize = 8;
+/// Max length per recorded command. Long shell pipelines get
+/// truncated with an ellipsis so a runaway `find ... -exec ...` line
+/// doesn't blow the budget.
+pub const MAX_COMMAND_LENGTH: usize = 200;
+
+/// A bounded, monotonically-updated snapshot of the agent's current
+/// operational state. Clone is cheap-ish (Vec / VecDeque clone) — call
+/// it once per `compact` call.
+#[derive(Debug, Clone, Default, Serialize)]
+pub struct WorkingContext {
+    /// Most-recently-touched files, head = newest, tail = oldest. Each
+    /// path appears at most once; a fresh touch moves the path back
+    /// to the head rather than duplicating it.
+    pub recent_files: VecDeque<PathBuf>,
+    /// Latest plan snapshot the agent published via `plan.update`.
+    /// `None` until the first emission this run.
+    pub latest_plan: Option<Vec<PlanItem>>,
+    /// FIFO cap for `recent_files`. Stored on the struct so tests can
+    /// override it without going through globals.
+    pub files_cap: usize,
+    /// Most-recently-issued shell commands / search patterns, same
+    /// FIFO + dedup invariant as `recent_files`. Pruned at
+    /// [`MAX_COMMAND_LENGTH`] before storage so any single entry
+    /// stays readable in the system-prompt block.
+    pub recent_commands: VecDeque<String>,
+    /// FIFO cap for `recent_commands`.
+    pub commands_cap: usize,
+}
+
+impl WorkingContext {
+    pub fn new(files_cap: usize) -> Self {
+        Self {
+            recent_files: VecDeque::with_capacity(files_cap),
+            latest_plan: None,
+            files_cap,
+            recent_commands: VecDeque::with_capacity(DEFAULT_RECENT_COMMANDS_CAP),
+            commands_cap: DEFAULT_RECENT_COMMANDS_CAP,
+        }
+    }
+
+    /// Promote `path` to the head of `recent_files`, deduping and
+    /// trimming to `files_cap`. Empty paths are ignored.
+    pub fn note_file(&mut self, path: PathBuf) {
+        if path.as_os_str().is_empty() {
+            return;
+        }
+        // Dedup: remove any prior entry equal to this path so the
+        // newest occurrence wins.
+        if let Some(pos) = self.recent_files.iter().position(|p| p == &path) {
+            self.recent_files.remove(pos);
+        }
+        self.recent_files.push_front(path);
+        while self.recent_files.len() > self.files_cap {
+            self.recent_files.pop_back();
+        }
+    }
+
+    /// Promote `cmd` to the head of `recent_commands`. Empty inputs
+    /// are ignored; over-long commands are truncated with an
+    /// ellipsis. Same dedup-and-front-promotion policy as
+    /// `recent_files` so the trail reflects "most-recent first".
+    pub fn note_command(&mut self, cmd: String) {
+        let trimmed = cmd.trim();
+        if trimmed.is_empty() {
+            return;
+        }
+        let value = if trimmed.chars().count() > MAX_COMMAND_LENGTH {
+            // Truncate on char boundary so we don't slice mid-UTF-8.
+            let mut s: String = trimmed.chars().take(MAX_COMMAND_LENGTH - 1).collect();
+            s.push('…');
+            s
+        } else {
+            trimmed.to_string()
+        };
+        if let Some(pos) = self.recent_commands.iter().position(|c| c == &value) {
+            self.recent_commands.remove(pos);
+        }
+        self.recent_commands.push_front(value);
+        while self.recent_commands.len() > self.commands_cap {
+            self.recent_commands.pop_back();
+        }
+    }
+
+    /// Replace the plan snapshot wholesale.
+    pub fn note_plan(&mut self, items: Vec<PlanItem>) {
+        self.latest_plan = Some(items);
+    }
+
+    /// Whether there's anything worth rendering. Memory backends skip
+    /// the injected block entirely when this returns false so they
+    /// don't waste tokens on an empty header.
+    pub fn is_empty(&self) -> bool {
+        self.recent_files.is_empty()
+            && self.latest_plan.is_none()
+            && self.recent_commands.is_empty()
+    }
+
+    /// Render to the wire-shape `System` message body. The format is
+    /// stable so other tools / tests can grep for the header.
+    /// Returns `None` when the context is empty.
+    pub fn render(&self) -> Option<String> {
+        if self.is_empty() {
+            return None;
+        }
+        let mut buf = String::from("=== working context ===\n");
+        if !self.recent_files.is_empty() {
+            buf.push_str("recent files (most recent first):\n");
+            for p in &self.recent_files {
+                buf.push_str("- ");
+                buf.push_str(&p.display().to_string());
+                buf.push('\n');
+            }
+        }
+        if !self.recent_commands.is_empty() {
+            buf.push_str("\nrecent commands (most recent first):\n");
+            for c in &self.recent_commands {
+                buf.push_str("- ");
+                buf.push_str(c);
+                buf.push('\n');
+            }
+        }
+        if let Some(items) = self.latest_plan.as_ref() {
+            if !items.is_empty() {
+                buf.push_str("\ncurrent plan:\n");
+                for item in items {
+                    let status = match item.status {
+                        crate::plan::PlanStatus::Pending => "[ ]",
+                        crate::plan::PlanStatus::InProgress => "[~]",
+                        crate::plan::PlanStatus::Completed => "[x]",
+                        crate::plan::PlanStatus::Cancelled => "[-]",
+                    };
+                    buf.push_str(status);
+                    buf.push(' ');
+                    buf.push_str(&item.title);
+                    if let Some(note) = item.note.as_deref() {
+                        buf.push_str(" (");
+                        buf.push_str(note);
+                        buf.push(')');
+                    }
+                    buf.push('\n');
+                }
+            }
+        }
+        Some(buf)
+    }
+}
+
+tokio::task_local! {
+    /// Per-run working-context slot. Scoped by [`with_working_context`]
+    /// at the top of `Agent::run` and `Agent::run_stream`.
+    static WORKING_CTX: Arc<Mutex<WorkingContext>>;
+}
+
+/// Note that the current task touched a file. No-op when no
+/// listener is installed (unit tests, etc.).
+pub fn note_file(path: impl Into<PathBuf>) {
+    let path = path.into();
+    let _ = WORKING_CTX.try_with(|wc| {
+        if let Ok(mut wc) = wc.lock() {
+            wc.note_file(path);
+        }
+    });
+}
+
+/// Forward a `plan.update` snapshot into the working context. Called
+/// by the agent loop after relaying a `PlanUpdate` event, so tools
+/// don't need to do anything extra.
+pub fn note_plan(items: Vec<PlanItem>) {
+    let _ = WORKING_CTX.try_with(|wc| {
+        if let Ok(mut wc) = wc.lock() {
+            wc.note_plan(items);
+        }
+    });
+}
+
+/// Record a shell command / search pattern in the current task's
+/// working context. Called by tools that issue meaningful "what
+/// did the agent just do" actions — today `shell.exec` and
+/// `code.grep`. No-op when no listener is installed.
+pub fn note_command(cmd: impl Into<String>) {
+    let cmd = cmd.into();
+    let _ = WORKING_CTX.try_with(|wc| {
+        if let Ok(mut wc) = wc.lock() {
+            wc.note_command(cmd);
+        }
+    });
+}
+
+/// Read-only snapshot of the current working context. `None` when
+/// no listener is installed. Returns a clone — the lock is held only
+/// for the duration of the clone.
+pub fn snapshot() -> Option<WorkingContext> {
+    WORKING_CTX
+        .try_with(|wc| wc.lock().ok().map(|guard| guard.clone()))
+        .ok()
+        .flatten()
+}
+
+/// Whether a working-context slot is installed for the current task.
+pub fn is_active() -> bool {
+    WORKING_CTX.try_with(|_| ()).is_ok()
+}
+
+/// Run `fut` with a fresh `WorkingContext` installed as the active
+/// slot. Used by the agent loop to scope context accumulation to a
+/// single `run` / `run_stream` invocation; the slot is cleared when
+/// `fut` completes.
+pub async fn with_working_context<F, R>(fut: F) -> R
+where
+    F: std::future::Future<Output = R>,
+{
+    with_working_context_capped(DEFAULT_RECENT_FILES_CAP, fut).await
+}
+
+/// Same as [`with_working_context`] but lets the caller pin the
+/// recent-files cap. Used by tests; production callers should prefer
+/// the default.
+pub async fn with_working_context_capped<F, R>(files_cap: usize, fut: F) -> R
+where
+    F: std::future::Future<Output = R>,
+{
+    let slot = Arc::new(Mutex::new(WorkingContext::new(files_cap)));
+    WORKING_CTX.scope(slot, fut).await
+}
+
+/// Wrap a `Stream` so each `poll_next` runs with a per-stream
+/// [`WorkingContext`] installed as the active task-local slot. Use
+/// this for streaming entry points (like `Agent::run_stream`) whose
+/// body can't be wrapped in [`with_working_context`] because
+/// `async_stream::yield` cannot traverse a `tokio::task_local`
+/// async scope.
+pub fn scope_stream<S: Stream + 'static>(stream: S) -> WorkingContextStream<S> {
+    WorkingContextStream::new(stream, DEFAULT_RECENT_FILES_CAP)
+}
+
+/// Same as [`scope_stream`] but lets callers (typically tests) pin
+/// the `recent_files` cap.
+pub fn scope_stream_capped<S: Stream + 'static>(
+    stream: S,
+    files_cap: usize,
+) -> WorkingContextStream<S> {
+    WorkingContextStream::new(stream, files_cap)
+}
+
+/// Stream adapter created by [`scope_stream`]: every `poll_next`
+/// borrows the per-stream slot synchronously via `sync_scope` so the
+/// task_local is visible inside the inner stream's body for that
+/// poll.
+pub struct WorkingContextStream<S> {
+    inner: Pin<Box<S>>,
+    ctx: Arc<Mutex<WorkingContext>>,
+}
+
+impl<S> WorkingContextStream<S> {
+    fn new(inner: S, files_cap: usize) -> Self {
+        Self {
+            inner: Box::pin(inner),
+            ctx: Arc::new(Mutex::new(WorkingContext::new(files_cap))),
+        }
+    }
+}
+
+impl<S: Stream> Stream for WorkingContextStream<S> {
+    type Item = S::Item;
+    fn poll_next(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Option<Self::Item>> {
+        let ctx = self.ctx.clone();
+        WORKING_CTX.sync_scope(ctx, || self.inner.as_mut().poll_next(cx))
+    }
+}
+
+/// Convenience wrapper for tools that already canonicalised a path
+/// against a sandbox root: pass the absolute path the tool resolved
+/// (not the model's input). Strips a workspace root prefix when
+/// available so the recorded path is portable across machines.
+pub fn note_file_relative_to<P: AsRef<Path>>(path: P, workspace_root: Option<&Path>) {
+    let path = path.as_ref();
+    let to_record = match workspace_root.and_then(|root| path.strip_prefix(root).ok()) {
+        Some(rel) => rel.to_path_buf(),
+        None => path.to_path_buf(),
+    };
+    note_file(to_record);
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::plan::{PlanItem, PlanStatus};
+
+    #[tokio::test]
+    async fn note_file_dedupes_and_caps() {
+        with_working_context_capped(3, async {
+            note_file("a");
+            note_file("b");
+            note_file("c");
+            note_file("a"); // promotes a back to head
+            note_file("d"); // evicts the oldest (b)
+            let snap = snapshot().unwrap();
+            let paths: Vec<_> = snap
+                .recent_files
+                .iter()
+                .map(|p| p.display().to_string())
+                .collect();
+            assert_eq!(paths, vec!["d", "a", "c"]);
+        })
+        .await;
+    }
+
+    #[tokio::test]
+    async fn note_plan_replaces() {
+        with_working_context(async {
+            note_plan(vec![PlanItem {
+                id: "1".into(),
+                title: "first".into(),
+                status: PlanStatus::InProgress,
+                note: None,
+            }]);
+            note_plan(vec![
+                PlanItem {
+                    id: "1".into(),
+                    title: "first".into(),
+                    status: PlanStatus::Completed,
+                    note: None,
+                },
+                PlanItem {
+                    id: "2".into(),
+                    title: "second".into(),
+                    status: PlanStatus::InProgress,
+                    note: None,
+                },
+            ]);
+            let snap = snapshot().unwrap();
+            let plan = snap.latest_plan.unwrap();
+            assert_eq!(plan.len(), 2);
+            assert_eq!(plan[0].status, PlanStatus::Completed);
+        })
+        .await;
+    }
+
+    #[tokio::test]
+    async fn snapshot_outside_scope_is_none() {
+        assert!(!is_active());
+        assert!(snapshot().is_none());
+        // The point: no panic.
+        note_file("ignored");
+        note_plan(vec![]);
+    }
+
+    #[tokio::test]
+    async fn render_emits_header_with_files_and_plan() {
+        with_working_context(async {
+            note_file("src/lib.rs");
+            note_plan(vec![PlanItem {
+                id: "x".into(),
+                title: "do thing".into(),
+                status: PlanStatus::InProgress,
+                note: Some("waiting on review".into()),
+            }]);
+            let body = snapshot().unwrap().render().unwrap();
+            assert!(body.starts_with("=== working context ==="), "got: {body}");
+            assert!(body.contains("- src/lib.rs"));
+            assert!(body.contains("[~] do thing (waiting on review)"));
+        })
+        .await;
+    }
+
+    #[tokio::test]
+    async fn render_empty_returns_none() {
+        with_working_context(async {
+            let snap = snapshot().unwrap();
+            assert!(snap.is_empty());
+            assert!(snap.render().is_none());
+        })
+        .await;
+    }
+
+    #[tokio::test]
+    async fn note_command_dedupes_truncates_and_renders() {
+        with_working_context(async {
+            super::note_command("cargo test");
+            super::note_command("cargo clippy");
+            super::note_command("cargo test"); // dedup, promotes
+            let huge = "x".repeat(MAX_COMMAND_LENGTH * 2);
+            super::note_command(huge);
+            let snap = snapshot().unwrap();
+            let cmds: Vec<_> = snap.recent_commands.iter().cloned().collect();
+            // 3 distinct entries, newest at head.
+            assert_eq!(cmds.len(), 3);
+            assert_eq!(cmds[1], "cargo test"); // promoted on dedup
+            assert_eq!(cmds[2], "cargo clippy");
+            // The huge entry was truncated with an ellipsis.
+            assert!(cmds[0].ends_with('…'));
+            assert!(cmds[0].chars().count() <= MAX_COMMAND_LENGTH);
+
+            let rendered = snap.render().unwrap();
+            assert!(rendered.contains("recent commands"));
+            assert!(rendered.contains("- cargo test"));
+        })
+        .await;
+    }
+
+    #[tokio::test]
+    async fn note_file_relative_to_strips_workspace_root() {
+        let root = std::path::PathBuf::from("/workspace/proj");
+        with_working_context(async {
+            note_file_relative_to(root.join("src/lib.rs"), Some(&root));
+            note_file_relative_to("/elsewhere/a.txt", Some(&root)); // absolute kept
+            let snap = snapshot().unwrap();
+            let paths: Vec<_> = snap
+                .recent_files
+                .iter()
+                .map(|p| p.display().to_string())
+                .collect();
+            assert!(
+                paths.iter().any(|p| p == "src/lib.rs"),
+                "expected stripped path, got: {paths:?}"
+            );
+            assert!(
+                paths.iter().any(|p| p == "/elsewhere/a.txt"),
+                "expected absolute kept, got: {paths:?}"
+            );
+        })
+        .await;
+    }
+}
diff --git a/crates/harness-memory/src/lib.rs b/crates/harness-memory/src/lib.rs
index 61dfeeb..68771cc 100644
--- a/crates/harness-memory/src/lib.rs
+++ b/crates/harness-memory/src/lib.rs
@@ -27,4 +27,6 @@ mod summarizing;
 mod turns;
 
 pub use sliding::SlidingWindowMemory;
-pub use summarizing::{LlmRouteResolver, SummarizingMemory, DEFAULT_SUMMARY_PROMPT};
+pub use summarizing::{
+    CompactionCounters, LlmRouteResolver, SummarizingMemory, DEFAULT_SUMMARY_PROMPT,
+};
diff --git a/crates/harness-memory/src/sliding.rs b/crates/harness-memory/src/sliding.rs
index cc2493a..f5d95cf 100644
--- a/crates/harness-memory/src/sliding.rs
+++ b/crates/harness-memory/src/sliding.rs
@@ -135,9 +135,27 @@ fn compact(
             out.push(messages[i].clone());
         }
     }
+    // Append the agent's working-context snapshot (recent files +
+    // current plan). Empty snapshots render `None` and contribute
+    // nothing. Outside an agent run (e.g. memory unit tests without
+    // `with_working_context`) the snapshot is also `None`, so this
+    // is a no-op in tests that don't opt in.
+    append_working_context(&mut out);
     out
 }
 
+/// Append the current `WorkingContext` snapshot as a trailing
+/// `System` message. No-op when no snapshot is installed or the
+/// snapshot has nothing worth rendering. Pulled out so the same
+/// behaviour lives in `SummarizingMemory` without copy/paste.
+pub(crate) fn append_working_context(out: &mut Vec<Message>) {
+    if let Some(wc) = harness_core::working_context_snapshot() {
+        if let Some(body) = wc.render() {
+            out.push(Message::system(body));
+        }
+    }
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
@@ -476,6 +494,67 @@ mod tests {
         }
     }
 
+    #[tokio::test]
+    async fn appends_working_context_block_when_active() {
+        use harness_core::{
+            note_working_file, note_working_plan, with_working_context, PlanItem, PlanStatus,
+        };
+        let msgs = vec![system("sys"), user("hi"), assistant("hello")];
+        with_working_context(async {
+            note_working_file("src/lib.rs");
+            note_working_plan(vec![PlanItem {
+                id: "1".into(),
+                title: "do thing".into(),
+                status: PlanStatus::InProgress,
+                note: None,
+            }]);
+            let mem = SlidingWindowMemory::new(10_000);
+            let out = mem.compact(&msgs).await.unwrap();
+            // Last message should be the working-context block.
+            let last = out.last().unwrap();
+            match last {
+                Message::System { content, .. } => {
+                    assert!(
+                        content.starts_with("=== working context ==="),
+                        "expected working-context block at tail, got: {content}"
+                    );
+                    assert!(content.contains("src/lib.rs"));
+                    assert!(content.contains("do thing"));
+                }
+                _ => panic!("expected trailing System message, got {last:?}"),
+            }
+        })
+        .await;
+    }
+
+    #[tokio::test]
+    async fn no_block_when_working_context_inactive() {
+        // No `with_working_context` scope: snapshot returns None and
+        // the trailing block is skipped entirely.
+        let msgs = vec![system("sys"), user("hi"), assistant("hello")];
+        let mem = SlidingWindowMemory::new(10_000);
+        let out = mem.compact(&msgs).await.unwrap();
+        let has_block = out.iter().any(
+            |m| matches!(m, Message::System { content, .. } if content.starts_with("=== working context ===")),
+        );
+        assert!(!has_block, "should not inject without a working-context scope");
+    }
+
+    #[tokio::test]
+    async fn no_block_when_snapshot_is_empty() {
+        use harness_core::with_working_context;
+        let msgs = vec![system("sys"), user("hi"), assistant("hello")];
+        with_working_context(async {
+            let mem = SlidingWindowMemory::new(10_000);
+            let out = mem.compact(&msgs).await.unwrap();
+            let has_block = out.iter().any(
+                |m| matches!(m, Message::System { content, .. } if content.starts_with("=== working context ===")),
+            );
+            assert!(!has_block, "empty context should not inject a block");
+        })
+        .await;
+    }
+
     #[tokio::test]
     async fn custom_estimator_halves_effective_budget() {
         let msgs = vec![
diff --git a/crates/harness-memory/src/summarizing.rs b/crates/harness-memory/src/summarizing.rs
index 63a90f1..a80f798 100644
--- a/crates/harness-memory/src/summarizing.rs
+++ b/crates/harness-memory/src/summarizing.rs
@@ -40,12 +40,15 @@
 //! endpoints so internal rows never leak into client conversation
 //! lists.
 
+use std::sync::atomic::{AtomicU64, Ordering};
 use std::sync::{Arc, Mutex};
+use std::time::{Duration, Instant};
 
 use async_trait::async_trait;
 use harness_core::{
     cache_breakpoint_indices, default_estimator, BoxError, ChatRequest, Conversation,
-    ConversationStore, Error as CoreError, LlmProvider, Memory, Message, TokenEstimator,
+    ConversationStore, Error as CoreError, LlmProvider, Memory, MemoryStatsProvider, Message,
+    TokenEstimator,
 };
 use tracing::{debug, warn};
 
@@ -82,6 +85,18 @@ const SUMMARY_RESERVE_TOKENS: usize = 256;
 /// Cap on how many tokens the summarisation call is allowed to emit.
 const DEFAULT_SUMMARY_MAX_TOKENS: u32 = 400;
 
+/// Consecutive summary-call failures that flip the circuit breaker
+/// to "open". While open, [`SummarizingMemory::compact`] skips the
+/// LLM entirely and falls through to the existing placeholder note
+/// path, so a wedged summariser stops burning quota.
+const CIRCUIT_FAILURE_THRESHOLD: u32 = 3;
+
+/// How long the circuit stays open before the next request is
+/// allowed through. Aggressively short — most "real" outages
+/// (provider 5xx storm, quota hit) clear within seconds, and we
+/// want to recover quickly when the upstream comes back.
+const CIRCUIT_OPEN_DURATION: Duration = Duration::from_secs(60);
+
 /// Optional resolver consulted before each summarisation call. When
 /// it returns `Some((llm, model))`, that pair overrides the
 /// constructor-time `(llm, model)` for this call only — useful when
@@ -94,6 +109,72 @@ const DEFAULT_SUMMARY_MAX_TOKENS: u32 = 400;
 /// holds the policy + provider registry.
 pub type LlmRouteResolver = dyn Fn() -> Option<(Arc<dyn LlmProvider>, String)> + Send + Sync;
 
+/// Process-wide counters for [`SummarizingMemory`]'s compaction
+/// path. Updated lock-free on the hot path, snapshotted to JSON via
+/// [`MemoryStatsProvider`] for the
+/// `GET /v1/diagnostics/memory` endpoint.
+///
+/// Counters are monotonic since process start — there's no "reset"
+/// API on purpose. Operators tuning `JARVIS_MEMORY_TOKENS` care
+/// about ratios (cache hit rate, LLM failure rate, how often PTL
+/// kicks in) which work fine with running totals.
+#[derive(Debug, Default)]
+pub struct CompactionCounters {
+    /// Total `compact()` calls — incremented every entry regardless
+    /// of whether any turns were dropped.
+    pub compactions_total: AtomicU64,
+    /// Calls that actually had something to summarise (i.e.
+    /// `dropped_msgs` was non-empty). The complement of this and
+    /// `compactions_total` is the "fits in budget, no work" path.
+    pub summary_required: AtomicU64,
+    /// In-memory single-slot cache hits.
+    pub cache_hits_memory: AtomicU64,
+    /// Persistent `ConversationStore` cache hits.
+    pub cache_hits_store: AtomicU64,
+    /// Times the LLM was actually called for a summary.
+    pub llm_calls: AtomicU64,
+    /// Times the LLM call returned `Err` (after the internal
+    /// transport retry).
+    pub llm_failures: AtomicU64,
+    /// Times the circuit breaker was found open and the LLM call
+    /// was skipped.
+    pub circuit_skips: AtomicU64,
+    /// Times the circuit breaker tripped (failure-threshold hit).
+    pub circuit_opens: AtomicU64,
+    /// Times the PTL fallback round 1 (drop 20%) was executed.
+    pub ptl_round_one: AtomicU64,
+    /// Times the PTL fallback round 2 (hard-prune to latest turn)
+    /// was executed.
+    pub ptl_round_two: AtomicU64,
+}
+
+impl CompactionCounters {
+    fn inc(&self, c: &AtomicU64) {
+        c.fetch_add(1, Ordering::Relaxed);
+    }
+    fn load(c: &AtomicU64) -> u64 {
+        c.load(Ordering::Relaxed)
+    }
+}
+
+impl MemoryStatsProvider for CompactionCounters {
+    fn snapshot(&self) -> serde_json::Value {
+        serde_json::json!({
+            "backend": "summarizing",
+            "compactions_total": Self::load(&self.compactions_total),
+            "summary_required": Self::load(&self.summary_required),
+            "cache_hits_memory": Self::load(&self.cache_hits_memory),
+            "cache_hits_store": Self::load(&self.cache_hits_store),
+            "llm_calls": Self::load(&self.llm_calls),
+            "llm_failures": Self::load(&self.llm_failures),
+            "circuit_skips": Self::load(&self.circuit_skips),
+            "circuit_opens": Self::load(&self.circuit_opens),
+            "ptl_round_one": Self::load(&self.ptl_round_one),
+            "ptl_round_two": Self::load(&self.ptl_round_two),
+        })
+    }
+}
+
 /// Compact a conversation by summarising the oldest turns.
 pub struct SummarizingMemory {
     llm: Arc<dyn LlmProvider>,
@@ -110,6 +191,22 @@ pub struct SummarizingMemory {
     /// Optional `(llm, model)` override resolved on every
     /// summarisation call. See [`LlmRouteResolver`].
     route_resolver: Option<Arc<LlmRouteResolver>>,
+    /// Consecutive summariser failures (cache hits don't count —
+    /// `summarise` returns `Ok` early on hit). Reset to zero on the
+    /// first success after a streak.
+    failure_streak: Arc<Mutex<u32>>,
+    /// When `Some(t)`, every `compact` call skips the LLM until
+    /// `Instant::now() >= t` and falls through to the existing
+    /// placeholder-note path. Reset to `None` when the deadline is
+    /// reached and the next call walks past
+    /// [`SummarizingMemory::circuit_open`].
+    circuit_until: Arc<Mutex<Option<Instant>>>,
+    /// Telemetry counters surfaced via
+    /// [`SummarizingMemory::counters`]. Composition roots clone the
+    /// `Arc` once and stash it on `AppState` so the diagnostics
+    /// endpoint can read snapshots without taking a reference back
+    /// into the memory backend.
+    counters: Arc<CompactionCounters>,
 }
 
 struct CachedSummary {
@@ -129,9 +226,25 @@ impl SummarizingMemory {
             persistence: None,
             estimator: default_estimator(),
             route_resolver: None,
+            failure_streak: Arc::new(Mutex::new(0)),
+            circuit_until: Arc::new(Mutex::new(None)),
+            counters: Arc::new(CompactionCounters::default()),
         }
     }
 
+    /// Clone-able handle to the telemetry counters. Composition
+    /// roots typically stash this on `AppState` so the diagnostics
+    /// surface can read snapshots:
+    ///
+    /// ```ignore
+    /// let mem = SummarizingMemory::new(llm, model, max_tokens);
+    /// let counters = mem.counters();
+    /// state.memory_stats = Some(counters as Arc<dyn MemoryStatsProvider>);
+    /// ```
+    pub fn counters(&self) -> Arc<CompactionCounters> {
+        self.counters.clone()
+    }
+
     /// Install a per-call route override. The resolver fires before
     /// each summarisation call; when it returns `Some((llm, model))`,
     /// that pair is used instead of the constructor-time default.
@@ -174,6 +287,7 @@ impl SummarizingMemory {
 #[async_trait]
 impl Memory for SummarizingMemory {
     async fn compact(&self, messages: &[Message]) -> Result<Vec<Message>, BoxError> {
+        self.counters.inc(&self.counters.compactions_total);
         let (system_idxs, turns) = split_into_turns(messages);
 
         let estimator = self.estimator.as_ref();
@@ -233,15 +347,36 @@ impl Memory for SummarizingMemory {
         // `SlidingWindowMemory`'s "[N earlier turn(s) omitted ...]"
         // so the model still sees a clear gap marker. The error is
         // logged so it's not invisible.
+        //
+        // Circuit breaker: if the upstream summariser has failed
+        // CIRCUIT_FAILURE_THRESHOLD times in a row, we treat the
+        // circuit as "open" and skip the LLM entirely for
+        // CIRCUIT_OPEN_DURATION. A long, slowly-degrading provider
+        // would otherwise burn quota on every compaction. The
+        // circuit auto-resets on time-out, so we recover without
+        // operator intervention.
         let summary = if dropped_msgs.is_empty() {
             None
         } else {
-            match self.summarise(&dropped_msgs).await {
-                Ok(s) => Some(s),
-                Err(e) => {
-                    warn!(error = %e, dropped = dropped_count,
-                          "summary failed; falling back to placeholder note");
-                    None
+            self.counters.inc(&self.counters.summary_required);
+            if self.circuit_open() {
+                self.counters.inc(&self.counters.circuit_skips);
+                debug!(dropped = dropped_count,
+                       "summary circuit open; skipping LLM call");
+                None
+            } else {
+                match self.summarise(&dropped_msgs).await {
+                    Ok(s) => {
+                        self.record_summary_success();
+                        Some(s)
+                    }
+                    Err(e) => {
+                        self.counters.inc(&self.counters.llm_failures);
+                        self.record_summary_failure();
+                        warn!(error = %e, dropped = dropped_count,
+                              "summary failed; falling back to placeholder note");
+                        None
+                    }
                 }
             }
         };
@@ -268,16 +403,97 @@ impl Memory for SummarizingMemory {
                 out.push(messages[i].clone());
             }
         }
+        // Append the agent's working-context snapshot. Same helper
+        // as `SlidingWindowMemory` so the two backends produce the
+        // same trailing block.
+        crate::sliding::append_working_context(&mut out);
+        // PTL safety net: if the summary itself ran long or the
+        // working-context block tipped us over, drop oldest turns
+        // until the estimate fits. Never returns `Err` — the entire
+        // point is to absorb pathological cases without bringing the
+        // user's turn down.
+        let (pruned, outcome) = enforce_token_budget(out, self.max_tokens, estimator);
+        out = pruned;
+        match outcome {
+            PtlOutcome::None => {}
+            PtlOutcome::RoundOne => self.counters.inc(&self.counters.ptl_round_one),
+            PtlOutcome::RoundTwo => {
+                self.counters.inc(&self.counters.ptl_round_one);
+                self.counters.inc(&self.counters.ptl_round_two);
+            }
+        }
         Ok(out)
     }
 }
 
 impl SummarizingMemory {
+    /// Whether the failure-streak has flipped the circuit open. Has
+    /// the side-effect of clearing the latch when the deadline has
+    /// passed, so the next call may try the LLM again.
+    fn circuit_open(&self) -> bool {
+        let mut guard = self
+            .circuit_until
+            .lock()
+            .expect("circuit_until mutex poisoned");
+        match *guard {
+            Some(t) if Instant::now() < t => true,
+            Some(_) => {
+                // Deadline reached — re-arm both pieces of state so
+                // a single failure post-cooldown doesn't immediately
+                // re-trip the breaker.
+                *guard = None;
+                drop(guard);
+                *self
+                    .failure_streak
+                    .lock()
+                    .expect("failure_streak mutex poisoned") = 0;
+                false
+            }
+            None => false,
+        }
+    }
+
+    /// Reset the failure-streak on any non-cache LLM success.
+    fn record_summary_success(&self) {
+        let mut streak = self
+            .failure_streak
+            .lock()
+            .expect("failure_streak mutex poisoned");
+        if *streak > 0 {
+            debug!(prior_streak = *streak, "summary success — resetting streak");
+        }
+        *streak = 0;
+    }
+
+    /// Increment the failure-streak; trip the breaker once the
+    /// threshold is reached.
+    fn record_summary_failure(&self) {
+        let mut streak = self
+            .failure_streak
+            .lock()
+            .expect("failure_streak mutex poisoned");
+        *streak += 1;
+        if *streak >= CIRCUIT_FAILURE_THRESHOLD {
+            *self
+                .circuit_until
+                .lock()
+                .expect("circuit_until mutex poisoned") =
+                Some(Instant::now() + CIRCUIT_OPEN_DURATION);
+            self.counters.inc(&self.counters.circuit_opens);
+            warn!(
+                streak = *streak,
+                cooldown_secs = CIRCUIT_OPEN_DURATION.as_secs(),
+                "summary circuit opened — skipping LLM for cooldown",
+            );
+        }
+    }
+
     async fn summarise(&self, dropped: &[Message]) -> Result<String, BoxError> {
         let fp = fingerprint(dropped);
 
         // Tier 1: in-memory single-slot cache.
         if let Some(text) = self.cache_lookup(&fp) {
+            self.counters.inc(&self.counters.cache_hits_memory);
             debug!(fingerprint = %fp, "summary cache hit (memory)");
             return Ok(text);
         }
@@ -287,6 +503,7 @@ impl SummarizingMemory {
             match store.load(&persist_key(&fp)).await {
                 Ok(Some(conv)) => {
                     if let Some(text) = extract_summary(&conv) {
+                        self.counters.inc(&self.counters.cache_hits_store);
                         debug!(fingerprint = %fp, "summary cache hit (store)");
                         self.cache_set(&fp, &text);
                         return Ok(text);
@@ -336,6 +553,11 @@ impl SummarizingMemory {
             parallel_tool_calls: None,
         };
 
+        // Mark that we're actually going to the LLM. Counted once
+        // per `summarise()` even when the inner retry runs — that's
+        // intentional, the second attempt isn't a "fresh call" to
+        // the operator, it's the same logical attempt that retried.
+        self.counters.inc(&self.counters.llm_calls);
         // One retry on transient transport errors — the summariser
         // shares a connection pool with the foreground agent and
         // sometimes hits a half-closed keep-alive on first send.
@@ -567,6 +789,111 @@ fn compact_args(v: &serde_json::Value) -> String {
     serde_json::to_string(v).unwrap_or_else(|_| "{}".to_string())
 }
 
+/// Which (if any) PTL round fired in [`enforce_token_budget`].
+/// Returned alongside the pruned vector so the caller can
+/// increment the right counters without re-running heuristics.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+enum PtlOutcome {
+    /// Already under budget — no pruning needed.
+    None,
+    /// Round-1 drop (oldest 20% of non-latest turns) was enough.
+    RoundOne,
+    /// Round-1 wasn't enough; round-2 hard-prune to latest turn
+    /// only ran. Both rounds are credited to the caller.
+    RoundTwo,
+}
+
+/// Best-effort enforcement: if the compacted output still exceeds
+/// `max_tokens`, drop turns from the oldest end (preserving the
+/// leading System prefix, the optional trailing working-context
+/// block, and the most recent turn). Two rounds — first 20% of
+/// non-latest turns, then everything except the latest turn — both
+/// followed by a stable marker. Never errors; returns the original
+/// vector untouched when no pruning is required.
+fn enforce_token_budget(
+    out: Vec<Message>,
+    max_tokens: usize,
+    est: &dyn TokenEstimator,
+) -> (Vec<Message>, PtlOutcome) {
+    if max_tokens == 0 || est.estimate_messages(&out) <= max_tokens {
+        return (out, PtlOutcome::None);
+    }
+
+    // Region 1: leading contiguous System messages (kept verbatim,
+    // including any compaction summary we just inserted).
+    let prefix_end = out
+        .iter()
+        .take_while(|m| matches!(m, Message::System { .. }))
+        .count();
+
+    // Region 3 (trailing): the working-context block, if present.
+    // Recognise it by header so we don't accidentally count a
+    // user-emitted System reply.
+    let trailing = matches!(
+        out.last(),
+        Some(Message::System { content, .. }) if content.starts_with("=== working context ===")
+    ) as usize;
+
+    // Region 2: body messages where the conversation turns live.
+    let body_start = prefix_end;
+    let body_end = out.len().saturating_sub(trailing);
+    if body_end <= body_start {
+        return (out, PtlOutcome::None);
+    }
+
+    let turn_starts: Vec<usize> = (body_start..body_end)
+        .filter(|&i| matches!(out[i], Message::User { .. }))
+        .collect();
+
+    if turn_starts.len() <= 1 {
+        // Only the latest turn is droppable, but the spec keeps it.
+        // Nothing we can safely prune.
+        return (out, PtlOutcome::None);
+    }
+
+    // Round 1: drop the oldest 20% of non-latest turns (round up).
+    let droppable_turns = turn_starts.len() - 1;
+    let mut drop_n = droppable_turns.div_ceil(5).max(1); // 20% rounded up, min 1
+    if drop_n >= droppable_turns {
+        drop_n = droppable_turns; // never include the latest turn
+    }
+    let cut_at = turn_starts[drop_n];
+
+    let mut pruned: Vec<Message> = Vec::with_capacity(out.len());
+    pruned.extend_from_slice(&out[..prefix_end]);
+    pruned.push(ptl_marker_message(drop_n));
+    pruned.extend_from_slice(&out[cut_at..body_end]);
+    pruned.extend_from_slice(&out[body_end..]); // trailing working context
+
+    if est.estimate_messages(&pruned) <= max_tokens {
+        return (pruned, PtlOutcome::RoundOne);
+    }
+
+    // Round 2: hard-prune to the latest turn only. Even this may
+    // not be enough if the latest turn alone is oversized — but the
+    // spec says preserve the latest turn rather than send nothing.
+    // Over-budget is preferable to truncating the turn the user is
+    // actively interacting with.
+    let last_turn_start = *turn_starts.last().unwrap_or(&body_start);
+    let dropped_turns_total = turn_starts.len() - 1;
+    let mut hard: Vec<Message> = Vec::with_capacity(out.len());
+    hard.extend_from_slice(&out[..prefix_end]);
+    hard.push(ptl_marker_message(dropped_turns_total));
+    hard.extend_from_slice(&out[last_turn_start..body_end]);
+    hard.extend_from_slice(&out[body_end..]);
+    (hard, PtlOutcome::RoundTwo)
+}
+
+/// Marker inserted by [`enforce_token_budget`] so the model knows a
+/// gap exists. The count is part of the text because the caller
+/// asked us to maintain a hard token cap, and that matters more
+/// than the marker being byte-stable across drop counts.
+fn ptl_marker_message(dropped: usize) -> Message {
+    Message::system(format!(
+        "[{dropped} earlier turn(s) truncated to fit token budget]"
+    ))
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
@@ -994,6 +1321,276 @@ mod tests {
         ));
     }
 
+    // --- M1.2: circuit breaker + PTL fallback ---
+
+    /// Counts every LLM call regardless of outcome — used by
+    /// circuit-breaker tests to assert "no more LLM calls were
+    /// made after the breaker tripped".
+    struct CountingFailingLlmCb {
+        calls: Arc<AtomicUsize>,
+    }
+    #[async_trait]
+    impl LlmProvider for CountingFailingLlmCb {
+        async fn complete(&self, _req: ChatRequest) -> CoreResult<ChatResponse> {
+            self.calls.fetch_add(1, Ordering::SeqCst);
+            // Non-transport error so the inner retry doesn't double-count.
+            Err(CoreError::Provider("status 500: server".into()))
+        }
+        async fn complete_stream(&self, _req: ChatRequest) -> CoreResult<LlmStream> {
+            unimplemented!()
+        }
+    }
+
+    #[tokio::test]
+    async fn circuit_breaker_trips_after_three_failures() {
+        let calls = Arc::new(AtomicUsize::new(0));
+        let llm = Arc::new(CountingFailingLlmCb {
+            calls: calls.clone(),
+        });
+        let mem = SummarizingMemory::new(llm, "test-model", 64);
+
+        // Each compact call needs a *different* dropped prefix so the
+        // in-memory cache doesn't short-circuit and skip the LLM.
+        for i in 0..5 {
+            let msgs = vec![
+                system("sys"),
+                user(&format!("old-{i}")),
+                assistant("old reply"),
+                user("recent"),
+                assistant("recent reply"),
+            ];
+            let _ = mem.compact(&msgs).await.unwrap();
+        }
+
+        // 3 attempts trip the breaker; the next 2 are circuit-skipped.
+        assert_eq!(
+            calls.load(Ordering::SeqCst),
+            3,
+            "expected exactly 3 LLM attempts before circuit opened",
+        );
+    }
+
+    #[tokio::test]
+    async fn circuit_breaker_resets_on_successful_summary() {
+        // FlakyLlm with succeeds_after=1 yields: fail, success, success, ...
+        // The first compact's transport-error retry inside `summarise`
+        // burns 2 LLM calls but ends in Ok — `record_summary_success`
+        // resets the streak.
+        let llm = Arc::new(FlakyLlm {
+            succeeds_after: 1,
+            calls: AtomicUsize::new(0),
+        });
+        let mem = SummarizingMemory::new(llm.clone(), "test-model", 64);
+
+        let msgs = vec![
+            system("sys"),
+            user("old-a"),
+            assistant("old reply"),
+            user("recent"),
+            assistant("recent reply"),
+        ];
+        let _ = mem.compact(&msgs).await.unwrap();
+        assert_eq!(llm.calls.load(Ordering::SeqCst), 2);
+    }
+
+    #[tokio::test]
+    async fn ptl_drops_oldest_turns_when_summary_pushes_over_budget() {
+        // Budget large enough that `select_recent_turns` keeps all
+        // four turns, but small enough that appending the oversized
+        // summary forces PTL to drop oldest turns.
+        // 300 = small enough that visible budget (300 - sys - 256
+        // reserve = ~40 tokens) drops oldest turns and triggers
+        // summarisation; but body still keeps >=2 turns so PTL has
+        // something to prune.
+        let llm = FakeLlm::new("X".repeat(2000));
+        let mem = SummarizingMemory::new(llm.clone(), "test-model", 300);
+
+        let msgs = vec![
+            system("sys"),
+            user("turn 1"),
+            assistant("reply 1 with some longer text"),
+            user("turn 2"),
+            assistant("reply 2 with some longer text"),
+            user("turn 3"),
+            assistant("reply 3 with some longer text"),
+            user("turn 4 most recent"),
+            assistant("reply 4"),
+        ];
+        let out = mem.compact(&msgs).await.unwrap();
+
+        assert!(
+            out.iter().any(|m| matches!(m,
+                Message::User { content, .. } if content == "turn 4 most recent"
+            )),
+            "latest turn must survive PTL"
+        );
+        assert!(
+            out.iter().any(|m| matches!(m,
+                Message::System { content, .. } if content.contains("truncated to fit token budget")
+            )),
+            "expected PTL marker in: {out:?}"
+        );
+        // Oldest turn must be gone (PTL second round hard-prunes
+        // because round-1's 20% wasn't enough).
+        assert!(
+            !out.iter().any(|m| matches!(m,
+                Message::User { content, .. } if content == "turn 1"
+            )),
+            "oldest turn should have been dropped, got: {out:?}"
+        );
+    }
+
+    #[tokio::test]
+    async fn ptl_noop_when_already_under_budget() {
+        let llm = FakeLlm::new("short");
+        let mem = SummarizingMemory::new(llm.clone(), "test-model", 10_000);
+
+        let msgs = vec![
+            system("sys"),
+            user("hi"),
+            assistant("hello"),
+            user("how are you"),
+            assistant("good"),
+        ];
+        let out = mem.compact(&msgs).await.unwrap();
+        assert!(
+            !out.iter().any(|m| matches!(m,
+                Message::System { content, .. } if content.contains("truncated to fit token budget")
+            )),
+            "PTL marker should not appear under-budget; out: {out:?}"
+        );
+    }
+
+    #[tokio::test]
+    async fn counters_track_compactions_llm_and_cache_paths() {
+        let llm = FakeLlm::new("SUMMARY");
+        let mem = SummarizingMemory::new(llm.clone(), "test-model", 256);
+        let counters = mem.counters();
+
+        // Under-budget: no summary required, no LLM call.
+        let small = vec![system("sys"), user("hi"), assistant("hello")];
+        let _ = mem.compact(&small).await.unwrap();
+
+        // Over-budget run 1: summary required, LLM call, cache miss.
+        let big = vec![
+            system("sys"),
+            user("turn 1"),
+            assistant("reply 1"),
+            user("turn 2"),
+            assistant("reply 2"),
+            user("turn 3 most recent"),
+            assistant("reply 3"),
+        ];
+        let _ = mem.compact(&big).await.unwrap();
+
+        // Run 2 with the same dropped prefix → in-memory cache hit.
+        let _ = mem.compact(&big).await.unwrap();
+
+        assert_eq!(
+            counters.compactions_total.load(Ordering::Relaxed),
+            3,
+            "every compact() counted"
+        );
+        assert_eq!(
+            counters.summary_required.load(Ordering::Relaxed),
+            2,
+            "only the over-budget runs needed a summary"
+        );
+        assert_eq!(
+            counters.llm_calls.load(Ordering::Relaxed),
+            1,
+            "second over-budget run hit the cache, no extra LLM call"
+        );
+        assert_eq!(
+            counters.cache_hits_memory.load(Ordering::Relaxed),
+            1,
+            "second over-budget run was an in-memory cache hit"
+        );
+        assert_eq!(counters.llm_failures.load(Ordering::Relaxed), 0);
+        assert_eq!(counters.circuit_opens.load(Ordering::Relaxed), 0);
+    }
+
+    #[tokio::test]
+    async fn counters_track_circuit_opens_and_skips() {
+        let calls = Arc::new(AtomicUsize::new(0));
+        let llm = Arc::new(CountingFailingLlmCb {
+            calls: calls.clone(),
+        });
+        let mem = SummarizingMemory::new(llm, "test-model", 64);
+        let counters = mem.counters();
+
+        for i in 0..5 {
+            let msgs = vec![
+                system("sys"),
+                user(&format!("old-{i}")),
+                assistant("old reply"),
+                user("recent"),
+                assistant("recent reply"),
+            ];
+            let _ = mem.compact(&msgs).await.unwrap();
+        }
+        // 3 attempts trip the breaker; the next 2 are circuit-skipped.
+        assert_eq!(counters.llm_calls.load(Ordering::Relaxed), 3);
+        assert_eq!(counters.llm_failures.load(Ordering::Relaxed), 3);
+        assert_eq!(counters.circuit_opens.load(Ordering::Relaxed), 1);
+        assert_eq!(counters.circuit_skips.load(Ordering::Relaxed), 2);
+    }
+
+    #[tokio::test]
+    async fn counters_track_ptl_rounds() {
+        let llm = FakeLlm::new("X".repeat(2000));
+        let mem = SummarizingMemory::new(llm, "test-model", 300);
+        let counters = mem.counters();
+        let msgs = vec![
+            system("sys"),
+            user("turn 1"),
+            assistant("reply 1 with some longer text"),
+            user("turn 2"),
+            assistant("reply 2 with some longer text"),
+            user("turn 3"),
+            assistant("reply 3 with some longer text"),
+            user("turn 4 most recent"),
+            assistant("reply 4"),
+        ];
+        let _ = mem.compact(&msgs).await.unwrap();
+        // Either round-one alone or both rounds fired — both counted.
+        assert!(counters.ptl_round_one.load(Ordering::Relaxed) >= 1);
+    }
+
+    #[tokio::test]
+    async fn enforce_token_budget_keeps_trailing_working_context_block() {
+        // Direct test of the helper: build a small conversation,
+        // append a working-context block, set a tight budget. The
+        // trailing System block must survive the prune.
+        use harness_core::CharRatioEstimator;
+        let est = CharRatioEstimator;
+        let msgs = vec![
+            system("sys"),
+            user("turn 1 something long enough"),
+            assistant("reply 1 also reasonably long here"),
+            user("turn 2 another long user message"),
+            assistant("reply 2 with extra padding text"),
+            user("turn 3 most recent here"),
+            assistant("reply 3 short"),
+            // Trailing working-context block (the marker pattern
+            // `enforce_token_budget` recognises).
+            system("=== working context ===\nrecent files:\n- src/lib.rs\n"),
+        ];
+        let (pruned, _outcome) = enforce_token_budget(msgs.clone(), 50, &est);
+        // Working-context block must remain at the tail.
+        assert!(
+            matches!(pruned.last(), Some(Message::System { content, .. }) if content.starts_with("=== working context ===")),
+            "trailing working-context block was lost"
+        );
+        // The latest turn must remain.
+        assert!(
+            pruned.iter().any(|m| matches!(m,
+                Message::User { content, .. } if content == "turn 3 most recent here"
+            )),
+            "latest user turn must remain"
+        );
+    }
+
     #[tokio::test]
     async fn persistence_save_failure_does_not_break_compact() {
         // We don't have an "always-fails" store; instead use a working
diff --git a/crates/harness-plugin/src/manager.rs b/crates/harness-plugin/src/manager.rs
index 5999bff..8ee53cb 100644
--- a/crates/harness-plugin/src/manager.rs
+++ b/crates/harness-plugin/src/manager.rs
@@ -599,6 +599,7 @@ mod tests {
                 activation: harness_skill::SkillActivation::Both,
                 keywords: vec![],
                 version: None,
+                paths: vec![],
             },
             body: "x".into(),
             path: PathBuf::from("/dev/null"),
diff --git a/crates/harness-project/Cargo.toml b/crates/harness-project/Cargo.toml
index 4be9e72..eb6f87c 100644
--- a/crates/harness-project/Cargo.toml
+++ b/crates/harness-project/Cargo.toml
@@ -17,4 +17,5 @@ chrono.workspace = true
 serde.workspace = true
 serde_json.workspace = true
 tokio = { workspace = true, features = ["sync"] }
+ts-rs.workspace = true
 uuid.workspace = true
diff --git a/crates/harness-project/src/activity.rs b/crates/harness-project/src/activity.rs
index b465a7a..275285f 100644
--- a/crates/harness-project/src/activity.rs
+++ b/crates/harness-project/src/activity.rs
@@ -29,7 +29,8 @@ use serde::{Deserialize, Serialize};
 /// every consumer to know the full set. UIs that need to read a
 /// field do so on a per-kind basis; the wire format documents the
 /// expected shape per kind below.
-#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize, ts_rs::TS)]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub struct Activity {
     /// Stable identifier (UUID v4).
     pub id: String,
@@ -41,6 +42,7 @@ pub struct Activity {
     pub actor: ActivityActor,
     /// Free-form payload, shape varies by `kind`. See variant docs
     /// for the expected fields.
+    #[ts(type = "Record<string, unknown>")]
     pub body: serde_json::Value,
     /// RFC-3339 / ISO-8601 timestamp.
     pub created_at: String,
@@ -72,8 +74,9 @@ impl Activity {
 /// The set is intentionally small in v0; AssigneeChange / Comment /
 /// Blocked / Unblocked are reserved for Phases 3.6 / 4 when their
 /// driving features land.
-#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, ts_rs::TS)]
 #[serde(rename_all = "snake_case")]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub enum ActivityKind {
     /// Status flipped.
     /// Body: `{"from": "<wire>", "to": "<wire>"}`.
@@ -105,8 +108,9 @@ pub enum ActivityKind {
 /// when `requirement.*` tools let the model drive board state.
 /// `System` is the bucket for server-side auto-advances
 /// (e.g. `start_run` flipping `Backlog → InProgress`).
-#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize, ts_rs::TS)]
 #[serde(tag = "type", rename_all = "snake_case")]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub enum ActivityActor {
     Human,
     Agent { profile_id: String },
diff --git a/crates/harness-project/src/comment.rs b/crates/harness-project/src/comment.rs
index 7339794..9efec11 100644
--- a/crates/harness-project/src/comment.rs
+++ b/crates/harness-project/src/comment.rs
@@ -39,7 +39,8 @@ use crate::ActivityActor;
 /// We deliberately keep this flat (no nesting deeper than two levels)
 /// — multi-level reply trees are a feature trap; Linear / GitHub /
 /// Multica all flatten beyond depth 1, and so do we.
-#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize, ts_rs::TS)]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub struct Comment {
     /// Stable identifier (UUID v4).
     pub id: String,
diff --git a/crates/harness-project/src/label.rs b/crates/harness-project/src/label.rs
index 8979f88..38dec21 100644
--- a/crates/harness-project/src/label.rs
+++ b/crates/harness-project/src/label.rs
@@ -29,7 +29,8 @@ use serde::{Deserialize, Serialize};
 pub const MAX_LABEL_NAME_LEN: usize = 32;
 
 /// One project-scoped tag.
-#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize, ts_rs::TS)]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub struct Label {
     /// Stable identifier (UUID v4).
     pub id: String,
diff --git a/crates/harness-project/src/project.rs b/crates/harness-project/src/project.rs
index 96170ce..14002e2 100644
--- a/crates/harness-project/src/project.rs
+++ b/crates/harness-project/src/project.rs
@@ -33,7 +33,8 @@ use serde::{Deserialize, Serialize};
 ///
 /// Paths are stored verbatim — canonicalisation is the caller's job
 /// (the REST layer canonicalises on insert).
-#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq, ts_rs::TS)]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub struct ProjectWorkspace {
     /// Filesystem path. Expected to be absolute and canonical, but the
     /// type does not enforce that — see `harness-server`'s create /
@@ -62,7 +63,8 @@ impl ProjectWorkspace {
 /// enabled so existing deployments that turn on `JARVIS_WORK_MODE=auto`
 /// keep the historical "all approved projects are eligible" behaviour
 /// until an operator pauses a specific project.
-#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq, ts_rs::TS)]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub struct ProjectAutomation {
     #[serde(default = "default_auto_mode_enabled")]
     pub auto_mode_enabled: bool,
@@ -90,7 +92,8 @@ fn is_default_automation(value: &ProjectAutomation) -> bool {
 /// Stored opaquely by [`ProjectStore`](crate::store::ProjectStore)
 /// implementations; the wire shape is the JSON serialisation of this
 /// struct, so all fields must round-trip through `serde`.
-#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq, ts_rs::TS)]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub struct Project {
     /// Stable internal identifier (UUID v4). Conversations reference
     /// this, never the slug.
@@ -144,7 +147,8 @@ pub struct Project {
 /// inline on the [`Project`] (not a separate table) since the
 /// cardinality is tiny (typically 3–6 per project) and edits always go
 /// through the project's PATCH endpoint anyway.
-#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq, ts_rs::TS)]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub struct KanbanColumn {
     /// Stable id; what `Requirement.status` references. Validated as
     /// non-empty + ≤ 64 bytes by [`validate_column_id`]. Built-in
diff --git a/crates/harness-project/src/requirement.rs b/crates/harness-project/src/requirement.rs
index 549c21c..e9b8b54 100644
--- a/crates/harness-project/src/requirement.rs
+++ b/crates/harness-project/src/requirement.rs
@@ -37,7 +37,8 @@ use crate::requirement_run::VerificationPlan;
 /// The wire shape matches the JSON serialisation of this struct.
 /// Renderers should treat unknown statuses as
 /// [`RequirementStatus::Backlog`] for forward compat.
-#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize, ts_rs::TS)]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub struct Requirement {
     /// Stable identifier (UUID v4 string). Server-allocated on
     /// `POST /v1/projects/:id/requirements` so clients can't pick
@@ -127,8 +128,9 @@ pub struct Requirement {
 /// snake_case (`"backlog"` / `"in_progress"` / `"review"` / `"done"`)
 /// to match the wire shape the Web UI already produces and consumes
 /// (see `apps/jarvis-web/src/types/frames.ts`).
-#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, ts_rs::TS)]
 #[serde(rename_all = "snake_case")]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub enum RequirementStatus {
     /// Not yet picked up.
     Backlog,
@@ -146,7 +148,8 @@ pub enum RequirementStatus {
 /// free-form chat plan: every item has a kind, status, optional
 /// command, dependencies, and evidence so automation can decide what
 /// to run next and humans can audit what happened later.
-#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize, ts_rs::TS)]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub struct RequirementTodo {
     /// Stable item id (UUID v4).
     pub id: String,
@@ -194,8 +197,9 @@ impl RequirementTodo {
     }
 }
 
-#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, ts_rs::TS)]
 #[serde(rename_all = "snake_case")]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub enum RequirementTodoKind {
     Work,
     Check,
@@ -230,8 +234,9 @@ impl RequirementTodoKind {
     }
 }
 
-#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, ts_rs::TS)]
 #[serde(rename_all = "snake_case")]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub enum RequirementTodoStatus {
     Pending,
     Running,
@@ -266,8 +271,9 @@ impl RequirementTodoStatus {
     }
 }
 
-#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, ts_rs::TS)]
 #[serde(rename_all = "snake_case")]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub enum RequirementTodoCreator {
     Human,
     Agent,
@@ -294,7 +300,8 @@ impl RequirementTodoCreator {
 }
 
 /// Latest proof attached to a [`RequirementTodo`].
-#[derive(Debug, Clone, Default, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, Default, PartialEq, Eq, Serialize, Deserialize, ts_rs::TS)]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub struct RequirementTodoEvidence {
     #[serde(default, skip_serializing_if = "Option::is_none")]
     pub run_id: Option<String>,
@@ -343,8 +350,9 @@ impl RequirementStatus {
 /// `"proposed_by_scan"`). Older requirement rows on disk that
 /// don't carry the field deserialise as [`TriageState::Approved`]
 /// — i.e. v0 behaviour is preserved when no triage gate was set.
-#[derive(Debug, Clone, Copy, Default, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, Copy, Default, PartialEq, Eq, Serialize, Deserialize, ts_rs::TS)]
 #[serde(rename_all = "snake_case")]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub enum TriageState {
     /// User has approved the work. The auto executor may pick it
     /// up subject to the usual `assignee_id` / `depends_on` /
@@ -405,8 +413,9 @@ impl TriageState {
 /// machinery is wired in. Until that machinery lands, the field is
 /// inert (no caller checks it), so the default is forward-looking
 /// without changing today's flow.
-#[derive(Debug, Clone, Copy, Default, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, Copy, Default, PartialEq, Eq, Serialize, Deserialize, ts_rs::TS)]
 #[serde(rename_all = "snake_case")]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub enum AcceptancePolicy {
     /// Default. Once the work agent flips the requirement to
     /// `Review`, the auto loop dispatches a reviewer subagent that
diff --git a/crates/harness-project/src/requirement_run.rs b/crates/harness-project/src/requirement_run.rs
index a7237b5..33f68cb 100644
--- a/crates/harness-project/src/requirement_run.rs
+++ b/crates/harness-project/src/requirement_run.rs
@@ -279,7 +279,8 @@ impl RequirementRunStatus {
 /// What success looks like for the run, expressed as commands the
 /// host should execute and policy gates the user / harness should
 /// honour.
-#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
+#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize, ts_rs::TS)]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
 pub struct VerificationPlan {
     /// Shell-style commands to run after the agent finishes. Each
     /// is run via the binary's existing `shell.exec` plumbing
diff --git a/crates/harness-server/src/auto_mode_routes.rs b/crates/harness-server/src/auto_mode_routes.rs
index abd9af0..0727b1e 100644
--- a/crates/harness-server/src/auto_mode_routes.rs
+++ b/crates/harness-server/src/auto_mode_routes.rs
@@ -25,13 +25,14 @@ use serde::Deserialize;
 use serde_json::{json, Map, Value};
 
 use crate::state::AppState;
+use crate::state_layers::AutoModeLayer;
 
 pub(crate) fn router() -> Router<AppState> {
     Router::new().route("/v1/auto-mode", get(get_auto_mode).post(set_auto_mode))
 }
 
-async fn get_auto_mode(State(state): State<AppState>) -> Response {
-    let runtime = state.auto_mode_runtime.as_ref();
+async fn get_auto_mode(State(auto): State<AutoModeLayer>) -> Response {
+    let runtime = auto.runtime.as_ref();
     let mut body = Map::new();
     let configured = runtime.is_some();
     let enabled = runtime.map(|r| r.is_enabled()).unwrap_or(false);
@@ -62,7 +63,7 @@ async fn get_auto_mode(State(state): State<AppState>) -> Response {
             rt.last_tick_at().map(Value::from).unwrap_or(Value::Null),
         );
     }
-    if let Some(cfg) = state.auto_mode_config.as_ref() {
+    if let Some(cfg) = auto.config.as_ref() {
         body.insert("mode".into(), Value::from(cfg.mode.as_wire()));
         body.insert("tick_seconds".into(), Value::from(cfg.tick_seconds));
         body.insert(
@@ -113,8 +114,8 @@ struct SetBody {
     max_retries: Option<usize>,
 }
 
-async fn set_auto_mode(State(state): State<AppState>, Json(body): Json<SetBody>) -> Response {
-    let Some(runtime) = state.auto_mode_runtime.as_ref() else {
+async fn set_auto_mode(State(auto): State<AutoModeLayer>, Json(body): Json<SetBody>) -> Response {
+    let Some(runtime) = auto.runtime.as_ref() else {
         return (
             StatusCode::SERVICE_UNAVAILABLE,
             Json(json!({ "error": "auto-mode runtime not configured" })),
@@ -135,7 +136,7 @@ async fn set_auto_mode(State(state): State<AppState>, Json(body): Json<SetBody>)
     let mut response = serde_json::Map::new();
     response.insert("configured".into(), Value::Bool(true));
     response.insert("enabled".into(), Value::Bool(runtime.is_enabled()));
-    if let Some(cfg) = state.auto_mode_config.as_ref() {
+    if let Some(cfg) = auto.config.as_ref() {
         response.insert(
             "effective_max_retries".into(),
             Value::from(runtime.effective_max_retries(cfg)),
diff --git a/crates/harness-server/src/channels_wecom_app/crypto.rs b/crates/harness-server/src/channels_wecom_app/crypto.rs
new file mode 100644
index 0000000..cc6e7f2
--- /dev/null
+++ b/crates/harness-server/src/channels_wecom_app/crypto.rs
@@ -0,0 +1,291 @@
+//! Crypto primitives for the inbound callback verify path —
+//! signature, constant-time eq, XML tag extractor, and the
+//! AES-256-CBC payload decryptor.
+//!
+//! All four functions are pure (no I/O, no state) so they live in
+//! one place and stay easily testable. The `synth_encrypt` test
+//! helper underneath is the symmetric counterpart of
+//! [`decrypt_aes_payload`] that lets the round-trip tests build
+//! their own ciphertext without depending on a real WeCom fixture.
+
+/// `sha1(sort([token, timestamp, nonce, payload]).join(""))`,
+/// hex-encoded lowercase. Same scheme used for the GET handshake
+/// (where `payload = echostr`) and POST verify (where `payload =
+/// <Encrypt>` field from the body).
+pub(super) fn wecom_signature(
+    token: &str,
+    timestamp: &str,
+    nonce: &str,
+    payload: &str,
+) -> String {
+    use sha1::{Digest, Sha1};
+    let mut parts = [token, timestamp, nonce, payload];
+    parts.sort();
+    let joined = parts.concat();
+    let digest = Sha1::digest(joined.as_bytes());
+    const HEX: &[u8; 16] = b"0123456789abcdef";
+    let mut out = String::with_capacity(40);
+    for b in digest {
+        out.push(HEX[(b >> 4) as usize] as char);
+        out.push(HEX[(b & 0x0f) as usize] as char);
+    }
+    out
+}
+
+/// Compare two byte slices in constant time so a mismatched
+/// signature doesn't leak prefix-length info via timing. Stdlib has
+/// no constant-time eq; this 4-line version is the hot-path-cheap
+/// equivalent everyone copy-pastes.
+pub(super) fn constant_time_eq(a: &[u8], b: &[u8]) -> bool {
+    if a.len() != b.len() {
+        return false;
+    }
+    a.iter().zip(b).fold(0u8, |acc, (x, y)| acc | (x ^ y)) == 0
+}
+
+/// Find `<Tag>...</Tag>` in `xml` and return the inner content,
+/// stripping a `<![CDATA[...]]>` wrapper if present. Hand-rolled
+/// because the inbound XML shape is rigid (5 message kinds, all
+/// flat) — pulling in `quick-xml` for this would be way more
+/// complexity than the parsing demands.
+///
+/// Returns `None` for missing or empty tags. Doesn't handle
+/// nesting — WeCom's inbound XML never does.
+pub(super) fn extract_tag(xml: &str, tag: &str) -> Option<String> {
+    let open = format!("<{tag}>");
+    let close = format!("</{tag}>");
+    let start = xml.find(&open)? + open.len();
+    let end = xml[start..].find(&close)? + start;
+    let raw = &xml[start..end];
+    let stripped = raw
+        .strip_prefix("<![CDATA[")
+        .and_then(|s| s.strip_suffix("]]>"))
+        .unwrap_or(raw);
+    Some(stripped.to_string())
+}
+
+/// AES-256-CBC decrypt the WeCom callback payload + extract the
+/// real plaintext. WeCom's encryption envelope:
+/// ```text
+/// base64-decoded ciphertext = AES-256-CBC encrypted bytes
+///   key = base64-decode(EncodingAESKey + "=")  // 32 bytes
+///   iv  = key[..16]                            // first 16 bytes of key
+/// plaintext = random_16 || msg_len_be_u32 || msg || receive_id
+/// ```
+/// We extract `msg`, validate `receive_id == corp_id`, and return
+/// `msg`. PKCS#7 padding is stripped from the tail of the ciphertext
+/// before slicing.
+pub(super) fn decrypt_aes_payload(
+    encoding_aes_key: &str,
+    ciphertext_b64: &str,
+    expected_corp_id: &str,
+) -> Result<String, String> {
+    use aes::cipher::{block_padding::NoPadding, BlockDecryptMut, KeyIvInit};
+    use base64::Engine;
+    type Aes256CbcDec = cbc::Decryptor<aes::Aes256>;
+
+    // EncodingAESKey is 43 chars of base64 — append `=` to make it
+    // a valid 44-char padded base64 → 32 bytes.
+    let aes_key = base64::engine::general_purpose::STANDARD
+        .decode(format!("{encoding_aes_key}="))
+        .map_err(|e| format!("encoding_aes_key not valid base64: {e}"))?;
+    if aes_key.len() != 32 {
+        return Err(format!(
+            "encoding_aes_key decoded to {} bytes; expected 32",
+            aes_key.len()
+        ));
+    }
+    let iv = &aes_key[..16];
+
+    let ciphertext = base64::engine::general_purpose::STANDARD
+        .decode(ciphertext_b64.trim())
+        .map_err(|e| format!("ciphertext not valid base64: {e}"))?;
+    if ciphertext.is_empty() || ciphertext.len() % 16 != 0 {
+        return Err(format!(
+            "ciphertext length {} is not a multiple of 16",
+            ciphertext.len()
+        ));
+    }
+
+    let mut buf = ciphertext.clone();
+    let cipher = Aes256CbcDec::new_from_slices(&aes_key, iv)
+        .map_err(|e| format!("AES init failed: {e}"))?;
+    cipher
+        .decrypt_padded_mut::<NoPadding>(&mut buf)
+        .map_err(|e| format!("AES decrypt failed: {e}"))?;
+
+    // Strip WeCom's custom PKCS#7-style padding. The last byte
+    // tells you how many trailing bytes are padding; valid range
+    // 1..=32. Anything else means key/iv/payload corruption.
+    let pad = *buf.last().ok_or("decrypted buffer is empty")? as usize;
+    if pad == 0 || pad > 32 || pad > buf.len() {
+        return Err(format!("invalid padding length: {pad}"));
+    }
+    let stripped_len = buf.len() - pad;
+    let plain = &buf[..stripped_len];
+
+    // Layout: `random_16 || msg_len_4_be || msg || receive_id`
+    if plain.len() < 16 + 4 {
+        return Err(format!("plaintext too short: {} bytes", plain.len()));
+    }
+    let msg_len = u32::from_be_bytes(plain[16..20].try_into().unwrap()) as usize;
+    if 16 + 4 + msg_len > plain.len() {
+        return Err(format!(
+            "msg_len {} exceeds plaintext length {}",
+            msg_len,
+            plain.len() - 20
+        ));
+    }
+    let msg_bytes = &plain[20..20 + msg_len];
+    let receive_id = &plain[20 + msg_len..];
+    let receive_id = std::str::from_utf8(receive_id)
+        .map_err(|e| format!("receive_id is not utf-8: {e}"))?;
+
+    if receive_id != expected_corp_id {
+        return Err(format!(
+            "receive_id mismatch: expected {expected_corp_id}, got {receive_id}"
+        ));
+    }
+    let msg = std::str::from_utf8(msg_bytes)
+        .map_err(|e| format!("msg is not utf-8: {e}"))?;
+    Ok(msg.to_string())
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn extract_tag_handles_plain_and_cdata() {
+        let xml = "<root><A>plain</A><B><![CDATA[in cdata]]></B></root>";
+        assert_eq!(extract_tag(xml, "A").as_deref(), Some("plain"));
+        assert_eq!(extract_tag(xml, "B").as_deref(), Some("in cdata"));
+        assert_eq!(extract_tag(xml, "Missing"), None);
+    }
+
+    #[test]
+    fn signature_is_lowercase_hex_and_matches_spec_example() {
+        // Sort + concat + sha1. Spot-check a known case computed
+        // off-line: `(token=ABC, ts=1, nonce=N, payload=PL)`.
+        // Sort → ["1","ABC","N","PL"] → concat → "1ABCNPL"
+        // sha1 of that string is deterministic; just check it's
+        // 40 lowercase hex chars and changes when an input changes.
+        let s1 = wecom_signature("ABC", "1", "N", "PL");
+        assert_eq!(s1.len(), 40);
+        assert!(s1.chars().all(|c| c.is_ascii_hexdigit() && !c.is_ascii_uppercase()));
+        let s2 = wecom_signature("ABC", "2", "N", "PL");
+        assert_ne!(s1, s2);
+        // Reordering identical inputs yields the same signature
+        // (sort makes parameter order irrelevant — that's the
+        // protocol).
+        let s_same = wecom_signature("PL", "ABC", "1", "N");
+        assert_eq!(s_same, s1);
+    }
+
+    #[test]
+    fn constant_time_eq_is_correct_for_basics() {
+        assert!(constant_time_eq(b"abc", b"abc"));
+        assert!(!constant_time_eq(b"abc", b"abd"));
+        assert!(!constant_time_eq(b"abc", b"abcd"));
+        assert!(constant_time_eq(b"", b""));
+    }
+
+    /// Build a plaintext that the WeCom AES envelope wraps, then
+    /// encrypt it ourselves and round-trip through
+    /// `decrypt_aes_payload`. We don't depend on a known WeCom
+    /// fixture; instead we use the same `aes` + `cbc` crates the
+    /// production decrypt does, on a synthetic key, and assert the
+    /// shape comes back out cleanly.
+    fn synth_encrypt(msg: &str, corp_id: &str, key: &[u8; 32]) -> String {
+        use aes::cipher::{block_padding::NoPadding, BlockEncryptMut, KeyIvInit};
+        use base64::Engine;
+        type Aes256CbcEnc = cbc::Encryptor<aes::Aes256>;
+
+        let iv = &key[..16];
+        let mut payload = Vec::new();
+        payload.extend_from_slice(&[0u8; 16]); // random_16
+        payload.extend_from_slice(&(msg.len() as u32).to_be_bytes());
+        payload.extend_from_slice(msg.as_bytes());
+        payload.extend_from_slice(corp_id.as_bytes());
+        // Pad to 32 (PKCS#7 amounts to (32 - len%32) % 32 minimum 1).
+        let pad_len = 32 - (payload.len() % 32);
+        payload.extend_from_slice(&vec![pad_len as u8; pad_len]);
+        // Pre-allocate the buffer for `encrypt_padded_mut`.
+        let mut buf = payload.clone();
+        let cipher = Aes256CbcEnc::new_from_slices(key, iv).unwrap();
+        let n = cipher
+            .encrypt_padded_mut::<NoPadding>(&mut buf, payload.len())
+            .unwrap()
+            .len();
+        base64::engine::general_purpose::STANDARD.encode(&buf[..n])
+    }
+
+    fn synth_aes_key_b64(key: &[u8; 32]) -> String {
+        use base64::Engine;
+        // EncodingAESKey = first 43 chars of base64(key). The
+        // production decoder appends `=` itself.
+        let full = base64::engine::general_purpose::STANDARD.encode(key);
+        full.chars().take(43).collect()
+    }
+
+    #[test]
+    fn decrypt_round_trip_extracts_msg_and_validates_corpid() {
+        let key = [7u8; 32];
+        let aes_key_b64 = synth_aes_key_b64(&key);
+        let cipher = synth_encrypt("hello world", "ww-good-corp", &key);
+        let plain = decrypt_aes_payload(&aes_key_b64, &cipher, "ww-good-corp").unwrap();
+        assert_eq!(plain, "hello world");
+    }
+
+    #[test]
+    fn decrypt_rejects_wrong_corp_id() {
+        let key = [7u8; 32];
+        let aes_key_b64 = synth_aes_key_b64(&key);
+        let cipher = synth_encrypt("hi", "ww-actual", &key);
+        let err = decrypt_aes_payload(&aes_key_b64, &cipher, "ww-different").unwrap_err();
+        assert!(err.contains("receive_id mismatch"), "got: {err}");
+    }
+
+    #[test]
+    fn decrypt_rejects_invalid_base64() {
+        // Use a valid AES key first (so we reach the ciphertext
+        // decode), then feed garbage that base64 can't parse.
+        let key = [11u8; 32];
+        let aes_key_b64 = synth_aes_key_b64(&key);
+        let err = decrypt_aes_payload(&aes_key_b64, "@@@not-base64@@@", "ww").unwrap_err();
+        assert!(err.contains("ciphertext not valid base64"), "got: {err}");
+    }
+
+    #[test]
+    fn decrypt_rejects_short_aes_key() {
+        // EncodingAESKey of 30 chars decodes to ~22 bytes, not 32.
+        let err = decrypt_aes_payload(&"a".repeat(30), "AAAA", "ww").unwrap_err();
+        assert!(err.contains("expected 32") || err.contains("not valid base64"));
+    }
+
+    #[test]
+    fn decrypt_rejects_truncated_plaintext() {
+        // A ciphertext that decrypts to fewer than 20 bytes (the
+        // header alone) should be rejected.
+        use aes::cipher::{block_padding::NoPadding, BlockEncryptMut, KeyIvInit};
+        use base64::Engine;
+        type Aes256CbcEnc = cbc::Encryptor<aes::Aes256>;
+        let key = [9u8; 32];
+        let iv = &key[..16];
+        // 16 bytes total: just one block padded with PKCS#7. After
+        // strip we'd have <20 bytes, triggering the length check.
+        let payload = b"123456789012345"; // 15 bytes; pad to 16 with 1 byte of pad
+        let mut padded = payload.to_vec();
+        padded.push(1u8); // 1 byte of pad
+        let mut buf = padded.clone();
+        let cipher = Aes256CbcEnc::new_from_slices(&key, iv).unwrap();
+        let n = cipher
+            .encrypt_padded_mut::<NoPadding>(&mut buf, padded.len())
+            .unwrap()
+            .len();
+        let cipher_b64 = base64::engine::general_purpose::STANDARD.encode(&buf[..n]);
+        let err =
+            decrypt_aes_payload(&synth_aes_key_b64(&key), &cipher_b64, "ww").unwrap_err();
+        assert!(err.contains("plaintext too short"), "got: {err}");
+    }
+}
diff --git a/crates/harness-server/src/channels_wecom_app.rs b/crates/harness-server/src/channels_wecom_app/mod.rs
similarity index 54%
rename from crates/harness-server/src/channels_wecom_app.rs
rename to crates/harness-server/src/channels_wecom_app/mod.rs
index 35eceee..f86976d 100644
--- a/crates/harness-server/src/channels_wecom_app.rs
+++ b/crates/harness-server/src/channels_wecom_app/mod.rs
@@ -35,86 +35,30 @@ use harness_channel::{
 };
 use serde::Deserialize;
 use serde_json::{json, Value};
-use std::collections::HashMap;
-use std::sync::{Arc, RwLock};
-use std::time::{Duration, Instant};
+use std::sync::Arc;
+use std::time::Duration;
+
+// Submodules — each owns a concern that was previously inlined in
+// this 1900-line file. mod.rs keeps the trait impls (the public
+// surface) plus codec / outbound HTTP helpers that are tightly
+// coupled to them; primitives that have a clean boundary moved out.
+mod crypto;
+mod oauth;
+mod token;
+
+use crypto::{constant_time_eq, decrypt_aes_payload, extract_tag, wecom_signature};
+use oauth::{
+    exchange_code_for_userid, make_oauth_state, oauth_authorize_url, verify_oauth_state, OAuthScope,
+};
+use token::{ensure_token, token_cache};
 
-const WECOM_API_BASE: &str = "https://qyapi.weixin.qq.com";
+pub(super) const WECOM_API_BASE: &str = "https://qyapi.weixin.qq.com";
 
 /// WeCom caps text body at ~2000 chars; markdown card body at ~4096.
 /// Use the more permissive bound and let the platform truncate
 /// anything above (it doesn't error, just clips).
 const WECOM_APP_MAX_BYTES: usize = 4096;
 
-/// How early to refresh `access_token` before its declared
-/// `expires_in`. WeCom hands out 7200-second tokens; refreshing 5
-/// minutes before keeps every send well clear of the boundary.
-const TOKEN_REFRESH_LEAD_SECS: u64 = 300;
-
-#[derive(Debug, Clone)]
-struct CachedToken {
-    token: String,
-    expires_at: Instant,
-}
-
-/// Process-level cache, keyed by `corp_id`. A separate
-/// `RwLock<HashMap>` per binary (not per-instance) because access
-/// tokens are corp-scoped, not app-scoped — multiple
-/// `ChannelInstance` rows for the same `corp_id` share one token to
-/// stay under WeCom's 2000-call/day refresh quota.
-#[derive(Default)]
-struct AccessTokenCache {
-    inner: RwLock<HashMap<String, CachedToken>>,
-}
-
-impl AccessTokenCache {
-    fn get(&self, corp_id: &str) -> Option<String> {
-        let g = self.inner.read().ok()?;
-        let cached = g.get(corp_id)?;
-        if Instant::now() < cached.expires_at {
-            Some(cached.token.clone())
-        } else {
-            None
-        }
-    }
-
-    fn set(&self, corp_id: &str, token: String, ttl_secs: u64) {
-        let safe_ttl = ttl_secs.saturating_sub(TOKEN_REFRESH_LEAD_SECS);
-        let expires_at = Instant::now() + Duration::from_secs(safe_ttl);
-        if let Ok(mut g) = self.inner.write() {
-            g.insert(
-                corp_id.to_string(),
-                CachedToken {
-                    token,
-                    expires_at,
-                },
-            );
-        }
-    }
-
-    fn invalidate(&self, corp_id: &str) {
-        if let Ok(mut g) = self.inner.write() {
-            g.remove(corp_id);
-        }
-    }
-}
-
-/// Singleton — every `WeComAppAdapter` invocation hits the same
-/// cache so deployments with multiple instances behind one
-/// `corp_id` share tokens. Lazy-init via `OnceLock`.
-fn token_cache() -> &'static AccessTokenCache {
-    static CACHE: std::sync::OnceLock<AccessTokenCache> = std::sync::OnceLock::new();
-    CACHE.get_or_init(AccessTokenCache::default)
-}
-
-/// Reset helper for tests — never called from production code.
-#[cfg(test)]
-fn reset_token_cache() {
-    if let Ok(mut g) = token_cache().inner.write() {
-        g.clear();
-    }
-}
-
 pub struct WeComAppAdapter;
 
 #[async_trait]
@@ -509,145 +453,6 @@ fn require_inbound_field(config: &Value, field: &str) -> Result<String, String>
 /// hex-encoded lowercase. Same scheme used for the GET handshake
 /// (where `payload = echostr`) and POST verify (where `payload =
 /// <Encrypt>` field from the body).
-fn wecom_signature(token: &str, timestamp: &str, nonce: &str, payload: &str) -> String {
-    use sha1::{Digest, Sha1};
-    let mut parts = [token, timestamp, nonce, payload];
-    parts.sort();
-    let joined = parts.concat();
-    let digest = Sha1::digest(joined.as_bytes());
-    const HEX: &[u8; 16] = b"0123456789abcdef";
-    let mut out = String::with_capacity(40);
-    for b in digest {
-        out.push(HEX[(b >> 4) as usize] as char);
-        out.push(HEX[(b & 0x0f) as usize] as char);
-    }
-    out
-}
-
-/// Compare two byte slices in constant time so a mismatched
-/// signature doesn't leak prefix-length info via timing. Stdlib has
-/// no constant-time eq; this 4-line version is the hot-path-cheap
-/// equivalent everyone copy-pastes.
-fn constant_time_eq(a: &[u8], b: &[u8]) -> bool {
-    if a.len() != b.len() {
-        return false;
-    }
-    a.iter().zip(b).fold(0u8, |acc, (x, y)| acc | (x ^ y)) == 0
-}
-
-/// Find `<Tag>...</Tag>` in `xml` and return the inner content,
-/// stripping a `<![CDATA[...]]>` wrapper if present. Hand-rolled
-/// because the inbound XML shape is rigid (5 message kinds, all
-/// flat) — pulling in `quick-xml` for this would be way more
-/// complexity than the parsing demands.
-///
-/// Returns `None` for missing or empty tags. Doesn't handle
-/// nesting — WeCom's inbound XML never does.
-fn extract_tag(xml: &str, tag: &str) -> Option<String> {
-    let open = format!("<{tag}>");
-    let close = format!("</{tag}>");
-    let start = xml.find(&open)? + open.len();
-    let end = xml[start..].find(&close)? + start;
-    let raw = &xml[start..end];
-    let stripped = raw
-        .strip_prefix("<![CDATA[")
-        .and_then(|s| s.strip_suffix("]]>"))
-        .unwrap_or(raw);
-    Some(stripped.to_string())
-}
-
-/// AES-256-CBC decrypt the WeCom callback payload + extract the
-/// real plaintext. WeCom's encryption envelope:
-/// ```text
-/// base64-decoded ciphertext = AES-256-CBC encrypted bytes
-///   key = base64-decode(EncodingAESKey + "=")  // 32 bytes
-///   iv  = key[..16]                            // first 16 bytes of key
-/// plaintext = random_16 || msg_len_be_u32 || msg || receive_id
-/// ```
-/// We extract `msg`, validate `receive_id == corp_id`, and return
-/// `msg`. PKCS#7 padding is stripped from the tail of the ciphertext
-/// before slicing.
-fn decrypt_aes_payload(
-    encoding_aes_key: &str,
-    ciphertext_b64: &str,
-    expected_corp_id: &str,
-) -> Result<String, String> {
-    use aes::cipher::{block_padding::NoPadding, BlockDecryptMut, KeyIvInit};
-    use base64::Engine;
-    type Aes256CbcDec = cbc::Decryptor<aes::Aes256>;
-
-    // EncodingAESKey is 43 chars of base64 — append `=` to make it
-    // a valid 44-char padded base64 → 32 bytes.
-    let aes_key = base64::engine::general_purpose::STANDARD
-        .decode(format!("{encoding_aes_key}="))
-        .map_err(|e| format!("encoding_aes_key not valid base64: {e}"))?;
-    if aes_key.len() != 32 {
-        return Err(format!(
-            "encoding_aes_key decoded to {} bytes; expected 32",
-            aes_key.len()
-        ));
-    }
-    let iv = &aes_key[..16];
-
-    let ciphertext = base64::engine::general_purpose::STANDARD
-        .decode(ciphertext_b64.trim())
-        .map_err(|e| format!("ciphertext not valid base64: {e}"))?;
-    if ciphertext.is_empty() || ciphertext.len() % 16 != 0 {
-        return Err(format!(
-            "ciphertext length {} is not a multiple of 16",
-            ciphertext.len()
-        ));
-    }
-
-    let mut buf = ciphertext.clone();
-    let cipher = Aes256CbcDec::new_from_slices(&aes_key, iv)
-        .map_err(|e| format!("AES init failed: {e}"))?;
-    cipher
-        .decrypt_padded_mut::<NoPadding>(&mut buf)
-        .map_err(|e| format!("AES decrypt failed: {e}"))?;
-
-    // Strip WeCom's custom PKCS#7-style padding. The last byte
-    // tells you how many trailing bytes are padding; valid range
-    // 1..=32. Anything else means key/iv/payload corruption.
-    let pad = *buf.last().ok_or("decrypted buffer is empty")? as usize;
-    if pad == 0 || pad > 32 || pad > buf.len() {
-        return Err(format!("invalid padding length: {pad}"));
-    }
-    let stripped_len = buf.len() - pad;
-    let plain = &buf[..stripped_len];
-
-    // Layout: `random_16 || msg_len_4_be || msg || receive_id`
-    if plain.len() < 16 + 4 {
-        return Err(format!("plaintext too short: {} bytes", plain.len()));
-    }
-    let msg_len = u32::from_be_bytes(plain[16..20].try_into().unwrap()) as usize;
-    if 16 + 4 + msg_len > plain.len() {
-        return Err(format!(
-            "msg_len {} exceeds plaintext length {}",
-            msg_len,
-            plain.len() - 20
-        ));
-    }
-    let msg_bytes = &plain[20..20 + msg_len];
-    let receive_id = &plain[20 + msg_len..];
-    let receive_id = std::str::from_utf8(receive_id)
-        .map_err(|e| format!("receive_id is not utf-8: {e}"))?;
-
-    if receive_id != expected_corp_id {
-        return Err(format!(
-            "receive_id mismatch: expected {expected_corp_id}, got {receive_id}"
-        ));
-    }
-    let msg = std::str::from_utf8(msg_bytes)
-        .map_err(|e| format!("msg is not utf-8: {e}"))?;
-    Ok(msg.to_string())
-}
-
-/// Parse decrypted inbound XML into a normalised
-/// [`ChannelInboundEvent`]. WeCom's 5 inbound message types we
-/// actually care about (text, image, voice, event/subscribe,
-/// event/unsubscribe). Anything else folds into `ChannelInboundKind
-/// ::Event(...)` so the caller still sees the message even if we
 /// don't have a dedicated branch.
 fn parse_inbound_xml(xml: &str) -> Result<ChannelInboundEvent, String> {
     let msg_type = extract_tag(xml, "MsgType")
@@ -848,100 +653,6 @@ async fn send_once(
     SendOutcome::sent()
 }
 
-/// Return a token from the cache, fetching one when missing /
-/// expired / `force_refresh = true`.
-pub(crate) async fn ensure_token(
-    corp_id: &str,
-    corp_secret: &str,
-    force_refresh: bool,
-) -> Result<String, SendOutcome> {
-    if !force_refresh {
-        if let Some(t) = token_cache().get(corp_id) {
-            return Ok(t);
-        }
-    }
-    fetch_token(corp_id, corp_secret).await
-}
-
-#[derive(Debug, Deserialize)]
-struct GetTokenReply {
-    errcode: i64,
-    #[serde(default)]
-    errmsg: String,
-    #[serde(default)]
-    access_token: String,
-    #[serde(default)]
-    expires_in: u64,
-}
-
-/// Fetch a fresh access_token. Cache populated on success.
-async fn fetch_token(corp_id: &str, corp_secret: &str) -> Result<String, SendOutcome> {
-    let url = format!(
-        "{WECOM_API_BASE}/cgi-bin/gettoken?corpid={}&corpsecret={}",
-        urlencoding_minimal(corp_id),
-        urlencoding_minimal(corp_secret),
-    );
-    let client = match reqwest::Client::builder()
-        .timeout(Duration::from_secs(10))
-        .build()
-    {
-        Ok(c) => c,
-        Err(e) => {
-            return Err(SendOutcome::fail_retryable(format!(
-                "HTTP client init: {e}"
-            )))
-        }
-    };
-    let resp = match client.get(&url).send().await {
-        Ok(r) => r,
-        Err(e) => {
-            return Err(SendOutcome::fail_retryable(format!(
-                "gettoken transport: {e}"
-            )))
-        }
-    };
-    let status = resp.status();
-    let raw = match resp.text().await {
-        Ok(t) => t,
-        Err(e) => {
-            return Err(SendOutcome::Failed {
-                message: format!("gettoken reply unreadable: {e}"),
-                code: Some("wecom_app:gettoken_reply_unreadable".into()),
-                retryable: false,
-            });
-        }
-    };
-    if !status.is_success() {
-        return Err(SendOutcome::Failed {
-            message: format!("gettoken HTTP {}: {raw}", status.as_u16()),
-            code: Some(format!("wecom_app:gettoken_http_{}", status.as_u16())),
-            retryable: status.is_server_error(),
-        });
-    }
-    let parsed: GetTokenReply = match serde_json::from_str(&raw) {
-        Ok(p) => p,
-        Err(e) => {
-            return Err(SendOutcome::Failed {
-                message: format!("gettoken parse: {e}: {raw}"),
-                code: Some("wecom_app:gettoken_reply_parse".into()),
-                retryable: false,
-            });
-        }
-    };
-    if parsed.errcode != 0 || parsed.access_token.is_empty() {
-        return Err(SendOutcome::Failed {
-            message: format!(
-                "gettoken errcode {}: {}",
-                parsed.errcode, parsed.errmsg
-            ),
-            code: Some(format!("wecom_app:gettoken_errcode_{}", parsed.errcode)),
-            retryable: false,
-        });
-    }
-    token_cache().set(corp_id, parsed.access_token.clone(), parsed.expires_in);
-    Ok(parsed.access_token)
-}
-
 #[derive(Debug, Deserialize)]
 struct WeComReply {
     errcode: i64,
@@ -953,7 +664,7 @@ struct WeComReply {
 /// secret can contain `+` / `/` / `=` from base64 in some configs
 /// (rare but documented), so we treat it like the DingTalk sign:
 /// percent-encode anything not in the unreserved set.
-fn urlencoding_minimal(s: &str) -> String {
+pub(super) fn urlencoding_minimal(s: &str) -> String {
     let mut out = String::with_capacity(s.len());
     for b in s.bytes() {
         match b {
@@ -966,260 +677,6 @@ fn urlencoding_minimal(s: &str) -> String {
     out
 }
 
-// ---------------------------------------------------------------------------
-// OAuth2 免登 (snsapi_base) — terminal-user identity verification.
-//
-// WeCom's snsapi_base scope returns a `userid` after a silent in-client
-// authorisation. We use it for "click here to verify who you are" links
-// the bot can post into a chat, or for the `/v1/channels/:id/oauth/start`
-// + `/oauth/callback` redirect pair.
-//
-// State is HMAC-SHA1 signed against the instance's `token` field — same
-// secret the inbound verify uses — so we don't need a server-side state
-// store. The signed payload carries `instance_id`, an expiry timestamp,
-// and a random nonce. Verification checks the signature, parses the
-// payload, validates the instance binding + expiry, all in constant time.
-//
-// Reference: https://developer.work.weixin.qq.com/document/path/91022
-//   ?appid=<corp_id> & redirect_uri=<urlencoded> & response_type=code
-//   & scope=snsapi_base | snsapi_privateinfo & agentid=<agent_id>
-//   & state=<our_csrf_state> #wechat_redirect
-// ---------------------------------------------------------------------------
-
-/// `snsapi_base` returns just the `userid` silently — no popup in the
-/// WeCom client when the user is already logged in. `snsapi_privateinfo`
-/// additionally surfaces name / avatar / mobile via a `user_ticket`, but
-/// it triggers a confirmation prompt and requires extra app permissions.
-/// v1 ships only `Base` — it's the minimum that proves identity.
-#[derive(Debug, Clone, Copy, PartialEq, Eq)]
-pub(crate) enum OAuthScope {
-    Base,
-}
-
-impl OAuthScope {
-    fn as_wire(self) -> &'static str {
-        match self {
-            Self::Base => "snsapi_base",
-        }
-    }
-}
-
-/// Build the WeCom OAuth2 authorize URL. `redirect_uri` is treated as
-/// opaque and URL-encoded verbatim — the operator is responsible for
-/// whitelisting its domain in the WeCom admin's "可信域名".
-///
-/// `#wechat_redirect` is mandatory per WeCom's docs; without it the
-/// authorize page renders blank inside the WeCom client.
-pub(crate) fn oauth_authorize_url(
-    corp_id: &str,
-    agent_id: u64,
-    redirect_uri: &str,
-    state: &str,
-    scope: OAuthScope,
-) -> String {
-    format!(
-        "https://open.weixin.qq.com/connect/oauth2/authorize\
-         ?appid={appid}\
-         &redirect_uri={redirect}\
-         &response_type=code\
-         &scope={scope}\
-         &state={state}\
-         &agentid={agentid}#wechat_redirect",
-        appid = urlencoding_minimal(corp_id),
-        redirect = urlencoding_minimal(redirect_uri),
-        scope = scope.as_wire(),
-        state = urlencoding_minimal(state),
-        agentid = agent_id,
-    )
-}
-
-/// Decoded state payload after signature verification. The fields are
-/// the contract between `make_oauth_state` and `verify_oauth_state` —
-/// keep them additive-only or version the payload.
-#[derive(Debug, Clone, serde::Serialize, serde::Deserialize, PartialEq, Eq)]
-pub(crate) struct OAuthStateClaims {
-    /// Channel-instance id this state belongs to. The callback route
-    /// uses this to cross-check the `:id` path parameter.
-    pub(crate) instance_id: String,
-    /// Unix seconds after which the state is invalid. Typically now +
-    /// 10 minutes — long enough for a slow tap, short enough that a
-    /// stolen state ages out before being useful.
-    pub(crate) exp: u64,
-    /// 16-byte hex random — guards against replay of the same state
-    /// (combined with `exp`) and makes the signed blob look opaque.
-    pub(crate) nonce: String,
-    /// Optional caller-supplied opaque field. Often a Jarvis session
-    /// id, a `next=` URL hint, or a pairing token — the callback
-    /// surfaces this verbatim so the originator can correlate.
-    #[serde(default, skip_serializing_if = "Option::is_none")]
-    pub(crate) ctx: Option<String>,
-}
-
-/// Sign a fresh state token. The `token` argument is the same value
-/// configured on the `ChannelInstance` for inbound verify (`config.token`
-/// — operator-chosen, kept secret) so we don't need a dedicated
-/// signing key.
-pub(crate) fn make_oauth_state(
-    instance_id: &str,
-    instance_token: &str,
-    ttl_secs: u64,
-    ctx: Option<&str>,
-    nonce_hex: &str,
-    now_unix: u64,
-) -> Result<String, String> {
-    use base64::Engine;
-    if instance_token.is_empty() {
-        return Err("instance token is empty — cannot sign OAuth state".to_string());
-    }
-    let claims = OAuthStateClaims {
-        instance_id: instance_id.to_string(),
-        exp: now_unix.saturating_add(ttl_secs),
-        nonce: nonce_hex.to_string(),
-        ctx: ctx.map(str::to_string),
-    };
-    let json = serde_json::to_vec(&claims).map_err(|e| format!("state encode: {e}"))?;
-    let b64 = base64::engine::general_purpose::URL_SAFE_NO_PAD.encode(&json);
-    let sig = oauth_state_sig(&b64, instance_token);
-    Ok(format!("{b64}.{sig}"))
-}
-
-/// Verify + decode a state token. Returns the claims (CSRF passed and
-/// not expired) or an operator-readable error.
-///
-/// Step order matters:
-/// 1. Split on `.`  (cheap, doesn't leak anything)
-/// 2. Recompute sig + constant-time compare — catches tampering early
-/// 3. Decode payload, parse JSON
-/// 4. Cross-check `instance_id` against the route's `:id`
-/// 5. Check expiry against the caller-supplied `now_unix`
-pub(crate) fn verify_oauth_state(
-    state: &str,
-    expected_instance: &str,
-    instance_token: &str,
-    now_unix: u64,
-) -> Result<OAuthStateClaims, String> {
-    use base64::Engine;
-    let (b64, sig) = state.split_once('.').ok_or("state missing signature")?;
-    if b64.is_empty() || sig.is_empty() {
-        return Err("state malformed".to_string());
-    }
-    let expected_sig = oauth_state_sig(b64, instance_token);
-    if !constant_time_eq(sig.as_bytes(), expected_sig.as_bytes()) {
-        return Err("state signature mismatch".to_string());
-    }
-    let raw = base64::engine::general_purpose::URL_SAFE_NO_PAD
-        .decode(b64)
-        .map_err(|e| format!("state base64: {e}"))?;
-    let claims: OAuthStateClaims =
-        serde_json::from_slice(&raw).map_err(|e| format!("state json: {e}"))?;
-    if claims.instance_id != expected_instance {
-        return Err("state instance_id mismatch".to_string());
-    }
-    if claims.exp < now_unix {
-        return Err("state expired".to_string());
-    }
-    Ok(claims)
-}
-
-/// HMAC-SHA1 of the state payload keyed by the instance token. Output
-/// is the 40-char lowercase hex digest. WeCom signatures elsewhere in
-/// this file are plain `sha1(concat)` — we use HMAC here because the
-/// token is a true secret (operator-chosen) and HMAC is the standard
-/// CSRF-token construction; plain SHA1 of `token + payload` is
-/// vulnerable to length-extension on hypothetical inputs we don't
-/// fully control.
-fn oauth_state_sig(payload_b64: &str, instance_token: &str) -> String {
-    use hmac::{Hmac, Mac};
-    use sha1::Sha1;
-    type HmacSha1 = Hmac<Sha1>;
-    let mut mac =
-        HmacSha1::new_from_slice(instance_token.as_bytes()).expect("HMAC accepts any key length");
-    mac.update(payload_b64.as_bytes());
-    let bytes = mac.finalize().into_bytes();
-    const HEX: &[u8; 16] = b"0123456789abcdef";
-    let mut out = String::with_capacity(40);
-    for b in bytes {
-        out.push(HEX[(b >> 4) as usize] as char);
-        out.push(HEX[(b & 0x0f) as usize] as char);
-    }
-    out
-}
-
-/// Exchange the `code` returned by WeCom for the user's `userid` via
-/// `cgi-bin/auth/getuserinfo`. The `access_token` argument is the
-/// app-level access_token from [`ensure_token`].
-///
-/// WeCom returns `{errcode:0, errmsg:"ok", userid:"..."}` on success.
-/// `external_userid` (for non-corp users) and `user_ticket` (only with
-/// `snsapi_privateinfo` scope) are surfaced when present — callers
-/// that only need `userid` ignore them.
-pub(crate) async fn exchange_code_for_userid(
-    access_token: &str,
-    code: &str,
-) -> Result<OAuthUserInfo, String> {
-    let url = format!(
-        "{WECOM_API_BASE}/cgi-bin/auth/getuserinfo?access_token={}&code={}",
-        urlencoding_minimal(access_token),
-        urlencoding_minimal(code),
-    );
-    let resp = reqwest::Client::new()
-        .get(&url)
-        .send()
-        .await
-        .map_err(|e| format!("getuserinfo http: {e}"))?;
-    let parsed: GetUserInfoReply = resp
-        .json()
-        .await
-        .map_err(|e| format!("getuserinfo json: {e}"))?;
-    if parsed.errcode != 0 {
-        return Err(format!(
-            "wecom getuserinfo failed: errcode={} errmsg={}",
-            parsed.errcode, parsed.errmsg
-        ));
-    }
-    // A corp member returns `userid`; a non-corp visitor returns
-    // `openid` + `external_userid` instead. v1 only supports corp
-    // members — surface the visitor case as a clear error rather than
-    // silently dropping them.
-    let userid = parsed
-        .userid
-        .filter(|s| !s.is_empty())
-        .ok_or_else(|| "wecom oauth: not a corp member (no userid)".to_string())?;
-    Ok(OAuthUserInfo {
-        userid,
-        external_userid: parsed.external_userid.filter(|s| !s.is_empty()),
-        user_ticket: parsed.user_ticket.filter(|s| !s.is_empty()),
-    })
-}
-
-/// Subset of the `getuserinfo` reply we care about. The other fields
-/// (`openid`, `device_id`) we ignore — see WeCom's docs if a future
-/// feature needs them.
-#[derive(Debug, Deserialize)]
-struct GetUserInfoReply {
-    errcode: i64,
-    #[serde(default)]
-    errmsg: String,
-    #[serde(default)]
-    userid: Option<String>,
-    #[serde(default)]
-    external_userid: Option<String>,
-    #[serde(default)]
-    user_ticket: Option<String>,
-}
-
-#[derive(Debug, Clone, PartialEq, Eq)]
-pub(crate) struct OAuthUserInfo {
-    pub(crate) userid: String,
-    /// Set when the authenticator is a non-corp visitor. v1 routes
-    /// reject these; recording the field anyway so future "external
-    /// contact" features can pick it up without a wire change.
-    pub(crate) external_userid: Option<String>,
-    /// Set only with `snsapi_privateinfo` scope. Used to call
-    /// `cgi-bin/auth/getuserdetail` for name / mobile. `None` for
-    /// snsapi_base.
-    pub(crate) user_ticket: Option<String>,
-}
 
 /// Same UTF-8-safe truncation pattern as the other adapters. Kept
 /// inline rather than extracted — each kind's max-bytes is platform
@@ -1238,7 +695,42 @@ fn truncate_utf8(s: &str, max_bytes: usize) -> (String, bool) {
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::channel_adapter::ChannelAdapter;
+    use crate::channel_adapter::{ChannelAdapter, ChannelInboundHandler};
+    use std::collections::HashMap;
+
+    /// Mirror of `crypto::tests::synth_encrypt` — duplicated here
+    /// because integration-shape tests (handler_post_round_trip)
+    /// live in mod.rs but need to fabricate ciphertext, and
+    /// `#[cfg(test)]` items inside a sibling submodule's `mod tests`
+    /// aren't reachable from this module. Keep them in sync — the
+    /// unit tests in crypto.rs cover the round-trip semantics.
+    fn synth_encrypt(msg: &str, corp_id: &str, key: &[u8; 32]) -> String {
+        use aes::cipher::{block_padding::NoPadding, BlockEncryptMut, KeyIvInit};
+        use base64::Engine;
+        type Aes256CbcEnc = cbc::Encryptor<aes::Aes256>;
+
+        let iv = &key[..16];
+        let mut payload = Vec::new();
+        payload.extend_from_slice(&[0u8; 16]);
+        payload.extend_from_slice(&(msg.len() as u32).to_be_bytes());
+        payload.extend_from_slice(msg.as_bytes());
+        payload.extend_from_slice(corp_id.as_bytes());
+        let pad_len = 32 - (payload.len() % 32);
+        payload.extend_from_slice(&vec![pad_len as u8; pad_len]);
+        let mut buf = payload.clone();
+        let cipher = Aes256CbcEnc::new_from_slices(key, iv).unwrap();
+        let n = cipher
+            .encrypt_padded_mut::<NoPadding>(&mut buf, payload.len())
+            .unwrap()
+            .len();
+        base64::engine::general_purpose::STANDARD.encode(&buf[..n])
+    }
+
+    fn synth_aes_key_b64(key: &[u8; 32]) -> String {
+        use base64::Engine;
+        let full = base64::engine::general_purpose::STANDARD.encode(key);
+        full.chars().take(43).collect()
+    }
 
     fn full_config() -> Value {
         json!({
@@ -1399,333 +891,6 @@ mod tests {
         assert_eq!(out, "你");
     }
 
-    // ----------------------- OAuth2 helpers --------------------------
-
-    #[test]
-    fn oauth_authorize_url_has_required_params_and_hash() {
-        let url = oauth_authorize_url(
-            "ww-corp",
-            1_000_002,
-            "https://abc.example/v1/channels/xyz/oauth/callback",
-            "state-token-abc",
-            OAuthScope::Base,
-        );
-        // All of WeCom's required parameters present.
-        assert!(url.contains("appid=ww-corp"));
-        assert!(url.contains(
-            "redirect_uri=https%3A%2F%2Fabc.example%2Fv1%2Fchannels%2Fxyz%2Foauth%2Fcallback"
-        ));
-        assert!(url.contains("response_type=code"));
-        assert!(url.contains("scope=snsapi_base"));
-        assert!(url.contains("state=state-token-abc"));
-        assert!(url.contains("agentid=1000002"));
-        // The `#wechat_redirect` fragment is mandatory — without it
-        // WeCom client renders blank.
-        assert!(url.ends_with("#wechat_redirect"));
-        // No accidental newlines / whitespace from the format string.
-        assert!(!url.contains(' '));
-        assert!(!url.contains('\n'));
-    }
-
-    #[test]
-    fn oauth_state_round_trip_decodes_claims() {
-        let state = make_oauth_state(
-            "inst-1",
-            "token-secret",
-            600,
-            Some("session=abc"),
-            "deadbeefcafebabe",
-            1_700_000_000,
-        )
-        .expect("sign ok");
-        let claims = verify_oauth_state(&state, "inst-1", "token-secret", 1_700_000_100)
-            .expect("verify ok");
-        assert_eq!(claims.instance_id, "inst-1");
-        assert_eq!(claims.exp, 1_700_000_600);
-        assert_eq!(claims.nonce, "deadbeefcafebabe");
-        assert_eq!(claims.ctx.as_deref(), Some("session=abc"));
-    }
-
-    #[test]
-    fn oauth_state_rejects_tampered_payload() {
-        let state = make_oauth_state(
-            "inst-1",
-            "token-secret",
-            600,
-            None,
-            "nonce123",
-            1_700_000_000,
-        )
-        .unwrap();
-        // Flip a payload byte (but keep the signature) → signature
-        // mismatch.
-        let (payload, sig) = state.split_once('.').unwrap();
-        let mut bad_payload = payload.to_string();
-        let last = bad_payload.pop().unwrap();
-        // Replace last char with something different.
-        bad_payload.push(if last == 'A' { 'B' } else { 'A' });
-        let tampered = format!("{bad_payload}.{sig}");
-        let err = verify_oauth_state(&tampered, "inst-1", "token-secret", 1_700_000_100)
-            .expect_err("must reject");
-        assert!(err.contains("signature"));
-    }
-
-    #[test]
-    fn oauth_state_rejects_wrong_instance_id() {
-        let state = make_oauth_state(
-            "inst-A",
-            "token-secret",
-            600,
-            None,
-            "nonce123",
-            1_700_000_000,
-        )
-        .unwrap();
-        let err = verify_oauth_state(&state, "inst-B", "token-secret", 1_700_000_100)
-            .expect_err("must reject");
-        assert!(err.contains("instance_id"));
-    }
-
-    #[test]
-    fn oauth_state_rejects_expired() {
-        let state = make_oauth_state(
-            "inst-1",
-            "token-secret",
-            60,
-            None,
-            "nonce123",
-            1_700_000_000,
-        )
-        .unwrap();
-        // 70 seconds later — exp = 1_700_000_060, now = 1_700_000_070.
-        let err = verify_oauth_state(&state, "inst-1", "token-secret", 1_700_000_070)
-            .expect_err("must reject");
-        assert!(err.contains("expired"));
-    }
-
-    #[test]
-    fn oauth_state_rejects_missing_signature() {
-        // No period at all.
-        let err = verify_oauth_state("aGVsbG8", "inst-1", "token-secret", 1_700_000_000)
-            .expect_err("must reject");
-        assert!(err.contains("missing signature"));
-        // Empty signature segment.
-        let err = verify_oauth_state("aGVsbG8.", "inst-1", "token-secret", 1_700_000_000)
-            .expect_err("must reject");
-        assert!(err.contains("malformed"));
-    }
-
-    #[test]
-    fn oauth_state_refuses_empty_token() {
-        let err = make_oauth_state("inst-1", "", 600, None, "nonce", 1_700_000_000)
-            .expect_err("must reject");
-        assert!(err.contains("token"));
-    }
-
-    #[test]
-    fn oauth_state_sig_differs_per_token_value() {
-        // Two distinct tokens MUST produce distinct signatures over
-        // the same payload, otherwise the CSRF gate is decorative.
-        let s1 = oauth_state_sig("payload", "token-A");
-        let s2 = oauth_state_sig("payload", "token-B");
-        assert_ne!(s1, s2);
-        // And the same input is deterministic.
-        assert_eq!(s1, oauth_state_sig("payload", "token-A"));
-    }
-
-    // ----------------------- token cache ----------------------------
-    //
-    // All four cache tests touch the same process-level
-    // `token_cache()` singleton. Cargo runs tests in parallel by
-    // default, so we serialise just this group with a local mutex —
-    // simpler than dragging `serial_test` into the workspace deps
-    // and the cost is negligible (4 tests, each <2 ms).
-
-    fn cache_test_lock() -> &'static std::sync::Mutex<()> {
-        static LOCK: std::sync::OnceLock<std::sync::Mutex<()>> = std::sync::OnceLock::new();
-        LOCK.get_or_init(|| std::sync::Mutex::new(()))
-    }
-
-    #[test]
-    fn token_cache_stores_and_returns_within_ttl() {
-        let _g = cache_test_lock().lock().unwrap();
-        reset_token_cache();
-        let cache = token_cache();
-        cache.set("corp-A", "tok-1".into(), 7200);
-        assert_eq!(cache.get("corp-A"), Some("tok-1".into()));
-    }
-
-    #[test]
-    fn token_cache_treats_short_ttl_as_expired_via_lead() {
-        let _g = cache_test_lock().lock().unwrap();
-        reset_token_cache();
-        let cache = token_cache();
-        cache.set("corp-B", "tok-2".into(), 30); // shorter than 300s lead
-        // Cache stores expires_at = now() + 0s (saturating sub),
-        // already in the past by the time `get` runs.
-        std::thread::sleep(std::time::Duration::from_millis(2));
-        assert_eq!(cache.get("corp-B"), None);
-    }
-
-    #[test]
-    fn token_cache_invalidate_drops_entry() {
-        let _g = cache_test_lock().lock().unwrap();
-        reset_token_cache();
-        let cache = token_cache();
-        cache.set("corp-C", "tok-3".into(), 7200);
-        cache.invalidate("corp-C");
-        assert_eq!(cache.get("corp-C"), None);
-    }
-
-    #[test]
-    fn token_cache_keys_by_corp_id() {
-        let _g = cache_test_lock().lock().unwrap();
-        reset_token_cache();
-        let cache = token_cache();
-        cache.set("corp-D", "tok-D".into(), 7200);
-        cache.set("corp-E", "tok-E".into(), 7200);
-        assert_eq!(cache.get("corp-D").as_deref(), Some("tok-D"));
-        assert_eq!(cache.get("corp-E").as_deref(), Some("tok-E"));
-    }
-
-    // ----------------------- inbound (C.2) --------------------------
-
-    use crate::channel_adapter::ChannelInboundHandler;
-    use harness_channel::ChannelInboundKind;
-
-    #[test]
-    fn extract_tag_handles_plain_and_cdata() {
-        let xml = "<root><A>plain</A><B><![CDATA[in cdata]]></B></root>";
-        assert_eq!(extract_tag(xml, "A").as_deref(), Some("plain"));
-        assert_eq!(extract_tag(xml, "B").as_deref(), Some("in cdata"));
-        assert_eq!(extract_tag(xml, "Missing"), None);
-    }
-
-    #[test]
-    fn signature_is_lowercase_hex_and_matches_spec_example() {
-        // Sort + concat + sha1. Spot-check a known case computed
-        // off-line: `(token=ABC, ts=1, nonce=N, payload=PL)`.
-        // Sort → ["1","ABC","N","PL"] → concat → "1ABCNPL"
-        // sha1 of that string is deterministic; just check it's
-        // 40 lowercase hex chars and changes when an input changes.
-        let s1 = wecom_signature("ABC", "1", "N", "PL");
-        assert_eq!(s1.len(), 40);
-        assert!(s1.chars().all(|c| c.is_ascii_hexdigit() && !c.is_ascii_uppercase()));
-        let s2 = wecom_signature("ABC", "2", "N", "PL");
-        assert_ne!(s1, s2);
-        // Reordering identical inputs yields the same signature
-        // (sort makes parameter order irrelevant — that's the
-        // protocol).
-        let s_same = wecom_signature("PL", "ABC", "1", "N");
-        assert_eq!(s_same, s1);
-    }
-
-    #[test]
-    fn constant_time_eq_is_correct_for_basics() {
-        assert!(constant_time_eq(b"abc", b"abc"));
-        assert!(!constant_time_eq(b"abc", b"abd"));
-        assert!(!constant_time_eq(b"abc", b"abcd"));
-        assert!(constant_time_eq(b"", b""));
-    }
-
-    /// Build a plaintext that the WeCom AES envelope wraps, then
-    /// encrypt it ourselves and round-trip through
-    /// `decrypt_aes_payload`. We don't depend on a known WeCom
-    /// fixture; instead we use the same `aes` + `cbc` crates the
-    /// production decrypt does, on a synthetic key, and assert the
-    /// shape comes back out cleanly.
-    fn synth_encrypt(msg: &str, corp_id: &str, key: &[u8; 32]) -> String {
-        use aes::cipher::{block_padding::NoPadding, BlockEncryptMut, KeyIvInit};
-        use base64::Engine;
-        type Aes256CbcEnc = cbc::Encryptor<aes::Aes256>;
-
-        let iv = &key[..16];
-        let mut payload = Vec::new();
-        payload.extend_from_slice(&[0u8; 16]); // random_16
-        payload.extend_from_slice(&(msg.len() as u32).to_be_bytes());
-        payload.extend_from_slice(msg.as_bytes());
-        payload.extend_from_slice(corp_id.as_bytes());
-        // Pad to 32 (PKCS#7 amounts to (32 - len%32) % 32 minimum 1).
-        let pad_len = 32 - (payload.len() % 32);
-        payload.extend_from_slice(&vec![pad_len as u8; pad_len]);
-        // Pre-allocate the buffer for `encrypt_padded_mut`.
-        let mut buf = payload.clone();
-        let cipher = Aes256CbcEnc::new_from_slices(key, iv).unwrap();
-        let n = cipher
-            .encrypt_padded_mut::<NoPadding>(&mut buf, payload.len())
-            .unwrap()
-            .len();
-        base64::engine::general_purpose::STANDARD.encode(&buf[..n])
-    }
-
-    fn synth_aes_key_b64(key: &[u8; 32]) -> String {
-        use base64::Engine;
-        // EncodingAESKey = first 43 chars of base64(key). The
-        // production decoder appends `=` itself.
-        let full = base64::engine::general_purpose::STANDARD.encode(key);
-        full.chars().take(43).collect()
-    }
-
-    #[test]
-    fn decrypt_round_trip_extracts_msg_and_validates_corpid() {
-        let key = [7u8; 32];
-        let aes_key_b64 = synth_aes_key_b64(&key);
-        let cipher = synth_encrypt("hello world", "ww-good-corp", &key);
-        let plain = decrypt_aes_payload(&aes_key_b64, &cipher, "ww-good-corp").unwrap();
-        assert_eq!(plain, "hello world");
-    }
-
-    #[test]
-    fn decrypt_rejects_wrong_corp_id() {
-        let key = [7u8; 32];
-        let aes_key_b64 = synth_aes_key_b64(&key);
-        let cipher = synth_encrypt("hi", "ww-actual", &key);
-        let err = decrypt_aes_payload(&aes_key_b64, &cipher, "ww-different").unwrap_err();
-        assert!(err.contains("receive_id mismatch"), "got: {err}");
-    }
-
-    #[test]
-    fn decrypt_rejects_invalid_base64() {
-        // Use a valid AES key first (so we reach the ciphertext
-        // decode), then feed garbage that base64 can't parse.
-        let key = [11u8; 32];
-        let aes_key_b64 = synth_aes_key_b64(&key);
-        let err = decrypt_aes_payload(&aes_key_b64, "@@@not-base64@@@", "ww").unwrap_err();
-        assert!(err.contains("ciphertext not valid base64"), "got: {err}");
-    }
-
-    #[test]
-    fn decrypt_rejects_short_aes_key() {
-        // EncodingAESKey of 30 chars decodes to ~22 bytes, not 32.
-        let err = decrypt_aes_payload(&"a".repeat(30), "AAAA", "ww").unwrap_err();
-        assert!(err.contains("expected 32") || err.contains("not valid base64"));
-    }
-
-    #[test]
-    fn decrypt_rejects_truncated_plaintext() {
-        // A ciphertext that decrypts to fewer than 20 bytes (the
-        // header alone) should be rejected.
-        use aes::cipher::{block_padding::NoPadding, BlockEncryptMut, KeyIvInit};
-        use base64::Engine;
-        type Aes256CbcEnc = cbc::Encryptor<aes::Aes256>;
-        let key = [9u8; 32];
-        let iv = &key[..16];
-        // 16 bytes total: just one block padded with PKCS#7. After
-        // strip we'd have <20 bytes, triggering the length check.
-        let payload = b"123456789012345"; // 15 bytes; pad to 16 with 1 byte of pad
-        let mut padded = payload.to_vec();
-        padded.push(1u8); // 1 byte of pad
-        let mut buf = padded.clone();
-        let cipher = Aes256CbcEnc::new_from_slices(&key, iv).unwrap();
-        let n = cipher
-            .encrypt_padded_mut::<NoPadding>(&mut buf, padded.len())
-            .unwrap()
-            .len();
-        let cipher_b64 = base64::engine::general_purpose::STANDARD.encode(&buf[..n]);
-        let err =
-            decrypt_aes_payload(&synth_aes_key_b64(&key), &cipher_b64, "ww").unwrap_err();
-        assert!(err.contains("plaintext too short"), "got: {err}");
-    }
 
     #[test]
     fn parse_inbound_xml_text_message() {
diff --git a/crates/harness-server/src/channels_wecom_app/oauth.rs b/crates/harness-server/src/channels_wecom_app/oauth.rs
new file mode 100644
index 0000000..66b889c
--- /dev/null
+++ b/crates/harness-server/src/channels_wecom_app/oauth.rs
@@ -0,0 +1,391 @@
+//! OAuth2 免登 (snsapi_base) — terminal-user identity verification.
+//!
+//! WeCom's snsapi_base scope returns a `userid` after a silent in-client
+//! authorisation. We use it for "click here to verify who you are" links
+//! the bot can post into a chat, or for the `/v1/channels/:id/oauth/start`
+//! + `/oauth/callback` redirect pair.
+//!
+//! State is HMAC-SHA1 signed against the instance's `token` field — same
+//! secret the inbound verify uses — so we don't need a server-side state
+//! store. The signed payload carries `instance_id`, an expiry timestamp,
+//! and a random nonce. Verification checks the signature, parses the
+//! payload, validates the instance binding + expiry, all in constant time.
+//!
+//! Reference: <https://developer.work.weixin.qq.com/document/path/91022>
+
+use serde::Deserialize;
+
+use super::crypto::constant_time_eq;
+use super::{urlencoding_minimal, WECOM_API_BASE};
+
+/// `snsapi_base` returns just the `userid` silently — no popup in the
+/// WeCom client when the user is already logged in. `snsapi_privateinfo`
+/// additionally surfaces name / avatar / mobile via a `user_ticket`, but
+/// it triggers a confirmation prompt and requires extra app permissions.
+/// v1 ships only `Base` — it's the minimum that proves identity.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub(crate) enum OAuthScope {
+    Base,
+}
+
+impl OAuthScope {
+    fn as_wire(self) -> &'static str {
+        match self {
+            Self::Base => "snsapi_base",
+        }
+    }
+}
+
+/// Build the WeCom OAuth2 authorize URL. `redirect_uri` is treated as
+/// opaque and URL-encoded verbatim — the operator is responsible for
+/// whitelisting its domain in the WeCom admin's "可信域名".
+///
+/// `#wechat_redirect` is mandatory per WeCom's docs; without it the
+/// authorize page renders blank inside the WeCom client.
+pub(crate) fn oauth_authorize_url(
+    corp_id: &str,
+    agent_id: u64,
+    redirect_uri: &str,
+    state: &str,
+    scope: OAuthScope,
+) -> String {
+    format!(
+        "https://open.weixin.qq.com/connect/oauth2/authorize\
+         ?appid={appid}\
+         &redirect_uri={redirect}\
+         &response_type=code\
+         &scope={scope}\
+         &state={state}\
+         &agentid={agentid}#wechat_redirect",
+        appid = urlencoding_minimal(corp_id),
+        redirect = urlencoding_minimal(redirect_uri),
+        scope = scope.as_wire(),
+        state = urlencoding_minimal(state),
+        agentid = agent_id,
+    )
+}
+
+/// Decoded state payload after signature verification. The fields are
+/// the contract between `make_oauth_state` and `verify_oauth_state` —
+/// keep them additive-only or version the payload.
+#[derive(Debug, Clone, serde::Serialize, serde::Deserialize, PartialEq, Eq)]
+pub(crate) struct OAuthStateClaims {
+    /// Channel-instance id this state belongs to. The callback route
+    /// uses this to cross-check the `:id` path parameter.
+    pub(crate) instance_id: String,
+    /// Unix seconds after which the state is invalid. Typically now +
+    /// 10 minutes — long enough for a slow tap, short enough that a
+    /// stolen state ages out before being useful.
+    pub(crate) exp: u64,
+    /// 16-byte hex random — guards against replay of the same state
+    /// (combined with `exp`) and makes the signed blob look opaque.
+    pub(crate) nonce: String,
+    /// Optional caller-supplied opaque field. Often a Jarvis session
+    /// id, a `next=` URL hint, or a pairing token — the callback
+    /// surfaces this verbatim so the originator can correlate.
+    #[serde(default, skip_serializing_if = "Option::is_none")]
+    pub(crate) ctx: Option<String>,
+}
+
+/// Sign a fresh state token. The `token` argument is the same value
+/// configured on the `ChannelInstance` for inbound verify (`config.token`
+/// — operator-chosen, kept secret) so we don't need a dedicated
+/// signing key.
+pub(crate) fn make_oauth_state(
+    instance_id: &str,
+    instance_token: &str,
+    ttl_secs: u64,
+    ctx: Option<&str>,
+    nonce_hex: &str,
+    now_unix: u64,
+) -> Result<String, String> {
+    use base64::Engine;
+    if instance_token.is_empty() {
+        return Err("instance token is empty — cannot sign OAuth state".to_string());
+    }
+    let claims = OAuthStateClaims {
+        instance_id: instance_id.to_string(),
+        exp: now_unix.saturating_add(ttl_secs),
+        nonce: nonce_hex.to_string(),
+        ctx: ctx.map(str::to_string),
+    };
+    let json = serde_json::to_vec(&claims).map_err(|e| format!("state encode: {e}"))?;
+    let b64 = base64::engine::general_purpose::URL_SAFE_NO_PAD.encode(&json);
+    let sig = oauth_state_sig(&b64, instance_token);
+    Ok(format!("{b64}.{sig}"))
+}
+
+/// Verify + decode a state token. Returns the claims (CSRF passed and
+/// not expired) or an operator-readable error.
+///
+/// Step order matters:
+/// 1. Split on `.`  (cheap, doesn't leak anything)
+/// 2. Recompute sig + constant-time compare — catches tampering early
+/// 3. Decode payload, parse JSON
+/// 4. Cross-check `instance_id` against the route's `:id`
+/// 5. Check expiry against the caller-supplied `now_unix`
+pub(crate) fn verify_oauth_state(
+    state: &str,
+    expected_instance: &str,
+    instance_token: &str,
+    now_unix: u64,
+) -> Result<OAuthStateClaims, String> {
+    use base64::Engine;
+    let (b64, sig) = state.split_once('.').ok_or("state missing signature")?;
+    if b64.is_empty() || sig.is_empty() {
+        return Err("state malformed".to_string());
+    }
+    let expected_sig = oauth_state_sig(b64, instance_token);
+    if !constant_time_eq(sig.as_bytes(), expected_sig.as_bytes()) {
+        return Err("state signature mismatch".to_string());
+    }
+    let raw = base64::engine::general_purpose::URL_SAFE_NO_PAD
+        .decode(b64)
+        .map_err(|e| format!("state base64: {e}"))?;
+    let claims: OAuthStateClaims =
+        serde_json::from_slice(&raw).map_err(|e| format!("state json: {e}"))?;
+    if claims.instance_id != expected_instance {
+        return Err("state instance_id mismatch".to_string());
+    }
+    if claims.exp < now_unix {
+        return Err("state expired".to_string());
+    }
+    Ok(claims)
+}
+
+/// HMAC-SHA1 of the state payload keyed by the instance token. Output
+/// is the 40-char lowercase hex digest. WeCom signatures elsewhere in
+/// this file are plain `sha1(concat)` — we use HMAC here because the
+/// token is a true secret (operator-chosen) and HMAC is the standard
+/// CSRF-token construction; plain SHA1 of `token + payload` is
+/// vulnerable to length-extension on hypothetical inputs we don't
+/// fully control.
+fn oauth_state_sig(payload_b64: &str, instance_token: &str) -> String {
+    use hmac::{Hmac, Mac};
+    use sha1::Sha1;
+    type HmacSha1 = Hmac<Sha1>;
+    let mut mac =
+        HmacSha1::new_from_slice(instance_token.as_bytes()).expect("HMAC accepts any key length");
+    mac.update(payload_b64.as_bytes());
+    let bytes = mac.finalize().into_bytes();
+    const HEX: &[u8; 16] = b"0123456789abcdef";
+    let mut out = String::with_capacity(40);
+    for b in bytes {
+        out.push(HEX[(b >> 4) as usize] as char);
+        out.push(HEX[(b & 0x0f) as usize] as char);
+    }
+    out
+}
+
+/// Exchange the `code` returned by WeCom for the user's `userid` via
+/// `cgi-bin/auth/getuserinfo`. The `access_token` argument is the
+/// app-level access_token from [`super::token::ensure_token`].
+///
+/// WeCom returns `{errcode:0, errmsg:"ok", userid:"..."}` on success.
+/// `external_userid` (for non-corp users) and `user_ticket` (only with
+/// `snsapi_privateinfo` scope) are surfaced when present — callers
+/// that only need `userid` ignore them.
+pub(crate) async fn exchange_code_for_userid(
+    access_token: &str,
+    code: &str,
+) -> Result<OAuthUserInfo, String> {
+    let url = format!(
+        "{WECOM_API_BASE}/cgi-bin/auth/getuserinfo?access_token={}&code={}",
+        urlencoding_minimal(access_token),
+        urlencoding_minimal(code),
+    );
+    let resp = reqwest::Client::new()
+        .get(&url)
+        .send()
+        .await
+        .map_err(|e| format!("getuserinfo http: {e}"))?;
+    let parsed: GetUserInfoReply = resp
+        .json()
+        .await
+        .map_err(|e| format!("getuserinfo json: {e}"))?;
+    if parsed.errcode != 0 {
+        return Err(format!(
+            "wecom getuserinfo failed: errcode={} errmsg={}",
+            parsed.errcode, parsed.errmsg
+        ));
+    }
+    // A corp member returns `userid`; a non-corp visitor returns
+    // `openid` + `external_userid` instead. v1 only supports corp
+    // members — surface the visitor case as a clear error rather than
+    // silently dropping them.
+    let userid = parsed
+        .userid
+        .filter(|s| !s.is_empty())
+        .ok_or_else(|| "wecom oauth: not a corp member (no userid)".to_string())?;
+    Ok(OAuthUserInfo {
+        userid,
+        external_userid: parsed.external_userid.filter(|s| !s.is_empty()),
+        user_ticket: parsed.user_ticket.filter(|s| !s.is_empty()),
+    })
+}
+
+/// Subset of the `getuserinfo` reply we care about. The other fields
+/// (`openid`, `device_id`) we ignore — see WeCom's docs if a future
+/// feature needs them.
+#[derive(Debug, Deserialize)]
+struct GetUserInfoReply {
+    errcode: i64,
+    #[serde(default)]
+    errmsg: String,
+    #[serde(default)]
+    userid: Option<String>,
+    #[serde(default)]
+    external_userid: Option<String>,
+    #[serde(default)]
+    user_ticket: Option<String>,
+}
+
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub(crate) struct OAuthUserInfo {
+    pub(crate) userid: String,
+    /// Set when the authenticator is a non-corp visitor. v1 routes
+    /// reject these; recording the field anyway so future "external
+    /// contact" features can pick it up without a wire change.
+    pub(crate) external_userid: Option<String>,
+    /// Set only with `snsapi_privateinfo` scope. Used to call
+    /// `cgi-bin/auth/getuserdetail` for name / mobile. `None` for
+    /// snsapi_base.
+    pub(crate) user_ticket: Option<String>,
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn oauth_authorize_url_has_required_params_and_hash() {
+        let url = oauth_authorize_url(
+            "ww-corp",
+            1_000_002,
+            "https://abc.example/v1/channels/xyz/oauth/callback",
+            "state-token-abc",
+            OAuthScope::Base,
+        );
+        // All of WeCom's required parameters present.
+        assert!(url.contains("appid=ww-corp"));
+        assert!(url.contains(
+            "redirect_uri=https%3A%2F%2Fabc.example%2Fv1%2Fchannels%2Fxyz%2Foauth%2Fcallback"
+        ));
+        assert!(url.contains("response_type=code"));
+        assert!(url.contains("scope=snsapi_base"));
+        assert!(url.contains("state=state-token-abc"));
+        assert!(url.contains("agentid=1000002"));
+        // The `#wechat_redirect` fragment is mandatory — without it
+        // WeCom client renders blank.
+        assert!(url.ends_with("#wechat_redirect"));
+        // No accidental newlines / whitespace from the format string.
+        assert!(!url.contains(' '));
+        assert!(!url.contains('\n'));
+    }
+
+    #[test]
+    fn oauth_state_round_trip_decodes_claims() {
+        let state = make_oauth_state(
+            "inst-1",
+            "token-secret",
+            600,
+            Some("session=abc"),
+            "deadbeefcafebabe",
+            1_700_000_000,
+        )
+        .expect("sign ok");
+        let claims = verify_oauth_state(&state, "inst-1", "token-secret", 1_700_000_100)
+            .expect("verify ok");
+        assert_eq!(claims.instance_id, "inst-1");
+        assert_eq!(claims.exp, 1_700_000_600);
+        assert_eq!(claims.nonce, "deadbeefcafebabe");
+        assert_eq!(claims.ctx.as_deref(), Some("session=abc"));
+    }
+
+    #[test]
+    fn oauth_state_rejects_tampered_payload() {
+        let state = make_oauth_state(
+            "inst-1",
+            "token-secret",
+            600,
+            None,
+            "nonce123",
+            1_700_000_000,
+        )
+        .unwrap();
+        // Flip a payload byte (but keep the signature) → signature
+        // mismatch.
+        let (payload, sig) = state.split_once('.').unwrap();
+        let mut bad_payload = payload.to_string();
+        let last = bad_payload.pop().unwrap();
+        // Replace last char with something different.
+        bad_payload.push(if last == 'A' { 'B' } else { 'A' });
+        let tampered = format!("{bad_payload}.{sig}");
+        let err = verify_oauth_state(&tampered, "inst-1", "token-secret", 1_700_000_100)
+            .expect_err("must reject");
+        assert!(err.contains("signature"));
+    }
+
+    #[test]
+    fn oauth_state_rejects_wrong_instance_id() {
+        let state = make_oauth_state(
+            "inst-A",
+            "token-secret",
+            600,
+            None,
+            "nonce123",
+            1_700_000_000,
+        )
+        .unwrap();
+        let err = verify_oauth_state(&state, "inst-B", "token-secret", 1_700_000_100)
+            .expect_err("must reject");
+        assert!(err.contains("instance_id"));
+    }
+
+    #[test]
+    fn oauth_state_rejects_expired() {
+        let state = make_oauth_state(
+            "inst-1",
+            "token-secret",
+            60,
+            None,
+            "nonce123",
+            1_700_000_000,
+        )
+        .unwrap();
+        // 70 seconds later — exp = 1_700_000_060, now = 1_700_000_070.
+        let err = verify_oauth_state(&state, "inst-1", "token-secret", 1_700_000_070)
+            .expect_err("must reject");
+        assert!(err.contains("expired"));
+    }
+
+    #[test]
+    fn oauth_state_rejects_missing_signature() {
+        // No period at all.
+        let err = verify_oauth_state("aGVsbG8", "inst-1", "token-secret", 1_700_000_000)
+            .expect_err("must reject");
+        assert!(err.contains("missing signature"));
+        // Empty signature segment.
+        let err = verify_oauth_state("aGVsbG8.", "inst-1", "token-secret", 1_700_000_000)
+            .expect_err("must reject");
+        assert!(err.contains("malformed"));
+    }
+
+    #[test]
+    fn oauth_state_refuses_empty_token() {
+        let err = make_oauth_state("inst-1", "", 600, None, "nonce", 1_700_000_000)
+            .expect_err("must reject");
+        assert!(err.contains("token"));
+    }
+
+    #[test]
+    fn oauth_state_sig_differs_per_token_value() {
+        // Two distinct tokens MUST produce distinct signatures over
+        // the same payload, otherwise the CSRF gate is decorative.
+        let s1 = oauth_state_sig("payload", "token-A");
+        let s2 = oauth_state_sig("payload", "token-B");
+        assert_ne!(s1, s2);
+        // And the same input is deterministic.
+        assert_eq!(s1, oauth_state_sig("payload", "token-A"));
+    }
+}
diff --git a/crates/harness-server/src/channels_wecom_app/token.rs b/crates/harness-server/src/channels_wecom_app/token.rs
new file mode 100644
index 0000000..66f3173
--- /dev/null
+++ b/crates/harness-server/src/channels_wecom_app/token.rs
@@ -0,0 +1,250 @@
+//! Access-token cache and fetch — the credentials half of WeCom
+//! 自建应用 outbound.
+//!
+//! WeCom's self-built apps authenticate every API call with a short-
+//! lived `access_token` derived from `corp_id + corp_secret`:
+//!
+//! ```text
+//! GET /cgi-bin/gettoken?corpid=...&corpsecret=...
+//!   → { errcode:0, access_token:"...", expires_in:7200 }
+//! ```
+//!
+//! A token is good for ~2h. The cache here is a process-level
+//! `HashMap<corp_id, CachedToken>` so multiple `ChannelInstance` rows
+//! sharing the same corp don't each burn an `expires_in` budget
+//! (WeCom enforces ~2000 gettoken calls/day per corp).
+//!
+//! `ensure_token` is the single externally-visible entry point —
+//! also called by the OAuth callback handler in
+//! [`super::oauth`](super::oauth) to authorise its `getuserinfo`
+//! exchange.
+
+use harness_channel::SendOutcome;
+use serde::Deserialize;
+use std::collections::HashMap;
+use std::sync::RwLock;
+use std::time::{Duration, Instant};
+
+use super::{urlencoding_minimal, WECOM_API_BASE};
+
+/// How early to refresh `access_token` before its declared
+/// `expires_in`. WeCom hands out 7200-second tokens; refreshing 5
+/// minutes before keeps every send well clear of the boundary.
+const TOKEN_REFRESH_LEAD_SECS: u64 = 300;
+
+#[derive(Debug, Clone)]
+struct CachedToken {
+    token: String,
+    expires_at: Instant,
+}
+
+/// Process-level cache, keyed by `corp_id`. A separate
+/// `RwLock<HashMap>` per binary (not per-instance) because access
+/// tokens are corp-scoped, not app-scoped — multiple
+/// `ChannelInstance` rows for the same `corp_id` share one token to
+/// stay under WeCom's 2000-call/day refresh quota.
+#[derive(Default)]
+pub(super) struct AccessTokenCache {
+    inner: RwLock<HashMap<String, CachedToken>>,
+}
+
+impl AccessTokenCache {
+    pub(super) fn get(&self, corp_id: &str) -> Option<String> {
+        let g = self.inner.read().ok()?;
+        let cached = g.get(corp_id)?;
+        if Instant::now() < cached.expires_at {
+            Some(cached.token.clone())
+        } else {
+            None
+        }
+    }
+
+    pub(super) fn set(&self, corp_id: &str, token: String, ttl_secs: u64) {
+        let safe_ttl = ttl_secs.saturating_sub(TOKEN_REFRESH_LEAD_SECS);
+        let expires_at = Instant::now() + Duration::from_secs(safe_ttl);
+        if let Ok(mut g) = self.inner.write() {
+            g.insert(
+                corp_id.to_string(),
+                CachedToken {
+                    token,
+                    expires_at,
+                },
+            );
+        }
+    }
+
+    pub(super) fn invalidate(&self, corp_id: &str) {
+        if let Ok(mut g) = self.inner.write() {
+            g.remove(corp_id);
+        }
+    }
+}
+
+/// Singleton — every `WeComAppAdapter` invocation hits the same
+/// cache so deployments with multiple instances behind one
+/// `corp_id` share tokens. Lazy-init via `OnceLock`.
+pub(super) fn token_cache() -> &'static AccessTokenCache {
+    static CACHE: std::sync::OnceLock<AccessTokenCache> = std::sync::OnceLock::new();
+    CACHE.get_or_init(AccessTokenCache::default)
+}
+
+/// Reset helper for tests — never called from production code.
+#[cfg(test)]
+pub(super) fn reset_token_cache() {
+    if let Ok(mut g) = token_cache().inner.write() {
+        g.clear();
+    }
+}
+
+/// Return a token from the cache, fetching one when missing /
+/// expired / `force_refresh = true`. Externally reachable
+/// (`pub(crate)`) because [`super::oauth`](super::oauth) needs it
+/// for the OAuth code exchange.
+pub(crate) async fn ensure_token(
+    corp_id: &str,
+    corp_secret: &str,
+    force_refresh: bool,
+) -> Result<String, SendOutcome> {
+    if !force_refresh {
+        if let Some(t) = token_cache().get(corp_id) {
+            return Ok(t);
+        }
+    }
+    fetch_token(corp_id, corp_secret).await
+}
+
+#[derive(Debug, Deserialize)]
+struct GetTokenReply {
+    errcode: i64,
+    #[serde(default)]
+    errmsg: String,
+    #[serde(default)]
+    access_token: String,
+    #[serde(default)]
+    expires_in: u64,
+}
+
+/// Fetch a fresh access_token. Cache populated on success.
+async fn fetch_token(corp_id: &str, corp_secret: &str) -> Result<String, SendOutcome> {
+    let url = format!(
+        "{WECOM_API_BASE}/cgi-bin/gettoken?corpid={}&corpsecret={}",
+        urlencoding_minimal(corp_id),
+        urlencoding_minimal(corp_secret),
+    );
+    let client = match reqwest::Client::builder()
+        .timeout(Duration::from_secs(10))
+        .build()
+    {
+        Ok(c) => c,
+        Err(e) => {
+            return Err(SendOutcome::fail_retryable(format!(
+                "HTTP client init: {e}"
+            )))
+        }
+    };
+    let resp = match client.get(&url).send().await {
+        Ok(r) => r,
+        Err(e) => {
+            return Err(SendOutcome::fail_retryable(format!(
+                "gettoken transport: {e}"
+            )))
+        }
+    };
+    let status = resp.status();
+    let raw = match resp.text().await {
+        Ok(t) => t,
+        Err(e) => {
+            return Err(SendOutcome::Failed {
+                message: format!("gettoken reply unreadable: {e}"),
+                code: Some("wecom_app:gettoken_reply_unreadable".into()),
+                retryable: false,
+            });
+        }
+    };
+    if !status.is_success() {
+        return Err(SendOutcome::Failed {
+            message: format!("gettoken HTTP {}: {raw}", status.as_u16()),
+            code: Some(format!("wecom_app:gettoken_http_{}", status.as_u16())),
+            retryable: status.is_server_error(),
+        });
+    }
+    let parsed: GetTokenReply = match serde_json::from_str(&raw) {
+        Ok(p) => p,
+        Err(e) => {
+            return Err(SendOutcome::Failed {
+                message: format!("gettoken parse: {e}: {raw}"),
+                code: Some("wecom_app:gettoken_reply_parse".into()),
+                retryable: false,
+            });
+        }
+    };
+    if parsed.errcode != 0 || parsed.access_token.is_empty() {
+        return Err(SendOutcome::Failed {
+            message: format!(
+                "gettoken errcode {}: {}",
+                parsed.errcode, parsed.errmsg
+            ),
+            code: Some(format!("wecom_app:gettoken_errcode_{}", parsed.errcode)),
+            retryable: false,
+        });
+    }
+    token_cache().set(corp_id, parsed.access_token.clone(), parsed.expires_in);
+    Ok(parsed.access_token)
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    // All four cache tests touch the same process-level
+    // `token_cache()` singleton. Cargo runs tests in parallel by
+    // default, so we serialise just this group with a local mutex —
+    // simpler than dragging `serial_test` into the workspace deps
+    // and the cost is negligible (4 tests, each <2 ms).
+    fn cache_test_lock() -> &'static std::sync::Mutex<()> {
+        static LOCK: std::sync::OnceLock<std::sync::Mutex<()>> = std::sync::OnceLock::new();
+        LOCK.get_or_init(|| std::sync::Mutex::new(()))
+    }
+
+    #[test]
+    fn token_cache_stores_and_returns_within_ttl() {
+        let _g = cache_test_lock().lock().unwrap();
+        reset_token_cache();
+        let cache = token_cache();
+        cache.set("corp-A", "tok-1".into(), 7200);
+        assert_eq!(cache.get("corp-A"), Some("tok-1".into()));
+    }
+
+    #[test]
+    fn token_cache_treats_short_ttl_as_expired_via_lead() {
+        let _g = cache_test_lock().lock().unwrap();
+        reset_token_cache();
+        let cache = token_cache();
+        cache.set("corp-B", "tok-2".into(), 30); // shorter than 300s lead
+        // Cache stores expires_at = now() + 0s (saturating sub),
+        // already in the past by the time `get` runs.
+        std::thread::sleep(std::time::Duration::from_millis(2));
+        assert_eq!(cache.get("corp-B"), None);
+    }
+
+    #[test]
+    fn token_cache_invalidate_drops_entry() {
+        let _g = cache_test_lock().lock().unwrap();
+        reset_token_cache();
+        let cache = token_cache();
+        cache.set("corp-C", "tok-3".into(), 7200);
+        cache.invalidate("corp-C");
+        assert_eq!(cache.get("corp-C"), None);
+    }
+
+    #[test]
+    fn token_cache_keys_by_corp_id() {
+        let _g = cache_test_lock().lock().unwrap();
+        reset_token_cache();
+        let cache = token_cache();
+        cache.set("corp-D", "tok-D".into(), 7200);
+        cache.set("corp-E", "tok-E".into(), 7200);
+        assert_eq!(cache.get("corp-D").as_deref(), Some("tok-D"));
+        assert_eq!(cache.get("corp-E").as_deref(), Some("tok-E"));
+    }
+}
diff --git a/crates/harness-server/src/diagnostics_routes.rs b/crates/harness-server/src/diagnostics_routes.rs
index deed263..cea265b 100644
--- a/crates/harness-server/src/diagnostics_routes.rs
+++ b/crates/harness-server/src/diagnostics_routes.rs
@@ -36,6 +36,87 @@ pub(crate) fn router() -> Router<AppState> {
         .route("/v1/diagnostics/runs/stuck", get(list_stuck_runs))
         .route("/v1/diagnostics/runs/failed", get(list_failed_runs))
         .route("/v1/diagnostics/runs/recent", get(list_recent_runs))
+        .route("/v1/diagnostics/memory", get(get_memory_stats))
+}
+
+/// P8 — `GET /v1/diagnostics/memory`. Returns the active memory
+/// backend's telemetry counters (compaction count, cache hits,
+/// circuit-breaker trips, PTL frequency) as a JSON object. 503
+/// when no stats provider is configured — typically because the
+/// binary is running with `SlidingWindowMemory` (no internal
+/// counters) or memory was disabled entirely.
+async fn get_memory_stats(
+    axum::extract::State(state): axum::extract::State<AppState>,
+) -> Response {
+    match state.memory_stats.as_ref() {
+        Some(provider) => Json(provider.snapshot()).into_response(),
+        None => (
+            StatusCode::SERVICE_UNAVAILABLE,
+            Json(json!({ "error": "memory stats provider not configured" })),
+        )
+            .into_response(),
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use harness_core::MemoryStatsProvider;
+    use std::sync::Arc;
+
+    struct StubLlm;
+    #[async_trait::async_trait]
+    impl harness_core::LlmProvider for StubLlm {
+        async fn complete(
+            &self,
+            _: harness_core::ChatRequest,
+        ) -> Result<harness_core::ChatResponse, harness_core::Error> {
+            Err(harness_core::Error::Provider("stub".into()))
+        }
+    }
+
+    fn stub_state() -> AppState {
+        use harness_core::{Agent, AgentConfig};
+        let cfg = AgentConfig::new("stub-model");
+        let agent = Arc::new(Agent::new(Arc::new(StubLlm) as _, cfg));
+        AppState::new(agent)
+    }
+
+    async fn read_json(resp: Response) -> serde_json::Value {
+        let bytes = axum::body::to_bytes(resp.into_body(), 64 * 1024)
+            .await
+            .unwrap();
+        serde_json::from_slice(&bytes).unwrap()
+    }
+
+    struct StaticProvider(serde_json::Value);
+    impl MemoryStatsProvider for StaticProvider {
+        fn snapshot(&self) -> serde_json::Value {
+            self.0.clone()
+        }
+    }
+
+    #[tokio::test]
+    async fn memory_stats_returns_503_when_unconfigured() {
+        let state = stub_state();
+        let resp = get_memory_stats(axum::extract::State(state)).await;
+        assert_eq!(resp.status(), StatusCode::SERVICE_UNAVAILABLE);
+        let body = read_json(resp).await;
+        assert!(body["error"].as_str().unwrap().contains("not configured"));
+    }
+
+    #[tokio::test]
+    async fn memory_stats_returns_snapshot_when_configured() {
+        let provider: Arc<dyn MemoryStatsProvider> = Arc::new(StaticProvider(json!({
+            "backend": "summarizing",
+            "compactions_total": 42,
+        })));
+        let state = stub_state().with_memory_stats(provider);
+        let resp = get_memory_stats(axum::extract::State(state)).await;
+        let body = read_json(resp).await;
+        assert_eq!(body["backend"], "summarizing");
+        assert_eq!(body["compactions_total"], 42);
+    }
 }
 
 #[allow(clippy::result_large_err)]
diff --git a/crates/harness-server/src/lib.rs b/crates/harness-server/src/lib.rs
index 3f7a439..6c5db59 100644
--- a/crates/harness-server/src/lib.rs
+++ b/crates/harness-server/src/lib.rs
@@ -58,7 +58,9 @@ mod state;
 pub mod state_layers;
 mod subagent_runs;
 mod subagent_runs_routes;
+mod memory_sync_routes;
 mod subagents_routes;
+mod tasks_routes;
 mod todo_binder;
 mod todos_routes;
 mod ui;
@@ -80,7 +82,7 @@ pub use requirements_routes::sweep_orphan_requirements_on_startup;
 pub use route_policy::{ModelRoutePolicy, ModelTarget, RouteSlot};
 pub use routes::router;
 pub use subagent_runs::{SubAgentRunRecord, SubAgentRunRegistry, SubAgentRunStatus};
-pub use state::{AppState, ServerInfo, TelemetryStatus};
+pub use state::{AppState, MemoryRuntime, ServerInfo, TelemetryStatus};
 
 // Re-export so binaries can construct stores / modes without depending
 // on harness-core directly when they only need the permission types.
diff --git a/crates/harness-server/src/market_routes.rs b/crates/harness-server/src/market_routes.rs
index 6377e5a..374ee66 100644
--- a/crates/harness-server/src/market_routes.rs
+++ b/crates/harness-server/src/market_routes.rs
@@ -21,6 +21,7 @@ use serde::{Deserialize, Serialize};
 use serde_json::{json, Value};
 
 use crate::state::AppState;
+use crate::state_layers::SkillsLayer;
 
 const MCP_REGISTRY_URL: &str = "https://registry.modelcontextprotocol.io/v0.1/servers";
 const SKILLS_SH_URL: &str = "https://skills.sh";
@@ -89,8 +90,8 @@ struct InstallSkillRequest {
 }
 
 #[allow(clippy::result_large_err)]
-fn require_catalog(state: &AppState) -> Result<Arc<RwLock<SkillCatalog>>, Response> {
-    state.skills.clone().ok_or_else(|| {
+fn require_catalog(skills: &SkillsLayer) -> Result<Arc<RwLock<SkillCatalog>>, Response> {
+    skills.catalog.clone().ok_or_else(|| {
         (
             StatusCode::SERVICE_UNAVAILABLE,
             Json(json!({ "error": "skill catalogue not configured" })),
@@ -100,8 +101,8 @@ fn require_catalog(state: &AppState) -> Result<Arc<RwLock<SkillCatalog>>, Respon
 }
 
 #[allow(clippy::result_large_err)]
-fn require_user_skill_dir(state: &AppState) -> Result<PathBuf, Response> {
-    state.user_skills_dir.clone().ok_or_else(|| {
+fn require_user_skill_dir(skills: &SkillsLayer) -> Result<PathBuf, Response> {
+    skills.user_dir.clone().ok_or_else(|| {
         (
             StatusCode::SERVICE_UNAVAILABLE,
             Json(json!({ "error": "user skill directory not configured" })),
@@ -172,14 +173,14 @@ async fn search_skills(Query(q): Query<MarketQuery>) -> Response {
 }
 
 async fn install_skill(
-    State(state): State<AppState>,
+    State(skills): State<SkillsLayer>,
     Json(req): Json<InstallSkillRequest>,
 ) -> Response {
-    let catalog = match require_catalog(&state) {
+    let catalog = match require_catalog(&skills) {
         Ok(c) => c,
         Err(r) => return r,
     };
-    let user_dir = match require_user_skill_dir(&state) {
+    let user_dir = match require_user_skill_dir(&skills) {
         Ok(d) => d,
         Err(r) => return r,
     };
diff --git a/crates/harness-server/src/mcp_routes.rs b/crates/harness-server/src/mcp_routes.rs
index 5092468..89dd75c 100644
--- a/crates/harness-server/src/mcp_routes.rs
+++ b/crates/harness-server/src/mcp_routes.rs
@@ -23,6 +23,7 @@ use serde_json::json;
 use std::sync::Arc;
 
 use crate::state::AppState;
+use crate::state_layers::McpLayer;
 
 pub fn router() -> Router<AppState> {
     Router::new()
@@ -36,8 +37,8 @@ pub fn router() -> Router<AppState> {
 }
 
 #[allow(clippy::result_large_err)]
-fn require_mcp(state: &AppState) -> Result<Arc<McpManager>, Response> {
-    state.mcp.clone().ok_or_else(|| {
+fn require_mcp(mcp: &McpLayer) -> Result<Arc<McpManager>, Response> {
+    mcp.manager.clone().ok_or_else(|| {
         (
             StatusCode::SERVICE_UNAVAILABLE,
             Json(json!({ "error": "mcp manager not configured" })),
@@ -46,8 +47,8 @@ fn require_mcp(state: &AppState) -> Result<Arc<McpManager>, Response> {
     })
 }
 
-async fn list(State(state): State<AppState>) -> Response {
-    let mcp = match require_mcp(&state) {
+async fn list(State(mcp): State<McpLayer>) -> Response {
+    let mcp = match require_mcp(&mcp) {
         Ok(m) => m,
         Err(r) => return r,
     };
@@ -55,8 +56,8 @@ async fn list(State(state): State<AppState>) -> Response {
     (StatusCode::OK, Json(json!({ "servers": servers }))).into_response()
 }
 
-async fn get_one(State(state): State<AppState>, Path(prefix): Path<String>) -> Response {
-    let mcp = match require_mcp(&state) {
+async fn get_one(State(mcp): State<McpLayer>, Path(prefix): Path<String>) -> Response {
+    let mcp = match require_mcp(&mcp) {
         Ok(m) => m,
         Err(r) => return r,
     };
@@ -70,8 +71,8 @@ async fn get_one(State(state): State<AppState>, Path(prefix): Path<String>) -> R
     }
 }
 
-async fn add(State(state): State<AppState>, Json(cfg): Json<McpClientConfig>) -> Response {
-    let mcp = match require_mcp(&state) {
+async fn add(State(mcp): State<McpLayer>, Json(cfg): Json<McpClientConfig>) -> Response {
+    let mcp = match require_mcp(&mcp) {
         Ok(m) => m,
         Err(r) => return r,
     };
@@ -94,11 +95,11 @@ async fn add(State(state): State<AppState>, Json(cfg): Json<McpClientConfig>) ->
 }
 
 async fn replace(
-    State(state): State<AppState>,
+    State(mcp): State<McpLayer>,
     Path(prefix): Path<String>,
     Json(mut cfg): Json<McpClientConfig>,
 ) -> Response {
-    let mcp = match require_mcp(&state) {
+    let mcp = match require_mcp(&mcp) {
         Ok(m) => m,
         Err(r) => return r,
     };
@@ -127,8 +128,8 @@ async fn replace(
     }
 }
 
-async fn remove(State(state): State<AppState>, Path(prefix): Path<String>) -> Response {
-    let mcp = match require_mcp(&state) {
+async fn remove(State(mcp): State<McpLayer>, Path(prefix): Path<String>) -> Response {
+    let mcp = match require_mcp(&mcp) {
         Ok(m) => m,
         Err(r) => return r,
     };
@@ -147,8 +148,8 @@ async fn remove(State(state): State<AppState>, Path(prefix): Path<String>) -> Re
     }
 }
 
-async fn health(State(state): State<AppState>, Path(prefix): Path<String>) -> Response {
-    let mcp = match require_mcp(&state) {
+async fn health(State(mcp): State<McpLayer>, Path(prefix): Path<String>) -> Response {
+    let mcp = match require_mcp(&mcp) {
         Ok(m) => m,
         Err(r) => return r,
     };
@@ -178,8 +179,8 @@ async fn health(State(state): State<AppState>, Path(prefix): Path<String>) -> Re
 /// server stalls or its child process crashed and the slot fell
 /// to `Unhealthy` / `Stopped`. Idempotent: hitting an already-
 /// running server is just a quick teardown + reconnect.
-async fn reload(State(state): State<AppState>, Path(prefix): Path<String>) -> Response {
-    let mcp = match require_mcp(&state) {
+async fn reload(State(mcp): State<McpLayer>, Path(prefix): Path<String>) -> Response {
+    let mcp = match require_mcp(&mcp) {
         Ok(m) => m,
         Err(r) => return r,
     };
diff --git a/crates/harness-server/src/memory_sync_routes.rs b/crates/harness-server/src/memory_sync_routes.rs
new file mode 100644
index 0000000..3c85e00
--- /dev/null
+++ b/crates/harness-server/src/memory_sync_routes.rs
@@ -0,0 +1,502 @@
+//! P14 — REST surface for the Settings → Memory Sync panel.
+//!
+//! The agent-side already has `memory.sync` / `memory.sync_setup` /
+//! `memory.sync_status` (P10/P11/P13). These REST endpoints expose
+//! the same operations to the Web UI so the operator can configure
+//! sync without going through the chat. They reuse the same tool
+//! impls under the hood — no duplicate logic.
+//!
+//! 503 is returned when:
+//! - `enable_memory` is off (no memory tree to sync)
+//! - `enable_memory_sync` ⇒ `backend == None` (the tools that
+//!   match git/icloud operations aren't loaded)
+//! - The runtime's `user_root` isn't configured (user-scope sync
+//!   needs a path)
+//!
+//! All write endpoints (`/sync`, `/sync_setup`) are intentionally
+//! NOT approval-gated at the REST layer — the operator is the one
+//! clicking, which is already an approval. The underlying tool
+//! invocations bypass the agent's approver because we're not in
+//! an agent run.
+
+use axum::{
+    extract::State,
+    http::StatusCode,
+    response::{IntoResponse, Response},
+    routing::{get, post},
+    Json, Router,
+};
+use axum::extract::Query;
+use harness_core::Tool;
+use harness_tools::{
+    memory_include_tools::{
+        MemoryIncludeAddTool, MemoryIncludeListTool, MemoryIncludeRefreshTool,
+        MemoryIncludeRemoveTool,
+    },
+    memory_sync::{MemoryICloudSetupTool, MemorySyncSetupTool, MemorySyncStatusTool, MemorySyncTool},
+    MemoryRoots, MemorySyncBackend,
+};
+use serde::Deserialize;
+use serde_json::{json, Value};
+
+use crate::state::AppState;
+
+pub(crate) fn router() -> Router<AppState> {
+    Router::new()
+        .route("/v1/memory/sync_status", get(get_status))
+        .route("/v1/memory/sync", post(post_sync))
+        .route("/v1/memory/sync_setup", post(post_setup_git))
+        .route("/v1/memory/sync_setup_icloud", post(post_setup_icloud))
+        .route(
+            "/v1/memory/includes",
+            get(get_includes)
+                .post(post_include_add)
+                .delete(delete_include),
+        )
+        .route("/v1/memory/includes/refresh", post(post_include_refresh))
+}
+
+/// Build a fresh `MemoryRoots` per request from the runtime
+/// metadata on `AppState`. The memory tools are stateless past
+/// the roots, so reconstructing each call avoids holding any
+/// per-tool handle on `AppState`.
+#[allow(clippy::result_large_err)]
+fn roots_from_state(state: &AppState) -> Result<MemoryRoots, Response> {
+    let rt = state.memory_runtime.as_ref().ok_or_else(|| {
+        (
+            StatusCode::SERVICE_UNAVAILABLE,
+            Json(json!({
+                "error": "memory tools are not enabled — set JARVIS_ENABLE_MEMORY=1 and restart",
+            })),
+        )
+            .into_response()
+    })?;
+    let mut roots = MemoryRoots::new(rt.workspace_root.clone());
+    if let Some(user) = rt.user_root.clone() {
+        roots = roots.with_user_root(user);
+    }
+    Ok(roots)
+}
+
+fn backend(state: &AppState) -> MemorySyncBackend {
+    state
+        .memory_runtime
+        .as_ref()
+        .map(|rt| rt.backend)
+        .unwrap_or(MemorySyncBackend::None)
+}
+
+async fn get_status(State(state): State<AppState>) -> Response {
+    let roots = match roots_from_state(&state) {
+        Ok(r) => r,
+        Err(resp) => return resp,
+    };
+    let backend = backend(&state);
+    let user_root = state
+        .memory_runtime
+        .as_ref()
+        .and_then(|rt| rt.user_root.clone());
+
+    let mut envelope = serde_json::Map::new();
+    envelope.insert("backend".into(), json!(backend.as_wire()));
+    envelope.insert(
+        "user_root".into(),
+        json!(user_root.as_ref().map(|p| p.display().to_string())),
+    );
+    envelope.insert(
+        "workspace_root".into(),
+        json!(state
+            .memory_runtime
+            .as_ref()
+            .map(|rt| rt.workspace_root.display().to_string())),
+    );
+
+    // For Git / iCloud, dig into the underlying sync_status tool
+    // for the live per-scope details. We invoke it directly (not
+    // via the agent's tool registry) so the panel can read this
+    // even when no agent run is active.
+    match backend {
+        MemorySyncBackend::None => {}
+        MemorySyncBackend::Git | MemorySyncBackend::ICloud => {
+            let tool = MemorySyncStatusTool::new(roots);
+            match tool.invoke(json!({ "scope": "user" })).await {
+                Ok(body) => {
+                    if let Ok(v) = serde_json::from_str::<Value>(&body) {
+                        envelope.insert("user_scope".into(), v);
+                    } else {
+                        envelope.insert("user_scope".into(), json!({ "raw": body }));
+                    }
+                }
+                Err(e) => {
+                    envelope.insert("user_scope".into(), json!({ "error": e.to_string() }));
+                }
+            }
+        }
+    }
+
+    Json(Value::Object(envelope)).into_response()
+}
+
+#[derive(Debug, Deserialize)]
+struct SyncBody {
+    #[serde(default)]
+    scope: Option<String>,
+    #[serde(default)]
+    remote: Option<String>,
+    #[serde(default)]
+    branch: Option<String>,
+    #[serde(default)]
+    timeout_ms: Option<u64>,
+}
+
+async fn post_sync(
+    State(state): State<AppState>,
+    body: Option<Json<SyncBody>>,
+) -> Response {
+    if !matches!(backend(&state), MemorySyncBackend::Git) {
+        return (
+            StatusCode::SERVICE_UNAVAILABLE,
+            Json(json!({
+                "error": "memory.sync only applies to the `git` backend — current backend is not git",
+                "backend": backend(&state).as_wire(),
+            })),
+        )
+            .into_response();
+    }
+    let roots = match roots_from_state(&state) {
+        Ok(r) => r,
+        Err(resp) => return resp,
+    };
+    let mut args = serde_json::Map::new();
+    if let Some(Json(b)) = body {
+        if let Some(scope) = b.scope {
+            args.insert("scope".into(), json!(scope));
+        }
+        if let Some(remote) = b.remote {
+            args.insert("remote".into(), json!(remote));
+        }
+        if let Some(branch) = b.branch {
+            args.insert("branch".into(), json!(branch));
+        }
+        if let Some(timeout_ms) = b.timeout_ms {
+            args.insert("timeout_ms".into(), json!(timeout_ms));
+        }
+    }
+    let tool = MemorySyncTool::new(roots);
+    match tool.invoke(Value::Object(args)).await {
+        Ok(body) => match serde_json::from_str::<Value>(&body) {
+            Ok(v) => Json(v).into_response(),
+            Err(_) => Json(json!({ "raw": body })).into_response(),
+        },
+        Err(e) => (
+            StatusCode::BAD_REQUEST,
+            Json(json!({ "error": e.to_string() })),
+        )
+            .into_response(),
+    }
+}
+
+#[derive(Debug, Deserialize)]
+struct GitSetupBody {
+    remote_url: String,
+    #[serde(default)]
+    scope: Option<String>,
+    #[serde(default)]
+    branch: Option<String>,
+    #[serde(default)]
+    push: Option<bool>,
+    #[serde(default)]
+    force: Option<bool>,
+}
+
+async fn post_setup_git(
+    State(state): State<AppState>,
+    Json(body): Json<GitSetupBody>,
+) -> Response {
+    if !matches!(backend(&state), MemorySyncBackend::Git) {
+        return (
+            StatusCode::SERVICE_UNAVAILABLE,
+            Json(json!({
+                "error": "git sync setup only applies to the `git` backend",
+                "backend": backend(&state).as_wire(),
+            })),
+        )
+            .into_response();
+    }
+    let roots = match roots_from_state(&state) {
+        Ok(r) => r,
+        Err(resp) => return resp,
+    };
+    let mut args = serde_json::Map::new();
+    args.insert("remote_url".into(), json!(body.remote_url));
+    if let Some(scope) = body.scope {
+        args.insert("scope".into(), json!(scope));
+    }
+    if let Some(branch) = body.branch {
+        args.insert("branch".into(), json!(branch));
+    }
+    if let Some(push) = body.push {
+        args.insert("push".into(), json!(push));
+    }
+    if let Some(force) = body.force {
+        args.insert("force".into(), json!(force));
+    }
+    let tool = MemorySyncSetupTool::new(roots);
+    match tool.invoke(Value::Object(args)).await {
+        Ok(body) => match serde_json::from_str::<Value>(&body) {
+            Ok(v) => Json(v).into_response(),
+            Err(_) => Json(json!({ "raw": body })).into_response(),
+        },
+        Err(e) => (
+            StatusCode::BAD_REQUEST,
+            Json(json!({ "error": e.to_string() })),
+        )
+            .into_response(),
+    }
+}
+
+async fn post_setup_icloud(State(state): State<AppState>) -> Response {
+    if !matches!(backend(&state), MemorySyncBackend::ICloud) {
+        return (
+            StatusCode::SERVICE_UNAVAILABLE,
+            Json(json!({
+                "error": "iCloud sync setup only applies to the `icloud` backend",
+                "backend": backend(&state).as_wire(),
+            })),
+        )
+            .into_response();
+    }
+    let roots = match roots_from_state(&state) {
+        Ok(r) => r,
+        Err(resp) => return resp,
+    };
+    let tool = MemoryICloudSetupTool::new(roots);
+    match tool.invoke(json!({})).await {
+        Ok(body) => match serde_json::from_str::<Value>(&body) {
+            Ok(v) => Json(v).into_response(),
+            Err(_) => Json(json!({ "raw": body })).into_response(),
+        },
+        Err(e) => (
+            StatusCode::BAD_REQUEST,
+            Json(json!({ "error": e.to_string() })),
+        )
+            .into_response(),
+    }
+}
+
+// -------- /v1/memory/includes --------
+
+#[derive(Debug, Deserialize)]
+struct IncludesQuery {
+    #[serde(default)]
+    scope: Option<String>,
+}
+
+#[derive(Debug, Deserialize)]
+struct IncludeBody {
+    target: String,
+    #[serde(default)]
+    scope: Option<String>,
+}
+
+#[derive(Debug, Deserialize)]
+struct IncludeRefreshBody {
+    target: String,
+}
+
+async fn invoke_tool_to_response(
+    tool: impl harness_core::Tool,
+    args: Value,
+) -> Response {
+    match tool.invoke(args).await {
+        Ok(body) => match serde_json::from_str::<Value>(&body) {
+            Ok(v) => Json(v).into_response(),
+            Err(_) => Json(json!({ "raw": body })).into_response(),
+        },
+        Err(e) => (
+            StatusCode::BAD_REQUEST,
+            Json(json!({ "error": e.to_string() })),
+        )
+            .into_response(),
+    }
+}
+
+async fn get_includes(
+    State(state): State<AppState>,
+    Query(q): Query<IncludesQuery>,
+) -> Response {
+    let roots = match roots_from_state(&state) {
+        Ok(r) => r,
+        Err(resp) => return resp,
+    };
+    let mut args = serde_json::Map::new();
+    if let Some(scope) = q.scope {
+        args.insert("scope".into(), json!(scope));
+    }
+    invoke_tool_to_response(MemoryIncludeListTool::new(roots), Value::Object(args)).await
+}
+
+async fn post_include_add(
+    State(state): State<AppState>,
+    Json(body): Json<IncludeBody>,
+) -> Response {
+    let roots = match roots_from_state(&state) {
+        Ok(r) => r,
+        Err(resp) => return resp,
+    };
+    let mut args = serde_json::Map::new();
+    args.insert("target".into(), json!(body.target));
+    if let Some(scope) = body.scope {
+        args.insert("scope".into(), json!(scope));
+    }
+    invoke_tool_to_response(MemoryIncludeAddTool::new(roots), Value::Object(args)).await
+}
+
+async fn delete_include(
+    State(state): State<AppState>,
+    Json(body): Json<IncludeBody>,
+) -> Response {
+    let roots = match roots_from_state(&state) {
+        Ok(r) => r,
+        Err(resp) => return resp,
+    };
+    let mut args = serde_json::Map::new();
+    args.insert("target".into(), json!(body.target));
+    if let Some(scope) = body.scope {
+        args.insert("scope".into(), json!(scope));
+    }
+    invoke_tool_to_response(MemoryIncludeRemoveTool::new(roots), Value::Object(args)).await
+}
+
+async fn post_include_refresh(
+    _state: State<AppState>,
+    Json(body): Json<IncludeRefreshBody>,
+) -> Response {
+    invoke_tool_to_response(
+        MemoryIncludeRefreshTool,
+        json!({ "target": body.target }),
+    )
+    .await
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::state::{AppState, MemoryRuntime};
+    use std::sync::Arc;
+
+    struct StubLlm;
+    #[async_trait::async_trait]
+    impl harness_core::LlmProvider for StubLlm {
+        async fn complete(
+            &self,
+            _: harness_core::ChatRequest,
+        ) -> Result<harness_core::ChatResponse, harness_core::Error> {
+            Err(harness_core::Error::Provider("stub".into()))
+        }
+    }
+
+    fn stub_state() -> AppState {
+        use harness_core::{Agent, AgentConfig};
+        let cfg = AgentConfig::new("stub-model");
+        let agent = Arc::new(Agent::new(Arc::new(StubLlm) as _, cfg));
+        AppState::new(agent)
+    }
+
+    async fn read_json(resp: Response) -> Value {
+        let bytes = axum::body::to_bytes(resp.into_body(), 1024 * 1024)
+            .await
+            .unwrap();
+        serde_json::from_slice(&bytes).unwrap()
+    }
+
+    #[tokio::test]
+    async fn status_503_when_runtime_unconfigured() {
+        let state = stub_state();
+        let resp = get_status(State(state)).await;
+        assert_eq!(resp.status(), StatusCode::SERVICE_UNAVAILABLE);
+        let body = read_json(resp).await;
+        assert!(body["error"]
+            .as_str()
+            .unwrap()
+            .contains("memory tools are not enabled"));
+    }
+
+    #[tokio::test]
+    async fn status_reports_backend_none_when_runtime_present_but_off() {
+        let state = stub_state().with_memory_runtime(MemoryRuntime {
+            workspace_root: std::path::PathBuf::from("/tmp/ws"),
+            user_root: None,
+            backend: MemorySyncBackend::None,
+        });
+        let resp = get_status(State(state)).await;
+        let body = read_json(resp).await;
+        assert_eq!(body["backend"], "none");
+        assert!(body.get("user_scope").is_none());
+    }
+
+    #[tokio::test]
+    async fn sync_503_when_backend_is_not_git() {
+        let state = stub_state().with_memory_runtime(MemoryRuntime {
+            workspace_root: std::path::PathBuf::from("/tmp/ws"),
+            user_root: Some(std::path::PathBuf::from("/tmp/user")),
+            backend: MemorySyncBackend::ICloud,
+        });
+        let resp = post_sync(State(state), None).await;
+        assert_eq!(resp.status(), StatusCode::SERVICE_UNAVAILABLE);
+        let body = read_json(resp).await;
+        assert!(body["error"]
+            .as_str()
+            .unwrap()
+            .contains("only applies to the `git` backend"));
+        assert_eq!(body["backend"], "icloud");
+    }
+
+    #[tokio::test]
+    async fn includes_get_503_when_runtime_unconfigured() {
+        let state = stub_state();
+        let resp = get_includes(State(state), Query(IncludesQuery { scope: None })).await;
+        assert_eq!(resp.status(), StatusCode::SERVICE_UNAVAILABLE);
+    }
+
+    #[tokio::test]
+    async fn includes_get_returns_items_array_when_runtime_present() {
+        let workspace = tempfile::tempdir().unwrap();
+        let state = stub_state().with_memory_runtime(MemoryRuntime {
+            workspace_root: workspace.path().to_path_buf(),
+            user_root: None,
+            backend: MemorySyncBackend::None,
+        });
+        let resp = get_includes(State(state), Query(IncludesQuery { scope: None })).await;
+        let body = read_json(resp).await;
+        // Either `items` key exists or `error` (when scope unresolvable);
+        // a fresh workspace with no MEMORY.md returns `items: []`.
+        assert!(body.get("items").is_some() || body.get("error").is_some());
+    }
+
+    #[tokio::test]
+    async fn include_refresh_rejects_local_path() {
+        let state = stub_state();
+        let resp = post_include_refresh(
+            State(state),
+            Json(IncludeRefreshBody {
+                target: "/some/local/path".into(),
+            }),
+        )
+        .await;
+        assert_eq!(resp.status(), StatusCode::BAD_REQUEST);
+        let body = read_json(resp).await;
+        assert!(body["error"].as_str().unwrap().contains("only applies"));
+    }
+
+    #[tokio::test]
+    async fn setup_icloud_503_when_backend_is_git() {
+        let state = stub_state().with_memory_runtime(MemoryRuntime {
+            workspace_root: std::path::PathBuf::from("/tmp/ws"),
+            user_root: Some(std::path::PathBuf::from("/tmp/user")),
+            backend: MemorySyncBackend::Git,
+        });
+        let resp = post_setup_icloud(State(state)).await;
+        assert_eq!(resp.status(), StatusCode::SERVICE_UNAVAILABLE);
+    }
+}
diff --git a/crates/harness-server/src/plugin_routes.rs b/crates/harness-server/src/plugin_routes.rs
index fe77a0f..28621e9 100644
--- a/crates/harness-server/src/plugin_routes.rs
+++ b/crates/harness-server/src/plugin_routes.rs
@@ -24,6 +24,7 @@ use serde::Deserialize;
 use serde_json::{json, Value};
 
 use crate::state::AppState;
+use crate::state_layers::PluginsLayer;
 
 pub fn router() -> Router<AppState> {
     Router::new()
@@ -34,8 +35,8 @@ pub fn router() -> Router<AppState> {
 }
 
 #[allow(clippy::result_large_err)]
-fn require_manager(state: &AppState) -> Result<Arc<PluginManager>, Response> {
-    state.plugins.clone().ok_or_else(|| {
+fn require_manager(plugins: &PluginsLayer) -> Result<Arc<PluginManager>, Response> {
+    plugins.manager.clone().ok_or_else(|| {
         (
             StatusCode::SERVICE_UNAVAILABLE,
             Json(json!({ "error": "plugin manager not configured" })),
@@ -44,8 +45,8 @@ fn require_manager(state: &AppState) -> Result<Arc<PluginManager>, Response> {
     })
 }
 
-async fn list(State(state): State<AppState>) -> Response {
-    let mgr = match require_manager(&state) {
+async fn list(State(plugins): State<PluginsLayer>) -> Response {
+    let mgr = match require_manager(&plugins) {
         Ok(m) => m,
         Err(r) => return r,
     };
@@ -53,8 +54,8 @@ async fn list(State(state): State<AppState>) -> Response {
     (StatusCode::OK, Json(json!({ "plugins": entries }))).into_response()
 }
 
-async fn get_one(State(state): State<AppState>, Path(name): Path<String>) -> Response {
-    let mgr = match require_manager(&state) {
+async fn get_one(State(plugins): State<PluginsLayer>, Path(name): Path<String>) -> Response {
+    let mgr = match require_manager(&plugins) {
         Ok(m) => m,
         Err(r) => return r,
     };
@@ -76,8 +77,8 @@ enum InstallRequest {
     // Reserved for future flavours: Git { url, ref?: String }.
 }
 
-async fn install(State(state): State<AppState>, Json(req): Json<InstallRequest>) -> Response {
-    let mgr = match require_manager(&state) {
+async fn install(State(plugins): State<PluginsLayer>, Json(req): Json<InstallRequest>) -> Response {
+    let mgr = match require_manager(&plugins) {
         Ok(m) => m,
         Err(r) => return r,
     };
@@ -89,8 +90,8 @@ async fn install(State(state): State<AppState>, Json(req): Json<InstallRequest>)
     }
 }
 
-async fn remove(State(state): State<AppState>, Path(name): Path<String>) -> Response {
-    let mgr = match require_manager(&state) {
+async fn remove(State(plugins): State<PluginsLayer>, Path(name): Path<String>) -> Response {
+    let mgr = match require_manager(&plugins) {
         Ok(m) => m,
         Err(r) => return r,
     };
@@ -104,11 +105,13 @@ async fn remove(State(state): State<AppState>, Path(name): Path<String>) -> Resp
     }
 }
 
-async fn marketplace(State(_state): State<AppState>) -> Response {
+async fn marketplace() -> Response {
     // Hard-coded built-in list. Each entry points at a path that
     // ships in-repo (under `examples/plugins/`) so a clean clone
     // can install one with a single click. Phase 4 swaps this for
-    // a remote JSON index.
+    // a remote JSON index, at which point this handler would grow
+    // a state extractor (HTTP client / cached fetch). For now,
+    // pure function.
     let entries: Vec<Value> = vec![
         json!({
             "name": "code-review-pack",
diff --git a/crates/harness-server/src/routes.rs b/crates/harness-server/src/routes.rs
index ce3ee37..194fa50 100644
--- a/crates/harness-server/src/routes.rs
+++ b/crates/harness-server/src/routes.rs
@@ -83,6 +83,8 @@ pub fn router(state: AppState) -> Router {
         .merge(crate::agent_profiles_routes::router())
         .merge(crate::subagents_routes::router())
         .merge(crate::subagent_runs_routes::router())
+        .merge(crate::tasks_routes::router())
+        .merge(crate::memory_sync_routes::router())
         .merge(crate::diagnostics_routes::router())
         .merge(crate::auto_mode_routes::router())
         .merge(crate::channels_routes::router())
@@ -2020,6 +2022,7 @@ async fn begin_user_turn(
     sticky_provider: &mut Option<String>,
     sticky_model: &mut Option<String>,
     active_skills: &[String],
+    recent_touched_files: &[String],
     socket_workspace: &Option<std::path::PathBuf>,
     hitl_tx: &mpsc::Sender<PendingHitl>,
 ) -> bool {
@@ -2042,7 +2045,12 @@ async fn begin_user_turn(
     let hitl = hitl_tx.clone();
     let active_mode = *mode_handle.read().await;
     let skills_catalog = state.skills.as_ref().cloned();
-    let skills_snapshot = merged_skills_for_turn(skills_catalog.as_ref(), active_skills, &content);
+    let skills_snapshot = merged_skills_for_turn(
+        skills_catalog.as_ref(),
+        active_skills,
+        &content,
+        recent_touched_files,
+    );
     let workspace_for_turn = socket_workspace.clone();
     let agent = match state.build_agent_with(provider_pick, model_pick, |cfg| {
         cfg.approver = Some(approver);
@@ -2183,6 +2191,7 @@ fn merged_skills_for_turn(
     catalog: Option<&Arc<std::sync::RwLock<harness_skill::SkillCatalog>>>,
     manual_active: &[String],
     user_content: &str,
+    recent_paths: &[String],
 ) -> Vec<String> {
     let mut merged: Vec<String> = manual_active.to_vec();
     let Some(cat_arc) = catalog else {
@@ -2198,9 +2207,98 @@ fn merged_skills_for_turn(
             merged.push(n);
         }
     }
+    // M3.3: file-path auto-activation. Skills with a non-empty
+    // `paths` glob list that hit any of the agent's recently-
+    // touched files this socket get added on top of the keyword
+    // matches. Capped at AUTO_SKILL_TOP_K so a single edit can't
+    // pile on indefinitely.
+    if !recent_paths.is_empty() {
+        let path_picks = harness_skill::pick_path_match_skills(
+            &guard,
+            recent_paths,
+            AUTO_SKILL_TOP_K,
+            &merged,
+        );
+        for n in path_picks {
+            if !merged.iter().any(|m| m == &n) {
+                merged.push(n);
+            }
+        }
+    }
     merged
 }
 
+/// FIFO push that dedupes and caps. Used to maintain the per-WS
+/// session's "recently-touched files" list that feeds M3.3 skill
+/// path-based auto-activation. Bounded so a long session can't
+/// grow the list unbounded; older entries fall off as new ones
+/// land. The dedupe-and-move-to-front policy keeps the most-
+/// recent file at the head.
+const RECENT_TOUCHED_FILES_CAP: usize = 32;
+
+/// Push a fresh `tasks_snapshot` frame down `ws_tx`. Fan-out
+/// helper for the BackgroundTasksPanel's WS-push path (P7): the
+/// frontend listens for these and replaces its local task list,
+/// so it doesn't need to poll `/v1/tasks` on a tight interval.
+async fn push_tasks_snapshot(
+    ws_tx: &mut SplitSink<WebSocket, WsMessage>,
+    state: &AppState,
+) {
+    let items = crate::tasks_routes::collect_tasks(state).await;
+    let _ = ws_tx
+        .send(WsMessage::Text(
+            json!({
+                "type": "tasks_snapshot",
+                "items": items,
+                "generated_at": std::time::SystemTime::now()
+                    .duration_since(std::time::UNIX_EPOCH)
+                    .map(|d| d.as_millis() as u64)
+                    .unwrap_or(0),
+            })
+            .to_string(),
+        ))
+        .await;
+}
+
+/// Compute which skills would auto-activate via the M3.3
+/// path-match rule on the next user turn, given `manual_active`
+/// (the currently-selected skills the user already sees) and
+/// `recent_touched_files`. Returns just the names, deduped against
+/// the manual set. Used to power the Composer's "next turn
+/// auto-activated" preview chip.
+fn predict_skill_auto_activation(
+    catalog: Option<&Arc<std::sync::RwLock<harness_skill::SkillCatalog>>>,
+    manual_active: &[String],
+    recent_touched_files: &[String],
+) -> Vec<String> {
+    let Some(cat_arc) = catalog else {
+        return Vec::new();
+    };
+    let Ok(guard) = cat_arc.read() else {
+        return Vec::new();
+    };
+    harness_skill::pick_path_match_skills(
+        &guard,
+        recent_touched_files,
+        AUTO_SKILL_TOP_K,
+        manual_active,
+    )
+}
+
+fn push_recent_touched_file(files: &mut Vec<String>, path: &str) {
+    if path.is_empty() {
+        return;
+    }
+    let owned = path.to_string();
+    if let Some(pos) = files.iter().position(|p| p == &owned) {
+        files.remove(pos);
+    }
+    files.insert(0, owned);
+    while files.len() > RECENT_TOUCHED_FILES_CAP {
+        files.pop();
+    }
+}
+
 fn compose_with_skills(
     template: Option<&str>,
     catalog: Option<&Arc<std::sync::RwLock<harness_skill::SkillCatalog>>>,
@@ -2338,6 +2436,13 @@ async fn handle_ws(socket: WebSocket, state: AppState) {
     // system prompt. Order is insertion order so the model sees
     // them in the same order the user activated them.
     let mut active_skills: Vec<String> = Vec::new();
+    // M3.3: workspace-relative paths the agent has touched in this
+    // socket's lifetime. Sniffed from `ToolStart` events for fs.*
+    // tools below; consulted by `merged_skills_for_turn` so a
+    // skill with `paths: ["**/*.rs"]` auto-activates after the
+    // agent reads/edits a `.rs` file. Bounded so a long session
+    // can't grow this unbounded.
+    let mut recent_touched_files: Vec<String> = Vec::new();
     // Per-socket workspace override. `None` means "use the binary's
     // startup workspace" (the historical behaviour). When `Some`,
     // the path is installed as a `crate::workspace::with_session_workspace`
@@ -2409,6 +2514,7 @@ async fn handle_ws(socket: WebSocket, state: AppState) {
                     &mut sticky_provider,
                     &mut sticky_model,
                     &mut active_skills,
+                    &recent_touched_files,
                     &mut socket_workspace,
                     &hitl_tx,
                 )
@@ -2684,6 +2790,56 @@ async fn handle_ws(socket: WebSocket, state: AppState) {
                 // the client. The client never sees it; the persisted
                 // history never stores it.
                 let mut ev_to_send = ev;
+                // Tool-initiated mode change (M2.3 `enter_plan_mode`).
+                // Flip the per-socket mode handle so the next turn's
+                // approver / tool_filter see the new mode. The
+                // current turn finishes under the old mode — that's
+                // intentional, see [`mode_signal`] doc.
+                // M3.3 skill auto-activation: track every fs.* path
+                // the agent touches so the next turn's
+                // `merged_skills_for_turn` can pick up skills whose
+                // `paths` glob hits the recent set. Bounded FIFO so a
+                // long session doesn't accumulate forever; sniffed at
+                // ToolStart rather than ToolEnd because Start lands
+                // first and successful starts are followed by a body
+                // event anyway — we don't gate on success because the
+                // glob only cares "did the agent intend to touch X".
+                if let AgentEvent::ToolStart { name, arguments, .. } = &ev_to_send {
+                    if matches!(
+                        name.as_str(),
+                        "fs.read" | "fs.list" | "fs.write" | "fs.edit"
+                    ) {
+                        if let Some(p) = arguments.get("path").and_then(|v| v.as_str()) {
+                            push_recent_touched_file(&mut recent_touched_files, p);
+                        }
+                    } else if name == "fs.patch" {
+                        if let Some(diff) = arguments.get("diff").and_then(|v| v.as_str()) {
+                            for line in diff.lines() {
+                                if let Some(rest) = line.strip_prefix("+++ b/") {
+                                    push_recent_touched_file(&mut recent_touched_files, rest);
+                                }
+                            }
+                        }
+                    }
+                }
+                if let AgentEvent::ModeChanged { mode } = &ev_to_send {
+                    let new_mode = *mode;
+                    *mode_handle.write().await = new_mode;
+                    // Mirror via the existing `permission_mode` UI
+                    // frame so banners / mode badges update in step
+                    // with the change, same shape as the `SetMode`
+                    // / `AcceptPlan` paths.
+                    let _ = ws_tx
+                        .send(WsMessage::Text(
+                            json!({
+                                "type": "permission_mode",
+                                "mode": new_mode,
+                                "via": "tool",
+                            })
+                            .to_string(),
+                        ))
+                        .await;
+                }
                 if let AgentEvent::Done { conversation, .. } = &mut ev_to_send {
                     if let Some(prepared) = last_injection.as_ref() {
                         *conversation = strip_turn_injections(conversation.clone(), prepared);
@@ -2717,6 +2873,31 @@ async fn handle_ws(socket: WebSocket, state: AppState) {
                     // stopped so nothing is waiting on them anyway.
                     pending.clear();
                     pending_hitl.clear();
+                    // M3.3 UX patch: after a turn ends, predict which
+                    // skills *would* auto-activate next turn given
+                    // the files the agent touched. The Composer shows
+                    // a chip ("auto-activated next turn: foo") so the
+                    // user can see in advance — and decide whether to
+                    // proceed or pivot. Empty payload still emitted
+                    // so the Composer can clear any stale chip.
+                    let preview = predict_skill_auto_activation(
+                        state.skills.as_ref(),
+                        &active_skills,
+                        &recent_touched_files,
+                    );
+                    let _ = ws_tx
+                        .send(WsMessage::Text(
+                            json!({
+                                "type": "skill_auto_activated_for_next_turn",
+                                "skills": preview,
+                            })
+                            .to_string(),
+                        ))
+                        .await;
+                    // P7: push the BackgroundTasksPanel's task list
+                    // at the natural state-change moment (turn just
+                    // finished) so the panel can drop its 3s poll.
+                    push_tasks_snapshot(&mut ws_tx, &state).await;
                 }
             }
             // ---- tailed run → server ----
@@ -2814,6 +2995,7 @@ async fn handle_client_frame(
     sticky_provider: &mut Option<String>,
     sticky_model: &mut Option<String>,
     active_skills: &mut Vec<String>,
+    recent_touched_files: &[String],
     socket_workspace: &mut Option<std::path::PathBuf>,
     hitl_tx: &mpsc::Sender<PendingHitl>,
 ) -> bool {
@@ -3136,6 +3318,7 @@ async fn handle_client_frame(
                 sticky_provider,
                 sticky_model,
                 active_skills,
+                recent_touched_files,
                 socket_workspace,
                 hitl_tx,
             )
@@ -3165,6 +3348,7 @@ async fn handle_client_frame(
                 sticky_provider,
                 sticky_model,
                 active_skills,
+                recent_touched_files,
                 socket_workspace,
                 hitl_tx,
             )
@@ -3570,7 +3754,12 @@ async fn handle_client_frame(
             let active_mode = *mode_handle.read().await;
             let skills_catalog = state.skills.as_ref().cloned();
             let skills_snapshot =
-                merged_skills_for_turn(skills_catalog.as_ref(), active_skills, &content);
+                merged_skills_for_turn(
+                    skills_catalog.as_ref(),
+                    active_skills,
+                    &content,
+                    recent_touched_files,
+                );
             let workspace_for_turn = socket_workspace.clone();
             let agent = match state.build_agent_with(provider_pick, model_pick, |cfg| {
                 cfg.approver = Some(approver);
@@ -3759,7 +3948,12 @@ async fn handle_client_frame(
             let active_mode = *mode_handle.read().await;
             let skills_catalog = state.skills.as_ref().cloned();
             let skills_snapshot =
-                merged_skills_for_turn(skills_catalog.as_ref(), active_skills, proceed_message);
+                merged_skills_for_turn(
+                    skills_catalog.as_ref(),
+                    active_skills,
+                    proceed_message,
+                    recent_touched_files,
+                );
             let workspace_for_turn = socket_workspace.clone();
             let agent = match state.build_agent_with(provider_pick, model_pick, |cfg| {
                 cfg.approver = Some(approver);
@@ -3881,7 +4075,12 @@ async fn handle_client_frame(
             let active_mode = *mode_handle.read().await;
             let skills_catalog = state.skills.as_ref().cloned();
             let skills_snapshot =
-                merged_skills_for_turn(skills_catalog.as_ref(), active_skills, &feedback);
+                merged_skills_for_turn(
+                    skills_catalog.as_ref(),
+                    active_skills,
+                    &feedback,
+                    recent_touched_files,
+                );
             let workspace_for_turn = socket_workspace.clone();
             let agent = match state.build_agent_with(provider_pick, model_pick, |cfg| {
                 cfg.approver = Some(approver);
diff --git a/crates/harness-server/src/skill_routes.rs b/crates/harness-server/src/skill_routes.rs
index 10fe4ab..d7699cf 100644
--- a/crates/harness-server/src/skill_routes.rs
+++ b/crates/harness-server/src/skill_routes.rs
@@ -23,6 +23,7 @@ use serde_json::json;
 use tracing::info;
 
 use crate::state::AppState;
+use crate::state_layers::SkillsLayer;
 
 pub fn router() -> Router<AppState> {
     Router::new()
@@ -32,8 +33,8 @@ pub fn router() -> Router<AppState> {
 }
 
 #[allow(clippy::result_large_err)]
-fn require_catalog(state: &AppState) -> Result<Arc<RwLock<SkillCatalog>>, Response> {
-    state.skills.clone().ok_or_else(|| {
+fn require_catalog(skills: &SkillsLayer) -> Result<Arc<RwLock<SkillCatalog>>, Response> {
+    skills.catalog.clone().ok_or_else(|| {
         (
             StatusCode::SERVICE_UNAVAILABLE,
             Json(json!({ "error": "skill catalogue not configured" })),
@@ -42,8 +43,8 @@ fn require_catalog(state: &AppState) -> Result<Arc<RwLock<SkillCatalog>>, Respon
     })
 }
 
-async fn list(State(state): State<AppState>) -> Response {
-    let cat = match require_catalog(&state) {
+async fn list(State(skills): State<SkillsLayer>) -> Response {
+    let cat = match require_catalog(&skills) {
         Ok(c) => c,
         Err(r) => return r,
     };
@@ -76,8 +77,8 @@ async fn list(State(state): State<AppState>) -> Response {
     (StatusCode::OK, Json(json!({ "skills": entries }))).into_response()
 }
 
-async fn get_one(State(state): State<AppState>, Path(name): Path<String>) -> Response {
-    let cat = match require_catalog(&state) {
+async fn get_one(State(skills): State<SkillsLayer>, Path(name): Path<String>) -> Response {
+    let cat = match require_catalog(&skills) {
         Ok(c) => c,
         Err(r) => return r,
     };
@@ -116,8 +117,8 @@ async fn get_one(State(state): State<AppState>, Path(name): Path<String>) -> Res
     }
 }
 
-async fn reload(State(state): State<AppState>) -> Response {
-    let cat = match require_catalog(&state) {
+async fn reload(State(skills): State<SkillsLayer>) -> Response {
+    let cat = match require_catalog(&skills) {
         Ok(c) => c,
         Err(r) => return r,
     };
diff --git a/crates/harness-server/src/state.rs b/crates/harness-server/src/state.rs
index 73b935b..1b92137 100644
--- a/crates/harness-server/src/state.rs
+++ b/crates/harness-server/src/state.rs
@@ -321,6 +321,31 @@ pub struct AppState {
     /// that case so callers can distinguish "not configured" from
     /// "really broken".
     pub subagent_runs: Option<Arc<crate::subagent_runs::SubAgentRunRegistry>>,
+    /// P8: optional handle to the active memory backend's
+    /// telemetry counters. Surfaced via
+    /// `GET /v1/diagnostics/memory` so operators tuning
+    /// `JARVIS_MEMORY_TOKENS` can see compact_count / cache hits /
+    /// circuit-open / PTL frequency without restarting. `None`
+    /// when the memory backend has no stats (sliding window) or
+    /// the binary didn't wire it. The endpoint returns 503.
+    pub memory_stats: Option<Arc<dyn harness_core::MemoryStatsProvider>>,
+    /// P14: memory metadata for the Settings → Memory Sync panel.
+    /// `None` when the agent-maintained memory tools aren't
+    /// enabled — the REST endpoints return 503 in that case so
+    /// the panel can render an "off, enable in config" hint
+    /// instead of pretending to have a state.
+    pub memory_runtime: Option<MemoryRuntime>,
+}
+
+/// Snapshot of the memory + sync configuration the binary
+/// resolved at startup. Cloned cheaply (PathBuf + enum) onto
+/// every AppState clone; the actual `MemoryRoots` instances the
+/// memory tools see are rebuilt per request from these fields.
+#[derive(Debug, Clone)]
+pub struct MemoryRuntime {
+    pub workspace_root: PathBuf,
+    pub user_root: Option<PathBuf>,
+    pub backend: harness_tools::MemorySyncBackend,
 }
 
 impl AppState {
@@ -369,6 +394,8 @@ impl AppState {
             chat_runs: crate::chat_runs::ChatRunRegistry::new(),
             route_policy: Arc::new(RwLock::new(ModelRoutePolicy::default())),
             subagent_runs: None,
+            memory_stats: None,
+            memory_runtime: None,
         }
     }
 
@@ -422,6 +449,8 @@ impl AppState {
             chat_runs: crate::chat_runs::ChatRunRegistry::new(),
             route_policy: Arc::new(RwLock::new(ModelRoutePolicy::default())),
             subagent_runs: None,
+            memory_stats: None,
+            memory_runtime: None,
         }
     }
 
@@ -739,6 +768,29 @@ impl AppState {
         self
     }
 
+    /// Install a memory-stats handle so
+    /// `GET /v1/diagnostics/memory` returns the active backend's
+    /// counters. Composition root passes
+    /// `SummarizingMemory::counters()` cast to
+    /// `Arc<dyn MemoryStatsProvider>` here.
+    pub fn with_memory_stats(
+        mut self,
+        provider: Arc<dyn harness_core::MemoryStatsProvider>,
+    ) -> Self {
+        self.memory_stats = Some(provider);
+        self
+    }
+
+    /// Install memory + sync runtime metadata. Only the binary
+    /// composition root has the full picture (which backend the
+    /// operator picked, where the user_root resolves to), so this
+    /// has to be a setter rather than something AppState
+    /// reconstructs.
+    pub fn with_memory_runtime(mut self, rt: MemoryRuntime) -> Self {
+        self.memory_runtime = Some(rt);
+        self
+    }
+
     /// Build a fresh `Agent` for one request, routed via the
     /// registry. The returned agent shares the template's tools /
     /// memory / approver / system_prompt / max_iterations.
diff --git a/crates/harness-server/src/state_layers.rs b/crates/harness-server/src/state_layers.rs
index 74bfd80..7fb47e5 100644
--- a/crates/harness-server/src/state_layers.rs
+++ b/crates/harness-server/src/state_layers.rs
@@ -212,6 +212,99 @@ impl FromRef<AppState> for WorkspaceLayer {
     }
 }
 
+/// Runtime MCP manager slice. The manager owns spawned external
+/// MCP processes and the tools they project into the shared
+/// `ToolRegistry`. Consumed by `mcp_routes.rs` (the `/v1/mcp/*`
+/// runtime add / remove / health probes).
+#[derive(Clone)]
+pub struct McpLayer {
+    pub manager: Option<Arc<harness_mcp::McpManager>>,
+}
+
+impl FromRef<AppState> for McpLayer {
+    fn from_ref(s: &AppState) -> Self {
+        Self {
+            manager: s.mcp.clone(),
+        }
+    }
+}
+
+/// Plugin manager slice. The manager owns installed plugin
+/// processes / their skill + MCP registrations. Consumed by
+/// `plugin_routes.rs` (install / uninstall / list).
+#[derive(Clone)]
+pub struct PluginsLayer {
+    pub manager: Option<Arc<harness_plugin::PluginManager>>,
+}
+
+impl FromRef<AppState> for PluginsLayer {
+    fn from_ref(s: &AppState) -> Self {
+        Self {
+            manager: s.plugins.clone(),
+        }
+    }
+}
+
+/// SubAgent runs registry — the in-process ledger of recent
+/// SubAgent invocations the WS handler appends frames to.
+/// Consumed by `subagent_runs_routes.rs` (the `/v1/subagents/runs*`
+/// surface).
+#[derive(Clone)]
+pub struct SubAgentRunsLayer {
+    pub registry: Option<Arc<crate::subagent_runs::SubAgentRunRegistry>>,
+}
+
+impl FromRef<AppState> for SubAgentRunsLayer {
+    fn from_ref(s: &AppState) -> Self {
+        Self {
+            registry: s.subagent_runs.clone(),
+        }
+    }
+}
+
+/// Skill-catalogue slice — the in-memory parsed catalogue + the
+/// user-writable root that online skill-market installs land in.
+/// Consumed by `market_routes.rs` (install / uninstall) and a
+/// couple of read-only browse endpoints. The catalogue itself is
+/// `Arc<RwLock<…>>` so concurrent reads don't block writes.
+#[derive(Clone)]
+pub struct SkillsLayer {
+    pub catalog: Option<Arc<std::sync::RwLock<harness_skill::SkillCatalog>>>,
+    pub user_dir: Option<std::path::PathBuf>,
+}
+
+impl FromRef<AppState> for SkillsLayer {
+    fn from_ref(s: &AppState) -> Self {
+        Self {
+            catalog: s.skills.clone(),
+            user_dir: s.user_skills_dir.clone(),
+        }
+    }
+}
+
+/// Auto-mode slice — the runtime claim ledger + the per-tick
+/// config the picker reads. Consumed only by
+/// `auto_mode_routes.rs`; nothing else should touch these because
+/// they're a control plane, not a data store.
+///
+/// Both are `Option` — auto mode is opt-in via
+/// `JARVIS_WORK_MODE=auto` and the binary leaves them `None` for
+/// off / unconfigured deployments. Handlers return 503 then.
+#[derive(Clone)]
+pub struct AutoModeLayer {
+    pub runtime: Option<crate::auto_mode::AutoModeRuntime>,
+    pub config: Option<Arc<crate::auto_mode::AutoModeConfig>>,
+}
+
+impl FromRef<AppState> for AutoModeLayer {
+    fn from_ref(s: &AppState) -> Self {
+        Self {
+            runtime: s.auto_mode_runtime.clone(),
+            config: s.auto_mode_config.clone(),
+        }
+    }
+}
+
 /// TODO-board slice. Tiny — the store plus the "prepend recent
 /// TODOs to the agent's system prompt?" flag the agent loop reads
 /// at build time. Consumed by `todos_routes.rs` plus the agent
diff --git a/crates/harness-server/src/subagent_runs_routes.rs b/crates/harness-server/src/subagent_runs_routes.rs
index eba1f53..b6df4d2 100644
--- a/crates/harness-server/src/subagent_runs_routes.rs
+++ b/crates/harness-server/src/subagent_runs_routes.rs
@@ -21,6 +21,7 @@ use axum::{
 use serde_json::json;
 
 use crate::state::AppState;
+use crate::state_layers::SubAgentRunsLayer;
 
 pub(crate) fn router() -> Router<AppState> {
     Router::new()
@@ -29,16 +30,16 @@ pub(crate) fn router() -> Router<AppState> {
         .route("/v1/subagents/runs/:id/cancel", post(cancel_run))
 }
 
-async fn list_runs(State(state): State<AppState>) -> Response {
-    let Some(reg) = state.subagent_runs.as_ref() else {
+async fn list_runs(State(runs): State<SubAgentRunsLayer>) -> Response {
+    let Some(reg) = runs.registry.as_ref() else {
         return service_unavailable();
     };
     let items = reg.list();
     Json(json!({ "items": items })).into_response()
 }
 
-async fn get_run(State(state): State<AppState>, Path(id): Path<String>) -> Response {
-    let Some(reg) = state.subagent_runs.as_ref() else {
+async fn get_run(State(runs): State<SubAgentRunsLayer>, Path(id): Path<String>) -> Response {
+    let Some(reg) = runs.registry.as_ref() else {
         return service_unavailable();
     };
     match reg.get(&id) {
@@ -54,8 +55,8 @@ async fn get_run(State(state): State<AppState>, Path(id): Path<String>) -> Respo
     }
 }
 
-async fn cancel_run(State(state): State<AppState>, Path(id): Path<String>) -> Response {
-    let Some(reg) = state.subagent_runs.as_ref() else {
+async fn cancel_run(State(runs): State<SubAgentRunsLayer>, Path(id): Path<String>) -> Response {
+    let Some(reg) = runs.registry.as_ref() else {
         return service_unavailable();
     };
     let ok = reg.cancel(&id);
diff --git a/crates/harness-server/src/tasks_routes.rs b/crates/harness-server/src/tasks_routes.rs
new file mode 100644
index 0000000..da640cd
--- /dev/null
+++ b/crates/harness-server/src/tasks_routes.rs
@@ -0,0 +1,325 @@
+//! `GET /v1/tasks` — unified background-tasks panel feed.
+//!
+//! The UI's BackgroundTasksPanel needs one place to see *every*
+//! kind of long-running work the server is currently handling: chat
+//! turns mid-stream, subagent runs in flight, auto-mode requirement
+//! picks, future shell/MCP entries. Rather than have the UI call
+//! three endpoints and reconcile them, this route normalises each
+//! source into a single `TaskEntry` shape sorted newest-first.
+//!
+//! v1 sources (more can be added without breaking the wire shape —
+//! each entry's `kind` discriminator lets the UI render new types
+//! progressively):
+//!
+//! - `chat_run`     — from [`crate::chat_runs::ChatRunRegistry`]
+//! - `subagent_run` — from [`crate::subagent_runs::SubAgentRunRegistry`]
+//!
+//! Filtering: only entries with a still-active lifecycle status
+//! appear (running / waiting_*); completed / failed / cancelled
+//! runs are surfaced through their dedicated detail endpoints. The
+//! panel is "what's in flight right now", not a history view.
+
+use axum::{extract::State, response::IntoResponse, routing::get, Json, Router};
+use harness_project::RequirementRunStatus;
+use serde::Serialize;
+use serde_json::Value;
+
+use crate::chat_runs::ChatRunStatus;
+use crate::state::AppState;
+use crate::subagent_runs::SubAgentRunStatus;
+
+pub(crate) fn router() -> Router<AppState> {
+    Router::new().route("/v1/tasks", get(list_tasks))
+}
+
+/// One normalised entry across kinds. `kind` is the source
+/// discriminator and `id` is unique within that kind. `label` is
+/// the one-line UI string; `detail` carries the raw record so a
+/// click-into-detail UI can pivot without a second fetch.
+#[derive(Debug, Serialize)]
+pub struct TaskEntry {
+    pub kind: TaskKind,
+    pub id: String,
+    pub label: String,
+    pub status: String,
+    pub started_at: u64,
+    pub updated_at: u64,
+    pub detail: Value,
+}
+
+#[derive(Debug, Serialize)]
+#[serde(rename_all = "snake_case")]
+pub enum TaskKind {
+    ChatRun,
+    SubagentRun,
+    RequirementRun,
+    McpServer,
+}
+
+#[derive(Debug, Serialize)]
+struct TasksResponse {
+    items: Vec<TaskEntry>,
+    /// Server clock at snapshot time (ms since epoch). Lets the UI
+    /// render relative "started 30s ago" without trusting the
+    /// client wall clock.
+    generated_at: u64,
+}
+
+async fn list_tasks(State(state): State<AppState>) -> impl IntoResponse {
+    let items = collect_tasks(&state).await;
+    Json(TasksResponse {
+        items,
+        generated_at: now_ms(),
+    })
+}
+
+/// Build a snapshot of the current `TaskEntry` set from every
+/// configured source. Pulled out of [`list_tasks`] so the future
+/// WS push path can call it on a timer / event without going
+/// through HTTP.
+pub(crate) async fn collect_tasks(state: &AppState) -> Vec<TaskEntry> {
+    let mut items: Vec<TaskEntry> = Vec::new();
+
+    // Chat runs — always available; filter to active states.
+    let chat_runs = state.chat_runs.list(/* active_only */ true);
+    for r in chat_runs {
+        let active = matches!(
+            r.status,
+            ChatRunStatus::Running | ChatRunStatus::WaitingApproval | ChatRunStatus::WaitingHitl
+        );
+        if !active {
+            continue;
+        }
+        let status = match r.status {
+            ChatRunStatus::Running => "running",
+            ChatRunStatus::WaitingApproval => "waiting_approval",
+            ChatRunStatus::WaitingHitl => "waiting_hitl",
+            ChatRunStatus::Completed => "completed",
+            ChatRunStatus::Failed => "failed",
+            ChatRunStatus::Cancelled => "cancelled",
+        };
+        let label = match r.current_tool.as_deref() {
+            Some(tool) => format!("Chat · running {tool}"),
+            None => "Chat turn".to_string(),
+        };
+        items.push(TaskEntry {
+            kind: TaskKind::ChatRun,
+            id: r.conversation_id.clone(),
+            label,
+            status: status.to_string(),
+            started_at: r.started_at,
+            updated_at: r.updated_at,
+            detail: serde_json::to_value(&r).unwrap_or(Value::Null),
+        });
+    }
+
+    // Subagent runs — optional registry.
+    if let Some(reg) = state.subagent_runs.as_ref() {
+        for r in reg.list() {
+            if !matches!(r.status, SubAgentRunStatus::Running) {
+                continue;
+            }
+            // Compose a concise label: "<name>: <task-head>" with
+            // the task truncated so the panel row stays readable.
+            let task_head = r.task.as_deref().unwrap_or("");
+            let task_short = if task_head.len() > 48 {
+                format!("{}…", &task_head[..47])
+            } else {
+                task_head.to_string()
+            };
+            let label = if task_short.is_empty() {
+                r.name.clone()
+            } else {
+                format!("{}: {}", r.name, task_short)
+            };
+            items.push(TaskEntry {
+                kind: TaskKind::SubagentRun,
+                id: r.id.clone(),
+                label,
+                status: "running".into(),
+                started_at: r.started_at,
+                updated_at: r.updated_at,
+                detail: serde_json::to_value(&r).unwrap_or(Value::Null),
+            });
+        }
+    }
+
+    // Requirement runs (auto-mode picks + manual `start_run`).
+    // We only surface still-in-flight rows. Listing through the
+    // store is bounded (the trait caps `list_all` at ~200), so
+    // even a noisy run history doesn't bloat the panel.
+    if let Some(store) = state.requirement_runs.as_ref() {
+        if let Ok(rows) = store.list_all(200).await {
+            for r in rows {
+                if !matches!(
+                    r.status,
+                    RequirementRunStatus::Pending | RequirementRunStatus::Running
+                ) {
+                    continue;
+                }
+                let status = match r.status {
+                    RequirementRunStatus::Pending => "pending",
+                    RequirementRunStatus::Running => "running",
+                    RequirementRunStatus::Completed => "completed",
+                    RequirementRunStatus::Failed => "failed",
+                    RequirementRunStatus::Cancelled => "cancelled",
+                };
+                let label = format!("Requirement {} · {}", r.requirement_id, status);
+                // `RequirementRun.started_at` is an RFC-3339 string
+                // (the row gets persisted across processes); parse to
+                // millis for the panel sort. Fall back to now() when
+                // a row predates the timestamp convention.
+                let started_ms = parse_rfc3339_ms(&r.started_at).unwrap_or_else(now_ms);
+                let updated_ms = r
+                    .finished_at
+                    .as_deref()
+                    .and_then(parse_rfc3339_ms)
+                    .unwrap_or(started_ms);
+                items.push(TaskEntry {
+                    kind: TaskKind::RequirementRun,
+                    id: r.id.clone(),
+                    label,
+                    status: status.to_string(),
+                    started_at: started_ms,
+                    updated_at: updated_ms,
+                    detail: serde_json::to_value(&r).unwrap_or(Value::Null),
+                });
+            }
+        }
+    }
+
+    // MCP server health — surface unhealthy / stopped servers as
+    // "tasks" so the operator can spot a wedged tool source. We
+    // omit cleanly-running servers from the panel: they aren't
+    // pending work, they're idle infrastructure.
+    if let Some(mgr) = state.mcp.as_ref() {
+        for s in mgr.list().await {
+            use harness_mcp::manager::McpServerStatus;
+            if matches!(s.status, McpServerStatus::Running) {
+                continue;
+            }
+            let (status, label) = match s.status {
+                McpServerStatus::Stopped => (
+                    "stopped",
+                    format!("MCP {} · stopped", s.prefix),
+                ),
+                McpServerStatus::Unhealthy => (
+                    "unhealthy",
+                    format!("MCP {} · unhealthy", s.prefix),
+                ),
+                McpServerStatus::Running => unreachable!(),
+            };
+            // MCP servers don't have a meaningful timestamp on
+            // McpServerInfo today; pin to now() so they sort to
+            // the head only when freshly broken. We may extend
+            // McpServerInfo later with a last_status_at field.
+            let now = now_ms();
+            items.push(TaskEntry {
+                kind: TaskKind::McpServer,
+                id: s.prefix.clone(),
+                label,
+                status: status.to_string(),
+                started_at: now,
+                updated_at: now,
+                detail: serde_json::to_value(&s).unwrap_or(Value::Null),
+            });
+        }
+    }
+
+    // Newest first across kinds so a fresh task lands at the top
+    // regardless of where it came from.
+    items.sort_by_key(|t| std::cmp::Reverse(t.started_at));
+    items
+}
+
+fn now_ms() -> u64 {
+    use std::time::{SystemTime, UNIX_EPOCH};
+    SystemTime::now()
+        .duration_since(UNIX_EPOCH)
+        .map(|d| d.as_millis() as u64)
+        .unwrap_or(0)
+}
+
+/// Parse an RFC-3339 / ISO-8601 timestamp into ms since epoch.
+/// Returns `None` on any parse failure so callers can fall back
+/// cleanly. Used to normalise persisted run-store timestamps onto
+/// the same axis as the in-memory chat / subagent registries.
+fn parse_rfc3339_ms(s: &str) -> Option<u64> {
+    chrono::DateTime::parse_from_rfc3339(s)
+        .ok()
+        .map(|dt| dt.timestamp_millis().max(0) as u64)
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::state::AppState;
+    use std::sync::Arc;
+
+    /// Minimal stub provider; the tasks endpoint never reaches the
+    /// agent so any never-call provider works here.
+    struct StubLlm;
+    #[async_trait::async_trait]
+    impl harness_core::LlmProvider for StubLlm {
+        async fn complete(
+            &self,
+            _: harness_core::ChatRequest,
+        ) -> Result<harness_core::ChatResponse, harness_core::Error> {
+            Err(harness_core::Error::Provider("stub".into()))
+        }
+    }
+
+    fn mk_state() -> AppState {
+        use harness_core::{Agent, AgentConfig};
+        let cfg = AgentConfig::new("stub-model");
+        let agent = Arc::new(Agent::new(Arc::new(StubLlm) as _, cfg));
+        AppState::new(agent)
+    }
+
+    async fn read_json(resp: axum::response::Response) -> serde_json::Value {
+        let bytes = axum::body::to_bytes(resp.into_body(), 1024 * 1024)
+            .await
+            .unwrap();
+        serde_json::from_slice(&bytes).unwrap()
+    }
+
+    #[tokio::test]
+    async fn empty_state_returns_empty_items() {
+        let state = mk_state();
+        let resp = list_tasks(State(state)).await.into_response();
+        let body = read_json(resp).await;
+        assert!(body["items"].as_array().unwrap().is_empty());
+        assert!(body["generated_at"].as_u64().is_some());
+    }
+
+    #[tokio::test]
+    async fn active_chat_run_surfaces() {
+        let state = mk_state();
+        state.chat_runs.start("conv-123");
+        let resp = list_tasks(State(state)).await.into_response();
+        let body = read_json(resp).await;
+        let items = body["items"].as_array().unwrap();
+        assert_eq!(items.len(), 1, "expected 1 task, got: {items:?}");
+        assert_eq!(items[0]["kind"], "chat_run");
+        assert_eq!(items[0]["id"], "conv-123");
+        assert_eq!(items[0]["status"], "running");
+    }
+
+    #[tokio::test]
+    async fn completed_chat_run_does_not_surface() {
+        let state = mk_state();
+        state.chat_runs.start("conv-done");
+        // `event` with a Done event flips to completed.
+        let done = harness_core::AgentEvent::Done {
+            outcome: harness_core::RunOutcome::Stopped { iterations: 1 },
+            conversation: harness_core::Conversation::new(),
+        };
+        state.chat_runs.event(Some("conv-done"), &done);
+        let resp = list_tasks(State(state)).await.into_response();
+        let body = read_json(resp).await;
+        assert!(
+            body["items"].as_array().unwrap().is_empty(),
+            "completed run leaked into tasks: {body}"
+        );
+    }
+}
diff --git a/crates/harness-server/src/work_overview_routes.rs b/crates/harness-server/src/work_overview_routes.rs
index 46836f0..e49c1e1 100644
--- a/crates/harness-server/src/work_overview_routes.rs
+++ b/crates/harness-server/src/work_overview_routes.rs
@@ -33,6 +33,7 @@ use serde_json::{json, Value};
 use tracing::error;
 
 use crate::state::AppState;
+use crate::state_layers::ProjectLayer;
 
 /// Default time window when neither `since` nor `window_days` is set.
 const DEFAULT_WINDOW_DAYS: i64 = 7;
@@ -103,8 +104,8 @@ fn resolve_window(q: &OverviewQuery) -> Result<ResolvedWindow, Response> {
 // --------------------------- Helpers -------------------------------------
 
 #[allow(clippy::result_large_err)]
-fn require_run_store(state: &AppState) -> Result<Arc<dyn RequirementRunStore>, Response> {
-    state.requirement_runs.clone().ok_or_else(|| {
+fn require_run_store(project: &ProjectLayer) -> Result<Arc<dyn RequirementRunStore>, Response> {
+    project.requirement_runs.clone().ok_or_else(|| {
         (
             StatusCode::SERVICE_UNAVAILABLE,
             Json(json!({ "error": "requirement run store not configured" })),
@@ -146,12 +147,12 @@ fn normalise_command(cmd: &str) -> String {
 
 // --------------------------- Overview handler ----------------------------
 
-async fn get_overview(State(state): State<AppState>, Query(q): Query<OverviewQuery>) -> Response {
+async fn get_overview(State(project): State<ProjectLayer>, Query(q): Query<OverviewQuery>) -> Response {
     let window = match resolve_window(&q) {
         Ok(w) => w,
         Err(resp) => return resp,
     };
-    let runs_store = match require_run_store(&state) {
+    let runs_store = match require_run_store(&project) {
         Ok(r) => r,
         Err(resp) => return resp,
     };
@@ -165,7 +166,7 @@ async fn get_overview(State(state): State<AppState>, Query(q): Query<OverviewQue
     };
     let truncated = runs.len() as u32 >= RUN_SCAN_LIMIT;
 
-    let projects: Option<Vec<Project>> = match state.projects.as_ref() {
+    let projects: Option<Vec<Project>> = match project.projects.as_ref() {
         Some(s) => match s.list(false, 500).await {
             Ok(rows) => Some(rows),
             Err(e) => return internal_error(e),
@@ -176,7 +177,7 @@ async fn get_overview(State(state): State<AppState>, Query(q): Query<OverviewQue
         }
     };
 
-    let requirements: Option<Vec<Requirement>> = match (state.requirements.as_ref(), &projects) {
+    let requirements: Option<Vec<Requirement>> = match (project.requirements.as_ref(), &projects) {
         (Some(req_store), Some(projs)) => {
             let mut all = Vec::new();
             for p in projs {
@@ -409,7 +410,7 @@ async fn get_overview(State(state): State<AppState>, Query(q): Query<OverviewQue
 
     // ---- blocked_requirements ------------------------------------------
     let (blocked_requirements, blocked_truncated) = match (
-        state.activities.as_ref(),
+        project.activities.as_ref(),
         requirements.as_ref(),
         projects.as_ref(),
     ) {
@@ -473,7 +474,7 @@ async fn get_overview(State(state): State<AppState>, Query(q): Query<OverviewQue
             (Some(blocked), truncated)
         }
         _ => {
-            if state.activities.is_none() {
+            if project.activities.is_none() {
                 missing_stores.push("activities");
             }
             (None, false)
@@ -506,12 +507,12 @@ async fn get_overview(State(state): State<AppState>, Query(q): Query<OverviewQue
 
 // --------------------------- Quality handler -----------------------------
 
-async fn get_quality(State(state): State<AppState>, Query(q): Query<OverviewQuery>) -> Response {
+async fn get_quality(State(project): State<ProjectLayer>, Query(q): Query<OverviewQuery>) -> Response {
     let window = match resolve_window(&q) {
         Ok(w) => w,
         Err(resp) => return resp,
     };
-    let runs_store = match require_run_store(&state) {
+    let runs_store = match require_run_store(&project) {
         Ok(r) => r,
         Err(resp) => return resp,
     };
diff --git a/crates/harness-server/src/workspace_diff.rs b/crates/harness-server/src/workspace_diff.rs
index 8a3c854..22c7aed 100644
--- a/crates/harness-server/src/workspace_diff.rs
+++ b/crates/harness-server/src/workspace_diff.rs
@@ -36,6 +36,7 @@ use serde_json::{json, Value};
 use tokio::process::Command;
 
 use crate::state::AppState;
+use crate::state_layers::WorkspaceLayer;
 
 /// Default base branch when the client doesn't pin one. Most of our
 /// codebases use `main`; a future enhancement could probe
@@ -183,7 +184,7 @@ fn safe_relative_path(path: &str) -> Result<&str, &'static str> {
 /// be absolute, NUL/newline-free, and resolve via `canonicalize` to an
 /// existing directory; anything else returns `400`.
 #[allow(clippy::result_large_err)]
-fn resolve_workspace(state: &AppState, override_root: Option<&str>) -> Result<PathBuf, Response> {
+fn resolve_workspace(ws: &WorkspaceLayer, override_root: Option<&str>) -> Result<PathBuf, Response> {
     if let Some(raw) = override_root {
         let trimmed = raw.trim();
         if trimmed.is_empty() {
@@ -202,7 +203,7 @@ fn resolve_workspace(state: &AppState, override_root: Option<&str>) -> Result<Pa
         }
         return Ok(canonical);
     }
-    state.workspace_root.clone().ok_or_else(|| {
+    ws.root.clone().ok_or_else(|| {
         (
             StatusCode::SERVICE_UNAVAILABLE,
             Json(json!({ "error": "workspace root not configured" })),
@@ -272,8 +273,8 @@ async fn base_exists(root: &std::path::Path, base: &str) -> bool {
 // GET /v1/workspace/diff
 // ----------------------------------------------------------------------
 
-async fn get_workspace_diff(State(state): State<AppState>, Query(q): Query<DiffQuery>) -> Response {
-    let root = match resolve_workspace(&state, q.root.as_deref()) {
+async fn get_workspace_diff(State(ws): State<WorkspaceLayer>, Query(q): Query<DiffQuery>) -> Response {
+    let root = match resolve_workspace(&ws, q.root.as_deref()) {
         Ok(r) => r,
         Err(r) => return r,
     };
@@ -552,10 +553,10 @@ async fn uncommitted_summary(root: &std::path::Path) -> Value {
 // ----------------------------------------------------------------------
 
 async fn get_workspace_diff_file(
-    State(state): State<AppState>,
+    State(ws): State<WorkspaceLayer>,
     Query(q): Query<FileDiffQuery>,
 ) -> Response {
-    let root = match resolve_workspace(&state, q.root.as_deref()) {
+    let root = match resolve_workspace(&ws, q.root.as_deref()) {
         Ok(r) => r,
         Err(r) => return r,
     };
@@ -634,10 +635,10 @@ struct CommitBody {
 }
 
 async fn post_workspace_commit(
-    State(state): State<AppState>,
+    State(ws): State<WorkspaceLayer>,
     Json(body): Json<CommitBody>,
 ) -> Response {
-    let root = match resolve_workspace(&state, body.root.as_deref()) {
+    let root = match resolve_workspace(&ws, body.root.as_deref()) {
         Ok(r) => r,
         Err(r) => return r,
     };
@@ -738,8 +739,8 @@ async fn post_workspace_commit(
 // GET /v1/workspace/pr/preview
 // ----------------------------------------------------------------------
 
-async fn get_pr_preview(State(state): State<AppState>, Query(q): Query<DiffQuery>) -> Response {
-    let root = match resolve_workspace(&state, q.root.as_deref()) {
+async fn get_pr_preview(State(ws): State<WorkspaceLayer>, Query(q): Query<DiffQuery>) -> Response {
+    let root = match resolve_workspace(&ws, q.root.as_deref()) {
         Ok(r) => r,
         Err(r) => return r,
     };
@@ -877,8 +878,8 @@ fn default_true() -> bool {
     true
 }
 
-async fn post_create_pr(State(state): State<AppState>, Json(body): Json<CreatePrBody>) -> Response {
-    let root = match resolve_workspace(&state, body.root.as_deref()) {
+async fn post_create_pr(State(ws): State<WorkspaceLayer>, Json(body): Json<CreatePrBody>) -> Response {
+    let root = match resolve_workspace(&ws, body.root.as_deref()) {
         Ok(r) => r,
         Err(r) => return r,
     };
diff --git a/crates/harness-server/src/workspace_files.rs b/crates/harness-server/src/workspace_files.rs
index b077fef..ff56c09 100644
--- a/crates/harness-server/src/workspace_files.rs
+++ b/crates/harness-server/src/workspace_files.rs
@@ -32,6 +32,7 @@ use serde_json::json;
 use tokio::fs;
 
 use crate::state::AppState;
+use crate::state_layers::WorkspaceLayer;
 
 /// Hard cap on a single file read. Anything bigger gets truncated
 /// (with a sentinel) so the client doesn't OOM rendering a huge
@@ -101,7 +102,7 @@ fn server_error(msg: impl std::fmt::Display) -> Response {
 /// so this module doesn't reach into a sibling module's privates.
 /// Keeps the security policy explicit at each entry point.
 #[allow(clippy::result_large_err)]
-fn resolve_workspace(state: &AppState, override_root: Option<&str>) -> Result<PathBuf, Response> {
+fn resolve_workspace(ws: &WorkspaceLayer, override_root: Option<&str>) -> Result<PathBuf, Response> {
     if let Some(raw) = override_root {
         let trimmed = raw.trim();
         if trimmed.is_empty() {
@@ -120,7 +121,7 @@ fn resolve_workspace(state: &AppState, override_root: Option<&str>) -> Result<Pa
         }
         return Ok(canonical);
     }
-    state.workspace_root.clone().ok_or_else(|| {
+    ws.root.clone().ok_or_else(|| {
         (
             StatusCode::SERVICE_UNAVAILABLE,
             Json(json!({ "error": "workspace root not configured" })),
@@ -156,8 +157,8 @@ fn safe_relative(rel: &str) -> Result<&str, &'static str> {
 // GET /v1/workspace/list
 // ----------------------------------------------------------------------
 
-async fn list_dir(State(state): State<AppState>, Query(q): Query<ListQuery>) -> Response {
-    let root = match resolve_workspace(&state, q.root.as_deref()) {
+async fn list_dir(State(ws): State<WorkspaceLayer>, Query(q): Query<ListQuery>) -> Response {
+    let root = match resolve_workspace(&ws, q.root.as_deref()) {
         Ok(r) => r,
         Err(r) => return r,
     };
@@ -256,8 +257,8 @@ async fn list_dir(State(state): State<AppState>, Query(q): Query<ListQuery>) ->
 // GET /v1/workspace/read
 // ----------------------------------------------------------------------
 
-async fn read_file(State(state): State<AppState>, Query(q): Query<ReadQuery>) -> Response {
-    let root = match resolve_workspace(&state, q.root.as_deref()) {
+async fn read_file(State(ws): State<WorkspaceLayer>, Query(q): Query<ReadQuery>) -> Response {
+    let root = match resolve_workspace(&ws, q.root.as_deref()) {
         Ok(r) => r,
         Err(r) => return r,
     };
diff --git a/crates/harness-server/src/workspace_find.rs b/crates/harness-server/src/workspace_find.rs
index ae4ef02..2e84064 100644
--- a/crates/harness-server/src/workspace_find.rs
+++ b/crates/harness-server/src/workspace_find.rs
@@ -32,6 +32,7 @@ use serde::Deserialize;
 use serde_json::json;
 
 use crate::state::AppState;
+use crate::state_layers::ConversationLayer;
 
 /// Maximum depth (relative to a search root) the walker explores.
 /// 2 catches `~/Documents/GitHub/<repo>` (depth 1 from the root)
@@ -83,7 +84,7 @@ struct FindQuery {
     name: String,
 }
 
-async fn find_workspace(State(state): State<AppState>, Query(q): Query<FindQuery>) -> Response {
+async fn find_workspace(State(conv): State<ConversationLayer>, Query(q): Query<FindQuery>) -> Response {
     let needle = q.name.trim();
     if needle.is_empty() {
         return bad_request("name parameter is required");
@@ -130,7 +131,7 @@ async fn find_workspace(State(state): State<AppState>, Query(q): Query<FindQuery
     // opened are by definition canonical, so they rank highest.
     let mut seen: HashSet<String> = HashSet::new();
     let mut out: Vec<String> = Vec::new();
-    if let Some(ws) = state.workspaces.as_ref() {
+    if let Some(ws) = conv.workspaces.as_ref() {
         for entry in ws.list_recent() {
             if basename_eq(&entry.path, needle) && seen.insert(entry.path.clone()) {
                 out.push(entry.path);
diff --git a/crates/harness-server/src/workspace_terminal.rs b/crates/harness-server/src/workspace_terminal.rs
index 77b3128..7579d31 100644
--- a/crates/harness-server/src/workspace_terminal.rs
+++ b/crates/harness-server/src/workspace_terminal.rs
@@ -44,6 +44,7 @@ use serde_json::json;
 use tokio::sync::Mutex;
 
 use crate::state::AppState;
+use crate::state_layers::WorkspaceLayer;
 
 pub(crate) fn router() -> Router<AppState> {
     Router::new()
@@ -57,8 +58,8 @@ pub(crate) fn router() -> Router<AppState> {
 /// network error. `available: false` only if no workspace root
 /// resolves; the actual PTY spawn errors are surfaced through the
 /// open WS as a closing frame with a reason byte.
-async fn status(State(state): State<AppState>) -> Response {
-    let available = state.workspace_root.is_some();
+async fn status(State(workspace): State<WorkspaceLayer>) -> Response {
+    let available = workspace.root.is_some();
     Json(json!({
         "available": available,
         "shell": pick_shell(),
@@ -83,7 +84,10 @@ fn bad_request(msg: &str) -> Response {
 }
 
 #[allow(clippy::result_large_err)]
-fn resolve_workspace(state: &AppState, override_root: Option<&str>) -> Result<PathBuf, Response> {
+fn resolve_workspace(
+    workspace: &WorkspaceLayer,
+    override_root: Option<&str>,
+) -> Result<PathBuf, Response> {
     if let Some(raw) = override_root {
         let trimmed = raw.trim();
         if trimmed.is_empty() {
@@ -102,7 +106,7 @@ fn resolve_workspace(state: &AppState, override_root: Option<&str>) -> Result<Pa
         }
         return Ok(canonical);
     }
-    state.workspace_root.clone().ok_or_else(|| {
+    workspace.root.clone().ok_or_else(|| {
         (
             StatusCode::SERVICE_UNAVAILABLE,
             Json(json!({ "error": "workspace root not configured" })),
@@ -113,10 +117,10 @@ fn resolve_workspace(state: &AppState, override_root: Option<&str>) -> Result<Pa
 
 async fn terminal_ws(
     ws: WebSocketUpgrade,
-    State(state): State<AppState>,
+    State(workspace): State<WorkspaceLayer>,
     Query(q): Query<TerminalQuery>,
 ) -> Response {
-    let root = match resolve_workspace(&state, q.root.as_deref()) {
+    let root = match resolve_workspace(&workspace, q.root.as_deref()) {
         Ok(r) => r,
         Err(r) => return r,
     };
diff --git a/crates/harness-skill/src/lib.rs b/crates/harness-skill/src/lib.rs
index 1aea1cd..34a8f05 100644
--- a/crates/harness-skill/src/lib.rs
+++ b/crates/harness-skill/src/lib.rs
@@ -20,11 +20,15 @@
 
 pub mod catalog;
 pub mod manifest;
+pub mod path_match;
 pub mod selector;
 
 pub use catalog::{SkillCatalog, SkillEntry, SkillSource};
 pub use manifest::{parse_skill, SkillActivation, SkillError, SkillManifest};
-pub use selector::{pick_auto_skills, query_token_set, score_skill};
+pub use path_match::{any_glob_matches, glob_matches};
+pub use selector::{
+    pick_auto_skills, pick_path_match_skills, query_token_set, score_skill,
+};
 
 /// Default skills shipped with the binary (`assets/defaults/<name>/SKILL.md`).
 /// Embedded at compile time via [`include_dir!`]. Pass to
diff --git a/crates/harness-skill/src/manifest.rs b/crates/harness-skill/src/manifest.rs
index 7390366..e5623bc 100644
--- a/crates/harness-skill/src/manifest.rs
+++ b/crates/harness-skill/src/manifest.rs
@@ -91,6 +91,22 @@ pub struct SkillManifest {
     /// Free-form version string. Display-only.
     #[serde(default, skip_serializing_if = "Option::is_none")]
     pub version: Option<String>,
+    /// File-path globs that auto-activate this skill when the agent
+    /// touches a matching file in the current session (M3.3). Empty
+    /// / absent disables the path-based trigger. Pattern semantics:
+    ///
+    /// - `*` matches any run of non-`/` characters within one path
+    ///   segment.
+    /// - `**` matches across segments (including zero).
+    /// - `?` matches one non-`/` character.
+    /// - everything else is literal.
+    ///
+    /// Example: `["**/*.tsx", "Cargo.toml"]` triggers when the
+    /// agent edits any `.tsx` anywhere in the workspace or the
+    /// root `Cargo.toml`. Matching is case-sensitive and runs
+    /// against the workspace-relative path.
+    #[serde(default, skip_serializing_if = "Vec::is_empty")]
+    pub paths: Vec<String>,
 }
 
 /// Outcome of parsing a SKILL.md text: structured manifest + the
diff --git a/crates/harness-skill/src/path_match.rs b/crates/harness-skill/src/path_match.rs
new file mode 100644
index 0000000..90c9351
--- /dev/null
+++ b/crates/harness-skill/src/path_match.rs
@@ -0,0 +1,162 @@
+//! Path-glob matcher for the M3.3 skill auto-activation rule.
+//!
+//! Self-contained and dependency-free (no `glob` / `globset` crate
+//! pull-in). The grammar is intentionally tiny — only the patterns
+//! a SKILL.md author would reasonably write:
+//!
+//! - `?`  — one non-`/` character
+//! - `*`  — any run of non-`/` characters within one segment
+//! - `**` — any path fragment, crossing segment boundaries (incl.
+//!   zero segments)
+//! - any other character — literal match (case-sensitive)
+//!
+//! Backslashes in input paths are normalised to forward slashes so
+//! the same pattern works on Windows without authors having to
+//! double-escape.
+//!
+//! Implementation is a straightforward dynamic-programming match
+//! over byte slices; pattern length and path length are both small
+//! (paths bounded by filesystem limits, patterns are user-written
+//! and rarely exceed a few dozen chars), so the O(n*m) cost is
+//! noise.
+
+/// True when `path` matches the glob `pattern`. Paths are
+/// normalised by replacing `\` with `/` so callers don't have to
+/// pre-normalise. Empty pattern matches only empty path; empty
+/// path matches only patterns that reduce to nothing (e.g. `**`).
+pub fn glob_matches(pattern: &str, path: &str) -> bool {
+    let path = path.replace('\\', "/");
+    let pat = pattern.as_bytes();
+    let txt = path.as_bytes();
+    matches_at(pat, 0, txt, 0)
+}
+
+/// True when any pattern in `patterns` matches `path`. Convenience
+/// for the common "skill has 0..N globs" case.
+pub fn any_glob_matches<S: AsRef<str>>(patterns: &[S], path: &str) -> bool {
+    patterns.iter().any(|p| glob_matches(p.as_ref(), path))
+}
+
+fn matches_at(pat: &[u8], mut pi: usize, txt: &[u8], mut ti: usize) -> bool {
+    while pi < pat.len() {
+        match pat[pi] {
+            b'*' if pat.get(pi + 1) == Some(&b'*') => {
+                // `**` — match across path segments. Optionally
+                // consume a trailing `/` so `**/foo` matches both
+                // `foo` and `a/b/foo`.
+                let mut next = pi + 2;
+                if pat.get(next) == Some(&b'/') {
+                    next += 1;
+                }
+                // Try matching the remainder at every position in
+                // `txt` from current onward (including current).
+                loop {
+                    if matches_at(pat, next, txt, ti) {
+                        return true;
+                    }
+                    if ti >= txt.len() {
+                        return false;
+                    }
+                    ti += 1;
+                }
+            }
+            b'*' => {
+                // `*` — match any run of non-`/` within one segment.
+                let next = pi + 1;
+                loop {
+                    if matches_at(pat, next, txt, ti) {
+                        return true;
+                    }
+                    if ti >= txt.len() || txt[ti] == b'/' {
+                        return false;
+                    }
+                    ti += 1;
+                }
+            }
+            b'?' => {
+                if ti >= txt.len() || txt[ti] == b'/' {
+                    return false;
+                }
+                pi += 1;
+                ti += 1;
+            }
+            c => {
+                if ti >= txt.len() || txt[ti] != c {
+                    return false;
+                }
+                pi += 1;
+                ti += 1;
+            }
+        }
+    }
+    ti == txt.len()
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn literal_matches() {
+        assert!(glob_matches("Cargo.toml", "Cargo.toml"));
+        assert!(!glob_matches("Cargo.toml", "Cargo.lock"));
+    }
+
+    #[test]
+    fn star_matches_within_segment() {
+        assert!(glob_matches("*.rs", "lib.rs"));
+        assert!(!glob_matches("*.rs", "lib.rs.bak"));
+        assert!(!glob_matches("*.rs", "src/lib.rs"));
+    }
+
+    #[test]
+    fn double_star_crosses_segments() {
+        assert!(glob_matches("**/*.tsx", "App.tsx"));
+        assert!(glob_matches("**/*.tsx", "src/components/App.tsx"));
+        assert!(!glob_matches("**/*.tsx", "App.ts"));
+    }
+
+    #[test]
+    fn double_star_matches_zero_segments() {
+        assert!(glob_matches("**/foo", "foo"));
+        assert!(glob_matches("**/foo", "a/b/foo"));
+        assert!(!glob_matches("**/foo", "foobar"));
+    }
+
+    #[test]
+    fn question_mark_matches_one_char() {
+        assert!(glob_matches("a?c", "abc"));
+        assert!(!glob_matches("a?c", "ac"));
+        assert!(!glob_matches("a?c", "abbc"));
+        // Doesn't cross `/`.
+        assert!(!glob_matches("a?c", "a/c"));
+    }
+
+    #[test]
+    fn segment_in_middle_with_double_star() {
+        assert!(glob_matches("src/**/*.rs", "src/lib.rs"));
+        assert!(glob_matches("src/**/*.rs", "src/a/b/c.rs"));
+        assert!(!glob_matches("src/**/*.rs", "tests/a.rs"));
+    }
+
+    #[test]
+    fn backslashes_are_normalised() {
+        // Author writes the pattern with `/`; matcher accepts a
+        // Windows-style path with `\`.
+        assert!(glob_matches("src/**/*.rs", "src\\foo\\bar.rs"));
+    }
+
+    #[test]
+    fn empty_pattern_matches_only_empty() {
+        assert!(glob_matches("", ""));
+        assert!(!glob_matches("", "x"));
+    }
+
+    #[test]
+    fn any_glob_matches_short_circuits() {
+        let pats = vec!["*.lock".to_string(), "**/*.tsx".to_string()];
+        assert!(any_glob_matches(&pats, "src/App.tsx"));
+        assert!(any_glob_matches(&pats, "Cargo.lock"));
+        assert!(!any_glob_matches(&pats, "src/lib.rs"));
+    }
+}
diff --git a/crates/harness-skill/src/selector.rs b/crates/harness-skill/src/selector.rs
index d97ce72..ad0db17 100644
--- a/crates/harness-skill/src/selector.rs
+++ b/crates/harness-skill/src/selector.rs
@@ -120,6 +120,53 @@ pub fn pick_auto_skills(
     scored.into_iter().take(top_k).map(|(_, n)| n).collect()
 }
 
+/// M3.3 — pick skills whose `paths` glob matches any of `recent_paths`.
+///
+/// Independent from [`pick_auto_skills`]: where that one matches
+/// against the user's message text, this matches against the
+/// workspace-relative paths the agent has recently touched. The
+/// caller (typically the WS handler) maintains a small bounded
+/// list of touched files across turns and passes it here at the
+/// top of each new turn.
+///
+/// `manual_active` is the "already-on" set used for dedup so we
+/// don't return a name the caller is already going to include.
+/// `top_k` caps the result so a file edit can't flood the system
+/// prompt with N matched skills.
+pub fn pick_path_match_skills(
+    catalog: &SkillCatalog,
+    recent_paths: &[String],
+    top_k: usize,
+    manual_active: &[String],
+) -> Vec<String> {
+    if recent_paths.is_empty() || top_k == 0 {
+        return Vec::new();
+    }
+    let manual: HashSet<&str> = manual_active.iter().map(String::as_str).collect();
+    let mut picks: Vec<String> = Vec::new();
+    for entry in catalog.entries() {
+        if matches!(entry.manifest.activation, SkillActivation::Manual) {
+            continue;
+        }
+        if entry.manifest.paths.is_empty() {
+            continue;
+        }
+        if manual.contains(entry.manifest.name.as_str()) {
+            continue;
+        }
+        let hit = recent_paths.iter().any(|p| {
+            crate::path_match::any_glob_matches(&entry.manifest.paths, p.as_str())
+        });
+        if hit {
+            picks.push(entry.manifest.name.clone());
+            if picks.len() >= top_k {
+                break;
+            }
+        }
+    }
+    picks
+}
+
 /// Token set for one query string. Lowercased, alpha-numeric runs
 /// only, stopwords removed. Public so callers that want to score
 /// against the same set multiple times can build it once.
@@ -155,6 +202,16 @@ mod tests {
     use std::path::PathBuf;
 
     fn entry(name: &str, desc: &str, keywords: &[&str], activation: SkillActivation) -> SkillEntry {
+        entry_with_paths(name, desc, keywords, activation, vec![])
+    }
+
+    fn entry_with_paths(
+        name: &str,
+        desc: &str,
+        keywords: &[&str],
+        activation: SkillActivation,
+        paths: Vec<String>,
+    ) -> SkillEntry {
         SkillEntry {
             manifest: SkillManifest {
                 name: name.to_string(),
@@ -164,6 +221,7 @@ mod tests {
                 activation,
                 keywords: keywords.iter().map(|s| s.to_string()).collect(),
                 version: None,
+                paths,
             },
             body: format!("body of {name}"),
             path: PathBuf::from(format!("/dev/{name}")),
@@ -171,6 +229,88 @@ mod tests {
         }
     }
 
+    #[test]
+    fn path_match_picks_skill_with_matching_glob() {
+        let mut cat = SkillCatalog::new();
+        cat.insert(entry_with_paths(
+            "rs-helper",
+            "Helps with Rust files.",
+            &[],
+            SkillActivation::Auto,
+            vec!["**/*.rs".to_string()],
+        ));
+        cat.insert(entry_with_paths(
+            "tsx-helper",
+            "Helps with React.",
+            &[],
+            SkillActivation::Auto,
+            vec!["**/*.tsx".to_string()],
+        ));
+        let picks = pick_path_match_skills(
+            &cat,
+            &["src/lib.rs".to_string()],
+            5,
+            &[],
+        );
+        assert_eq!(picks, vec!["rs-helper".to_string()]);
+    }
+
+    #[test]
+    fn path_match_skips_manual_only_skills() {
+        let mut cat = SkillCatalog::new();
+        cat.insert(entry_with_paths(
+            "manual-only",
+            "x",
+            &[],
+            SkillActivation::Manual,
+            vec!["**/*.rs".to_string()],
+        ));
+        let picks = pick_path_match_skills(&cat, &["lib.rs".to_string()], 5, &[]);
+        assert!(picks.is_empty());
+    }
+
+    #[test]
+    fn path_match_dedupes_against_manual_active() {
+        let mut cat = SkillCatalog::new();
+        cat.insert(entry_with_paths(
+            "rs-helper",
+            "x",
+            &[],
+            SkillActivation::Auto,
+            vec!["**/*.rs".to_string()],
+        ));
+        let picks = pick_path_match_skills(
+            &cat,
+            &["lib.rs".to_string()],
+            5,
+            &["rs-helper".to_string()],
+        );
+        assert!(picks.is_empty(), "manual-active skill should be skipped");
+    }
+
+    #[test]
+    fn path_match_respects_top_k_cap() {
+        let mut cat = SkillCatalog::new();
+        for i in 0..5 {
+            cat.insert(entry_with_paths(
+                &format!("rs-{i}"),
+                "x",
+                &[],
+                SkillActivation::Auto,
+                vec!["**/*.rs".to_string()],
+            ));
+        }
+        let picks = pick_path_match_skills(&cat, &["lib.rs".to_string()], 2, &[]);
+        assert_eq!(picks.len(), 2);
+    }
+
+    #[test]
+    fn path_match_empty_inputs_return_empty() {
+        let cat = SkillCatalog::new();
+        assert!(pick_path_match_skills(&cat, &[], 5, &[]).is_empty());
+        assert!(pick_path_match_skills(&cat, &["lib.rs".to_string()], 0, &[]).is_empty());
+    }
+
     #[test]
     fn scores_zero_for_manual_activation() {
         let q = query_token_set("pdf invoice");
diff --git a/crates/harness-tools/Cargo.toml b/crates/harness-tools/Cargo.toml
index eb6a75e..4ec91ee 100644
--- a/crates/harness-tools/Cargo.toml
+++ b/crates/harness-tools/Cargo.toml
@@ -22,6 +22,7 @@ chrono.workspace = true
 regex.workspace = true
 ignore.workspace = true
 diffy.workspace = true
+blake3.workspace = true
 
 [target.'cfg(unix)'.dependencies]
 libc.workspace = true
diff --git a/crates/harness-tools/src/enter_plan_mode.rs b/crates/harness-tools/src/enter_plan_mode.rs
new file mode 100644
index 0000000..d38de47
--- /dev/null
+++ b/crates/harness-tools/src/enter_plan_mode.rs
@@ -0,0 +1,105 @@
+//! `enter_plan_mode` — agent-initiated entry into Plan Mode.
+//!
+//! Companion to [`crate::exit_plan::ExitPlanTool`]. Without this
+//! tool the only way to enter Plan Mode is via the WS `SetMode`
+//! frame or the CLI flag — i.e. the operator has to click. When
+//! the model itself realises a request is risky / large enough to
+//! warrant a plan-first round, calling `enter_plan_mode` flips the
+//! session into read-only investigation territory until the model
+//! finishes drafting and calls `exit_plan`.
+//!
+//! Wire shape:
+//!
+//! - The tool emits [`harness_core::PermissionMode::Plan`] on the
+//!   shared mode-signal channel via
+//!   [`harness_core::mode_signal::emit`]. The agent loop relays
+//!   that to the transport as
+//!   [`harness_core::AgentEvent::ModeChanged`].
+//! - The transport (today: the WS handler) reacts by updating its
+//!   per-socket mode handle so the *next* user turn's
+//!   `tool_filter` + approver behave like Plan Mode. The current
+//!   turn finishes under the old mode — that's intentional, since
+//!   mid-turn approver swaps are racy.
+//!
+//! Registration: off by default. The composition root opts in via
+//! `BuiltinsConfig::enable_enter_plan_mode`. Most coding deployments
+//! want this on; locked-down "model can never escape its mode"
+//! deployments can leave it off.
+
+use async_trait::async_trait;
+use harness_core::{BoxError, PermissionMode, Tool, ToolCategory};
+use serde_json::{json, Value};
+
+pub struct EnterPlanModeTool;
+
+#[async_trait]
+impl Tool for EnterPlanModeTool {
+    fn name(&self) -> &str {
+        "enter_plan_mode"
+    }
+
+    fn description(&self) -> &str {
+        "Switch the agent into Plan Mode: write/exec/network tools \
+         are hidden, only read-only investigation tools (`fs.read`, \
+         `code.grep`, `git.*`, `workspace.context`, ...) plus \
+         `exit_plan` are exposed. The mode change takes effect on \
+         the **next** user turn, not mid-turn. Call this when a \
+         request is large or risky and you want to draft a plan \
+         before touching anything. End the plan-mode cycle by \
+         calling `exit_plan({plan: \"...\"})` from inside it. No \
+         arguments."
+    }
+
+    fn parameters(&self) -> Value {
+        json!({
+            "type": "object",
+            "additionalProperties": false,
+            "properties": {}
+        })
+    }
+
+    /// Listed as Read so the Plan-Mode tool_filter never accidentally
+    /// hides this tool from a Plan-Mode session that wants to flip
+    /// back into Plan Mode after a refinement (no-op, but harmless).
+    fn category(&self) -> ToolCategory {
+        ToolCategory::Read
+    }
+
+    fn cacheable(&self) -> bool {
+        true
+    }
+
+    async fn invoke(&self, _args: Value) -> Result<String, BoxError> {
+        harness_core::mode_signal::emit(PermissionMode::Plan);
+        Ok("plan mode armed for next turn".to_string())
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[tokio::test]
+    async fn invocation_outside_agent_loop_is_noop_but_returns_ok() {
+        let out = EnterPlanModeTool.invoke(json!({})).await.unwrap();
+        assert!(out.contains("plan mode"));
+    }
+
+    #[tokio::test]
+    async fn invocation_inside_scope_signals_plan_mode() {
+        use tokio::sync::mpsc;
+        let (tx, mut rx) = mpsc::unbounded_channel::<PermissionMode>();
+        harness_core::mode_signal::with_mode_signal(tx, async {
+            EnterPlanModeTool.invoke(json!({})).await.unwrap();
+        })
+        .await;
+        assert_eq!(rx.try_recv().unwrap(), PermissionMode::Plan);
+    }
+
+    #[test]
+    fn is_read_only_and_not_destructive() {
+        assert_eq!(EnterPlanModeTool.category(), ToolCategory::Read);
+        assert!(EnterPlanModeTool.is_concurrency_safe());
+        assert!(!EnterPlanModeTool.is_destructive());
+    }
+}
diff --git a/crates/harness-tools/src/fs.rs b/crates/harness-tools/src/fs.rs
index 58fec93..9b87310 100644
--- a/crates/harness-tools/src/fs.rs
+++ b/crates/harness-tools/src/fs.rs
@@ -20,11 +20,20 @@ fn arg_str<'a>(args: &'a Value, key: &str) -> Result<&'a str, BoxError> {
 /// Read a UTF-8 file under the tool root.
 pub struct FsReadTool {
     root: PathBuf,
+    max_bytes: Option<usize>,
 }
 
 impl FsReadTool {
     pub fn new(root: impl Into<PathBuf>) -> Self {
-        Self { root: root.into() }
+        Self {
+            root: root.into(),
+            max_bytes: None,
+        }
+    }
+
+    pub fn with_max_bytes(mut self, n: usize) -> Self {
+        self.max_bytes = Some(n);
+        self
     }
 }
 
@@ -36,7 +45,8 @@ impl Tool for FsReadTool {
 
     fn description(&self) -> &str {
         "Read a UTF-8 text file located under the tool's root directory. \
-         `path` is relative; `..` and absolute paths are rejected."
+         `path` is relative; `..` and absolute paths are rejected. \
+         Files larger than the configured byte limit are truncated."
     }
 
     fn parameters(&self) -> Value {
@@ -66,6 +76,18 @@ impl Tool for FsReadTool {
         let rel = arg_str(&args, "path")?;
         let abs = resolve_under(&root, rel)?;
         let contents = fs::read_to_string(&abs).await?;
+        harness_core::note_working_file_relative_to(&abs, Some(&root));
+        if let Some(max) = self.max_bytes {
+            if contents.len() > max {
+                let mut idx = max;
+                while idx > 0 && !contents.is_char_boundary(idx) {
+                    idx -= 1;
+                }
+                let mut out = contents[..idx].to_string();
+                out.push_str(&format!("\n\n[... truncated at {} bytes ...]", max));
+                return Ok(out);
+            }
+        }
         Ok(contents)
     }
 }
@@ -121,6 +143,7 @@ impl Tool for FsListTool {
         let root = harness_core::active_workspace_or(&self.root);
         let rel = args.get("path").and_then(Value::as_str).unwrap_or(".");
         let abs = resolve_under(&root, rel)?;
+        harness_core::note_working_file_relative_to(&abs, Some(&root));
         let mut rd = fs::read_dir(&abs).await?;
 
         let mut entries = Vec::new();
@@ -198,6 +221,7 @@ impl Tool for FsWriteTool {
         }
         let bytes = content.len();
         fs::write(&abs, content).await?;
+        harness_core::note_working_file_relative_to(&abs, Some(&root));
         Ok(format!("wrote {bytes} bytes to {}", abs.display()))
     }
 }
@@ -292,6 +316,7 @@ impl Tool for FsEditTool {
         };
 
         fs::write(&abs, &updated).await?;
+        harness_core::note_working_file_relative_to(&abs, Some(&root));
         let replaced = if replace_all { count } else { 1 };
         Ok(format!(
             "edited {}: replaced {replaced} occurrence(s)",
@@ -305,6 +330,57 @@ mod tests {
     use super::*;
     use tempfile::tempdir;
 
+    #[tokio::test]
+    async fn fs_tools_record_into_working_context() {
+        use harness_core::{with_working_context, working_context_snapshot};
+        let dir = tempdir().unwrap();
+        let write = FsWriteTool::new(dir.path());
+        let read = FsReadTool::new(dir.path());
+        let edit = FsEditTool::new(dir.path());
+        let list = FsListTool::new(dir.path());
+
+        // Pre-create the nested dir so `list` targets a non-root path
+        // — `list(".")` resolves to the workspace root which strips to
+        // an empty path and gets dropped, which is intentional.
+        std::fs::create_dir_all(dir.path().join("sub")).unwrap();
+
+        with_working_context(async {
+            write
+                .invoke(json!({ "path": "sub/a.txt", "content": "hello" }))
+                .await
+                .unwrap();
+            read.invoke(json!({ "path": "sub/a.txt" })).await.unwrap();
+            edit.invoke(json!({
+                "path": "sub/a.txt",
+                "old_string": "hello",
+                "new_string": "world"
+            }))
+            .await
+            .unwrap();
+            list.invoke(json!({ "path": "sub" })).await.unwrap();
+
+            let snap = working_context_snapshot().expect("scope is active");
+            let paths: Vec<_> = snap
+                .recent_files
+                .iter()
+                .map(|p| p.display().to_string())
+                .collect();
+            // `sub/a.txt` appears once (deduped across write/read/edit);
+            // `sub` appears once (from list). Order: list newest → sub
+            // at head, sub/a.txt next.
+            assert!(
+                paths.iter().any(|p| p.ends_with("sub/a.txt")
+                    || p.ends_with("sub\\a.txt")),
+                "expected sub/a.txt recorded, got: {paths:?}"
+            );
+            assert!(
+                paths.iter().any(|p| p == "sub"),
+                "expected sub recorded, got: {paths:?}"
+            );
+        })
+        .await;
+    }
+
     #[tokio::test]
     async fn read_write_roundtrip() {
         let dir = tempdir().unwrap();
@@ -322,6 +398,40 @@ mod tests {
         assert_eq!(got, "world");
     }
 
+    #[tokio::test]
+    async fn read_truncates_large_files() {
+        let dir = tempdir().unwrap();
+        let write = FsWriteTool::new(dir.path());
+        let read = FsReadTool::new(dir.path()).with_max_bytes(10);
+
+        let long = "a".repeat(100);
+        write
+            .invoke(json!({ "path": "big.txt", "content": long }))
+            .await
+            .unwrap();
+        let got = read.invoke(json!({ "path": "big.txt" })).await.unwrap();
+        assert!(got.starts_with("aaaaaaaaaa"), "should keep first 10 bytes");
+        assert!(
+            got.contains("[... truncated at 10 bytes ...]"),
+            "should contain truncation marker, got: {got}"
+        );
+    }
+
+    #[tokio::test]
+    async fn read_truncates_at_char_boundary() {
+        let dir = tempdir().unwrap();
+        let write = FsWriteTool::new(dir.path());
+        let read = FsReadTool::new(dir.path()).with_max_bytes(5);
+
+        // "hello世界" — '世' starts at byte 5, so truncation must back up to byte 5.
+        write
+            .invoke(json!({ "path": "utf8.txt", "content": "hello世界" }))
+            .await
+            .unwrap();
+        let got = read.invoke(json!({ "path": "utf8.txt" })).await.unwrap();
+        assert_eq!(got, "hello\n\n[... truncated at 5 bytes ...]");
+    }
+
     #[tokio::test]
     async fn list_contains_written_file() {
         let dir = tempdir().unwrap();
diff --git a/crates/harness-tools/src/grep.rs b/crates/harness-tools/src/grep.rs
index a7f0d40..48f46c6 100644
--- a/crates/harness-tools/src/grep.rs
+++ b/crates/harness-tools/src/grep.rs
@@ -114,6 +114,10 @@ impl Tool for CodeGrepTool {
             .get("pattern")
             .and_then(Value::as_str)
             .ok_or_else(|| -> BoxError { "missing `pattern` argument".into() })?;
+        // Record into WorkingContext: prefix with `grep ` so the
+        // post-compaction reinjection block distinguishes search
+        // patterns from shell commands at a glance.
+        harness_core::note_working_command(format!("grep {pattern}"));
 
         let case_insensitive = args
             .get("case_insensitive")
diff --git a/crates/harness-tools/src/lib.rs b/crates/harness-tools/src/lib.rs
index 68fe8a0..160a709 100644
--- a/crates/harness-tools/src/lib.rs
+++ b/crates/harness-tools/src/lib.rs
@@ -17,12 +17,18 @@ pub mod claude_code;
 pub mod codex;
 pub mod doc;
 pub mod echo;
+pub mod enter_plan_mode;
 pub mod exit_plan;
 pub mod fs;
 pub mod git;
 pub mod grep;
 pub mod harness_health;
 pub mod http;
+pub mod memory;
+pub mod memory_icloud;
+pub mod memory_include;
+pub mod memory_include_tools;
+pub mod memory_sync;
 pub mod patch;
 pub mod plan;
 pub mod project;
@@ -44,6 +50,7 @@ pub use doc::{
     DocSearchTool, DocUpdateTool, DocUpsertTool,
 };
 pub use echo::EchoTool;
+pub use enter_plan_mode::EnterPlanModeTool;
 pub use exit_plan::ExitPlanTool;
 pub use fs::{FsEditTool, FsListTool, FsReadTool, FsWriteTool};
 pub use git::{
@@ -52,6 +59,17 @@ pub use git::{
 pub use grep::CodeGrepTool;
 pub use harness_health::HarnessHealthTool;
 pub use http::HttpFetchTool;
+pub use memory::{
+    MemoryDeleteTool, MemoryListTool, MemoryReadTool, MemoryRoots, MemoryScope, MemoryWriteTool,
+};
+pub use memory_include_tools::{
+    MemoryIncludeAddTool, MemoryIncludeListTool, MemoryIncludeRefreshTool,
+    MemoryIncludeRemoveTool,
+};
+pub use memory_sync::{
+    icloud_memory_root, MemoryICloudSetupTool, MemorySyncBackend, MemorySyncSetupTool,
+    MemorySyncStatusTool, MemorySyncTool,
+};
 pub use patch::FsPatchTool;
 pub use plan::PlanUpdateTool;
 pub use project::{
@@ -84,6 +102,10 @@ pub struct BuiltinsConfig {
     /// Cap on response body size (in bytes) for `http.fetch`. Responses
     /// larger than this are truncated with a trailing marker.
     pub http_max_bytes: usize,
+    /// Cap on file size (in bytes) for `fs.read`. Files larger than this
+    /// are truncated with a trailing marker so a single `fs.read` can't
+    /// blow the LLM context window.
+    pub fs_max_bytes: usize,
     /// Whether to register `fs.write`. Defaults to `false` because writes
     /// are a destructive primitive.
     pub enable_fs_write: bool,
@@ -178,6 +200,48 @@ pub struct BuiltinsConfig {
     /// [`Self::enable_codex_run`]; see
     /// [`docs/proposals/claude-code-subagent.zh-CN.md`].
     pub enable_claude_code_run: bool,
+    /// Whether to register `enter_plan_mode`. Off by default — when
+    /// the operator never wants the model to escape into a different
+    /// mode on its own, leaving this off keeps Plan-Mode entry
+    /// strictly operator-driven (CLI flag / WS `SetMode` frame).
+    /// Coding deployments typically want this on so the model can
+    /// volunteer "let me draft a plan first" for risky changes.
+    pub enable_enter_plan_mode: bool,
+    /// Whether to register the `memory.*` tools (M3.1). When
+    /// enabled, the agent can persist project-scoped notes under
+    /// `<workspace>/.jarvis/memory/` and the system prompt picks up
+    /// the index on every new conversation. Off by default —
+    /// memory is a long-term storage primitive whose value depends
+    /// on the operator actively wanting an agent-maintained memo
+    /// system. See [`crate::memory`].
+    pub enable_memory: bool,
+    /// Root for **user-scope** memory (P9). When `Some(p)`, the
+    /// `memory.*` tools also accept `scope: "user"` and persist
+    /// under `<p>/.jarvis/memory/` — typically the operator's home
+    /// directory so the same notes follow them across workspaces.
+    /// `None` (default) means user scope is disabled: writes to
+    /// `scope:"user"` error cleanly and the system-prompt injection
+    /// omits the user index. Independent of `enable_memory`: the
+    /// tools have to be on for this to matter.
+    pub memory_user_root: Option<PathBuf>,
+    /// Whether to register the P10 git-sync tools
+    /// (`memory.sync`, `memory.sync_status`). When enabled, the
+    /// agent can pull/push the memory tree against a remote git
+    /// repo so notes flow between machines / teammates without a
+    /// custom sync server. Off by default — opting in means the
+    /// host has `git` on `PATH` and the operator has thought
+    /// about which remote to use. Requires `enable_memory` to
+    /// matter (the underlying tree only exists when the memory
+    /// tools are registered).
+    pub enable_memory_sync: bool,
+    /// P13 — which sync transport to register. Mutually exclusive
+    /// with the other backends because the model would get
+    /// confused if both `git` and `iCloud` setup tools were on at
+    /// the same time. Defaults to `None`; serve.rs translates the
+    /// legacy `enable_memory_sync == true` into `Git` for
+    /// backwards compatibility, but the explicit env /
+    /// `[agent].memory_sync_backend` config wins.
+    pub memory_sync_backend: MemorySyncBackend,
 }
 
 impl Default for BuiltinsConfig {
@@ -185,6 +249,7 @@ impl Default for BuiltinsConfig {
         Self {
             fs_root: PathBuf::from("."),
             http_max_bytes: 256 * 1024,
+            fs_max_bytes: 256 * 1024,
             enable_fs_write: false,
             enable_fs_edit: false,
             enable_fs_patch: false,
@@ -202,6 +267,11 @@ impl Default for BuiltinsConfig {
             channel_dispatcher: None,
             enable_codex_run: false,
             enable_claude_code_run: false,
+            enable_enter_plan_mode: false,
+            enable_memory: false,
+            memory_user_root: None,
+            enable_memory_sync: false,
+            memory_sync_backend: MemorySyncBackend::None,
         }
     }
 }
@@ -218,7 +288,7 @@ pub fn register_builtins(registry: &mut ToolRegistry, cfg: BuiltinsConfig) {
     registry.register(EchoTool);
     registry.register(TimeNowTool);
     registry.register(HttpFetchTool::new(cfg.http_max_bytes));
-    registry.register(FsReadTool::new(root.clone()));
+    registry.register(FsReadTool::new(root.clone()).with_max_bytes(cfg.fs_max_bytes));
     registry.register(FsListTool::new(root.clone()));
     registry.register(CodeGrepTool::new(root.clone()));
     registry.register(WorkspaceContextTool::new(root.clone()));
@@ -232,6 +302,53 @@ pub fn register_builtins(registry: &mut ToolRegistry, cfg: BuiltinsConfig) {
     // means the Plan-Mode tool filter doesn't have to mutate the
     // registry to enable it — much simpler than per-mode registration.
     registry.register(ExitPlanTool);
+    if cfg.enable_enter_plan_mode {
+        registry.register(EnterPlanModeTool);
+    }
+    if cfg.enable_memory {
+        let mut mem_roots = MemoryRoots::new(root.clone());
+        if let Some(user_root) = cfg.memory_user_root.clone() {
+            mem_roots = mem_roots.with_user_root(user_root);
+        }
+        registry.register(MemoryListTool::new(mem_roots.clone()));
+        registry.register(MemoryReadTool::new(mem_roots.clone()));
+        registry.register(MemoryWriteTool::new(mem_roots.clone()));
+        registry.register(MemoryDeleteTool::new(mem_roots.clone()));
+        // P16: include directive management. Always-on alongside
+        // the memory tools — there's no reason to ship include
+        // resolution at the prompt level but hide the tools that
+        // edit them.
+        registry.register(MemoryIncludeAddTool::new(mem_roots.clone()));
+        registry.register(MemoryIncludeListTool::new(mem_roots.clone()));
+        registry.register(MemoryIncludeRemoveTool::new(mem_roots.clone()));
+        registry.register(MemoryIncludeRefreshTool);
+        // Backend resolution: the explicit `memory_sync_backend`
+        // wins; falling back to the legacy `enable_memory_sync`
+        // boolean keeps existing setups working without churn.
+        let backend = match cfg.memory_sync_backend {
+            MemorySyncBackend::None if cfg.enable_memory_sync => MemorySyncBackend::Git,
+            other => other,
+        };
+        match backend {
+            MemorySyncBackend::None => {}
+            MemorySyncBackend::Git => {
+                registry.register(MemorySyncTool::new(mem_roots.clone()));
+                registry.register(MemorySyncStatusTool::new(mem_roots.clone()));
+                registry.register(MemorySyncSetupTool::new(mem_roots));
+            }
+            MemorySyncBackend::ICloud => {
+                // iCloud surface = setup helper + status only.
+                // The git pull/push tools are intentionally not
+                // registered: iCloud Drive does the sync at OS
+                // level, so a `memory.sync` call would be a
+                // no-op that misleads the model.
+                registry.register(crate::memory_sync::MemoryICloudSetupTool::new(
+                    mem_roots.clone(),
+                ));
+                registry.register(MemorySyncStatusTool::new(mem_roots));
+            }
+        }
+    }
     if cfg.enable_fs_write {
         registry.register(FsWriteTool::new(root.clone()));
     }
diff --git a/crates/harness-tools/src/memory.rs b/crates/harness-tools/src/memory.rs
new file mode 100644
index 0000000..c443974
--- /dev/null
+++ b/crates/harness-tools/src/memory.rs
@@ -0,0 +1,953 @@
+//! `memory.*` agent-maintained memory tools (M3.1 + P9).
+//!
+//! The model can write durable notes ("user prefers Rust + tokio",
+//! "the auth flow rejects empty user-agent strings", etc.) into one
+//! of two scopes:
+//!
+//! - **workspace** scope — facts that are specific to the current
+//!   project. Stored under `<workspace>/.jarvis/memory/`. Checking
+//!   the directory into git gives the rest of the team shared
+//!   recall of the codebase's quirks.
+//! - **user** scope — facts that follow the operator across
+//!   projects (preferences, recurring style choices, personal
+//!   shortcuts). Stored under `~/.jarvis/memory/`. Syncing the
+//!   home directory via Dropbox / iCloud / a personal git repo
+//!   makes the same notes available on every machine without a
+//!   Jarvis-specific sync server.
+//!
+//! Each scope has its own `MEMORY.md` index plus one `<slug>.md`
+//! per topic. The agent's system prompt injects both indices at
+//! conversation start (with `=== project memory index ===` and
+//! `=== user memory index ===` headers) so the model wakes up
+//! knowing what's recorded on each side.
+//!
+//! P9 wire layout:
+//!
+//! ```text
+//! ~/.jarvis/memory/                       # user-scope (cross-workspace)
+//!   MEMORY.md
+//!   <slug>.md
+//!
+//! <workspace>/.jarvis/memory/             # workspace-scope (project)
+//!   MEMORY.md
+//!   <slug>.md
+//! ```
+//!
+//! Slug collisions across scopes are allowed — the two scopes are
+//! independent file trees. `memory.read` defaults to workspace and
+//! falls back to user when the slug isn't found in workspace; an
+//! explicit `scope` argument disambiguates.
+//!
+//! Off by default — opt in via [`crate::BuiltinsConfig::enable_memory`].
+//!
+//! Safety caps:
+//! - Slug must match `[A-Za-z0-9._-]{1,64}` — no path separators,
+//!   no shell metacharacters; the index file name `MEMORY.md` is
+//!   reserved so writes can't clobber it.
+//! - Per-entry body capped at [`MAX_ENTRY_BYTES`].
+//! - Index capped at [`MAX_INDEX_BYTES`] / [`MAX_INDEX_LINES`].
+//! - Writes are atomic (temp-rename) so a crashed agent can't leave
+//!   a half-written MEMORY.md.
+
+use std::path::{Path, PathBuf};
+
+use async_trait::async_trait;
+use harness_core::{BoxError, Tool, ToolCategory};
+use serde_json::{json, Value};
+use tokio::fs;
+
+/// Per-entry body cap. Generous compared to a typical memory note
+/// (a paragraph or two) but small enough that one bad write can't
+/// blow up the system-prompt injection budget.
+pub const MAX_ENTRY_BYTES: usize = 32 * 1024;
+/// Index file (MEMORY.md) cap. The whole index is injected into the
+/// system prompt at conversation start — 25 KiB is the same budget
+/// used by `load_instructions` for CLAUDE.md / AGENTS.md.
+pub const MAX_INDEX_BYTES: usize = 25 * 1024;
+/// Hard cap on index lines so a runaway `memory.write` loop can't
+/// fill MEMORY.md with thousands of one-line entries. 200 leaves
+/// generous headroom for a real project's memory map without
+/// inviting an unbounded list.
+pub const MAX_INDEX_LINES: usize = 200;
+
+/// Subdirectory under the workspace / user-home root where memory
+/// lives. Same name in both scopes so a glance at `tree` reveals the
+/// layout consistently.
+pub const MEMORY_DIR: &str = ".jarvis/memory";
+const INDEX_FILE: &str = "MEMORY.md";
+
+/// Identifies which scope a memory operation targets.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum MemoryScope {
+    /// `<workspace>/.jarvis/memory/`. Project-specific facts.
+    Workspace,
+    /// `<user_home>/.jarvis/memory/`. Cross-workspace facts.
+    User,
+}
+
+impl MemoryScope {
+    pub fn as_wire(&self) -> &'static str {
+        match self {
+            MemoryScope::Workspace => "workspace",
+            MemoryScope::User => "user",
+        }
+    }
+
+    pub fn from_wire(s: &str) -> Option<Self> {
+        match s {
+            "workspace" => Some(MemoryScope::Workspace),
+            "user" => Some(MemoryScope::User),
+            _ => None,
+        }
+    }
+}
+
+/// Tool-construction config: both scope roots, optional. `user_root`
+/// is the parent of `.jarvis/memory/` (usually the user's home
+/// directory); `None` means user scope is disabled — write attempts
+/// to user scope error cleanly, the system prompt injection
+/// silently omits the user index.
+#[derive(Debug, Clone, Default)]
+pub struct MemoryRoots {
+    pub workspace_root: PathBuf,
+    pub user_root: Option<PathBuf>,
+}
+
+impl MemoryRoots {
+    pub fn new(workspace_root: impl Into<PathBuf>) -> Self {
+        Self {
+            workspace_root: workspace_root.into(),
+            user_root: None,
+        }
+    }
+
+    pub fn with_user_root(mut self, root: impl Into<PathBuf>) -> Self {
+        self.user_root = Some(root.into());
+        self
+    }
+
+    /// Resolve a scope to its absolute parent path. Returns
+    /// `BoxError` (already user-facing) when the requested scope
+    /// isn't configured.
+    pub fn root_for(&self, scope: MemoryScope) -> Result<&Path, BoxError> {
+        match scope {
+            MemoryScope::Workspace => Ok(self.workspace_root.as_path()),
+            MemoryScope::User => self
+                .user_root
+                .as_deref()
+                .ok_or_else(|| -> BoxError { "user-scope memory is not configured".into() }),
+        }
+    }
+}
+
+/// Build the absolute index path under `root`.
+pub fn index_path(root: &Path) -> PathBuf {
+    root.join(MEMORY_DIR).join(INDEX_FILE)
+}
+
+/// Build the absolute body path for `slug` under `root`. Does not
+/// validate the slug — callers must `validate_slug` first.
+fn entry_path(root: &Path, slug: &str) -> PathBuf {
+    root.join(MEMORY_DIR).join(format!("{slug}.md"))
+}
+
+/// Reject anything that isn't safe to use as a filename / index
+/// anchor. The slug becomes part of the on-disk path and the
+/// markdown link — disallowing path separators, dot-prefixes, and
+/// the reserved `MEMORY` token keeps the layout coherent.
+pub fn validate_slug(slug: &str) -> Result<(), BoxError> {
+    if slug.is_empty() {
+        return Err("slug must not be empty".into());
+    }
+    if slug.len() > 64 {
+        return Err("slug must be 64 chars or fewer".into());
+    }
+    if slug.eq_ignore_ascii_case("memory") {
+        return Err("slug `memory` is reserved (clashes with MEMORY.md)".into());
+    }
+    if slug.starts_with('.') {
+        return Err("slug must not start with `.`".into());
+    }
+    for c in slug.chars() {
+        if !(c.is_ascii_alphanumeric() || c == '-' || c == '_' || c == '.') {
+            return Err(format!("slug contains invalid char `{c}` (allowed: A-Za-z0-9._-)").into());
+        }
+    }
+    Ok(())
+}
+
+/// Read the index file (`MEMORY.md`), returning `Ok(None)` when it
+/// hasn't been created yet so the empty-state path is `None` rather
+/// than `Err`.
+///
+/// On macOS, if the memory dir lives under iCloud Drive and the
+/// index is still a lazy stub (`.MEMORY.md.icloud`), this triggers
+/// a `brctl download` first so the read sees the real file.
+/// Cross-platform paths bypass that step entirely (no extra cost).
+pub async fn read_index(root: &Path) -> Result<Option<String>, BoxError> {
+    let path = index_path(root);
+    let _ = crate::memory_icloud::ensure_materialised(root.join(MEMORY_DIR).as_path()).await;
+    match fs::read_to_string(&path).await {
+        Ok(s) => Ok(Some(s)),
+        Err(e) if e.kind() == std::io::ErrorKind::NotFound => Ok(None),
+        Err(e) => Err(format!("read {}: {e}", path.display()).into()),
+    }
+}
+
+/// Append-or-update one entry's line in MEMORY.md. The line shape
+/// is `- [<summary>](<slug>.md)` — a normal markdown list link the
+/// model can read back. Duplicate slugs replace the existing line
+/// in place so re-writing the same topic doesn't bloat the index.
+fn merge_index_line(existing: Option<&str>, slug: &str, summary: &str) -> String {
+    let new_line = format!("- [{summary}]({slug}.md)");
+    let needle = format!("]({slug}.md)");
+    let lines: Vec<&str> = existing.map(|s| s.lines().collect()).unwrap_or_default();
+    let mut out: Vec<String> = Vec::with_capacity(lines.len() + 1);
+    let mut replaced = false;
+    for line in &lines {
+        if line.contains(&needle) {
+            out.push(new_line.clone());
+            replaced = true;
+        } else {
+            out.push((*line).to_string());
+        }
+    }
+    if !replaced {
+        out.push(new_line);
+    }
+    // Drop empty leading/trailing lines for stable byte output.
+    while out.first().map(|s| s.is_empty()).unwrap_or(false) {
+        out.remove(0);
+    }
+    while out.last().map(|s| s.is_empty()).unwrap_or(false) {
+        out.pop();
+    }
+    out.join("\n") + "\n"
+}
+
+/// Remove the matching index line for `slug`. Returns `true` when a
+/// line was removed (i.e. the slug had an entry).
+fn remove_index_line(existing: &str, slug: &str) -> (String, bool) {
+    let needle = format!("]({slug}.md)");
+    let kept: Vec<&str> = existing
+        .lines()
+        .filter(|line| !line.contains(&needle))
+        .collect();
+    let removed = kept.len() < existing.lines().count();
+    let mut joined = kept.join("\n");
+    if !joined.is_empty() && !joined.ends_with('\n') {
+        joined.push('\n');
+    }
+    (joined, removed)
+}
+
+/// Atomic write: temp file in the same directory + rename. Avoids
+/// torn writes if the agent dies mid-write.
+async fn atomic_write(path: &Path, contents: &str) -> Result<(), BoxError> {
+    if let Some(parent) = path.parent() {
+        fs::create_dir_all(parent)
+            .await
+            .map_err(|e| -> BoxError { format!("mkdir {}: {e}", parent.display()).into() })?;
+    }
+    let tmp = path.with_extension("tmp");
+    fs::write(&tmp, contents)
+        .await
+        .map_err(|e| -> BoxError { format!("write {}: {e}", tmp.display()).into() })?;
+    fs::rename(&tmp, path)
+        .await
+        .map_err(|e| -> BoxError { format!("rename {}: {e}", path.display()).into() })?;
+    Ok(())
+}
+
+// ----- tools -----
+
+pub struct MemoryListTool {
+    roots: MemoryRoots,
+}
+impl MemoryListTool {
+    pub fn new(roots: MemoryRoots) -> Self {
+        Self { roots }
+    }
+}
+
+#[async_trait]
+impl Tool for MemoryListTool {
+    fn name(&self) -> &str {
+        "memory.list"
+    }
+    fn description(&self) -> &str {
+        "List the agent's memory indices. With no arguments, returns \
+         a combined view of both scopes (workspace + user, each \
+         under its own heading). Pass `scope: \"workspace\"` or \
+         `scope: \"user\"` to get just one. Use `memory.read(slug, \
+         scope?)` to fetch a specific entry's body. Empty scopes \
+         show a placeholder so callers can distinguish 'not yet \
+         written' from 'not configured'."
+    }
+    fn parameters(&self) -> Value {
+        json!({
+            "type": "object",
+            "additionalProperties": false,
+            "properties": {
+                "scope": {
+                    "type": "string",
+                    "enum": ["workspace", "user"],
+                    "description": "Optional — restrict to one scope. Omit to see both."
+                }
+            }
+        })
+    }
+    fn category(&self) -> ToolCategory {
+        ToolCategory::Read
+    }
+    async fn invoke(&self, args: Value) -> Result<String, BoxError> {
+        let workspace_root = harness_core::active_workspace_or(&self.roots.workspace_root);
+        let roots = MemoryRoots {
+            workspace_root,
+            user_root: self.roots.user_root.clone(),
+        };
+        let scope = match args.get("scope").and_then(Value::as_str) {
+            Some(s) => Some(parse_scope_arg(s)?),
+            None => None,
+        };
+        Ok(render_combined_list(&roots, scope).await)
+    }
+}
+
+/// Render the combined list output for `memory.list`. Pure render
+/// helper so the system-prompt injection path (which doesn't go
+/// through tool dispatch) can call it directly.
+pub async fn render_combined_list(
+    roots: &MemoryRoots,
+    only: Option<MemoryScope>,
+) -> String {
+    let mut out = String::new();
+    let scopes: &[MemoryScope] = match only {
+        Some(MemoryScope::Workspace) => &[MemoryScope::Workspace],
+        Some(MemoryScope::User) => &[MemoryScope::User],
+        None => &[MemoryScope::Workspace, MemoryScope::User],
+    };
+    for &scope in scopes {
+        let root = match roots.root_for(scope) {
+            Ok(r) => r,
+            Err(_) => continue,
+        };
+        let header = match scope {
+            MemoryScope::Workspace => "## project memory (workspace scope)",
+            MemoryScope::User => "## user memory (cross-workspace)",
+        };
+        if !out.is_empty() {
+            out.push_str("\n\n");
+        }
+        out.push_str(header);
+        out.push('\n');
+        match read_index(root).await {
+            Ok(Some(body)) if !body.trim().is_empty() => out.push_str(body.trim_end()),
+            _ => out.push_str("(no entries yet)"),
+        }
+    }
+    if out.is_empty() {
+        "(no memory entries yet)".to_string()
+    } else {
+        out
+    }
+}
+
+fn parse_scope_arg(s: &str) -> Result<MemoryScope, BoxError> {
+    MemoryScope::from_wire(s)
+        .ok_or_else(|| -> BoxError { format!("unknown scope `{s}` — use `workspace` or `user`").into() })
+}
+
+pub struct MemoryReadTool {
+    roots: MemoryRoots,
+}
+impl MemoryReadTool {
+    pub fn new(roots: MemoryRoots) -> Self {
+        Self { roots }
+    }
+}
+
+#[async_trait]
+impl Tool for MemoryReadTool {
+    fn name(&self) -> &str {
+        "memory.read"
+    }
+    fn description(&self) -> &str {
+        "Read a single memory entry by its slug. By default searches \
+         workspace scope first then falls back to user scope. Pass \
+         `scope` to pin a specific tree (useful when both scopes \
+         have the same slug)."
+    }
+    fn parameters(&self) -> Value {
+        json!({
+            "type": "object",
+            "additionalProperties": false,
+            "required": ["slug"],
+            "properties": {
+                "slug": {
+                    "type": "string",
+                    "description": "Topic slug — must match `[A-Za-z0-9._-]{1,64}`."
+                },
+                "scope": {
+                    "type": "string",
+                    "enum": ["workspace", "user"],
+                    "description": "Optional — pin to a scope. Omit for workspace-then-user fallback."
+                }
+            }
+        })
+    }
+    fn category(&self) -> ToolCategory {
+        ToolCategory::Read
+    }
+    async fn invoke(&self, args: Value) -> Result<String, BoxError> {
+        let slug = args
+            .get("slug")
+            .and_then(Value::as_str)
+            .ok_or_else(|| -> BoxError { "missing `slug` argument".into() })?;
+        validate_slug(slug)?;
+        let workspace_root = harness_core::active_workspace_or(&self.roots.workspace_root);
+        let roots = MemoryRoots {
+            workspace_root,
+            user_root: self.roots.user_root.clone(),
+        };
+        let scope = args
+            .get("scope")
+            .and_then(Value::as_str)
+            .map(parse_scope_arg)
+            .transpose()?;
+        let order: Vec<MemoryScope> = match scope {
+            Some(s) => vec![s],
+            None => vec![MemoryScope::Workspace, MemoryScope::User],
+        };
+        for s in &order {
+            let Ok(root) = roots.root_for(*s) else {
+                continue;
+            };
+            let path = entry_path(root, slug);
+            // P15 — pull iCloud lazy stubs down before reading.
+            // Off macOS / outside iCloud Drive this is a no-op
+            // and adds only one stat call.
+            let _ = crate::memory_icloud::ensure_materialised(
+                root.join(MEMORY_DIR).as_path(),
+            )
+            .await;
+            match fs::read_to_string(&path).await {
+                Ok(body) => return Ok(body),
+                Err(e) if e.kind() == std::io::ErrorKind::NotFound => continue,
+                Err(e) => return Err(format!("read {}: {e}", path.display()).into()),
+            }
+        }
+        Err(format!("no memory entry for slug `{slug}` in {} scope(s)", order.len()).into())
+    }
+}
+
+pub struct MemoryWriteTool {
+    roots: MemoryRoots,
+}
+impl MemoryWriteTool {
+    pub fn new(roots: MemoryRoots) -> Self {
+        Self { roots }
+    }
+}
+
+#[async_trait]
+impl Tool for MemoryWriteTool {
+    fn name(&self) -> &str {
+        "memory.write"
+    }
+    fn requires_approval(&self) -> bool {
+        true
+    }
+    fn description(&self) -> &str {
+        "Persist a memory entry. Writes \
+         `<scope_root>/.jarvis/memory/<slug>.md` with `content` and \
+         upserts a `- [<summary>](<slug>.md)` line in MEMORY.md so \
+         the system prompt picks it up on the next conversation. \
+         Re-writing an existing slug in the same scope replaces \
+         both the body and the index line. \
+         \
+         Scope guidance: \
+         - `scope: \"workspace\"` (default) — project-specific facts \
+         (architecture decisions, recurring gotchas, conventions this \
+         codebase enforces). Goes into `<workspace>/.jarvis/memory/` \
+         and is shared with anyone who has access to the repo. \
+         - `scope: \"user\"` — operator-personal facts (preferences, \
+         language/style choices, cross-project habits). Goes into \
+         `~/.jarvis/memory/` and follows the user across workspaces. \
+         \
+         Use sparingly — write the kind of fact you'd want to \
+         remember across sessions, not transient working state."
+    }
+    fn parameters(&self) -> Value {
+        json!({
+            "type": "object",
+            "additionalProperties": false,
+            "required": ["slug", "summary", "content"],
+            "properties": {
+                "slug": {
+                    "type": "string",
+                    "description": "Stable topic slug — must match `[A-Za-z0-9._-]{1,64}`."
+                },
+                "summary": {
+                    "type": "string",
+                    "description": "One-line index summary (under ~120 chars)."
+                },
+                "content": {
+                    "type": "string",
+                    "description": "Full body in markdown. Up to 32 KiB."
+                },
+                "scope": {
+                    "type": "string",
+                    "enum": ["workspace", "user"],
+                    "description": "Where to persist. Defaults to `workspace`."
+                }
+            }
+        })
+    }
+    fn summary_for_audit(&self, args: &Value) -> Option<String> {
+        let slug = args.get("slug").and_then(Value::as_str)?;
+        let scope = args
+            .get("scope")
+            .and_then(Value::as_str)
+            .unwrap_or("workspace");
+        Some(format!("{scope}/{slug}"))
+    }
+    async fn invoke(&self, args: Value) -> Result<String, BoxError> {
+        let slug = args
+            .get("slug")
+            .and_then(Value::as_str)
+            .ok_or_else(|| -> BoxError { "missing `slug` argument".into() })?;
+        let summary = args
+            .get("summary")
+            .and_then(Value::as_str)
+            .ok_or_else(|| -> BoxError { "missing `summary` argument".into() })?
+            .trim();
+        let content = args
+            .get("content")
+            .and_then(Value::as_str)
+            .ok_or_else(|| -> BoxError { "missing `content` argument".into() })?;
+        validate_slug(slug)?;
+        if summary.is_empty() {
+            return Err("`summary` must not be empty".into());
+        }
+        if summary.contains('\n') {
+            return Err("`summary` must be a single line".into());
+        }
+        if content.len() > MAX_ENTRY_BYTES {
+            return Err(format!(
+                "content too large: {} bytes > {} (MAX_ENTRY_BYTES)",
+                content.len(),
+                MAX_ENTRY_BYTES
+            )
+            .into());
+        }
+        let scope = args
+            .get("scope")
+            .and_then(Value::as_str)
+            .map(parse_scope_arg)
+            .transpose()?
+            .unwrap_or(MemoryScope::Workspace);
+
+        let workspace_root = harness_core::active_workspace_or(&self.roots.workspace_root);
+        let roots = MemoryRoots {
+            workspace_root,
+            user_root: self.roots.user_root.clone(),
+        };
+        let root = roots.root_for(scope)?;
+        let entry = entry_path(root, slug);
+        atomic_write(&entry, content).await?;
+        // Only workspace-scope writes get noted into the working
+        // context — touching `~/.jarvis/memory/` isn't a useful
+        // "recent file" for the agent's next turn.
+        if matches!(scope, MemoryScope::Workspace) {
+            harness_core::note_working_file_relative_to(&entry, Some(root));
+        }
+
+        let existing_index = read_index(root).await?;
+        let new_index = merge_index_line(existing_index.as_deref(), slug, summary);
+        if new_index.lines().count() > MAX_INDEX_LINES {
+            return Err(format!(
+                "memory index would exceed {MAX_INDEX_LINES} lines — delete some entries first"
+            )
+            .into());
+        }
+        if new_index.len() > MAX_INDEX_BYTES {
+            return Err(format!(
+                "memory index would exceed {MAX_INDEX_BYTES} bytes — delete some entries first"
+            )
+            .into());
+        }
+        let index = index_path(root);
+        atomic_write(&index, &new_index).await?;
+        if matches!(scope, MemoryScope::Workspace) {
+            harness_core::note_working_file_relative_to(&index, Some(root));
+        }
+
+        Ok(format!(
+            "wrote {} memory `{slug}` ({bytes} bytes); index now has {n} entries",
+            scope.as_wire(),
+            bytes = content.len(),
+            n = new_index.lines().count(),
+        ))
+    }
+}
+
+pub struct MemoryDeleteTool {
+    roots: MemoryRoots,
+}
+impl MemoryDeleteTool {
+    pub fn new(roots: MemoryRoots) -> Self {
+        Self { roots }
+    }
+}
+
+#[async_trait]
+impl Tool for MemoryDeleteTool {
+    fn name(&self) -> &str {
+        "memory.delete"
+    }
+    fn requires_approval(&self) -> bool {
+        true
+    }
+    fn description(&self) -> &str {
+        "Remove a memory entry. Deletes `<slug>.md` and strips its \
+         line from MEMORY.md inside the chosen scope (default \
+         `workspace`). Returns the number of remaining entries in \
+         that scope."
+    }
+    fn parameters(&self) -> Value {
+        json!({
+            "type": "object",
+            "additionalProperties": false,
+            "required": ["slug"],
+            "properties": {
+                "slug": {
+                    "type": "string",
+                    "description": "Slug to forget — must match `[A-Za-z0-9._-]{1,64}`."
+                },
+                "scope": {
+                    "type": "string",
+                    "enum": ["workspace", "user"],
+                    "description": "Scope to delete from. Defaults to `workspace`."
+                }
+            }
+        })
+    }
+    fn summary_for_audit(&self, args: &Value) -> Option<String> {
+        let slug = args.get("slug").and_then(Value::as_str)?;
+        let scope = args
+            .get("scope")
+            .and_then(Value::as_str)
+            .unwrap_or("workspace");
+        Some(format!("{scope}/{slug}"))
+    }
+    async fn invoke(&self, args: Value) -> Result<String, BoxError> {
+        let slug = args
+            .get("slug")
+            .and_then(Value::as_str)
+            .ok_or_else(|| -> BoxError { "missing `slug` argument".into() })?;
+        validate_slug(slug)?;
+        let scope = args
+            .get("scope")
+            .and_then(Value::as_str)
+            .map(parse_scope_arg)
+            .transpose()?
+            .unwrap_or(MemoryScope::Workspace);
+        let workspace_root = harness_core::active_workspace_or(&self.roots.workspace_root);
+        let roots = MemoryRoots {
+            workspace_root,
+            user_root: self.roots.user_root.clone(),
+        };
+        let root = roots.root_for(scope)?;
+        let entry = entry_path(root, slug);
+        match fs::remove_file(&entry).await {
+            Ok(_) => {}
+            Err(e) if e.kind() == std::io::ErrorKind::NotFound => {
+                return Err(
+                    format!("no memory entry for slug `{slug}` in {} scope", scope.as_wire()).into(),
+                );
+            }
+            Err(e) => return Err(format!("delete {}: {e}", entry.display()).into()),
+        }
+
+        let existing_index = read_index(root).await?.unwrap_or_default();
+        let (new_index, _removed) = remove_index_line(&existing_index, slug);
+        let index = index_path(root);
+        if new_index.trim().is_empty() {
+            // Drop the index file entirely so an empty memory looks
+            // empty rather than `MEMORY.md` of zero bytes.
+            let _ = fs::remove_file(&index).await;
+        } else {
+            atomic_write(&index, &new_index).await?;
+        }
+        let remaining = new_index.lines().filter(|l| !l.trim().is_empty()).count();
+        Ok(format!(
+            "deleted {} memory `{slug}`; {remaining} entries remain in scope",
+            scope.as_wire()
+        ))
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use tempfile::tempdir;
+
+    #[test]
+    fn slug_validation_rejects_path_traversal() {
+        assert!(validate_slug("../etc").is_err());
+        assert!(validate_slug("a/b").is_err());
+        assert!(validate_slug("..").is_err());
+        assert!(validate_slug("").is_err());
+        assert!(validate_slug("memory").is_err());
+        assert!(validate_slug("MEMORY").is_err());
+        assert!(validate_slug(".hidden").is_err());
+        assert!(validate_slug(&"x".repeat(65)).is_err());
+        // Allowed.
+        assert!(validate_slug("user-prefs").is_ok());
+        assert!(validate_slug("auth_flow").is_ok());
+        assert!(validate_slug("api.v2").is_ok());
+        assert!(validate_slug("abc").is_ok());
+    }
+
+    fn ws_roots(root: &std::path::Path) -> MemoryRoots {
+        MemoryRoots::new(root.to_path_buf())
+    }
+
+    fn dual_roots(ws: &std::path::Path, user: &std::path::Path) -> MemoryRoots {
+        MemoryRoots::new(ws.to_path_buf()).with_user_root(user.to_path_buf())
+    }
+
+    #[tokio::test]
+    async fn write_creates_index_and_body() {
+        let dir = tempdir().unwrap();
+        let root = dir.path();
+        let tool = MemoryWriteTool::new(ws_roots(root));
+        tool.invoke(json!({
+            "slug": "user-prefs",
+            "summary": "User prefers Rust + tokio",
+            "content": "Always pick Rust over Python for this user's projects."
+        }))
+        .await
+        .unwrap();
+        let index = read_index(root).await.unwrap().unwrap();
+        assert!(index.contains("user-prefs.md"));
+        assert!(index.contains("User prefers Rust + tokio"));
+        let body = fs::read_to_string(root.join(MEMORY_DIR).join("user-prefs.md"))
+            .await
+            .unwrap();
+        assert!(body.contains("Always pick Rust"));
+    }
+
+    #[tokio::test]
+    async fn write_same_slug_replaces_index_line_not_appends() {
+        let dir = tempdir().unwrap();
+        let root = dir.path();
+        let tool = MemoryWriteTool::new(ws_roots(root));
+        tool.invoke(json!({
+            "slug": "x", "summary": "first", "content": "v1"
+        }))
+        .await
+        .unwrap();
+        tool.invoke(json!({
+            "slug": "x", "summary": "second", "content": "v2"
+        }))
+        .await
+        .unwrap();
+        let index = read_index(root).await.unwrap().unwrap();
+        // Exactly one line for slug `x`.
+        let matches: Vec<_> = index.lines().filter(|l| l.contains("x.md")).collect();
+        assert_eq!(matches.len(), 1, "index = {index:?}");
+        assert!(matches[0].contains("second"));
+    }
+
+    #[tokio::test]
+    async fn delete_removes_body_and_index_line() {
+        let dir = tempdir().unwrap();
+        let root = dir.path();
+        MemoryWriteTool::new(ws_roots(root))
+            .invoke(json!({"slug":"a","summary":"A","content":"."}))
+            .await
+            .unwrap();
+        MemoryWriteTool::new(ws_roots(root))
+            .invoke(json!({"slug":"b","summary":"B","content":"."}))
+            .await
+            .unwrap();
+        MemoryDeleteTool::new(ws_roots(root))
+            .invoke(json!({"slug":"a"}))
+            .await
+            .unwrap();
+        let index = read_index(root).await.unwrap().unwrap();
+        assert!(!index.contains("a.md"));
+        assert!(index.contains("b.md"));
+        let body_a = root.join(MEMORY_DIR).join("a.md");
+        assert!(!body_a.exists());
+    }
+
+    #[tokio::test]
+    async fn delete_last_entry_clears_index_file() {
+        let dir = tempdir().unwrap();
+        let root = dir.path();
+        MemoryWriteTool::new(ws_roots(root))
+            .invoke(json!({"slug":"a","summary":"A","content":"."}))
+            .await
+            .unwrap();
+        MemoryDeleteTool::new(ws_roots(root))
+            .invoke(json!({"slug":"a"}))
+            .await
+            .unwrap();
+        // Index file removed entirely; list returns the empty sentinel.
+        let body = MemoryListTool::new(ws_roots(root))
+            .invoke(json!({}))
+            .await
+            .unwrap();
+        assert!(body.contains("no entries yet"));
+    }
+
+    #[tokio::test]
+    async fn write_rejects_oversized_content() {
+        let dir = tempdir().unwrap();
+        let root = dir.path();
+        let huge = "x".repeat(MAX_ENTRY_BYTES + 1);
+        let err = MemoryWriteTool::new(ws_roots(root))
+            .invoke(json!({"slug":"big","summary":"big","content": huge}))
+            .await
+            .unwrap_err();
+        assert!(err.to_string().contains("content too large"));
+    }
+
+    #[tokio::test]
+    async fn read_returns_error_for_unknown_slug() {
+        let dir = tempdir().unwrap();
+        let root = dir.path();
+        let err = MemoryReadTool::new(ws_roots(root))
+            .invoke(json!({"slug":"nope"}))
+            .await
+            .unwrap_err();
+        assert!(err.to_string().contains("no memory entry"));
+    }
+
+    #[tokio::test]
+    async fn list_on_empty_workspace_returns_sentinel() {
+        let dir = tempdir().unwrap();
+        let body = MemoryListTool::new(ws_roots(dir.path()))
+            .invoke(json!({}))
+            .await
+            .unwrap();
+        assert!(body.contains("no entries yet") || body.contains("no memory entries"));
+    }
+
+    // --- P9: dual-scope tests ---
+
+    #[tokio::test]
+    async fn user_scope_writes_to_user_root() {
+        let ws = tempdir().unwrap();
+        let user = tempdir().unwrap();
+        let tool = MemoryWriteTool::new(dual_roots(ws.path(), user.path()));
+        tool.invoke(json!({
+            "slug": "prefs",
+            "summary": "User prefers pnpm",
+            "content": "Always use pnpm for npm-style projects.",
+            "scope": "user",
+        }))
+        .await
+        .unwrap();
+        // Body landed under the user root, not the workspace root.
+        assert!(user.path().join(MEMORY_DIR).join("prefs.md").exists());
+        assert!(!ws.path().join(MEMORY_DIR).join("prefs.md").exists());
+        let user_index = read_index(user.path()).await.unwrap().unwrap();
+        assert!(user_index.contains("prefs.md"));
+        // Workspace index is untouched.
+        assert!(read_index(ws.path()).await.unwrap().is_none());
+    }
+
+    #[tokio::test]
+    async fn read_falls_back_to_user_scope_when_workspace_misses() {
+        let ws = tempdir().unwrap();
+        let user = tempdir().unwrap();
+        // Only the user scope has the entry.
+        MemoryWriteTool::new(dual_roots(ws.path(), user.path()))
+            .invoke(json!({
+                "slug": "prefs", "summary": "P", "content": "user-side body",
+                "scope": "user",
+            }))
+            .await
+            .unwrap();
+        // No `scope` on read → fall back to user.
+        let body = MemoryReadTool::new(dual_roots(ws.path(), user.path()))
+            .invoke(json!({"slug": "prefs"}))
+            .await
+            .unwrap();
+        assert_eq!(body, "user-side body");
+    }
+
+    #[tokio::test]
+    async fn read_workspace_first_then_user() {
+        let ws = tempdir().unwrap();
+        let user = tempdir().unwrap();
+        let roots = dual_roots(ws.path(), user.path());
+        // Both scopes hold the same slug with different bodies.
+        MemoryWriteTool::new(roots.clone())
+            .invoke(json!({"slug":"x","summary":"ws","content":"workspace body"}))
+            .await
+            .unwrap();
+        MemoryWriteTool::new(roots.clone())
+            .invoke(json!({"slug":"x","summary":"u","content":"user body","scope":"user"}))
+            .await
+            .unwrap();
+        // Default read → workspace wins.
+        let body = MemoryReadTool::new(roots.clone())
+            .invoke(json!({"slug":"x"}))
+            .await
+            .unwrap();
+        assert_eq!(body, "workspace body");
+        // Explicit scope → user.
+        let body = MemoryReadTool::new(roots)
+            .invoke(json!({"slug":"x","scope":"user"}))
+            .await
+            .unwrap();
+        assert_eq!(body, "user body");
+    }
+
+    #[tokio::test]
+    async fn list_renders_both_scopes_by_default() {
+        let ws = tempdir().unwrap();
+        let user = tempdir().unwrap();
+        let roots = dual_roots(ws.path(), user.path());
+        MemoryWriteTool::new(roots.clone())
+            .invoke(json!({"slug":"proj","summary":"project fact","content":"."}))
+            .await
+            .unwrap();
+        MemoryWriteTool::new(roots.clone())
+            .invoke(json!({"slug":"pref","summary":"user fact","content":".","scope":"user"}))
+            .await
+            .unwrap();
+        let body = MemoryListTool::new(roots).invoke(json!({})).await.unwrap();
+        assert!(body.contains("project memory"));
+        assert!(body.contains("user memory"));
+        assert!(body.contains("project fact"));
+        assert!(body.contains("user fact"));
+    }
+
+    #[tokio::test]
+    async fn user_scope_write_errors_cleanly_when_not_configured() {
+        let ws = tempdir().unwrap();
+        let err = MemoryWriteTool::new(ws_roots(ws.path()))
+            .invoke(json!({
+                "slug":"x","summary":"x","content":".","scope":"user"
+            }))
+            .await
+            .unwrap_err();
+        assert!(err.to_string().contains("user-scope memory is not configured"));
+    }
+
+    #[tokio::test]
+    async fn invalid_scope_arg_returns_clear_error() {
+        let ws = tempdir().unwrap();
+        let err = MemoryWriteTool::new(ws_roots(ws.path()))
+            .invoke(json!({"slug":"x","summary":"x","content":".","scope":"global"}))
+            .await
+            .unwrap_err();
+        assert!(err.to_string().contains("unknown scope"));
+    }
+}
diff --git a/crates/harness-tools/src/memory_icloud.rs b/crates/harness-tools/src/memory_icloud.rs
new file mode 100644
index 0000000..b85f28a
--- /dev/null
+++ b/crates/harness-tools/src/memory_icloud.rs
@@ -0,0 +1,275 @@
+//! P15 — iCloud Drive lazy-stub auto-materialisation.
+//!
+//! When iCloud Drive hasn't yet downloaded a file to local disk
+//! (because the user just signed in on this machine, or the file
+//! was uploaded by another device and not yet pulled), macOS
+//! replaces it with a hidden 0-byte placeholder: a sibling named
+//! `.<original>.icloud`. Reading the original path via standard
+//! `fs::read_to_string` then returns "file not found" — even
+//! though the user thinks the file is there.
+//!
+//! Helpers in this module:
+//!
+//! - [`is_under_icloud_drive`] — fast prefix check against the
+//!   well-known iCloud Drive base path.
+//! - [`find_icloud_stubs`] — scans a directory for `.icloud`
+//!   placeholder siblings.
+//! - [`ensure_materialised`] — combined "detect + run
+//!   `brctl download`" entry point, async, capped to a few
+//!   seconds. Cross-platform safe: a no-op everywhere except
+//!   macOS, so callers can always invoke it without `#[cfg]`
+//!   sprinkling.
+//!
+//! Used by the `memory.*` read paths before opening MEMORY.md /
+//! `<slug>.md`. Each read pays an extra `read_dir` to scan for
+//! stubs — cheap when nothing is stubbed, and on a clean machine
+//! after first materialisation everything stays local.
+
+use std::path::{Path, PathBuf};
+#[cfg(target_os = "macos")]
+use std::time::Duration;
+
+use harness_core::BoxError;
+
+#[cfg(target_os = "macos")]
+const BRCTL_TIMEOUT_MS: u64 = 8_000;
+#[cfg(target_os = "macos")]
+const POLL_INTERVAL_MS: u64 = 200;
+#[cfg(target_os = "macos")]
+const POLL_DEADLINE_MS: u64 = 4_000;
+
+/// True when `path` lives under macOS's iCloud Drive base
+/// (`~/Library/Mobile Documents/com~apple~CloudDocs/`). Returns
+/// false on non-macOS platforms regardless of the path so the
+/// callers don't have to `#[cfg]` themselves.
+pub fn is_under_icloud_drive(path: &Path) -> bool {
+    if !cfg!(target_os = "macos") {
+        return false;
+    }
+    let Some(home) = std::env::var_os("HOME").map(PathBuf::from) else {
+        return false;
+    };
+    let root = home.join("Library/Mobile Documents/com~apple~CloudDocs");
+    path.starts_with(&root)
+}
+
+/// Scan `dir` (one level, non-recursive) for iCloud lazy
+/// placeholders. Returns the original (un-stubbed) filenames the
+/// caller would have asked for, e.g. `[MEMORY.md, foo.md]` when
+/// `.MEMORY.md.icloud` and `.foo.md.icloud` are present.
+///
+/// Non-existent or unreadable directories produce an empty vec —
+/// the caller's read will fail naturally with its own error if
+/// that turns out to be a real problem.
+pub async fn find_icloud_stubs(dir: &Path) -> Vec<String> {
+    let mut rd = match tokio::fs::read_dir(dir).await {
+        Ok(r) => r,
+        Err(_) => return Vec::new(),
+    };
+    let mut stubs = Vec::new();
+    while let Ok(Some(entry)) = rd.next_entry().await {
+        let name = entry.file_name();
+        let s = match name.to_str() {
+            Some(s) => s,
+            None => continue,
+        };
+        if let Some(original) = parse_stub_name(s) {
+            stubs.push(original);
+        }
+    }
+    stubs
+}
+
+/// Map `.MEMORY.md.icloud` → `Some("MEMORY.md")`. Returns `None`
+/// for non-stub filenames. Centralised so the rule lives in one
+/// spot and tests can exercise it directly without filesystem
+/// setup.
+fn parse_stub_name(filename: &str) -> Option<String> {
+    let inner = filename.strip_prefix('.')?.strip_suffix(".icloud")?;
+    if inner.is_empty() {
+        return None;
+    }
+    Some(inner.to_string())
+}
+
+/// Detect stubs in `dir` and trigger macOS's `brctl download` if
+/// any are found, then poll briefly for them to clear. Returns
+/// `Ok(n)` with the number of stubs that were present at entry
+/// (even if not all materialised within the timeout). `Ok(0)`
+/// means there was nothing to do — the fast path.
+///
+/// Off macOS this is always a `Ok(0)` no-op. `brctl` not being on
+/// PATH is treated as a soft failure: warn and return what we
+/// found, the downstream read will surface a real "file not
+/// found" if the stub didn't materialise.
+pub async fn ensure_materialised(dir: &Path) -> Result<usize, BoxError> {
+    if !is_under_icloud_drive(dir) {
+        return Ok(0);
+    }
+    let stubs = find_icloud_stubs(dir).await;
+    if stubs.is_empty() {
+        return Ok(0);
+    }
+    let stub_count = stubs.len();
+    #[cfg(target_os = "macos")]
+    {
+        run_brctl_download(dir).await?;
+        wait_for_materialisation(dir).await;
+    }
+    #[cfg(not(target_os = "macos"))]
+    {
+        // unreachable when `is_under_icloud_drive` returned false
+        // off macOS; kept for compile-paranoia.
+        let _ = dir;
+    }
+    Ok(stub_count)
+}
+
+#[cfg(target_os = "macos")]
+async fn run_brctl_download(dir: &Path) -> Result<(), BoxError> {
+    use std::process::Stdio;
+    use tokio::process::Command;
+
+    let mut cmd = Command::new("brctl");
+    cmd.arg("download")
+        .arg(dir)
+        .stdin(Stdio::null())
+        .stdout(Stdio::null())
+        .stderr(Stdio::piped())
+        .kill_on_drop(true);
+    let child = cmd
+        .spawn()
+        .map_err(|e| -> BoxError { format!("spawn brctl: {e}").into() })?;
+    match tokio::time::timeout(
+        Duration::from_millis(BRCTL_TIMEOUT_MS),
+        child.wait_with_output(),
+    )
+    .await
+    {
+        Ok(Ok(output)) => {
+            if !output.status.success() {
+                tracing::warn!(
+                    status = ?output.status.code(),
+                    stderr = %String::from_utf8_lossy(&output.stderr).trim(),
+                    "brctl download exited non-zero; iCloud stubs may persist",
+                );
+            }
+            Ok(())
+        }
+        Ok(Err(e)) => Err(format!("brctl io: {e}").into()),
+        Err(_) => {
+            tracing::warn!(
+                timeout_ms = BRCTL_TIMEOUT_MS,
+                "brctl download timed out; iCloud stubs may persist"
+            );
+            Ok(())
+        }
+    }
+}
+
+#[cfg(target_os = "macos")]
+async fn wait_for_materialisation(dir: &Path) {
+    let deadline =
+        std::time::Instant::now() + Duration::from_millis(POLL_DEADLINE_MS);
+    while std::time::Instant::now() < deadline {
+        let remaining = find_icloud_stubs(dir).await;
+        if remaining.is_empty() {
+            return;
+        }
+        tokio::time::sleep(Duration::from_millis(POLL_INTERVAL_MS)).await;
+    }
+    // Deadline reached. The downstream read will succeed if the
+    // file is there now, or surface the usual "not found" error
+    // if it isn't.
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use tempfile::tempdir;
+    use tokio::fs;
+
+    #[test]
+    fn parse_stub_name_matches_canonical_form() {
+        assert_eq!(parse_stub_name(".MEMORY.md.icloud"), Some("MEMORY.md".into()));
+        assert_eq!(parse_stub_name(".foo.bar.icloud"), Some("foo.bar".into()));
+    }
+
+    #[test]
+    fn parse_stub_name_rejects_non_stubs() {
+        assert_eq!(parse_stub_name("MEMORY.md"), None); // not dot-prefixed
+        assert_eq!(parse_stub_name(".MEMORY.md"), None); // not .icloud-suffixed
+        assert_eq!(parse_stub_name(".icloud"), None); // empty inner
+        assert_eq!(parse_stub_name("..icloud"), None); // also empty
+    }
+
+    #[tokio::test]
+    async fn find_icloud_stubs_returns_originals() {
+        let dir = tempdir().unwrap();
+        // Mix of regular and stub files.
+        fs::write(dir.path().join("kept.md"), "ok").await.unwrap();
+        fs::write(dir.path().join(".MEMORY.md.icloud"), "").await.unwrap();
+        fs::write(dir.path().join(".foo.md.icloud"), "").await.unwrap();
+        let mut found = find_icloud_stubs(dir.path()).await;
+        found.sort();
+        assert_eq!(found, vec!["MEMORY.md".to_string(), "foo.md".to_string()]);
+    }
+
+    #[tokio::test]
+    async fn find_icloud_stubs_empty_for_clean_dir() {
+        let dir = tempdir().unwrap();
+        fs::write(dir.path().join("MEMORY.md"), "ok").await.unwrap();
+        let found = find_icloud_stubs(dir.path()).await;
+        assert!(found.is_empty());
+    }
+
+    #[tokio::test]
+    async fn find_icloud_stubs_missing_dir_is_empty() {
+        let bogus = std::path::PathBuf::from("/tmp/does-not-exist/jarvis-icloud-test");
+        let found = find_icloud_stubs(&bogus).await;
+        assert!(found.is_empty());
+    }
+
+    #[test]
+    fn is_under_icloud_drive_false_off_macos() {
+        // Use a path that LOOKS like iCloud but the function
+        // returns false off macOS regardless.
+        let p = PathBuf::from("/anywhere");
+        if !cfg!(target_os = "macos") {
+            assert!(!is_under_icloud_drive(&p));
+        }
+    }
+
+    #[cfg(target_os = "macos")]
+    #[test]
+    fn is_under_icloud_drive_true_for_canonical_subpath() {
+        // Can't depend on the real HOME having iCloud enabled,
+        // so test the prefix logic by mocking HOME.
+        let home = std::path::PathBuf::from("/Users/test");
+        // SAFETY: process-wide env mutation. We restore below
+        // and other tests don't depend on HOME being unset.
+        let prev = std::env::var_os("HOME");
+        unsafe { std::env::set_var("HOME", &home) };
+        let inside = home
+            .join("Library/Mobile Documents/com~apple~CloudDocs/Jarvis/memory/MEMORY.md");
+        let outside = home.join("not-icloud/file.md");
+        assert!(is_under_icloud_drive(&inside));
+        assert!(!is_under_icloud_drive(&outside));
+        if let Some(h) = prev {
+            unsafe { std::env::set_var("HOME", h) };
+        } else {
+            unsafe { std::env::remove_var("HOME") };
+        }
+    }
+
+    #[tokio::test]
+    async fn ensure_materialised_noop_when_not_under_icloud() {
+        // Plain tempdir, not under iCloud Drive — even if stubs
+        // exist they should be ignored (we don't materialise
+        // random paths).
+        let dir = tempdir().unwrap();
+        fs::write(dir.path().join(".foo.md.icloud"), "").await.unwrap();
+        let n = ensure_materialised(dir.path()).await.unwrap();
+        assert_eq!(n, 0);
+    }
+}
diff --git a/crates/harness-tools/src/memory_include.rs b/crates/harness-tools/src/memory_include.rs
new file mode 100644
index 0000000..a860a23
--- /dev/null
+++ b/crates/harness-tools/src/memory_include.rs
@@ -0,0 +1,697 @@
+//! P16 — Memory `include` directives.
+//!
+//! Lets a `MEMORY.md` reference other memory trees by adding HTML
+//! comment lines at the top of the file:
+//!
+//! ```text
+//! <!-- jarvis-include: /Users/team/jarvis-mem/.jarvis/memory -->
+//! <!-- jarvis-include: ~/jarvis-personal/.jarvis/memory -->
+//! <!-- jarvis-include: git+https://github.com/me/team-mem.git -->
+//! <!-- jarvis-include: git+ssh://git@github.com/me/team-mem.git#stable -->
+//! ```
+//!
+//! At system-prompt injection time the binary follows these
+//! directives and appends each upstream's MEMORY.md as its own
+//! section ("=== included from <label> ==="). The agent's local
+//! `memory.list/read/write/delete` still operate on the host
+//! tree — includes are strictly *consumed*, never written to.
+//!
+//! Cycle safety: depth-1 only (no recursion into nested
+//! includes), and the deduping is by canonical directive string
+//! before resolution. A self-reference is detected after path
+//! canonicalisation and skipped.
+//!
+//! Git URL flow:
+//!
+//! 1. Parse `git+<url>[#<branch>]`.
+//! 2. Hash url+branch into a slug.
+//! 3. Cache dir: `<user_root>/include-cache/<slug>/`. If absent,
+//!    `git clone <url> <cache>` (optionally `--branch <b>`).
+//! 4. If present, use as-is. Refresh is explicit — there's a
+//!    `memory.include_refresh` tool that wipes + re-clones, and
+//!    the agent can call it when staleness matters.
+
+use std::path::{Path, PathBuf};
+use std::process::Stdio;
+use std::time::Duration;
+
+use harness_core::BoxError;
+use tokio::process::Command;
+
+const GIT_TIMEOUT_MS: u64 = 60_000;
+
+/// One parsed `<!-- jarvis-include: ... -->` line. Stays
+/// closer to the wire format than to the on-disk path so the
+/// caller can dedup / display the original directive verbatim.
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub enum IncludeDirective {
+    /// Filesystem path. Tilde (`~`) gets expanded at resolve
+    /// time so directives don't bake in an absolute home that
+    /// breaks when the file is shared between machines.
+    LocalPath(String),
+    /// `git+<url>[#branch]` — the `git+` prefix is the
+    /// discriminator. Clone target + optional branch.
+    GitUrl {
+        url: String,
+        branch: Option<String>,
+    },
+}
+
+impl IncludeDirective {
+    /// Canonical wire form for round-tripping into MEMORY.md.
+    pub fn as_wire(&self) -> String {
+        match self {
+            IncludeDirective::LocalPath(s) => s.clone(),
+            IncludeDirective::GitUrl {
+                url,
+                branch: Some(b),
+            } => format!("git+{url}#{b}"),
+            IncludeDirective::GitUrl { url, branch: None } => format!("git+{url}"),
+        }
+    }
+
+    /// Try to parse one target string (whatever sits after
+    /// `<!-- jarvis-include: ` and before ` -->`).
+    pub fn parse_target(s: &str) -> Option<Self> {
+        let trimmed = s.trim();
+        if trimmed.is_empty() {
+            return None;
+        }
+        if let Some(rest) = trimmed.strip_prefix("git+") {
+            let (url, branch) = match rest.rsplit_once('#') {
+                Some((u, b)) if !b.is_empty() && !u.is_empty() && !looks_like_path(u) => {
+                    (u.to_string(), Some(b.to_string()))
+                }
+                _ => (rest.to_string(), None),
+            };
+            return Some(IncludeDirective::GitUrl { url, branch });
+        }
+        Some(IncludeDirective::LocalPath(trimmed.to_string()))
+    }
+
+    /// A short, human-readable label used in the `=== included
+    /// from <label> ===` header. Tries to be more useful than
+    /// the raw URL/path for the model.
+    pub fn label(&self) -> String {
+        match self {
+            IncludeDirective::LocalPath(p) => p.clone(),
+            IncludeDirective::GitUrl { url, branch } => match branch {
+                Some(b) => format!("git:{url} ({b})"),
+                None => format!("git:{url}"),
+            },
+        }
+    }
+}
+
+/// Heuristic: a `git+...` rsplit shouldn't treat
+/// `https://host/foo#bar` as `https://host/foo` + branch `bar` if
+/// `bar` looks like a path segment instead of a branch. In
+/// practice branches don't contain `/`, so we use that as the
+/// disambiguator. Conservatively: if the right side has a slash,
+/// it's part of the URL fragment, not a branch.
+fn looks_like_path(_url: &str) -> bool {
+    false // simple heuristic — branches with `/` are valid but rare
+}
+
+/// Parse all `<!-- jarvis-include: ... -->` directives from a
+/// MEMORY.md text. Empty / malformed directives are silently
+/// skipped so an incomplete edit doesn't break the rest of the
+/// file. Duplicates are kept (caller dedups if desired).
+pub fn parse_include_directives(text: &str) -> Vec<IncludeDirective> {
+    let mut out = Vec::new();
+    for line in text.lines() {
+        let t = line.trim();
+        if let Some(rest) = t.strip_prefix("<!-- jarvis-include:") {
+            let Some(inner) = rest.strip_suffix("-->") else {
+                continue;
+            };
+            if let Some(d) = IncludeDirective::parse_target(inner.trim()) {
+                out.push(d);
+            }
+        }
+    }
+    out
+}
+
+/// Insert (or skip if already present) an include directive
+/// at the top of `text`, returning the new file body.
+/// Directives go above any non-directive content so they're
+/// findable at a glance.
+pub fn add_include_line(text: &str, directive: &IncludeDirective) -> String {
+    let line = format!("<!-- jarvis-include: {} -->", directive.as_wire());
+    let existing = parse_include_directives(text);
+    if existing.iter().any(|d| d == directive) {
+        return text.to_string();
+    }
+    // Split text into existing include lines vs. body.
+    let mut directives_block: Vec<&str> = Vec::new();
+    let mut rest_lines: Vec<&str> = Vec::new();
+    let mut hit_non_directive = false;
+    for l in text.lines() {
+        let t = l.trim();
+        if !hit_non_directive
+            && (t.is_empty()
+                || (t.starts_with("<!-- jarvis-include:") && t.ends_with("-->")))
+        {
+            if t.starts_with("<!-- jarvis-include:") {
+                directives_block.push(l);
+            }
+            // empty line at the top is just absorbed
+            continue;
+        }
+        hit_non_directive = true;
+        rest_lines.push(l);
+    }
+    let mut out = String::new();
+    for d in &directives_block {
+        out.push_str(d);
+        out.push('\n');
+    }
+    out.push_str(&line);
+    out.push('\n');
+    if !rest_lines.is_empty() {
+        out.push('\n');
+        out.push_str(&rest_lines.join("\n"));
+        if text.ends_with('\n') && !out.ends_with('\n') {
+            out.push('\n');
+        }
+    }
+    out
+}
+
+/// Remove the directive whose `as_wire()` matches `target`. No-op
+/// when not found; returns the modified body.
+pub fn remove_include_line(text: &str, target_wire: &str) -> String {
+    let needle = format!("<!-- jarvis-include: {target_wire} -->");
+    let mut out_lines = Vec::new();
+    let mut removed = false;
+    for line in text.lines() {
+        if !removed && line.trim() == needle {
+            removed = true;
+            continue;
+        }
+        out_lines.push(line);
+    }
+    let mut joined = out_lines.join("\n");
+    if text.ends_with('\n') && !joined.ends_with('\n') {
+        joined.push('\n');
+    }
+    joined
+}
+
+/// Expand a leading `~` in `path` against the operator's HOME.
+/// `~/foo` → `<HOME>/foo`; everything else returned unchanged.
+fn expand_tilde(path: &str) -> PathBuf {
+    if let Some(rest) = path.strip_prefix("~/") {
+        if let Some(home) = std::env::var_os("HOME") {
+            return PathBuf::from(home).join(rest);
+        }
+    }
+    PathBuf::from(path)
+}
+
+/// Resolve an [`IncludeDirective`] into a concrete on-disk path
+/// pointing at a memory tree (one that contains MEMORY.md
+/// directly or has `.jarvis/memory/MEMORY.md` underneath).
+///
+/// `cache_root` is the directory under which git includes are
+/// cached (typically `<user_root>/include-cache/`). Local
+/// includes ignore it.
+///
+/// Returns `Err` with a user-facing message when the target
+/// can't be resolved; the caller (system-prompt builder) logs
+/// the failure and skips that include rather than aborting.
+pub async fn resolve_include(
+    directive: &IncludeDirective,
+    cache_root: &Path,
+) -> Result<PathBuf, BoxError> {
+    match directive {
+        IncludeDirective::LocalPath(p) => {
+            let candidate = expand_tilde(p);
+            normalise_memory_dir(&candidate)
+        }
+        IncludeDirective::GitUrl { url, branch } => {
+            let slug = directive_slug(url, branch.as_deref());
+            let cache_dir = cache_root.join(&slug);
+            if !cache_dir.exists() {
+                tokio::fs::create_dir_all(cache_root)
+                    .await
+                    .map_err(|e| -> BoxError {
+                        format!("mkdir {}: {e}", cache_root.display()).into()
+                    })?;
+                git_clone(url, branch.as_deref(), &cache_dir).await?;
+            }
+            normalise_memory_dir(&cache_dir)
+        }
+    }
+}
+
+/// Inspect `candidate` and return whichever of these two paths
+/// contains a `MEMORY.md`:
+///
+/// 1. `candidate/MEMORY.md` (the include points directly at a
+///    memory dir)
+/// 2. `candidate/.jarvis/memory/MEMORY.md` (the include points
+///    at a workspace root)
+///
+/// Returns `Err` with a clear message when neither exists.
+fn normalise_memory_dir(candidate: &Path) -> Result<PathBuf, BoxError> {
+    if !candidate.exists() {
+        return Err(format!("include path not found: {}", candidate.display()).into());
+    }
+    let direct = candidate.join("MEMORY.md");
+    if direct.is_file() {
+        return Ok(candidate.to_path_buf());
+    }
+    let nested = candidate.join(crate::memory::MEMORY_DIR).join("MEMORY.md");
+    if nested.is_file() {
+        return Ok(candidate.join(crate::memory::MEMORY_DIR));
+    }
+    Err(format!(
+        "include `{}` has no MEMORY.md (looked at the directory itself and at .jarvis/memory/ underneath)",
+        candidate.display()
+    )
+    .into())
+}
+
+/// Deterministic per-include cache slug. Branch is folded in so
+/// `repo.git` and `repo.git#feature` get separate caches.
+fn directive_slug(url: &str, branch: Option<&str>) -> String {
+    let mut h = blake3::Hasher::new();
+    h.update(url.as_bytes());
+    if let Some(b) = branch {
+        h.update(b"\x00");
+        h.update(b.as_bytes());
+    }
+    h.finalize().to_hex()[..16].to_string()
+}
+
+async fn git_clone(url: &str, branch: Option<&str>, dest: &Path) -> Result<(), BoxError> {
+    let mut args: Vec<&str> = vec!["clone", "--depth", "1"];
+    if let Some(b) = branch {
+        args.push("--branch");
+        args.push(b);
+    }
+    args.push(url);
+    let dest_str = dest.to_string_lossy().to_string();
+    args.push(&dest_str);
+    let (ok, _stdout, stderr) = run_git(&args).await?;
+    if !ok {
+        return Err(format!("git clone failed: {}", stderr.trim()).into());
+    }
+    Ok(())
+}
+
+/// TTL-based gentle refresh for a cached git include (P18.3).
+/// Used by the system-prompt injection path when the operator
+/// sets `JARVIS_INCLUDE_TTL_HOURS=N` — we *want* to pick up
+/// teammate changes without the explicit `memory.include_refresh`
+/// dance, but only when the cache is stale enough to warrant a
+/// network call.
+///
+/// Behaviour:
+/// - LocalPath includes → no-op (`Ok(false)` — nothing fetched).
+/// - GitUrl with no cache yet → no-op (`resolve_include` will
+///   clone fresh).
+/// - GitUrl with cache: if the cache dir's `.git/FETCH_HEAD`
+///   mtime (or, when absent, the dir mtime) is older than
+///   `ttl`, run `git pull --ff-only` with a short timeout.
+///   Returns `Ok(true)` on a successful pull (whether or not
+///   anything new came down) and `Ok(false)` when no refresh
+///   was attempted. Errors are downgraded to `Ok(false)` so a
+///   network outage doesn't break startup — the caller keeps
+///   the stale cache.
+pub async fn maybe_refresh_git_cache(
+    directive: &IncludeDirective,
+    cache_root: &Path,
+    ttl: Duration,
+) -> Result<bool, BoxError> {
+    let (url, branch) = match directive {
+        IncludeDirective::GitUrl { url, branch } => (url.clone(), branch.clone()),
+        IncludeDirective::LocalPath(_) => return Ok(false),
+    };
+    let slug = directive_slug(&url, branch.as_deref());
+    let cache_dir = cache_root.join(&slug);
+    if !cache_dir.exists() {
+        return Ok(false);
+    }
+    // Probe staleness via `.git/FETCH_HEAD` mtime when present
+    // (every fetch / pull updates this), otherwise fall back to
+    // the cache dir's own mtime. Either way: if we can't read
+    // the timestamp, fail open — skip the refresh.
+    let probe = cache_dir.join(".git/FETCH_HEAD");
+    let probe_path = if probe.exists() { probe } else { cache_dir.clone() };
+    let meta = match tokio::fs::metadata(&probe_path).await {
+        Ok(m) => m,
+        Err(_) => return Ok(false),
+    };
+    let mtime = match meta.modified() {
+        Ok(t) => t,
+        Err(_) => return Ok(false),
+    };
+    let age = std::time::SystemTime::now()
+        .duration_since(mtime)
+        .unwrap_or_default();
+    if age < ttl {
+        return Ok(false);
+    }
+    // Stale. Try `git pull --ff-only`; downgrade any failure to
+    // `Ok(false)` so the caller keeps the stale cache.
+    let pull_args: Vec<&str> = match branch.as_deref() {
+        Some(b) => vec!["-C", cache_dir.to_str().unwrap_or("."), "pull", "--ff-only", "origin", b],
+        None => vec!["-C", cache_dir.to_str().unwrap_or("."), "pull", "--ff-only"],
+    };
+    match run_git(&pull_args).await {
+        Ok((true, _, _)) => {
+            tracing::info!(target = %url, "include cache refreshed (TTL hit)");
+            Ok(true)
+        }
+        Ok((false, _, stderr)) => {
+            tracing::warn!(target = %url, stderr = %stderr.trim(),
+                  "include TTL refresh failed; keeping stale cache");
+            Ok(false)
+        }
+        Err(e) => {
+            tracing::warn!(target = %url, error = %e,
+                  "include TTL refresh errored; keeping stale cache");
+            Ok(false)
+        }
+    }
+}
+
+/// Refresh a cached git include: removes the cache dir and
+/// re-clones. Used by the explicit `memory.include_refresh` tool;
+/// not called automatically (don't want to surprise the user
+/// with a network call during system-prompt injection).
+pub async fn refresh_git_cache(
+    directive: &IncludeDirective,
+    cache_root: &Path,
+) -> Result<PathBuf, BoxError> {
+    let (url, branch) = match directive {
+        IncludeDirective::GitUrl { url, branch } => (url.clone(), branch.clone()),
+        IncludeDirective::LocalPath(_) => {
+            return Err("refresh only applies to git+ includes".into());
+        }
+    };
+    let slug = directive_slug(&url, branch.as_deref());
+    let cache_dir = cache_root.join(&slug);
+    if cache_dir.exists() {
+        tokio::fs::remove_dir_all(&cache_dir)
+            .await
+            .map_err(|e| -> BoxError {
+                format!("rm {}: {e}", cache_dir.display()).into()
+            })?;
+    }
+    tokio::fs::create_dir_all(cache_root)
+        .await
+        .map_err(|e| -> BoxError {
+            format!("mkdir {}: {e}", cache_root.display()).into()
+        })?;
+    git_clone(&url, branch.as_deref(), &cache_dir).await?;
+    normalise_memory_dir(&cache_dir)
+}
+
+async fn run_git(args: &[&str]) -> Result<(bool, String, String), BoxError> {
+    let mut cmd = Command::new("git");
+    cmd.args(args)
+        .stdin(Stdio::null())
+        .stdout(Stdio::piped())
+        .stderr(Stdio::piped())
+        .kill_on_drop(true);
+    let child = cmd
+        .spawn()
+        .map_err(|e| -> BoxError { format!("spawn git: {e}").into() })?;
+    let output = match tokio::time::timeout(
+        Duration::from_millis(GIT_TIMEOUT_MS),
+        child.wait_with_output(),
+    )
+    .await
+    {
+        Ok(Ok(o)) => o,
+        Ok(Err(e)) => return Err(format!("git io: {e}").into()),
+        Err(_) => return Err("git timed out".into()),
+    };
+    Ok((
+        output.status.success(),
+        String::from_utf8_lossy(&output.stdout).into_owned(),
+        String::from_utf8_lossy(&output.stderr).into_owned(),
+    ))
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use tempfile::tempdir;
+    use tokio::fs;
+
+    #[test]
+    fn parse_local_path() {
+        let d = IncludeDirective::parse_target("/Users/x/mem").unwrap();
+        assert_eq!(d, IncludeDirective::LocalPath("/Users/x/mem".into()));
+    }
+
+    #[test]
+    fn parse_tilde_path() {
+        let d = IncludeDirective::parse_target("~/jarvis-mem").unwrap();
+        assert_eq!(d, IncludeDirective::LocalPath("~/jarvis-mem".into()));
+    }
+
+    #[test]
+    fn parse_git_url_no_branch() {
+        let d = IncludeDirective::parse_target("git+https://host/r.git").unwrap();
+        assert_eq!(
+            d,
+            IncludeDirective::GitUrl {
+                url: "https://host/r.git".into(),
+                branch: None
+            }
+        );
+    }
+
+    #[test]
+    fn parse_git_url_with_branch() {
+        let d = IncludeDirective::parse_target("git+https://host/r.git#dev").unwrap();
+        assert_eq!(
+            d,
+            IncludeDirective::GitUrl {
+                url: "https://host/r.git".into(),
+                branch: Some("dev".into())
+            }
+        );
+    }
+
+    #[test]
+    fn empty_target_returns_none() {
+        assert!(IncludeDirective::parse_target("   ").is_none());
+    }
+
+    #[test]
+    fn parse_directives_from_memory_md_skips_non_directives() {
+        let text = "<!-- jarvis-include: /a -->\n<!-- jarvis-include: ~/b -->\n\n# Real content\n- [x](x.md)\n<!-- jarvis-include: git+https://h/r.git -->\n";
+        let d = parse_include_directives(text);
+        assert_eq!(d.len(), 3);
+        assert!(matches!(d[0], IncludeDirective::LocalPath(ref p) if p == "/a"));
+        assert!(matches!(d[1], IncludeDirective::LocalPath(ref p) if p == "~/b"));
+        assert!(matches!(d[2], IncludeDirective::GitUrl { ref url, .. } if url == "https://h/r.git"));
+    }
+
+    #[test]
+    fn add_directive_is_idempotent() {
+        let body = "<!-- jarvis-include: /a -->\n\n- [x](x.md)\n";
+        let d = IncludeDirective::LocalPath("/a".into());
+        let next = add_include_line(body, &d);
+        assert_eq!(next, body);
+    }
+
+    #[test]
+    fn add_directive_appends_above_body() {
+        let body = "- [x](x.md)\n";
+        let d = IncludeDirective::LocalPath("/a".into());
+        let next = add_include_line(body, &d);
+        assert!(next.starts_with("<!-- jarvis-include: /a -->\n"));
+        assert!(next.contains("- [x](x.md)"));
+    }
+
+    #[test]
+    fn remove_directive_strips_line() {
+        let body = "<!-- jarvis-include: /a -->\n<!-- jarvis-include: /b -->\n- [x](x.md)\n";
+        let next = remove_include_line(body, "/a");
+        assert!(!next.contains("/a"));
+        assert!(next.contains("/b"));
+    }
+
+    #[test]
+    fn directive_slug_is_stable_and_branch_aware() {
+        let s1 = directive_slug("https://h/r.git", None);
+        let s2 = directive_slug("https://h/r.git", None);
+        let s3 = directive_slug("https://h/r.git", Some("dev"));
+        assert_eq!(s1, s2);
+        assert_ne!(s1, s3);
+        assert_eq!(s1.len(), 16);
+    }
+
+    #[tokio::test]
+    async fn resolve_local_direct_memory_md() {
+        let dir = tempdir().unwrap();
+        fs::write(dir.path().join("MEMORY.md"), "- [a](a.md)")
+            .await
+            .unwrap();
+        let d = IncludeDirective::LocalPath(dir.path().to_string_lossy().to_string());
+        let resolved = resolve_include(&d, &PathBuf::from("/dev/null")).await.unwrap();
+        assert_eq!(resolved, dir.path().to_path_buf());
+    }
+
+    #[tokio::test]
+    async fn resolve_local_workspace_layout() {
+        // include points at the workspace root (not the memory
+        // dir); resolver finds `.jarvis/memory/MEMORY.md`.
+        let dir = tempdir().unwrap();
+        let mem = dir.path().join(crate::memory::MEMORY_DIR);
+        fs::create_dir_all(&mem).await.unwrap();
+        fs::write(mem.join("MEMORY.md"), "- [a](a.md)").await.unwrap();
+        let d = IncludeDirective::LocalPath(dir.path().to_string_lossy().to_string());
+        let resolved = resolve_include(&d, &PathBuf::from("/dev/null")).await.unwrap();
+        assert_eq!(resolved, mem);
+    }
+
+    #[tokio::test]
+    async fn resolve_local_missing_returns_err() {
+        let d = IncludeDirective::LocalPath("/tmp/does-not-exist-jarvis-include".into());
+        let err = resolve_include(&d, &PathBuf::from("/dev/null"))
+            .await
+            .unwrap_err();
+        assert!(err.to_string().contains("not found"));
+    }
+
+    #[tokio::test]
+    async fn resolve_local_no_memory_md_returns_err() {
+        let dir = tempdir().unwrap();
+        let d = IncludeDirective::LocalPath(dir.path().to_string_lossy().to_string());
+        let err = resolve_include(&d, &PathBuf::from("/dev/null"))
+            .await
+            .unwrap_err();
+        assert!(err.to_string().contains("no MEMORY.md"));
+    }
+
+    #[tokio::test]
+    async fn resolve_git_clone_against_local_bare_repo() {
+        if std::process::Command::new("git")
+            .arg("--version")
+            .output()
+            .is_err()
+        {
+            return;
+        }
+        // Set up an upstream with a seed MEMORY.md, push it.
+        let upstream = tempdir().unwrap();
+        std::process::Command::new("git")
+            .args(["init", "-q", "--bare", "-b", "main"])
+            .arg(upstream.path())
+            .status()
+            .unwrap();
+        let work = tempdir().unwrap();
+        std::process::Command::new("git")
+            .args(["init", "-q", "-b", "main"])
+            .arg(work.path())
+            .status()
+            .unwrap();
+        std::process::Command::new("git")
+            .arg("-C")
+            .arg(work.path())
+            .args(["config", "user.email", "t@t"])
+            .status()
+            .unwrap();
+        std::process::Command::new("git")
+            .arg("-C")
+            .arg(work.path())
+            .args(["config", "user.name", "T"])
+            .status()
+            .unwrap();
+        fs::write(work.path().join("MEMORY.md"), "- [seed](seed.md)\n")
+            .await
+            .unwrap();
+        std::process::Command::new("git")
+            .arg("-C")
+            .arg(work.path())
+            .args(["add", "-A"])
+            .status()
+            .unwrap();
+        std::process::Command::new("git")
+            .arg("-C")
+            .arg(work.path())
+            .args(["commit", "-qm", "seed"])
+            .status()
+            .unwrap();
+        std::process::Command::new("git")
+            .arg("-C")
+            .arg(work.path())
+            .args(["remote", "add", "origin"])
+            .arg(upstream.path())
+            .status()
+            .unwrap();
+        std::process::Command::new("git")
+            .arg("-C")
+            .arg(work.path())
+            .args(["push", "-q", "-u", "origin", "main"])
+            .status()
+            .unwrap();
+
+        let cache = tempdir().unwrap();
+        let d = IncludeDirective::GitUrl {
+            url: upstream.path().to_string_lossy().to_string(),
+            branch: None,
+        };
+        let resolved = resolve_include(&d, cache.path()).await.unwrap();
+        let body = fs::read_to_string(resolved.join("MEMORY.md")).await.unwrap();
+        assert!(body.contains("seed"));
+    }
+
+    #[tokio::test]
+    async fn refresh_only_applies_to_git() {
+        let d = IncludeDirective::LocalPath("/a".into());
+        let err = refresh_git_cache(&d, &PathBuf::from("/tmp/cache"))
+            .await
+            .unwrap_err();
+        assert!(err.to_string().contains("only applies"));
+    }
+
+    #[tokio::test]
+    async fn maybe_refresh_noop_on_local_path() {
+        let d = IncludeDirective::LocalPath("/anywhere".into());
+        let result = maybe_refresh_git_cache(&d, &PathBuf::from("/tmp"), Duration::from_secs(1))
+            .await
+            .unwrap();
+        assert!(!result);
+    }
+
+    #[tokio::test]
+    async fn maybe_refresh_noop_when_cache_missing() {
+        let d = IncludeDirective::GitUrl {
+            url: "https://example.invalid/r.git".into(),
+            branch: None,
+        };
+        let cache = tempdir().unwrap();
+        let result = maybe_refresh_git_cache(&d, cache.path(), Duration::from_secs(1))
+            .await
+            .unwrap();
+        assert!(!result, "missing cache should not trigger network");
+    }
+
+    #[tokio::test]
+    async fn maybe_refresh_noop_when_within_ttl() {
+        // Set up a cache dir that exists. With a huge TTL the
+        // staleness check returns false and we don't attempt git.
+        let cache = tempdir().unwrap();
+        let d = IncludeDirective::GitUrl {
+            url: "https://example.invalid/r.git".into(),
+            branch: None,
+        };
+        let slug = directive_slug("https://example.invalid/r.git", None);
+        let cache_dir = cache.path().join(&slug);
+        std::fs::create_dir_all(&cache_dir).unwrap();
+        let result = maybe_refresh_git_cache(&d, cache.path(), Duration::from_secs(3600 * 24))
+            .await
+            .unwrap();
+        assert!(!result);
+    }
+}
diff --git a/crates/harness-tools/src/memory_include_tools.rs b/crates/harness-tools/src/memory_include_tools.rs
new file mode 100644
index 0000000..ed9d108
--- /dev/null
+++ b/crates/harness-tools/src/memory_include_tools.rs
@@ -0,0 +1,463 @@
+//! P16 — agent-facing tools for the `MEMORY.md` include
+//! directives.
+//!
+//! Tools:
+//! - `memory.include_add(target, scope?)` — adds a directive line
+//!   at the top of the scope's MEMORY.md. For git URLs the initial
+//!   clone happens immediately so the agent gets fast feedback on
+//!   bad URLs / auth instead of discovering them on next restart.
+//! - `memory.include_list(scope?)` — returns the parsed
+//!   directives + resolution status per entry.
+//! - `memory.include_remove(target, scope?)` — strips a directive
+//!   line.
+//! - `memory.include_refresh(target, scope?)` — git includes only:
+//!   nuke and re-clone the cache.
+
+use std::path::{Path, PathBuf};
+
+use async_trait::async_trait;
+use harness_core::{BoxError, Tool, ToolCategory};
+use serde_json::{json, Value};
+use tokio::fs;
+
+use crate::memory::{index_path, MemoryRoots, MemoryScope};
+#[cfg(test)]
+use crate::memory::MEMORY_DIR;
+use crate::memory_include::{
+    add_include_line, parse_include_directives, refresh_git_cache, remove_include_line,
+    resolve_include, IncludeDirective,
+};
+
+fn parse_scope_arg(s: &str) -> Result<MemoryScope, BoxError> {
+    MemoryScope::from_wire(s)
+        .ok_or_else(|| -> BoxError { format!("unknown scope `{s}` — use `workspace` or `user`").into() })
+}
+
+/// Best-effort `home/.jarvis/include-cache` resolution. Used by
+/// tools that aren't `serve.rs` (which has its own resolver) —
+/// falls back to a tempdir so `memory.include_refresh` etc. still
+/// have somewhere to put files when HOME is unset.
+fn include_cache_root() -> PathBuf {
+    if let Some(home) = std::env::var_os("HOME").map(PathBuf::from) {
+        return home.join(".jarvis/include-cache");
+    }
+    std::env::temp_dir().join("jarvis-include-cache")
+}
+
+async fn write_atomic(path: &Path, body: &str) -> Result<(), BoxError> {
+    if let Some(parent) = path.parent() {
+        fs::create_dir_all(parent)
+            .await
+            .map_err(|e| -> BoxError { format!("mkdir {}: {e}", parent.display()).into() })?;
+    }
+    let tmp = path.with_extension("tmp");
+    fs::write(&tmp, body)
+        .await
+        .map_err(|e| -> BoxError { format!("write {}: {e}", tmp.display()).into() })?;
+    fs::rename(&tmp, path)
+        .await
+        .map_err(|e| -> BoxError { format!("rename {}: {e}", path.display()).into() })?;
+    Ok(())
+}
+
+async fn read_or_empty(path: &Path) -> String {
+    fs::read_to_string(path).await.unwrap_or_default()
+}
+
+// -------- memory.include_add --------
+
+pub struct MemoryIncludeAddTool {
+    roots: MemoryRoots,
+}
+impl MemoryIncludeAddTool {
+    pub fn new(roots: MemoryRoots) -> Self {
+        Self { roots }
+    }
+}
+
+#[async_trait]
+impl Tool for MemoryIncludeAddTool {
+    fn name(&self) -> &str {
+        "memory.include_add"
+    }
+    fn requires_approval(&self) -> bool {
+        true
+    }
+    fn description(&self) -> &str {
+        "Add an include directive to the scope's MEMORY.md so the \
+         system prompt also pulls in another memory tree at \
+         conversation start. `target` is either a filesystem path \
+         (absolute or `~/...`) or a `git+<url>[#branch]` URL. Git \
+         URLs trigger an immediate clone into the local cache so \
+         the agent learns about auth / URL typos here rather than \
+         on next restart."
+    }
+    fn parameters(&self) -> Value {
+        json!({
+            "type": "object",
+            "additionalProperties": false,
+            "required": ["target"],
+            "properties": {
+                "target": {
+                    "type": "string",
+                    "description": "`/abs/path/memory` or `~/path/memory` or `git+https://...[#branch]`"
+                },
+                "scope": {
+                    "type": "string",
+                    "enum": ["workspace", "user"],
+                    "description": "Which scope's MEMORY.md to modify. Defaults to `workspace`."
+                }
+            }
+        })
+    }
+    fn summary_for_audit(&self, args: &Value) -> Option<String> {
+        args.get("target").and_then(Value::as_str).map(str::to_string)
+    }
+    async fn invoke(&self, args: Value) -> Result<String, BoxError> {
+        let target = args
+            .get("target")
+            .and_then(Value::as_str)
+            .ok_or_else(|| -> BoxError { "missing `target` argument".into() })?;
+        let directive = IncludeDirective::parse_target(target)
+            .ok_or_else(|| -> BoxError { format!("invalid include target `{target}`").into() })?;
+        let scope = args
+            .get("scope")
+            .and_then(Value::as_str)
+            .map(parse_scope_arg)
+            .transpose()?
+            .unwrap_or(MemoryScope::Workspace);
+        let workspace_root = harness_core::active_workspace_or(&self.roots.workspace_root);
+        let roots = MemoryRoots {
+            workspace_root,
+            user_root: self.roots.user_root.clone(),
+        };
+        let root = roots.root_for(scope)?;
+        let index = index_path(root);
+        let existing = read_or_empty(&index).await;
+        // Eager validate the directive: for git URLs this triggers
+        // the clone; for local paths it confirms the dir + memory
+        // layout. We fail BEFORE writing the directive so a broken
+        // target doesn't end up baked into MEMORY.md.
+        let cache = include_cache_root();
+        let _ = resolve_include(&directive, &cache).await?;
+        let next = add_include_line(&existing, &directive);
+        write_atomic(&index, &next).await?;
+        harness_core::note_working_file_relative_to(&index, Some(root));
+        Ok(json!({
+            "ok": true,
+            "added": directive.as_wire(),
+            "scope": scope.as_wire(),
+            "memory_md": index.display().to_string(),
+        })
+        .to_string())
+    }
+}
+
+// -------- memory.include_list --------
+
+pub struct MemoryIncludeListTool {
+    roots: MemoryRoots,
+}
+impl MemoryIncludeListTool {
+    pub fn new(roots: MemoryRoots) -> Self {
+        Self { roots }
+    }
+}
+
+#[async_trait]
+impl Tool for MemoryIncludeListTool {
+    fn name(&self) -> &str {
+        "memory.include_list"
+    }
+    fn description(&self) -> &str {
+        "Return the include directives declared at the top of the \
+         scope's MEMORY.md plus their resolution status. Each \
+         entry reports `target`, `kind` (`local_path` | \
+         `git_url`), and `resolves` (bool with `error` when false). \
+         No mutations."
+    }
+    fn parameters(&self) -> Value {
+        json!({
+            "type": "object",
+            "additionalProperties": false,
+            "properties": {
+                "scope": {
+                    "type": "string",
+                    "enum": ["workspace", "user"],
+                    "description": "Defaults to `workspace`."
+                }
+            }
+        })
+    }
+    fn category(&self) -> ToolCategory {
+        ToolCategory::Read
+    }
+    async fn invoke(&self, args: Value) -> Result<String, BoxError> {
+        let scope = args
+            .get("scope")
+            .and_then(Value::as_str)
+            .map(parse_scope_arg)
+            .transpose()?
+            .unwrap_or(MemoryScope::Workspace);
+        let workspace_root = harness_core::active_workspace_or(&self.roots.workspace_root);
+        let roots = MemoryRoots {
+            workspace_root,
+            user_root: self.roots.user_root.clone(),
+        };
+        let root = roots.root_for(scope)?;
+        let index = index_path(root);
+        let body = read_or_empty(&index).await;
+        let cache = include_cache_root();
+        let directives = parse_include_directives(&body);
+        let mut items = Vec::new();
+        for d in directives {
+            let kind = match d {
+                IncludeDirective::LocalPath(_) => "local_path",
+                IncludeDirective::GitUrl { .. } => "git_url",
+            };
+            let entry = match resolve_include(&d, &cache).await {
+                Ok(p) => json!({
+                    "target": d.as_wire(),
+                    "kind": kind,
+                    "resolves": true,
+                    "path": p.display().to_string(),
+                }),
+                Err(e) => json!({
+                    "target": d.as_wire(),
+                    "kind": kind,
+                    "resolves": false,
+                    "error": e.to_string(),
+                }),
+            };
+            items.push(entry);
+        }
+        Ok(json!({
+            "scope": scope.as_wire(),
+            "memory_md": index.display().to_string(),
+            "items": items,
+        })
+        .to_string())
+    }
+}
+
+// -------- memory.include_remove --------
+
+pub struct MemoryIncludeRemoveTool {
+    roots: MemoryRoots,
+}
+impl MemoryIncludeRemoveTool {
+    pub fn new(roots: MemoryRoots) -> Self {
+        Self { roots }
+    }
+}
+
+#[async_trait]
+impl Tool for MemoryIncludeRemoveTool {
+    fn name(&self) -> &str {
+        "memory.include_remove"
+    }
+    fn requires_approval(&self) -> bool {
+        true
+    }
+    fn description(&self) -> &str {
+        "Remove an include directive from the scope's MEMORY.md. \
+         `target` is the same string used when adding the include \
+         (use `memory.include_list` first to read the exact form)."
+    }
+    fn parameters(&self) -> Value {
+        json!({
+            "type": "object",
+            "additionalProperties": false,
+            "required": ["target"],
+            "properties": {
+                "target": { "type": "string" },
+                "scope": {
+                    "type": "string",
+                    "enum": ["workspace", "user"]
+                }
+            }
+        })
+    }
+    async fn invoke(&self, args: Value) -> Result<String, BoxError> {
+        let target = args
+            .get("target")
+            .and_then(Value::as_str)
+            .ok_or_else(|| -> BoxError { "missing `target` argument".into() })?;
+        let scope = args
+            .get("scope")
+            .and_then(Value::as_str)
+            .map(parse_scope_arg)
+            .transpose()?
+            .unwrap_or(MemoryScope::Workspace);
+        let workspace_root = harness_core::active_workspace_or(&self.roots.workspace_root);
+        let roots = MemoryRoots {
+            workspace_root,
+            user_root: self.roots.user_root.clone(),
+        };
+        let root = roots.root_for(scope)?;
+        let index = index_path(root);
+        let existing = read_or_empty(&index).await;
+        let next = remove_include_line(&existing, target);
+        write_atomic(&index, &next).await?;
+        Ok(json!({
+            "ok": true,
+            "removed": target,
+            "scope": scope.as_wire(),
+        })
+        .to_string())
+    }
+}
+
+// -------- memory.include_refresh --------
+
+pub struct MemoryIncludeRefreshTool;
+
+#[async_trait]
+impl Tool for MemoryIncludeRefreshTool {
+    fn name(&self) -> &str {
+        "memory.include_refresh"
+    }
+    fn requires_approval(&self) -> bool {
+        true
+    }
+    fn description(&self) -> &str {
+        "Wipe and re-clone the local cache for a `git+...` include. \
+         No-op for local-path includes (they always read from the \
+         source). Use this when a team member pushed a new memory \
+         entry and you want to pick it up without restarting."
+    }
+    fn parameters(&self) -> Value {
+        json!({
+            "type": "object",
+            "additionalProperties": false,
+            "required": ["target"],
+            "properties": {
+                "target": {
+                    "type": "string",
+                    "description": "The `git+<url>[#branch]` string to refresh."
+                }
+            }
+        })
+    }
+    async fn invoke(&self, args: Value) -> Result<String, BoxError> {
+        let target = args
+            .get("target")
+            .and_then(Value::as_str)
+            .ok_or_else(|| -> BoxError { "missing `target` argument".into() })?;
+        let directive = IncludeDirective::parse_target(target)
+            .ok_or_else(|| -> BoxError { format!("invalid include target `{target}`").into() })?;
+        let cache = include_cache_root();
+        let resolved = refresh_git_cache(&directive, &cache).await?;
+        Ok(json!({
+            "ok": true,
+            "target": directive.as_wire(),
+            "cache_path": resolved.display().to_string(),
+        })
+        .to_string())
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use tempfile::tempdir;
+
+    fn ws_roots(root: &std::path::Path) -> MemoryRoots {
+        MemoryRoots::new(root.to_path_buf())
+    }
+
+    #[tokio::test]
+    async fn add_local_include_writes_directive() {
+        let workspace = tempdir().unwrap();
+        // Need a real local path that resolves cleanly so the
+        // eager validation passes.
+        let upstream = tempdir().unwrap();
+        let upstream_mem = upstream.path().join(MEMORY_DIR);
+        fs::create_dir_all(&upstream_mem).await.unwrap();
+        fs::write(upstream_mem.join("MEMORY.md"), "- [foo](foo.md)\n")
+            .await
+            .unwrap();
+
+        let tool = MemoryIncludeAddTool::new(ws_roots(workspace.path()));
+        let out = tool
+            .invoke(json!({"target": upstream.path().to_string_lossy()}))
+            .await
+            .unwrap();
+        let parsed: Value = serde_json::from_str(&out).unwrap();
+        assert_eq!(parsed["ok"], true);
+        let body = fs::read_to_string(workspace.path().join(MEMORY_DIR).join("MEMORY.md"))
+            .await
+            .unwrap();
+        assert!(body.contains("<!-- jarvis-include: "));
+        assert!(body.contains(&upstream.path().to_string_lossy().to_string()));
+    }
+
+    #[tokio::test]
+    async fn add_rejects_unresolvable_target() {
+        let workspace = tempdir().unwrap();
+        let tool = MemoryIncludeAddTool::new(ws_roots(workspace.path()));
+        let err = tool
+            .invoke(json!({"target": "/tmp/does-not-exist-include"}))
+            .await
+            .unwrap_err();
+        assert!(err.to_string().contains("not found"));
+        // Crucially: MEMORY.md was NOT created with a broken directive.
+        let body = fs::read_to_string(workspace.path().join(MEMORY_DIR).join("MEMORY.md"))
+            .await;
+        assert!(body.is_err(), "should not have written MEMORY.md");
+    }
+
+    #[tokio::test]
+    async fn list_reports_resolution_per_entry() {
+        let workspace = tempdir().unwrap();
+        // Seed MEMORY.md with two directives: one resolvable, one not.
+        let mem = workspace.path().join(MEMORY_DIR);
+        fs::create_dir_all(&mem).await.unwrap();
+        let upstream = tempdir().unwrap();
+        let up_mem = upstream.path().join(MEMORY_DIR);
+        fs::create_dir_all(&up_mem).await.unwrap();
+        fs::write(up_mem.join("MEMORY.md"), "- [x](x.md)\n").await.unwrap();
+        let body = format!(
+            "<!-- jarvis-include: {} -->\n<!-- jarvis-include: /tmp/none-{} -->\n",
+            upstream.path().display(),
+            std::process::id()
+        );
+        fs::write(mem.join("MEMORY.md"), body).await.unwrap();
+        let tool = MemoryIncludeListTool::new(ws_roots(workspace.path()));
+        let out = tool.invoke(json!({})).await.unwrap();
+        let parsed: Value = serde_json::from_str(&out).unwrap();
+        let items = parsed["items"].as_array().unwrap();
+        assert_eq!(items.len(), 2);
+        assert_eq!(items[0]["resolves"], true);
+        assert_eq!(items[1]["resolves"], false);
+        assert!(items[1]["error"].as_str().unwrap().contains("not found"));
+    }
+
+    #[tokio::test]
+    async fn remove_strips_directive() {
+        let workspace = tempdir().unwrap();
+        let mem = workspace.path().join(MEMORY_DIR);
+        fs::create_dir_all(&mem).await.unwrap();
+        fs::write(
+            mem.join("MEMORY.md"),
+            "<!-- jarvis-include: /a -->\n<!-- jarvis-include: /b -->\n",
+        )
+        .await
+        .unwrap();
+        let tool = MemoryIncludeRemoveTool::new(ws_roots(workspace.path()));
+        let _ = tool.invoke(json!({"target": "/a"})).await.unwrap();
+        let body = fs::read_to_string(mem.join("MEMORY.md")).await.unwrap();
+        assert!(!body.contains("/a"));
+        assert!(body.contains("/b"));
+    }
+
+    #[tokio::test]
+    async fn refresh_rejects_local_path() {
+        let tool = MemoryIncludeRefreshTool;
+        let err = tool
+            .invoke(json!({"target": "/some/path"}))
+            .await
+            .unwrap_err();
+        assert!(err.to_string().contains("only applies"));
+    }
+}
diff --git a/crates/harness-tools/src/memory_sync.rs b/crates/harness-tools/src/memory_sync.rs
new file mode 100644
index 0000000..ea7ff7f
--- /dev/null
+++ b/crates/harness-tools/src/memory_sync.rs
@@ -0,0 +1,1291 @@
+//! P10 — `memory.sync` / `memory.sync_status`.
+//!
+//! Git-as-transport network sync for the M3.1+P9 memory tree. The
+//! operator (or their team) hosts a private git repo somewhere they
+//! already trust (GitHub / GitLab / self-hosted), points the local
+//! `~/.jarvis/memory/` at it via `git remote add origin <url>`, and
+//! these two tools wrap pull/push + status so the agent can keep the
+//! local tree in step without the user re-typing git commands.
+//!
+//! Why git?
+//!
+//! - Auth, conflict resolution, history, branching, offline buffering
+//!   are all solved problems on git's side.
+//! - The user has a clear mental model: it's a repo, it follows the
+//!   same rules as every other git checkout they have.
+//! - We don't have to design, ship, or maintain a sync server.
+//! - The same flow works for `<workspace>/.jarvis/memory/` too —
+//!   that directory naturally syncs via the workspace's own repo,
+//!   `memory.sync` is mostly meant for the `~/.jarvis/memory/`
+//!   (user-scope) case where there's no auto-sync from the workspace's
+//!   normal git flow.
+//!
+//! Both tools are opt-in via [`crate::BuiltinsConfig::enable_memory_sync`]
+//! — they spawn the host's `git` binary which is more side-effectful
+//! than the rest of the memory toolset.
+
+use std::path::{Path, PathBuf};
+use std::process::Stdio;
+use std::time::Duration;
+
+use async_trait::async_trait;
+use harness_core::{BoxError, Tool, ToolCategory};
+use serde_json::{json, Value};
+use tokio::process::Command;
+
+use crate::memory::{MemoryRoots, MemoryScope, MEMORY_DIR};
+
+/// Which sync transport the user has opted into. Mutually
+/// exclusive — the model + tool set adapt to the choice so a
+/// `git`-backed deployment never sees iCloud-only tools and vice
+/// versa.
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Default)]
+pub enum MemorySyncBackend {
+    /// No automatic sync transport. Memory still works locally;
+    /// the agent just doesn't have any "push it elsewhere" tool.
+    /// Default when the user hasn't opted in.
+    #[default]
+    None,
+    /// P10/P11 — git pull/push against a remote. Cross-platform,
+    /// explicit, works for any host with `git` on `PATH`.
+    Git,
+    /// P13 — store the user-scope memory inside iCloud Drive and
+    /// let macOS sync it automatically. No protocol code in
+    /// Jarvis; the OS handles everything once files land in
+    /// `~/Library/Mobile Documents/com~apple~CloudDocs/Jarvis/`.
+    /// macOS-only.
+    ICloud,
+}
+
+impl MemorySyncBackend {
+    pub fn as_wire(&self) -> &'static str {
+        match self {
+            MemorySyncBackend::None => "none",
+            MemorySyncBackend::Git => "git",
+            MemorySyncBackend::ICloud => "icloud",
+        }
+    }
+
+    pub fn from_wire(s: &str) -> Option<Self> {
+        match s.trim().to_ascii_lowercase().as_str() {
+            "" | "none" | "off" | "disabled" => Some(MemorySyncBackend::None),
+            "git" => Some(MemorySyncBackend::Git),
+            "icloud" | "icloud-drive" => Some(MemorySyncBackend::ICloud),
+            _ => None,
+        }
+    }
+}
+
+/// macOS iCloud Drive base path. Same value for every user on the
+/// machine because the OS stitches it onto each home directory.
+/// Returns `None` off macOS — the caller can decide whether to
+/// error or fall back.
+pub fn icloud_drive_root() -> Option<PathBuf> {
+    if !cfg!(target_os = "macos") {
+        return None;
+    }
+    let home = std::env::var_os("HOME").map(PathBuf::from)?;
+    Some(home.join("Library/Mobile Documents/com~apple~CloudDocs"))
+}
+
+/// Resolved location of the Jarvis memory subdir inside iCloud
+/// Drive. `None` when iCloud Drive isn't available (non-macOS,
+/// HOME unresolvable, or the iCloud root dir doesn't exist —
+/// happens when the user hasn't enabled iCloud Drive). Callers
+/// should fall back to the non-iCloud user_root in that case.
+pub fn icloud_memory_root() -> Option<PathBuf> {
+    let root = icloud_drive_root()?;
+    if !root.exists() {
+        return None;
+    }
+    Some(root.join("Jarvis"))
+}
+
+/// 60s default. Network pulls / pushes can take a few seconds even
+/// on a healthy link; a tighter cap would kill normal interactive
+/// use. The model can pass a shorter `timeout_ms` per call.
+const DEFAULT_TIMEOUT_MS: u64 = 60_000;
+const DEFAULT_MAX_BYTES: usize = 64 * 1024;
+
+/// Resolve `<scope_root>/.jarvis/memory/` for a sync operation, then
+/// return its absolute path. Returns `BoxError` (user-facing) when
+/// the requested scope isn't configured.
+fn memory_dir_for(roots: &MemoryRoots, scope: MemoryScope) -> Result<PathBuf, BoxError> {
+    let root = roots.root_for(scope)?;
+    Ok(root.join(MEMORY_DIR))
+}
+
+/// Run `git` with the given args inside `cwd`. Pulled out so both
+/// tools share the same spawn / timeout / output-truncation contract.
+async fn run_git(
+    cwd: &Path,
+    args: &[&str],
+    timeout_ms: u64,
+) -> Result<(bool, String, String), BoxError> {
+    let mut cmd = Command::new("git");
+    cmd.arg("-C")
+        .arg(cwd)
+        .args(args)
+        .stdin(Stdio::null())
+        .stdout(Stdio::piped())
+        .stderr(Stdio::piped())
+        .kill_on_drop(true);
+
+    let child = cmd
+        .spawn()
+        .map_err(|e| -> BoxError { format!("failed to spawn git: {e}").into() })?;
+
+    let output =
+        match tokio::time::timeout(Duration::from_millis(timeout_ms), child.wait_with_output())
+            .await
+        {
+            Ok(Ok(o)) => o,
+            Ok(Err(e)) => return Err(format!("git process error: {e}").into()),
+            Err(_) => return Err(format!("git timed out after {timeout_ms} ms").into()),
+        };
+
+    let mut stdout = String::from_utf8_lossy(&output.stdout).into_owned();
+    let mut stderr = String::from_utf8_lossy(&output.stderr).into_owned();
+    if stdout.len() > DEFAULT_MAX_BYTES {
+        truncate_to(&mut stdout, DEFAULT_MAX_BYTES);
+    }
+    if stderr.len() > DEFAULT_MAX_BYTES {
+        truncate_to(&mut stderr, DEFAULT_MAX_BYTES);
+    }
+    Ok((output.status.success(), stdout, stderr))
+}
+
+fn truncate_to(s: &mut String, max_bytes: usize) {
+    let cut = s
+        .char_indices()
+        .take_while(|(i, _)| *i < max_bytes)
+        .last()
+        .map(|(i, c)| i + c.len_utf8())
+        .unwrap_or(0);
+    s.truncate(cut);
+    s.push_str(&format!("\n[... truncated at {max_bytes} bytes ...]\n"));
+}
+
+/// Quick "is this dir a git work tree" probe — uses
+/// `rev-parse --is-inside-work-tree` which exits 0 inside a repo and
+/// fails outside one. Cheaper than running `status` just to check.
+async fn is_git_repo(cwd: &Path) -> bool {
+    if !cwd.exists() {
+        return false;
+    }
+    let Ok((ok, _, _)) = run_git(cwd, &["rev-parse", "--is-inside-work-tree"], 5_000).await else {
+        return false;
+    };
+    ok
+}
+
+fn parse_scope_arg(s: &str) -> Result<MemoryScope, BoxError> {
+    MemoryScope::from_wire(s)
+        .ok_or_else(|| -> BoxError { format!("unknown scope `{s}` — use `workspace` or `user`").into() })
+}
+
+/// User-facing setup hint when the memory dir isn't a git repo yet.
+fn setup_hint(path: &Path) -> String {
+    format!(
+        "memory dir `{}` is not a git repository.\n\
+         to set up sync:\n  \
+         1. create a private remote repo (GitHub / GitLab / self-hosted)\n  \
+         2. cd {} && git init && git remote add origin <url>\n  \
+         3. git add . && git commit -m \"seed\" && git push -u origin main\n\
+         then re-run memory.sync.",
+        path.display(),
+        path.display(),
+    )
+}
+
+// --- memory.sync ---
+
+pub struct MemorySyncTool {
+    roots: MemoryRoots,
+}
+
+impl MemorySyncTool {
+    pub fn new(roots: MemoryRoots) -> Self {
+        Self { roots }
+    }
+}
+
+#[async_trait]
+impl Tool for MemorySyncTool {
+    fn name(&self) -> &str {
+        "memory.sync"
+    }
+    fn requires_approval(&self) -> bool {
+        true
+    }
+    fn description(&self) -> &str {
+        "Sync the memory tree with its configured git remote. \
+         Defaults to user scope (`~/.jarvis/memory/`). Runs \
+         `git pull --rebase` then `git push`; if either fails (merge \
+         conflict, auth, no remote, no network) returns the git \
+         stderr verbatim plus a hint. The memory dir must already be \
+         a git working tree — run `memory.sync_status` first to \
+         check, or follow the setup hint the tool prints on first \
+         use. Approval-gated because the push side has an external \
+         effect."
+    }
+    fn parameters(&self) -> Value {
+        json!({
+            "type": "object",
+            "additionalProperties": false,
+            "properties": {
+                "scope": {
+                    "type": "string",
+                    "enum": ["workspace", "user"],
+                    "description": "Which memory tree to sync. Defaults to `user`."
+                },
+                "remote": {
+                    "type": "string",
+                    "description": "Optional remote name (defaults to `origin`)."
+                },
+                "branch": {
+                    "type": "string",
+                    "description": "Optional branch (defaults to the repo's current branch)."
+                },
+                "timeout_ms": {
+                    "type": "integer",
+                    "description": "Per-git-call timeout. Defaults to 60000 (60s)."
+                }
+            }
+        })
+    }
+    fn summary_for_audit(&self, args: &Value) -> Option<String> {
+        let scope = args.get("scope").and_then(Value::as_str).unwrap_or("user");
+        let remote = args
+            .get("remote")
+            .and_then(Value::as_str)
+            .unwrap_or("origin");
+        Some(format!("{scope} → {remote}"))
+    }
+    async fn invoke(&self, args: Value) -> Result<String, BoxError> {
+        let scope = args
+            .get("scope")
+            .and_then(Value::as_str)
+            .map(parse_scope_arg)
+            .transpose()?
+            .unwrap_or(MemoryScope::User);
+        let workspace_root = harness_core::active_workspace_or(&self.roots.workspace_root);
+        let roots = MemoryRoots {
+            workspace_root,
+            user_root: self.roots.user_root.clone(),
+        };
+        let dir = memory_dir_for(&roots, scope)?;
+        let timeout_ms = args
+            .get("timeout_ms")
+            .and_then(Value::as_u64)
+            .unwrap_or(DEFAULT_TIMEOUT_MS);
+
+        if !is_git_repo(&dir).await {
+            return Err(setup_hint(&dir).into());
+        }
+
+        let remote = args
+            .get("remote")
+            .and_then(Value::as_str)
+            .unwrap_or("origin");
+        // Validate remote / branch names — refuse anything that
+        // looks like a flag so the model can't smuggle a
+        // `--upload-pack=<cmd>` style option through.
+        if remote.starts_with('-') || remote.contains(char::is_whitespace) {
+            return Err(format!("invalid remote name `{remote}`").into());
+        }
+
+        let branch_arg = args.get("branch").and_then(Value::as_str);
+        if let Some(b) = branch_arg {
+            if b.starts_with('-') || b.contains(char::is_whitespace) {
+                return Err(format!("invalid branch name `{b}`").into());
+            }
+        }
+
+        let mut report = serde_json::Map::new();
+        report.insert("scope".into(), json!(scope.as_wire()));
+        report.insert("dir".into(), json!(dir.display().to_string()));
+        report.insert("remote".into(), json!(remote));
+
+        // Pull --rebase first so concurrent edits from other clones
+        // land cleanly. `--autostash` would help if the local has
+        // uncommitted changes, but `memory.write` writes through
+        // an atomic temp-rename and we don't expect a dirty tree —
+        // surface dirty state as a clear error instead of silently
+        // stashing.
+        let mut pull_args = vec!["pull", "--rebase"];
+        if let Some(b) = branch_arg {
+            pull_args.push(remote);
+            pull_args.push(b);
+        }
+        let (pull_ok, pull_out, pull_err) = run_git(&dir, &pull_args, timeout_ms).await?;
+        report.insert(
+            "pull".into(),
+            json!({
+                "ok": pull_ok,
+                "stdout": pull_out.trim(),
+                "stderr": pull_err.trim(),
+            }),
+        );
+        if !pull_ok {
+            report.insert(
+                "hint".into(),
+                json!(
+                    "pull failed — run `git -C <dir> status` to inspect; \
+                     resolve conflicts manually and re-run memory.sync."
+                ),
+            );
+            return Ok(serde_json::to_string_pretty(&report).unwrap_or_default());
+        }
+
+        // Push only after a clean pull.
+        let mut push_args = vec!["push"];
+        if let Some(b) = branch_arg {
+            push_args.push(remote);
+            push_args.push(b);
+        }
+        let (push_ok, push_out, push_err) = run_git(&dir, &push_args, timeout_ms).await?;
+        report.insert(
+            "push".into(),
+            json!({
+                "ok": push_ok,
+                "stdout": push_out.trim(),
+                "stderr": push_err.trim(),
+            }),
+        );
+        if !push_ok {
+            report.insert(
+                "hint".into(),
+                json!(
+                    "push failed — common causes: remote not set, auth missing, \
+                     or branch not tracking. Run `git -C <dir> push -u origin <branch>` once \
+                     to establish tracking."
+                ),
+            );
+        }
+
+        // Capture HEAD so the caller can confirm the sync moved
+        // (or didn't) and the model can log it.
+        if let Ok((true, head, _)) = run_git(&dir, &["rev-parse", "HEAD"], 5_000).await {
+            report.insert("head".into(), json!(head.trim()));
+        }
+        Ok(serde_json::to_string_pretty(&report).unwrap_or_default())
+    }
+}
+
+// --- background auto-sync ticker (P11.2) ---
+
+/// Default cadence for the background auto-sync ticker: 5 minutes.
+/// Long enough that a quick burst of edits doesn't hammer the
+/// remote, short enough that cross-machine drift stays bounded.
+pub const DEFAULT_AUTO_SYNC_INTERVAL_SECS: u64 = 300;
+
+/// Configuration knob for [`spawn_auto_sync_task`].
+#[derive(Debug, Clone)]
+pub struct AutoSyncConfig {
+    pub roots: MemoryRoots,
+    /// Which scope to sync on tick. Typically `User` — workspace
+    /// scope is generally tracked by the project's own repo and
+    /// shouldn't ping a separate remote on every tick.
+    pub scope: MemoryScope,
+    /// Tick interval. The first tick fires after `interval` from
+    /// startup, not immediately, so an early shell doesn't race
+    /// with `serve_*_runtime` initialisation.
+    pub interval: Duration,
+    /// Whether to also run one sync immediately at task start
+    /// (useful for picking up changes another machine pushed
+    /// while this one was offline). Defaults to true via
+    /// [`AutoSyncConfig::with_defaults`].
+    pub initial_pull: bool,
+}
+
+impl AutoSyncConfig {
+    pub fn with_defaults(roots: MemoryRoots) -> Self {
+        Self {
+            roots,
+            scope: MemoryScope::User,
+            interval: Duration::from_secs(DEFAULT_AUTO_SYNC_INTERVAL_SECS),
+            initial_pull: true,
+        }
+    }
+}
+
+/// Spawn a background tokio task that periodically syncs the
+/// configured memory scope against its git remote. Returns the
+/// `JoinHandle` so the caller can keep it alive for the process
+/// lifetime; drop it to stop ticking. Failures are logged via
+/// `tracing::warn!` — a flaky network can't bring down the server.
+pub fn spawn_auto_sync_task(cfg: AutoSyncConfig) -> tokio::task::JoinHandle<()> {
+    tokio::spawn(async move {
+        let tool = MemorySyncTool::new(cfg.roots.clone());
+        if cfg.initial_pull {
+            run_one_sync(&tool, cfg.scope, "initial").await;
+        }
+        let mut ticker = tokio::time::interval(cfg.interval);
+        // First `tick()` returns immediately — skip it so we don't
+        // double-fire alongside the optional initial pull.
+        ticker.tick().await;
+        loop {
+            ticker.tick().await;
+            run_one_sync(&tool, cfg.scope, "periodic").await;
+        }
+    })
+}
+
+async fn run_one_sync(tool: &MemorySyncTool, scope: MemoryScope, kind: &'static str) {
+    let args = serde_json::json!({ "scope": scope.as_wire() });
+    match tool.invoke(args).await {
+        Ok(body) => {
+            tracing::info!(
+                kind,
+                scope = scope.as_wire(),
+                report = %body.trim().replace('\n', " "),
+                "memory auto-sync ok",
+            );
+        }
+        Err(e) => {
+            tracing::warn!(
+                kind,
+                scope = scope.as_wire(),
+                error = %e,
+                "memory auto-sync failed (will retry on next tick)",
+            );
+        }
+    }
+}
+
+// --- memory.sync_setup_icloud (P13) ---
+
+pub struct MemoryICloudSetupTool {
+    roots: MemoryRoots,
+}
+
+impl MemoryICloudSetupTool {
+    pub fn new(roots: MemoryRoots) -> Self {
+        Self { roots }
+    }
+}
+
+#[async_trait]
+impl Tool for MemoryICloudSetupTool {
+    fn name(&self) -> &str {
+        "memory.sync_setup_icloud"
+    }
+    fn requires_approval(&self) -> bool {
+        true
+    }
+    fn description(&self) -> &str {
+        "Set up iCloud Drive as the user-scope memory sync transport \
+         (macOS only). Creates a `Jarvis/` folder inside \
+         `~/Library/Mobile Documents/com~apple~CloudDocs/` (iCloud \
+         Drive's local mount) and returns the absolute path. macOS \
+         then syncs that folder to every device signed into the same \
+         Apple ID — no Jarvis-side protocol needed. \
+         \
+         Caveats: macOS-only (this tool errors on Linux/Windows); \
+         the operator must have iCloud Drive enabled in System \
+         Settings; first run may need to set \
+         `JARVIS_MEMORY_USER_ROOT` to the returned path until \
+         iCloud auto-resolution is wired up at startup."
+    }
+    fn parameters(&self) -> Value {
+        json!({
+            "type": "object",
+            "additionalProperties": false,
+            "properties": {}
+        })
+    }
+    async fn invoke(&self, _args: Value) -> Result<String, BoxError> {
+        if !cfg!(target_os = "macos") {
+            return Err("iCloud Drive sync is macOS-only".into());
+        }
+        let drive_root = icloud_drive_root()
+            .ok_or_else(|| -> BoxError { "HOME unresolvable; cannot locate iCloud Drive".into() })?;
+        if !drive_root.exists() {
+            return Err(format!(
+                "iCloud Drive base `{}` does not exist. Enable iCloud Drive in System Settings first.",
+                drive_root.display()
+            )
+            .into());
+        }
+        let target = drive_root.join("Jarvis");
+        tokio::fs::create_dir_all(&target)
+            .await
+            .map_err(|e| -> BoxError { format!("mkdir {}: {e}", target.display()).into() })?;
+        // Note `roots` for parity with other setup tools — having
+        // the user_root match what `memory.*` is operating on means
+        // a subsequent sync_status call can verify everything points
+        // at the same place.
+        let _ = &self.roots;
+
+        let report = json!({
+            "ok": true,
+            "path": target.display().to_string(),
+            "hint": format!(
+                "Restart jarvis with `JARVIS_MEMORY_USER_ROOT={}` (or `JARVIS_MEMORY_SYNC_BACKEND=icloud`) to make this the active user-scope memory root.",
+                target.display()
+            ),
+        });
+        Ok(serde_json::to_string_pretty(&report).unwrap_or_default())
+    }
+}
+
+// --- memory.sync_setup ---
+
+pub struct MemorySyncSetupTool {
+    roots: MemoryRoots,
+}
+
+impl MemorySyncSetupTool {
+    pub fn new(roots: MemoryRoots) -> Self {
+        Self { roots }
+    }
+}
+
+#[async_trait]
+impl Tool for MemorySyncSetupTool {
+    fn name(&self) -> &str {
+        "memory.sync_setup"
+    }
+    fn requires_approval(&self) -> bool {
+        true
+    }
+    fn description(&self) -> &str {
+        "One-shot setup for memory git sync: creates the memory dir \
+         if missing, runs `git init`, adds the given `remote_url` as \
+         `origin`, seeds an empty MEMORY.md, makes the initial \
+         commit, and (by default) pushes to origin. Idempotent guard: \
+         if the dir is already a git repo, the tool errors out unless \
+         `force=true`, in which case it just updates the remote URL \
+         in place without re-initialising. Approval-gated because \
+         this writes to disk and pushes to an external remote."
+    }
+    fn parameters(&self) -> Value {
+        json!({
+            "type": "object",
+            "additionalProperties": false,
+            "required": ["remote_url"],
+            "properties": {
+                "remote_url": {
+                    "type": "string",
+                    "description": "Git URL of the remote repo (ssh / https). Pre-created private repo recommended."
+                },
+                "scope": {
+                    "type": "string",
+                    "enum": ["workspace", "user"],
+                    "description": "Which memory tree to set up. Defaults to `user`."
+                },
+                "branch": {
+                    "type": "string",
+                    "description": "Branch name for the initial commit + push. Defaults to `main`."
+                },
+                "push": {
+                    "type": "boolean",
+                    "description": "Push the initial commit after setup. Defaults to true."
+                },
+                "force": {
+                    "type": "boolean",
+                    "description": "When the dir is already a git repo, just update remote.origin.url to `remote_url` instead of erroring. Defaults to false."
+                }
+            }
+        })
+    }
+    fn summary_for_audit(&self, args: &Value) -> Option<String> {
+        let scope = args.get("scope").and_then(Value::as_str).unwrap_or("user");
+        let url = args
+            .get("remote_url")
+            .and_then(Value::as_str)
+            .unwrap_or("(missing)");
+        Some(format!("{scope} → {url}"))
+    }
+    async fn invoke(&self, args: Value) -> Result<String, BoxError> {
+        let remote_url = args
+            .get("remote_url")
+            .and_then(Value::as_str)
+            .ok_or_else(|| -> BoxError { "missing `remote_url` argument".into() })?
+            .trim();
+        if remote_url.is_empty() {
+            return Err("`remote_url` must not be empty".into());
+        }
+        // Refuse anything that looks like a flag — the URL goes
+        // verbatim into `git remote add`.
+        if remote_url.starts_with('-') {
+            return Err(format!("invalid remote_url `{remote_url}`").into());
+        }
+        let scope = args
+            .get("scope")
+            .and_then(Value::as_str)
+            .map(parse_scope_arg)
+            .transpose()?
+            .unwrap_or(MemoryScope::User);
+        let branch = args
+            .get("branch")
+            .and_then(Value::as_str)
+            .unwrap_or("main");
+        if branch.starts_with('-') || branch.contains(char::is_whitespace) {
+            return Err(format!("invalid branch name `{branch}`").into());
+        }
+        let push = args.get("push").and_then(Value::as_bool).unwrap_or(true);
+        let force = args.get("force").and_then(Value::as_bool).unwrap_or(false);
+
+        let workspace_root = harness_core::active_workspace_or(&self.roots.workspace_root);
+        let roots = MemoryRoots {
+            workspace_root,
+            user_root: self.roots.user_root.clone(),
+        };
+        let dir = memory_dir_for(&roots, scope)?;
+
+        // Create the dir if missing.
+        if !dir.exists() {
+            tokio::fs::create_dir_all(&dir).await.map_err(
+                |e| -> BoxError { format!("mkdir {}: {e}", dir.display()).into() },
+            )?;
+        }
+
+        let mut report = serde_json::Map::new();
+        report.insert("scope".into(), json!(scope.as_wire()));
+        report.insert("dir".into(), json!(dir.display().to_string()));
+        report.insert("remote_url".into(), json!(remote_url));
+        report.insert("branch".into(), json!(branch));
+
+        // Already-a-repo branch.
+        if is_git_repo(&dir).await {
+            if !force {
+                return Err(format!(
+                    "memory dir `{}` is already a git repository. Pass `force=true` to just update the remote, or run `memory.sync` if you wanted to sync.",
+                    dir.display()
+                )
+                .into());
+            }
+            // Force path: just set the remote URL. Use `set-url` if
+            // origin exists, otherwise `add origin`.
+            let (has_origin, _, _) =
+                run_git(&dir, &["config", "--get", "remote.origin.url"], 5_000).await?;
+            let (ok, out, err) = if has_origin {
+                run_git(&dir, &["remote", "set-url", "origin", remote_url], 10_000).await?
+            } else {
+                run_git(&dir, &["remote", "add", "origin", remote_url], 10_000).await?
+            };
+            report.insert(
+                "remote_update".into(),
+                json!({
+                    "ok": ok,
+                    "stdout": out.trim(),
+                    "stderr": err.trim(),
+                }),
+            );
+            if !ok {
+                return Err(format!(
+                    "failed to update origin remote: {}",
+                    err.trim()
+                )
+                .into());
+            }
+            report.insert("initialized".into(), json!(false));
+            return Ok(serde_json::to_string_pretty(&report).unwrap_or_default());
+        }
+
+        // Fresh setup path. Each step short-circuits on failure with
+        // the exact stderr surfaced so the user can read the git
+        // message and fix.
+        macro_rules! must_git {
+            ($args:expr) => {{
+                let (ok, out, err) = run_git(&dir, $args, 10_000).await?;
+                if !ok {
+                    return Err(format!(
+                        "git {:?} failed: {}",
+                        $args,
+                        err.trim()
+                    )
+                    .into());
+                }
+                (out, err)
+            }};
+        }
+
+        must_git!(&["init", "-q", "-b", branch]);
+        must_git!(&["remote", "add", "origin", remote_url]);
+
+        // Seed MEMORY.md if it's not there yet so the initial commit
+        // has something to add. Keep the content stable so subsequent
+        // setups don't churn the byte content.
+        let index = dir.join("MEMORY.md");
+        if !index.exists() {
+            tokio::fs::write(
+                &index,
+                "# Jarvis memory\n\nThis directory holds agent-maintained notes.\n",
+            )
+            .await
+            .map_err(|e| -> BoxError { format!("seed MEMORY.md: {e}").into() })?;
+        }
+
+        must_git!(&["add", "-A"]);
+        // Seed-commit author identity is supplied inline so the call
+        // works on machines without a global `user.email` / `user.name`
+        // configured (fresh dev boxes, CI runners). The overrides only
+        // apply to this single command — subsequent commits in the repo
+        // use whatever the operator has configured locally.
+        must_git!(&[
+            "-c",
+            "user.email=jarvis@local",
+            "-c",
+            "user.name=Jarvis",
+            "commit",
+            "-q",
+            "-m",
+            "init: jarvis memory",
+        ]);
+        report.insert("initialized".into(), json!(true));
+
+        if push {
+            let (push_ok, push_out, push_err) =
+                run_git(&dir, &["push", "-u", "origin", branch], DEFAULT_TIMEOUT_MS).await?;
+            report.insert(
+                "push".into(),
+                json!({
+                    "ok": push_ok,
+                    "stdout": push_out.trim(),
+                    "stderr": push_err.trim(),
+                }),
+            );
+            if !push_ok {
+                report.insert(
+                    "hint".into(),
+                    json!(
+                        "initial push failed — check the remote URL is reachable and you have credentials. \
+                         Local repo is set up; you can fix the push manually with `git -C <dir> push -u origin <branch>`."
+                    ),
+                );
+            }
+        } else {
+            report.insert(
+                "hint".into(),
+                json!("local repo initialised; push skipped (push=false)"),
+            );
+        }
+        Ok(serde_json::to_string_pretty(&report).unwrap_or_default())
+    }
+}
+
+// --- memory.sync_status ---
+
+pub struct MemorySyncStatusTool {
+    roots: MemoryRoots,
+}
+
+impl MemorySyncStatusTool {
+    pub fn new(roots: MemoryRoots) -> Self {
+        Self { roots }
+    }
+}
+
+#[async_trait]
+impl Tool for MemorySyncStatusTool {
+    fn name(&self) -> &str {
+        "memory.sync_status"
+    }
+    fn description(&self) -> &str {
+        "Report the git sync state of the memory tree without making \
+         changes. Returns whether the dir is a git repo, the current \
+         branch, the configured remote URL, and `git status --porcelain` \
+         output. Use this to verify setup or inspect why a previous \
+         `memory.sync` call failed."
+    }
+    fn parameters(&self) -> Value {
+        json!({
+            "type": "object",
+            "additionalProperties": false,
+            "properties": {
+                "scope": {
+                    "type": "string",
+                    "enum": ["workspace", "user"],
+                    "description": "Which memory tree to inspect. Defaults to `user`."
+                }
+            }
+        })
+    }
+    fn category(&self) -> ToolCategory {
+        ToolCategory::Read
+    }
+    async fn invoke(&self, args: Value) -> Result<String, BoxError> {
+        let scope = args
+            .get("scope")
+            .and_then(Value::as_str)
+            .map(parse_scope_arg)
+            .transpose()?
+            .unwrap_or(MemoryScope::User);
+        let workspace_root = harness_core::active_workspace_or(&self.roots.workspace_root);
+        let roots = MemoryRoots {
+            workspace_root,
+            user_root: self.roots.user_root.clone(),
+        };
+        let dir = memory_dir_for(&roots, scope)?;
+
+        let mut report = serde_json::Map::new();
+        report.insert("scope".into(), json!(scope.as_wire()));
+        report.insert("dir".into(), json!(dir.display().to_string()));
+
+        if !is_git_repo(&dir).await {
+            report.insert("is_git_repo".into(), json!(false));
+            report.insert("setup_hint".into(), json!(setup_hint(&dir)));
+            return Ok(serde_json::to_string_pretty(&report).unwrap_or_default());
+        }
+        report.insert("is_git_repo".into(), json!(true));
+
+        if let Ok((true, branch, _)) = run_git(&dir, &["rev-parse", "--abbrev-ref", "HEAD"], 5_000).await {
+            report.insert("branch".into(), json!(branch.trim()));
+        }
+        if let Ok((true, remote_url, _)) =
+            run_git(&dir, &["config", "--get", "remote.origin.url"], 5_000).await
+        {
+            report.insert("remote_url".into(), json!(remote_url.trim()));
+        } else {
+            report.insert("remote_url".into(), json!(null));
+            report.insert(
+                "hint".into(),
+                json!("no `origin` remote — set one with `git remote add origin <url>`."),
+            );
+        }
+        if let Ok((true, status, _)) = run_git(&dir, &["status", "--porcelain"], 5_000).await {
+            report.insert("dirty".into(), json!(!status.trim().is_empty()));
+            report.insert("status".into(), json!(status.trim()));
+        }
+        if let Ok((true, head, _)) = run_git(&dir, &["rev-parse", "HEAD"], 5_000).await {
+            report.insert("head".into(), json!(head.trim()));
+        }
+        Ok(serde_json::to_string_pretty(&report).unwrap_or_default())
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use std::process::Command as StdCommand;
+    use tempfile::tempdir;
+    use tokio::fs;
+
+    /// Make a tempdir + `git init` it, set user identity so commits
+    /// don't fail on a CI box without a global git config, and return
+    /// the path.
+    fn git_init(dir: &std::path::Path) {
+        let run = |args: &[&str]| {
+            let st = StdCommand::new("git")
+                .arg("-C")
+                .arg(dir)
+                .args(args)
+                .output()
+                .expect("git spawn");
+            assert!(
+                st.status.success(),
+                "git {args:?} failed: {}",
+                String::from_utf8_lossy(&st.stderr)
+            );
+        };
+        run(&["init", "-q", "-b", "main"]);
+        run(&["config", "user.email", "test@example.com"]);
+        run(&["config", "user.name", "Test"]);
+    }
+
+    async fn commit_all(dir: &std::path::Path, msg: &str) {
+        StdCommand::new("git")
+            .arg("-C")
+            .arg(dir)
+            .args(["add", "-A"])
+            .status()
+            .unwrap();
+        StdCommand::new("git")
+            .arg("-C")
+            .arg(dir)
+            .args(["commit", "-q", "-m", msg])
+            .status()
+            .unwrap();
+    }
+
+    fn user_only(user: &std::path::Path) -> MemoryRoots {
+        // Workspace root is unused by the sync tools when scope=user;
+        // give it a dead path to make accidental fall-through obvious.
+        MemoryRoots::new(std::path::PathBuf::from("/dev/null/should-not-be-used"))
+            .with_user_root(user.to_path_buf())
+    }
+
+    #[tokio::test]
+    async fn sync_status_reports_non_git_dir_with_setup_hint() {
+        let user = tempdir().unwrap();
+        // No `git init` — the memory dir doesn't even exist.
+        let tool = MemorySyncStatusTool::new(user_only(user.path()));
+        let body = tool.invoke(json!({})).await.unwrap();
+        let v: serde_json::Value = serde_json::from_str(&body).unwrap();
+        assert_eq!(v["is_git_repo"], false);
+        assert!(v["setup_hint"]
+            .as_str()
+            .unwrap()
+            .contains("git init"));
+    }
+
+    #[tokio::test]
+    async fn sync_status_reports_branch_and_head_when_git_repo() {
+        let user = tempdir().unwrap();
+        let mem_dir = user.path().join(MEMORY_DIR);
+        fs::create_dir_all(&mem_dir).await.unwrap();
+        git_init(&mem_dir);
+        fs::write(mem_dir.join("MEMORY.md"), "- [x](x.md)\n")
+            .await
+            .unwrap();
+        commit_all(&mem_dir, "seed").await;
+
+        let tool = MemorySyncStatusTool::new(user_only(user.path()));
+        let body = tool.invoke(json!({})).await.unwrap();
+        let v: serde_json::Value = serde_json::from_str(&body).unwrap();
+        assert_eq!(v["is_git_repo"], true);
+        assert_eq!(v["branch"], "main");
+        assert!(v["head"].as_str().unwrap().len() >= 7);
+        assert_eq!(v["dirty"], false);
+        // No remote configured yet — hint surfaces.
+        assert!(v["hint"].as_str().unwrap().contains("origin"));
+    }
+
+    #[tokio::test]
+    async fn sync_errors_with_setup_hint_when_not_a_repo() {
+        let user = tempdir().unwrap();
+        let tool = MemorySyncTool::new(user_only(user.path()));
+        let err = tool.invoke(json!({})).await.unwrap_err();
+        let msg = err.to_string();
+        assert!(msg.contains("not a git repository"));
+        assert!(msg.contains("git init"));
+    }
+
+    #[tokio::test]
+    async fn sync_against_local_bare_repo_round_trips() {
+        // Set up a local bare repo to act as the "remote", clone it,
+        // and verify pull+push report ok via the tool. Skip when
+        // `git` isn't on PATH (running in a strict sandbox); the
+        // tool would surface a spawn error in that case.
+        if StdCommand::new("git").arg("--version").output().is_err() {
+            eprintln!("skipping: git not on PATH");
+            return;
+        }
+        let upstream = tempdir().unwrap();
+        StdCommand::new("git")
+            .args(["init", "-q", "--bare", "-b", "main"])
+            .arg(upstream.path())
+            .status()
+            .unwrap();
+
+        let user = tempdir().unwrap();
+        let mem_dir = user.path().join(MEMORY_DIR);
+        fs::create_dir_all(&mem_dir).await.unwrap();
+        git_init(&mem_dir);
+        StdCommand::new("git")
+            .arg("-C")
+            .arg(&mem_dir)
+            .args(["remote", "add", "origin"])
+            .arg(upstream.path())
+            .status()
+            .unwrap();
+        fs::write(mem_dir.join("MEMORY.md"), "- [seed](seed.md)\n")
+            .await
+            .unwrap();
+        commit_all(&mem_dir, "seed").await;
+        StdCommand::new("git")
+            .arg("-C")
+            .arg(&mem_dir)
+            .args(["push", "-q", "-u", "origin", "main"])
+            .status()
+            .unwrap();
+
+        let tool = MemorySyncTool::new(user_only(user.path()));
+        let body = tool.invoke(json!({})).await.unwrap();
+        let v: serde_json::Value = serde_json::from_str(&body).unwrap();
+        assert_eq!(v["pull"]["ok"], true, "pull report: {v}");
+        assert_eq!(v["push"]["ok"], true, "push report: {v}");
+        assert!(v["head"].as_str().unwrap().len() >= 7);
+    }
+
+    #[tokio::test]
+    async fn sync_rejects_invalid_remote_name() {
+        let user = tempdir().unwrap();
+        let mem_dir = user.path().join(MEMORY_DIR);
+        fs::create_dir_all(&mem_dir).await.unwrap();
+        git_init(&mem_dir);
+        commit_all(&mem_dir, "seed").await;
+        let tool = MemorySyncTool::new(user_only(user.path()));
+        let err = tool
+            .invoke(json!({"remote": "--upload-pack=evil"}))
+            .await
+            .unwrap_err();
+        assert!(err.to_string().contains("invalid remote"));
+    }
+
+    #[tokio::test]
+    async fn user_scope_required_when_user_root_unconfigured() {
+        // No user_root → user-scope sync should error cleanly.
+        let roots = MemoryRoots::new(std::path::PathBuf::from("/tmp/ws"));
+        let tool = MemorySyncTool::new(roots);
+        let err = tool.invoke(json!({})).await.unwrap_err();
+        assert!(err.to_string().contains("user-scope memory is not configured"));
+    }
+
+    // --- memory.sync_setup ---
+
+    #[tokio::test]
+    async fn sync_setup_initialises_repo_and_pushes_to_local_remote() {
+        if StdCommand::new("git").arg("--version").output().is_err() {
+            eprintln!("skipping: git not on PATH");
+            return;
+        }
+        // Local bare repo as the "remote".
+        let upstream = tempdir().unwrap();
+        StdCommand::new("git")
+            .args(["init", "-q", "--bare", "-b", "main"])
+            .arg(upstream.path())
+            .status()
+            .unwrap();
+
+        let user = tempdir().unwrap();
+        let tool = MemorySyncSetupTool::new(user_only(user.path()));
+        let body = tool
+            .invoke(json!({
+                "remote_url": upstream.path().to_string_lossy().to_string(),
+            }))
+            .await
+            .unwrap();
+        let v: serde_json::Value = serde_json::from_str(&body).unwrap();
+        assert_eq!(v["initialized"], true);
+        assert_eq!(v["push"]["ok"], true, "push failed: {v}");
+        // MEMORY.md was seeded.
+        let seed = user.path().join(MEMORY_DIR).join("MEMORY.md");
+        assert!(seed.exists());
+        // Bare upstream now has a HEAD ref.
+        let head = StdCommand::new("git")
+            .arg("-C")
+            .arg(upstream.path())
+            .args(["rev-parse", "HEAD"])
+            .output()
+            .unwrap();
+        assert!(head.status.success(), "upstream has no HEAD after push");
+    }
+
+    #[tokio::test]
+    async fn sync_setup_errors_when_already_a_repo_without_force() {
+        let user = tempdir().unwrap();
+        let mem_dir = user.path().join(MEMORY_DIR);
+        fs::create_dir_all(&mem_dir).await.unwrap();
+        git_init(&mem_dir);
+        let tool = MemorySyncSetupTool::new(user_only(user.path()));
+        let err = tool
+            .invoke(json!({"remote_url": "git@example.com:me/x.git"}))
+            .await
+            .unwrap_err();
+        assert!(err.to_string().contains("already a git repository"));
+    }
+
+    #[tokio::test]
+    async fn sync_setup_force_updates_remote_url_in_place() {
+        if StdCommand::new("git").arg("--version").output().is_err() {
+            return;
+        }
+        let user = tempdir().unwrap();
+        let mem_dir = user.path().join(MEMORY_DIR);
+        fs::create_dir_all(&mem_dir).await.unwrap();
+        git_init(&mem_dir);
+        // Seed an origin so set-url is the path taken (not add).
+        StdCommand::new("git")
+            .arg("-C")
+            .arg(&mem_dir)
+            .args(["remote", "add", "origin", "git@old:me/x.git"])
+            .status()
+            .unwrap();
+        let tool = MemorySyncSetupTool::new(user_only(user.path()));
+        let body = tool
+            .invoke(json!({
+                "remote_url": "git@new:me/x.git",
+                "force": true,
+            }))
+            .await
+            .unwrap();
+        let v: serde_json::Value = serde_json::from_str(&body).unwrap();
+        assert_eq!(v["initialized"], false);
+        // Verify the new URL actually landed.
+        let out = StdCommand::new("git")
+            .arg("-C")
+            .arg(&mem_dir)
+            .args(["config", "--get", "remote.origin.url"])
+            .output()
+            .unwrap();
+        assert_eq!(
+            String::from_utf8_lossy(&out.stdout).trim(),
+            "git@new:me/x.git"
+        );
+    }
+
+    #[tokio::test]
+    async fn sync_setup_rejects_flag_like_remote_url() {
+        let user = tempdir().unwrap();
+        let tool = MemorySyncSetupTool::new(user_only(user.path()));
+        let err = tool
+            .invoke(json!({"remote_url": "--upload-pack=evil"}))
+            .await
+            .unwrap_err();
+        assert!(err.to_string().contains("invalid remote_url"));
+    }
+
+    #[tokio::test]
+    async fn auto_sync_ticker_runs_initial_pull_then_periodic() {
+        // Closes the loop end-to-end: a local bare repo, one client
+        // dir already pointing at it, the ticker fires the initial
+        // pull, then we abort the task to avoid hanging the test.
+        if StdCommand::new("git").arg("--version").output().is_err() {
+            return;
+        }
+        let upstream = tempdir().unwrap();
+        StdCommand::new("git")
+            .args(["init", "-q", "--bare", "-b", "main"])
+            .arg(upstream.path())
+            .status()
+            .unwrap();
+
+        let user = tempdir().unwrap();
+        let mem_dir = user.path().join(MEMORY_DIR);
+        fs::create_dir_all(&mem_dir).await.unwrap();
+        git_init(&mem_dir);
+        StdCommand::new("git")
+            .arg("-C")
+            .arg(&mem_dir)
+            .args(["remote", "add", "origin"])
+            .arg(upstream.path())
+            .status()
+            .unwrap();
+        fs::write(mem_dir.join("MEMORY.md"), "- [seed](seed.md)\n")
+            .await
+            .unwrap();
+        commit_all(&mem_dir, "seed").await;
+        StdCommand::new("git")
+            .arg("-C")
+            .arg(&mem_dir)
+            .args(["push", "-q", "-u", "origin", "main"])
+            .status()
+            .unwrap();
+
+        let cfg = AutoSyncConfig {
+            roots: user_only(user.path()),
+            scope: MemoryScope::User,
+            interval: Duration::from_millis(120),
+            initial_pull: true,
+        };
+        let handle = spawn_auto_sync_task(cfg);
+        // Give the initial pull + at least one periodic tick a chance.
+        tokio::time::sleep(Duration::from_millis(400)).await;
+        handle.abort();
+        // If the task panicked the abort wouldn't catch it; the test
+        // would already have surfaced the panic in stderr. Either way
+        // the loop ran without bringing the test down.
+    }
+
+    #[test]
+    fn backend_from_wire_accepts_aliases_and_rejects_garbage() {
+        assert_eq!(
+            MemorySyncBackend::from_wire("git"),
+            Some(MemorySyncBackend::Git)
+        );
+        assert_eq!(
+            MemorySyncBackend::from_wire("GIT"),
+            Some(MemorySyncBackend::Git)
+        );
+        assert_eq!(
+            MemorySyncBackend::from_wire("icloud"),
+            Some(MemorySyncBackend::ICloud)
+        );
+        assert_eq!(
+            MemorySyncBackend::from_wire("iCloud-Drive"),
+            Some(MemorySyncBackend::ICloud)
+        );
+        assert_eq!(
+            MemorySyncBackend::from_wire("none"),
+            Some(MemorySyncBackend::None)
+        );
+        assert_eq!(
+            MemorySyncBackend::from_wire(""),
+            Some(MemorySyncBackend::None)
+        );
+        assert!(MemorySyncBackend::from_wire("dropbox").is_none());
+    }
+
+    #[test]
+    fn backend_round_trip_wire() {
+        for b in [
+            MemorySyncBackend::None,
+            MemorySyncBackend::Git,
+            MemorySyncBackend::ICloud,
+        ] {
+            assert_eq!(MemorySyncBackend::from_wire(b.as_wire()), Some(b));
+        }
+    }
+
+    #[cfg(target_os = "macos")]
+    #[test]
+    fn icloud_drive_root_returns_path_on_macos() {
+        // We can't assert the dir exists (depends on operator's
+        // iCloud Drive setup), only that the candidate path is
+        // computed correctly off `$HOME`.
+        let path = icloud_drive_root().expect("HOME should be set");
+        assert!(path.ends_with("Library/Mobile Documents/com~apple~CloudDocs"));
+    }
+
+    #[cfg(not(target_os = "macos"))]
+    #[test]
+    fn icloud_drive_root_returns_none_off_macos() {
+        assert!(icloud_drive_root().is_none());
+    }
+
+    #[cfg(not(target_os = "macos"))]
+    #[tokio::test]
+    async fn icloud_setup_errors_off_macos() {
+        let user = tempdir().unwrap();
+        let tool = MemoryICloudSetupTool::new(user_only(user.path()));
+        let err = tool.invoke(json!({})).await.unwrap_err();
+        assert!(err.to_string().contains("macOS-only"));
+    }
+
+    #[cfg(target_os = "macos")]
+    #[tokio::test]
+    async fn icloud_setup_errors_when_icloud_disabled() {
+        // Mock iCloud Drive absence by pointing HOME at a tempdir
+        // with no `Library/Mobile Documents/...` subtree. Has to
+        // run with the env override scoped to this test only.
+        let home = tempdir().unwrap();
+        let prev_home = std::env::var_os("HOME");
+        // SAFETY: process-wide env mutation. The other iCloud
+        // tests are #[cfg(target_os = "macos")] too and the test
+        // runner serialises within a process — vitest-style
+        // isolation isn't a concern at this layer.
+        // SAFETY justification: see comment above.
+        unsafe { std::env::set_var("HOME", home.path()) };
+        let user = tempdir().unwrap();
+        let tool = MemoryICloudSetupTool::new(user_only(user.path()));
+        let err = tool.invoke(json!({})).await.unwrap_err();
+        if let Some(h) = prev_home {
+            unsafe { std::env::set_var("HOME", h) };
+        }
+        assert!(err.to_string().contains("does not exist"));
+    }
+
+    #[tokio::test]
+    async fn sync_setup_skips_push_when_disabled() {
+        if StdCommand::new("git").arg("--version").output().is_err() {
+            return;
+        }
+        let user = tempdir().unwrap();
+        let tool = MemorySyncSetupTool::new(user_only(user.path()));
+        let body = tool
+            .invoke(json!({
+                "remote_url": "git@example.com:me/x.git",
+                "push": false,
+            }))
+            .await
+            .unwrap();
+        let v: serde_json::Value = serde_json::from_str(&body).unwrap();
+        assert_eq!(v["initialized"], true);
+        assert!(v.get("push").is_none());
+        assert!(v["hint"].as_str().unwrap().contains("push skipped"));
+    }
+}
diff --git a/crates/harness-tools/src/patch.rs b/crates/harness-tools/src/patch.rs
index 5f3f83f..84bd2e0 100644
--- a/crates/harness-tools/src/patch.rs
+++ b/crates/harness-tools/src/patch.rs
@@ -209,6 +209,9 @@ impl Tool for FsPatchTool {
                         .map_err(|e| -> BoxError { format!("delete `{}`: {e}", w.rel).into() })?;
                 }
             }
+            // Note every touched path so post-compaction reinjection
+            // can remind the agent which files it just changed.
+            harness_core::note_working_file_relative_to(&w.abs, Some(&root));
         }
 
         // Build the human-readable summary.
diff --git a/crates/harness-tools/src/shell.rs b/crates/harness-tools/src/shell.rs
index a4d3e0c..65a5f98 100644
--- a/crates/harness-tools/src/shell.rs
+++ b/crates/harness-tools/src/shell.rs
@@ -257,6 +257,10 @@ impl Tool for ShellExecTool {
             .get("command")
             .and_then(Value::as_str)
             .ok_or_else(|| -> BoxError { "missing `command` argument".into() })?;
+        // Record into WorkingContext so post-compaction reinjection
+        // can remind the agent which commands it just ran. Truncation
+        // / dedup is handled inside `note_command`.
+        harness_core::note_working_command(command);
 
         let root = harness_core::active_workspace_or(&self.root);
         let cwd = match args.get("cwd").and_then(Value::as_str) {
diff --git a/docs/conventions/rust-ts-codegen.md b/docs/conventions/rust-ts-codegen.md
new file mode 100644
index 0000000..e52024c
--- /dev/null
+++ b/docs/conventions/rust-ts-codegen.md
@@ -0,0 +1,170 @@
+# Rust → TypeScript type codegen
+
+Wire-shape types crossing the Rust ↔ TypeScript boundary are
+**generated** from the Rust definitions using
+[`ts-rs`](https://github.com/Aleph-Alpha/ts-rs). The frontend
+imports the generated types from
+`apps/jarvis-web/src/types/generated/`; hand-maintained equivalents
+are a drift hazard — the codegen is the source of truth.
+
+This file documents:
+- The conventions for annotating a Rust type
+- How to regenerate after a change
+- How the generated files are committed + reviewed
+
+## When to annotate
+
+Annotate a type when **all three** apply:
+
+1. The type appears on a JSON wire crossing into the SPA (REST
+   reply / WS frame payload / `localStorage` shape).
+2. The frontend ever names a TypeScript equivalent — `as ChannelInstance`,
+   `interface RequirementSummary { … }`, etc.
+3. The Rust definition is in `harness-channel`, `harness-project`,
+   `harness-observability`, or another crate that already has
+   `ts-rs` as a workspace dep. (`harness-core` deliberately stays
+   out — wire-shape types should live in their domain crate, not
+   the agent-loop trunk.)
+
+If only (1) is true but the frontend never names the shape (e.g.
+`fetch(...).then(r => r.json()).then((data: any) => data.foo)`),
+skip it. Code paths that hand-extract fields don't benefit from a
+generated type.
+
+## Annotation pattern
+
+```rust
+use serde::{Deserialize, Serialize};
+use ts_rs::TS;
+
+#[derive(Debug, Clone, Serialize, Deserialize, TS)]
+#[serde(rename_all = "snake_case")]
+#[ts(export, export_to = "../../../apps/jarvis-web/src/types/generated/")]
+pub struct Project {
+    pub id: String,
+    pub slug: String,
+    /// `None` when archived; `Some(Workspace { … })` otherwise.
+    pub workspace: Option<ProjectWorkspace>,
+}
+```
+
+Notes on each line:
+
+- `#[derive(TS)]` — the codegen derive macro. Goes alongside `serde`.
+  Pulls the derive from the workspace `ts-rs = "10"` dep added to
+  the owning crate's `Cargo.toml`.
+- `#[serde(rename_all = "snake_case")]` (or `kebab-case` etc.) — the
+  derive **inspects** serde renames and emits the matching wire
+  form on the TS side. Keep these in sync; mismatched casing is the
+  most common bug.
+- `#[ts(export, export_to = "…/types/generated/")]` — tells the
+  derive to write a `<TypeName>.ts` to the given path during
+  `cargo test`. The path is **relative to the source file the
+  derive is on**, not the workspace root. From a
+  `crates/harness-channel/src/instance.rs`, three `..` lands at
+  the repo root → `apps/jarvis-web/src/types/generated/`.
+
+### Common field-level overrides
+
+`serde_json::Value` becomes `any` by default, which is rarely what
+the frontend wants. Pick the narrowest TS type that covers the
+runtime shape:
+
+```rust
+#[ts(type = "Record<string, unknown>")]
+pub config: serde_json::Value,
+
+#[ts(type = "string[]")]
+pub tags: serde_json::Value,
+```
+
+Optional Rust types map to `T | null` by default. If the frontend
+expects an undefined-style optional (the field can be omitted
+entirely), add `#[ts(optional)]`:
+
+```rust
+#[serde(skip_serializing_if = "Option::is_none")]
+#[ts(optional)]
+pub note: Option<String>,
+```
+
+## Regenerating
+
+The codegen runs as an embedded `#[test]` injected by the derive
+macro. Every `cargo test` of an annotated crate writes the
+corresponding `.ts` files.
+
+```bash
+# Whole workspace (covers everything):
+cargo test --workspace --lib
+
+# Just the channel-domain types:
+cargo test -p harness-channel
+
+# Just the project-domain types:
+cargo test -p harness-project
+```
+
+`make ts-codegen` (in the root `Makefile`) is the canonical one-shot
+target — wraps the above with no test output noise.
+
+## Committing the generated files
+
+The `apps/jarvis-web/src/types/generated/` directory **is** in git.
+Reasoning:
+
+- CI doesn't have a Rust toolchain on the SPA-only build step. If
+  the frontend imports from `types/generated/`, those files must
+  exist on disk at build time. Generating during the SPA build
+  would tie Vite to `cargo`, which complicates Tauri / Docker
+  setups.
+- Drift is much easier to see in code review when the diff shows
+  the regenerated TS alongside the Rust change. A PR that touches
+  `Project` in Rust without a matching `Project.ts` diff is the
+  signal "you forgot to regenerate."
+
+Workflow: change a `#[derive(TS)]` type → run `cargo test -p
+<owning-crate>` → `git add apps/jarvis-web/src/types/generated/` →
+commit both in the same PR.
+
+## Consuming from the frontend
+
+Re-export from the matching `services/*.ts` file so the rest of the
+SPA doesn't have to know which type is generated vs hand-written:
+
+```typescript
+// services/channels.ts
+import type { ChannelInstance as GeneratedChannelInstance } from "../types/generated/ChannelInstance";
+import type { ChannelInstanceStatus } from "../types/generated/ChannelInstanceStatus";
+
+// Re-export under the conventional name so existing imports stay
+// stable. `ChannelStatus` is a legacy alias for the same enum.
+export type ChannelStatus = ChannelInstanceStatus;
+export type ChannelInstance = GeneratedChannelInstance;
+```
+
+Components import from the service layer (`import { ChannelInstance }
+from "@/services/channels"`), not from `types/generated/` directly.
+That insulation lets us swap a generated type for a richer
+hand-extended one if the SPA needs a field the Rust shape doesn't
+carry.
+
+## Anti-patterns
+
+- **Don't edit a file under `types/generated/`.** It'll be
+  overwritten on the next `cargo test`. If the type needs a hand-
+  written field, extend it in the service layer (intersection or
+  spread).
+- **Don't annotate types in `harness-core`.** That crate is the
+  agent-loop trunk; wire-shape types belong in their domain crate
+  (channel / project / observability). If a wire-shape type is
+  in `harness-core` today, that's a smell — extract it first.
+- **Don't omit `serde(rename_all = …)`.** Without it, an enum like
+  `RequirementStatus::InProgress` round-trips through JSON as
+  `"InProgress"` but ts-rs emits `"in_progress"`. The runtime
+  shape and the TS type disagree, and the SPA's narrow checks
+  silently fail.
+- **Don't annotate types with `Vec<Box<dyn Trait>>` fields.**
+  ts-rs can't reflect on trait objects. Either pull out the
+  concrete enum / struct, or skip codegen and write the TS by
+  hand for that single type.
diff --git a/start.sh b/start.sh
new file mode 100755
index 0000000..934ad7b
--- /dev/null
+++ b/start.sh
@@ -0,0 +1,162 @@
+#!/usr/bin/env bash
+# start.sh — Jarvis 快速启动脚本。
+#
+#   ./start.sh         # 嵌入式 UI：先 build web，再 cargo run。一个进程同时服务 API + UI。
+#   ./start.sh --dev   # 双进程：后台 Vite (5173) + 前台 cargo (7001)，热重载工作流。
+#
+# 通用选项：
+#   -h | --help        # 打印用法
+#   --no-env           # 即便存在 .env 也不加载
+#   --release          # cargo 用 release profile（嵌入式模式才生效）
+#   --port <N>         # 覆盖 JARVIS_ADDR 端口（默认 7001）
+#
+# Web bundle 是增量构建：dist/ 缺失，或 src/ / package.json / vite.config.ts
+# 比 dist/ 新时才重新 build。命中缓存时启动 < 1s。
+
+set -euo pipefail
+
+cd "$(dirname "$0")"
+
+mode="serve"
+load_env=1
+profile="debug"
+port=""
+
+while [[ $# -gt 0 ]]; do
+  case "$1" in
+    --dev)        mode="dev"; shift ;;
+    --no-env)     load_env=0; shift ;;
+    --release)    profile="release"; shift ;;
+    --port)       port="${2:?--port 需要一个端口号}"; shift 2 ;;
+    -h|--help)
+      sed -n '2,15p' "$0" | sed 's/^# \{0,1\}//'
+      exit 0 ;;
+    *) echo "start.sh: 未知参数 '$1'（用 -h 查看用法）" >&2; exit 64 ;;
+  esac
+done
+
+log()  { printf '\033[36m[start]\033[0m %s\n' "$*"; }
+warn() { printf '\033[33m[start]\033[0m %s\n' "$*" >&2; }
+die()  { printf '\033[31m[start]\033[0m %s\n' "$*" >&2; exit 1; }
+
+# 端口占用检查 —— 启动前显式报错胜过看着两个进程瞎打架
+#
+# 注意：开启 `set -o pipefail` 时 lsof 没找到匹配会返回 1，再走管道会把整个
+# `$(...)` 标成失败，触发 set -e 让脚本静默退出。所以这里用 `|| true` 把
+# "没人占用" 这种正常路径吞掉。
+check_port_free() {
+  local port="$1" name="$2" holder_pid
+  if ! command -v lsof >/dev/null; then return 0; fi
+  holder_pid=$(lsof -nP -tiTCP:"$port" -sTCP:LISTEN 2>/dev/null || true)
+  holder_pid="${holder_pid%%$'\n'*}"
+  if [[ -n "$holder_pid" ]]; then
+    local cmd
+    cmd=$(ps -p "$holder_pid" -o comm= 2>/dev/null || echo "?")
+    die "端口 ${port}（${name}）已被进程 ${holder_pid} (${cmd}) 占用。释放后重试：kill ${holder_pid}"
+  fi
+}
+
+# 给子进程的输出加前缀，免得 vite 和 cargo 的日志混成一团分不清
+prefix_stream() {
+  local tag="$1"
+  while IFS= read -r line; do printf '\033[2m[%s]\033[0m %s\n' "$tag" "$line"; done
+}
+
+# .env 加载 —— 仅当文件存在且未禁用时。set -a 让 source 的 KEY=VAL 自动 export。
+if [[ $load_env -eq 1 && -f .env ]]; then
+  log "加载 .env"
+  set -a; . ./.env; set +a
+fi
+
+# 端口覆盖
+if [[ -n "$port" ]]; then
+  export JARVIS_ADDR="127.0.0.1:${port}"
+elif [[ -z "${JARVIS_ADDR:-}" ]]; then
+  export JARVIS_ADDR="127.0.0.1:7001"
+fi
+
+# 工作区固定到仓库根，避免无意中沙箱化别处
+export JARVIS_FS_ROOT="${JARVIS_FS_ROOT:-$PWD}"
+
+WEB_DIR="apps/jarvis-web"
+WEB_DIST="$WEB_DIR/dist"
+
+ensure_web_deps() {
+  if [[ ! -d "$WEB_DIR/node_modules" ]]; then
+    log "首次运行：安装 web 依赖（npm ci）"
+    (cd "$WEB_DIR" && npm ci --no-audit --no-fund)
+  fi
+}
+
+# 增量 web build：dist/ 不存在，或 src/package.json/vite.config.ts 新于 dist/
+need_web_build() {
+  [[ ! -d "$WEB_DIST" ]] && return 0
+  local newest_src newest_dist
+  newest_src=$(find "$WEB_DIR/src" "$WEB_DIR/package.json" "$WEB_DIR/vite.config.ts" "$WEB_DIR/index.html" \
+                 -type f -newer "$WEB_DIST" -print -quit 2>/dev/null || true)
+  [[ -n "$newest_src" ]]
+}
+
+build_web_if_needed() {
+  ensure_web_deps
+  if need_web_build; then
+    log "web bundle 过时，重新构建（npm run build）"
+    (cd "$WEB_DIR" && npm run build)
+  else
+    log "web bundle 命中缓存，跳过 build"
+  fi
+}
+
+cargo_port() { echo "${JARVIS_ADDR##*:}"; }
+
+run_serve_mode() {
+  build_web_if_needed
+  check_port_free "$(cargo_port)" "jarvis"
+  log "启动 jarvis（${profile}）—— http://${JARVIS_ADDR}"
+  if [[ "$profile" == "release" ]]; then
+    exec cargo run --release -p jarvis -- serve --workspace "$JARVIS_FS_ROOT"
+  else
+    exec cargo run -p jarvis -- serve --workspace "$JARVIS_FS_ROOT"
+  fi
+}
+
+run_dev_mode() {
+  ensure_web_deps
+
+  local vite_port="${VITE_PORT:-5173}"
+  check_port_free "$vite_port"     "vite"
+  check_port_free "$(cargo_port)" "jarvis"
+
+  # 后台 Vite，输出经 prefix_stream 加 [vite] 前缀。subshell 拿到的是 pipeline 的最末一段，
+  # 但 vite 真正运行在子 shell 内的 npm 之下，所以 cleanup 时要 pkill -P 一路追下去。
+  log "启动 Vite （后台，http://127.0.0.1:${vite_port}）"
+  ( cd "$WEB_DIR" && exec npm run dev ) > >(prefix_stream vite) 2> >(prefix_stream vite >&2) &
+  local vite_pid=$!
+
+  cleanup() {
+    if kill -0 "$vite_pid" 2>/dev/null; then
+      log "停止 Vite (pid=$vite_pid)"
+      pkill -P "$vite_pid" 2>/dev/null || true
+      kill "$vite_pid" 2>/dev/null || true
+      wait "$vite_pid" 2>/dev/null || true
+    fi
+  }
+  trap cleanup EXIT INT TERM
+
+  # 给 Vite 半秒抢到第一条 banner 打印，再让 cargo 接管前台，免得日志互相打断
+  sleep 0.5
+
+  log "启动 jarvis （前台，http://${JARVIS_ADDR}）"
+  log "Ctrl-C 可同时停止两个进程"
+  # 不 exec：保留当前 shell 以触发 EXIT trap 清理 Vite
+  cargo run -p jarvis -- serve --workspace "$JARVIS_FS_ROOT"
+}
+
+# 基础依赖兜底检查 —— 缺失了直接说，不要等 cargo / npm 抛混乱错
+command -v cargo >/dev/null || die "未找到 cargo（请安装 Rust toolchain）"
+command -v npm   >/dev/null || die "未找到 npm（请安装 Node.js）"
+
+case "$mode" in
+  serve) run_serve_mode ;;
+  dev)   run_dev_mode ;;
+esac