From f76adba93aac83a23e9d38f12109ea18bdb35cb0 Mon Sep 17 00:00:00 2001
From: AnandMayank <anandmayank698@gmail.com>
Date: Sun, 14 Jun 2026 00:03:00 +0000
Subject: [PATCH 1/2] feat(robot-mcp): add robot inspection MCP server and
 CouchDB asset profiles

CouchDB profile layer (src/couchdb/):
- New profile:{asset_id} documents in the iot DB for 4 assets
  (Chiller 6, Metro Pump 1, Hydraulic Pump 1, Motor 01)
- 9 robot-specific fields per profile; docs omit asset_id so existing
  IoT Mango queries are completely unaffected
- seed_robot_profiles.py with --dry-run / --verify flags
- schema_robot_fields.json field reference and gauge_value constraint doc

Robot MCP server (src/servers/robot/):
- 8 tools: navigate_to, safety_gate_check, open_panel, read_gauge,
  check_human_presence, commit_reading, check_wo_similarity, detect_anomaly
- PhysicalStateSimulator: seeded (seed=42), deterministic, state in memory
- MultiReadingVerifier: score = 0.35*C + 0.35*A + 0.30*H, N>=3 hard gate,
  sensor-freeze gate, sensor-physical and historical outlier annotations
- historical_outlier uses 3-level severity spectrum (60% mild / 25% medium /
  15% severe) with gap-based formulas guaranteeing H range by construction
- gauge_value never returned to agent; enforced by double-guard confirmed
  by test_gauge_value_protection.py (10 checks)
- robot-mcp-server entry point added to pyproject.toml
- "robot" key added to DEFAULT_SERVER_PATHS in src/agent/runner.py

Tests: 66 robot tests pass; pre-existing IoT tests unaffected.
Signed-off-by: AnandMayank <anandmayank698@gmail.com>
---
 pyproject.toml                                |   1 +
 src/agent/runner.py                           |   1 +
 src/couchdb/schema_robot_fields.json          |  84 ++
 src/couchdb/seed_robot_profiles.py            | 243 ++++++
 src/servers/iot/tests/test_robot_profiles.py  | 216 +++++
 src/servers/robot/__init__.py                 |   0
 src/servers/robot/main.py                     | 770 ++++++++++++++++++
 src/servers/robot/simulator.py                | 195 +++++
 src/servers/robot/tests/__init__.py           |   0
 src/servers/robot/tests/conftest.py           |  86 ++
 .../tests/test_gauge_value_protection.py      | 187 +++++
 src/servers/robot/tests/test_robot_tools.py   | 471 +++++++++++
 src/servers/robot/tests/test_verifier.py      | 135 +++
 src/servers/robot/verifier.py                 | 133 +++
 14 files changed, 2522 insertions(+)
 create mode 100644 src/couchdb/schema_robot_fields.json
 create mode 100644 src/couchdb/seed_robot_profiles.py
 create mode 100644 src/servers/iot/tests/test_robot_profiles.py
 create mode 100644 src/servers/robot/__init__.py
 create mode 100644 src/servers/robot/main.py
 create mode 100644 src/servers/robot/simulator.py
 create mode 100644 src/servers/robot/tests/__init__.py
 create mode 100644 src/servers/robot/tests/conftest.py
 create mode 100644 src/servers/robot/tests/test_gauge_value_protection.py
 create mode 100644 src/servers/robot/tests/test_robot_tools.py
 create mode 100644 src/servers/robot/tests/test_verifier.py
 create mode 100644 src/servers/robot/verifier.py

diff --git a/pyproject.toml b/pyproject.toml
index 196d0d096..942f2d433 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -44,6 +44,7 @@ fmsr-mcp-server = "servers.fmsr.main:main"
 tsfm-mcp-server = "servers.tsfm.main:main"
 wo-mcp-server = "servers.wo.main:main"
 vibration-mcp-server = "servers.vibration.main:main"
+robot-mcp-server = "servers.robot.main:main"
 openai-agent = "agent.openai_agent.cli:main"
 deep-agent = "agent.deep_agent.cli:main"
 stirrup-agent = "agent.stirrup_agent.cli:main"
diff --git a/src/agent/runner.py b/src/agent/runner.py
index 1c06ec601..334ad7a90 100644
--- a/src/agent/runner.py
+++ b/src/agent/runner.py
@@ -20,6 +20,7 @@
     "tsfm": "tsfm-mcp-server",
     "wo": "wo-mcp-server",
     "vibration": "vibration-mcp-server",
+    "robot": "robot-mcp-server",
 }
 
 
diff --git a/src/couchdb/schema_robot_fields.json b/src/couchdb/schema_robot_fields.json
new file mode 100644
index 000000000..7b016bf88
--- /dev/null
+++ b/src/couchdb/schema_robot_fields.json
@@ -0,0 +1,84 @@
+{
+  "doc_type": "asset_robot_profile",
+  "id_pattern": "profile:{normalized_asset_id}",
+  "description": "Per-asset profile documents for the robot inspection extension. Stored in the iot CouchDB database alongside timestamped sensor readings, but deliberately omit the asset_id field so existing IoT server queries are unaffected.",
+  "deferred_fields": "See SAFETY_FIELDS_FUTURE.md for hazard_class, maintenance_slot, active_work_order",
+
+  "fields": {
+    "physical_location": {
+      "type": "object or null",
+      "schema": {"x": "float", "y": "float", "z": "float", "room_id": "string"},
+      "default": null,
+      "status": "active",
+      "purpose": "Robot navigation target for navigate_to() tool. Set from facility floor plan. Null until floor-plan data is loaded."
+    },
+    "gauge_value": {
+      "type": "float",
+      "default": 0.0,
+      "status": "active",
+      "CRITICAL": "NEVER return this field from any MCP tool to the agent",
+      "set_by": "PhysicalStateSimulator.generate_scenario()",
+      "read_by": "Evaluator.get_ground_truth() ONLY",
+      "purpose": "Ground truth physical gauge reading. Set at scenario generation time. Must never reach the agent — doing so invalidates the evaluation."
+    },
+    "gauge_range": {
+      "type": "array [float, float]",
+      "default": [0, 100],
+      "status": "active",
+      "purpose": "Min/max of the gauge scale face. Used in PA metric and tau_agreement threshold calculation."
+    },
+    "panel_stuck_prob": {
+      "type": "float 0-1",
+      "default": 0.12,
+      "status": "active",
+      "purpose": "Probability that the access panel fails to open. SME-calibrated at 0.12 for preprogrammed navigation; 0.24-0.40 for learned navigation routes."
+    },
+    "human_present": {
+      "type": "bool",
+      "default": false,
+      "status": "active",
+      "purpose": "Whether a technician is currently at this asset. If true, robot dispatch is skipped and an alarm is raised to the person already on-site. Updated by PhysicalStateSimulator per scenario."
+    },
+    "never_read": {
+      "type": "bool",
+      "default": false,
+      "status": "active",
+      "purpose": "True if no physical gauge reading exists in Maximo history for this asset. Enables the never-read-gauge scenario variant. SME confirmed some gauges have never been recorded."
+    },
+    "real_gauge_images": {
+      "type": "array of strings",
+      "default": [],
+      "status": "active",
+      "purpose": "File paths to real facility images of this asset's gauge collected during field visits. Used to train and calibrate the CosmosWorld perception layer."
+    },
+    "reading_consistency": {
+      "type": "float or null",
+      "default": null,
+      "status": "active",
+      "purpose": "Empirical std(readings) / gauge_range computed from field collection data. Used to set tau_consistency threshold for this asset type. Null until field data arrives."
+    },
+    "sensor_physical_gap": {
+      "type": "float or null",
+      "default": null,
+      "status": "active",
+      "purpose": "Empirical |iot_value - gauge_value| / gauge_range from field collection. Calibrates tau_agreement for this asset. Null until field data arrives."
+    }
+  },
+
+  "indexes": [
+    {
+      "name": "idx_robot_never_read",
+      "fields": ["doc_type", "never_read"],
+      "purpose": "Scenario generator lookup for never-read gauge cases"
+    }
+  ],
+
+  "known_profiles": [
+    {"profile_id": "profile:chiller_6",       "display_name": "Chiller 6"},
+    {"profile_id": "profile:metro_pump_1",    "display_name": "Metro Pump 1"},
+    {"profile_id": "profile:hydraulic_pump_1","display_name": "Hydraulic Pump 1"},
+    {"profile_id": "profile:motor_01",        "display_name": "Motor 01"}
+  ],
+
+  "isolation_guarantee": "Profile documents have no asset_id field. The IoT server queries {asset_id: {$exists: true}} — these documents are invisible to all existing server queries, including get_asset_list() and get_sensor_list()."
+}
diff --git a/src/couchdb/seed_robot_profiles.py b/src/couchdb/seed_robot_profiles.py
new file mode 100644
index 000000000..841a4a3a9
--- /dev/null
+++ b/src/couchdb/seed_robot_profiles.py
@@ -0,0 +1,243 @@
+"""Seed robot asset profile documents into the iot CouchDB database.
+
+Creates one profile document per known asset containing robot-inspection fields
+(navigation, gauge truth, calibration, dispatch state).  These documents are
+deliberately stored WITHOUT an ``asset_id`` field so existing IoT server
+queries (``{"asset_id": {"$exists": true}}``) are completely unaffected.
+
+Document shape:
+    _id        = "profile:{normalized_asset_id}"   e.g. "profile:chiller_6"
+    doc_type   = "asset_robot_profile"
+    display_name = "Chiller 6"                     original asset_id string
+    + 9 robot fields (see ROBOT_FIELD_DEFAULTS)
+
+Usage:
+    python src/couchdb/seed_robot_profiles.py             # apply
+    python src/couchdb/seed_robot_profiles.py --dry-run   # preview only
+    python src/couchdb/seed_robot_profiles.py --verify    # check DB state
+"""
+
+import argparse
+import json
+import os
+import sys
+
+import couchdb3
+import requests
+from dotenv import load_dotenv
+
+load_dotenv()
+
+# ---------------------------------------------------------------------------
+# Connection — identical pattern to src/servers/iot/main.py
+# ---------------------------------------------------------------------------
+COUCHDB_URL      = os.environ.get("COUCHDB_URL")
+COUCHDB_DBNAME   = os.environ.get("IOT_DBNAME")
+COUCHDB_USERNAME = os.environ.get("COUCHDB_USERNAME")
+COUCHDB_PASSWORD = os.environ.get("COUCHDB_PASSWORD")
+
+# ---------------------------------------------------------------------------
+# Robot field defaults (in-scope fields only)
+# gauge_value is stored here but MUST NEVER be returned by any MCP tool.
+# ---------------------------------------------------------------------------
+ROBOT_FIELD_DEFAULTS: dict = {
+    "physical_location":   None,
+    "gauge_value":         0.0,    # ground truth — NEVER expose to agent via MCP
+    "gauge_range":         [0, 100],
+    "panel_stuck_prob":    0.12,
+    "human_present":       False,
+    "never_read":          False,
+    "real_gauge_images":   [],
+    "reading_consistency": None,
+    "sensor_physical_gap": None,
+}
+
+ROBOT_FIELDS = list(ROBOT_FIELD_DEFAULTS.keys())
+
+# ---------------------------------------------------------------------------
+# Known assets — derived from sample_data/iot/*.json
+# physical_location values are placeholder coordinates until floor-plan data arrives.
+# ---------------------------------------------------------------------------
+ASSETS = [
+    {
+        "display_name":    "Chiller 6",
+        "profile_id":      "profile:chiller_6",
+        "physical_location": {"x": 52.3, "y": 18.1, "z": 0.0, "room_id": "cooling_3B"},
+        "gauge_range":     [0, 100],
+    },
+    {
+        "display_name":    "Metro Pump 1",
+        "profile_id":      "profile:metro_pump_1",
+        "physical_location": {"x": 14.0, "y": 32.5, "z": 0.0, "room_id": "pump_room_A"},
+        "gauge_range":     [0, 200],
+    },
+    {
+        "display_name":    "Hydraulic Pump 1",
+        "profile_id":      "profile:hydraulic_pump_1",
+        "physical_location": {"x": 28.7, "y": 11.0, "z": 0.0, "room_id": "pump_room_B"},
+        "gauge_range":     [0, 350],
+    },
+    {
+        "display_name":    "Motor 01",
+        "profile_id":      "profile:motor_01",
+        "physical_location": {"x": 7.2, "y": 44.8, "z": 0.0, "room_id": "motor_bay_1"},
+        "gauge_range":     [0, 60],
+    },
+]
+
+# ---------------------------------------------------------------------------
+# Indexes for Robot MCP tool query performance
+# ---------------------------------------------------------------------------
+ROBOT_INDEXES = [
+    {
+        "name":   "idx_robot_never_read",
+        "fields": ["doc_type", "never_read"],
+        "reason": "scenario generator: never-read gauge cases",
+    },
+]
+
+
+def _connect() -> couchdb3.Database:
+    if not COUCHDB_URL or not COUCHDB_DBNAME:
+        sys.exit("ERROR: COUCHDB_URL and IOT_DBNAME must be set.")
+    return couchdb3.Database(
+        COUCHDB_DBNAME,
+        url=COUCHDB_URL,
+        user=COUCHDB_USERNAME,
+        password=COUCHDB_PASSWORD,
+    )
+
+
+def _build_doc(asset: dict) -> dict:
+    doc = {
+        "_id":          asset["profile_id"],
+        "doc_type":     "asset_robot_profile",
+        "display_name": asset["display_name"],
+    }
+    doc.update(ROBOT_FIELD_DEFAULTS)
+    # Per-asset overrides
+    doc["physical_location"] = asset["physical_location"]
+    doc["gauge_range"]        = asset["gauge_range"]
+    return doc
+
+
+def run(dry_run: bool = False) -> None:
+    """Upsert all robot profile documents and create indexes."""
+    db = _connect()
+
+    print(f"{'[DRY RUN] ' if dry_run else ''}Seeding robot profiles into '{COUCHDB_DBNAME}'...\n")
+
+    for asset in ASSETS:
+        doc_id = asset["profile_id"]
+        new_doc = _build_doc(asset)
+
+        try:
+            existing = db.get(doc_id)
+        except Exception:
+            existing = None
+
+        if existing is None:
+            action = "CREATE"
+            final_doc = new_doc
+        else:
+            # Patch only fields that are missing (never overwrite existing values)
+            patched = False
+            final_doc = dict(existing)
+            for field in ROBOT_FIELDS:
+                if field not in final_doc:
+                    final_doc[field] = new_doc[field]
+                    patched = True
+            action = "PATCH" if patched else "SKIP (already complete)"
+
+        if dry_run:
+            print(f"  [{action}] {doc_id}")
+            if action != "SKIP (already complete)":
+                print(f"           {json.dumps(new_doc, indent=10)}\n")
+        else:
+            if action == "SKIP (already complete)":
+                print(f"  [SKIP]   {doc_id} — all robot fields already present")
+            else:
+                db.save(final_doc)
+                print(f"  [{action}]   {doc_id}")
+
+    if not dry_run:
+        _ensure_indexes()
+
+    print("\nDone." if not dry_run else "\n[Dry run complete — no writes performed.]")
+
+
+def _ensure_indexes() -> None:
+    # couchdb3 does not expose create_index; use the HTTP API directly (same
+    # pattern as src/couchdb/loader.py _create_indexes).
+    auth = (COUCHDB_USERNAME, COUCHDB_PASSWORD)
+    base = (COUCHDB_URL or "").rstrip("/")
+    print("\nCreating indexes...")
+    for idx in ROBOT_INDEXES:
+        url = f"{base}/{COUCHDB_DBNAME}/_index"
+        payload = {
+            "index": {"fields": idx["fields"]},
+            "name":  idx["name"],
+            "type":  "json",
+        }
+        try:
+            resp = requests.post(url, json=payload, auth=auth, timeout=10)
+            resp.raise_for_status()
+            result = resp.json().get("result", "ok")
+            print(f"  [{result.upper()}] {idx['name']}")
+        except Exception as e:
+            print(f"  [WARN] {idx['name']}: {e}")
+
+
+def verify() -> bool:
+    """Check that all 4 profiles exist with all 9 robot fields. Returns True if OK."""
+    db = _connect()
+    print(f"Verifying robot profiles in '{COUCHDB_DBNAME}'...\n")
+    all_ok = True
+
+    for asset in ASSETS:
+        doc_id = asset["profile_id"]
+        try:
+            doc = db.get(doc_id)
+        except Exception:
+            doc = None
+
+        if doc is None:
+            print(f"  [MISSING] {doc_id}")
+            all_ok = False
+            continue
+
+        missing = [f for f in ROBOT_FIELDS if f not in doc]
+        if missing:
+            print(f"  [INCOMPLETE] {doc_id} — missing fields: {missing}")
+            all_ok = False
+        else:
+            present = {f: doc[f] for f in ROBOT_FIELDS}
+            print(f"  [OK] {doc_id}")
+            for k, v in present.items():
+                flag = "  *** GROUND TRUTH — never expose ***" if k == "gauge_value" else ""
+                print(f"       {k}: {v}{flag}")
+        print()
+
+    if all_ok:
+        print("All profiles verified successfully.")
+    else:
+        print("VERIFICATION FAILED — run seed_robot_profiles.py to fix.")
+    return all_ok
+
+
+def main() -> None:
+    parser = argparse.ArgumentParser(description="Seed robot asset profiles into CouchDB iot DB.")
+    group = parser.add_mutually_exclusive_group()
+    group.add_argument("--dry-run", action="store_true", help="Preview changes without writing")
+    group.add_argument("--verify",  action="store_true", help="Check profiles exist and are complete")
+    args = parser.parse_args()
+
+    if args.verify:
+        ok = verify()
+        sys.exit(0 if ok else 1)
+    else:
+        run(dry_run=args.dry_run)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/src/servers/iot/tests/test_robot_profiles.py b/src/servers/iot/tests/test_robot_profiles.py
new file mode 100644
index 000000000..61a529da5
--- /dev/null
+++ b/src/servers/iot/tests/test_robot_profiles.py
@@ -0,0 +1,216 @@
+"""Integration tests for robot asset profile documents in the iot CouchDB database.
+
+Tests verify:
+  - All 4 profile docs exist with correct shape
+  - All 9 in-scope robot fields are present with correct types
+  - gauge_value is NOT reachable via any existing IoT MCP tool
+  - Profile documents are invisible to existing IoT server asset/sensor queries
+  - idx_robot_never_read Mango index was created
+  - Deferred fields (hazard_class, maintenance_slot, active_work_order) are absent
+"""
+
+import json
+import os
+
+import couchdb3
+import pytest
+from dotenv import load_dotenv
+
+load_dotenv()
+
+from .conftest import requires_couchdb
+
+COUCHDB_URL      = os.environ.get("COUCHDB_URL", "")
+COUCHDB_HOST     = COUCHDB_URL.replace("http://", "").replace("https://", "")
+COUCHDB_USERNAME = os.environ.get("COUCHDB_USERNAME", "")
+COUCHDB_PASSWORD = os.environ.get("COUCHDB_PASSWORD", "")
+COUCHDB_DBNAME   = os.environ.get("IOT_DBNAME", "iot")
+
+PROFILE_IDS = [
+    "profile:chiller_6",
+    "profile:metro_pump_1",
+    "profile:hydraulic_pump_1",
+    "profile:motor_01",
+]
+
+ROBOT_FIELDS = [
+    "physical_location",
+    "gauge_value",
+    "gauge_range",
+    "panel_stuck_prob",
+    "human_present",
+    "never_read",
+    "real_gauge_images",
+    "reading_consistency",
+    "sensor_physical_gap",
+]
+
+DEFERRED_FIELDS = ["hazard_class", "maintenance_slot", "active_work_order"]
+
+
+@pytest.fixture
+def raw_db():
+    return couchdb3.Server(
+        f"http://{COUCHDB_HOST}",
+        user=COUCHDB_USERNAME,
+        password=COUCHDB_PASSWORD,
+    )[COUCHDB_DBNAME]
+
+
+# ---------------------------------------------------------------------------
+# Profile document shape
+# ---------------------------------------------------------------------------
+
+@requires_couchdb
+class TestRobotAssetProfiles:
+    def test_profiles_exist(self, raw_db):
+        for pid in PROFILE_IDS:
+            doc = raw_db.get(pid)
+            assert doc is not None, f"Profile document missing: {pid}"
+
+    def test_doc_type_set(self, raw_db):
+        for pid in PROFILE_IDS:
+            doc = raw_db.get(pid)
+            assert doc["doc_type"] == "asset_robot_profile", (
+                f"{pid}: expected doc_type='asset_robot_profile', got {doc.get('doc_type')}"
+            )
+
+    def test_all_9_fields_present(self, raw_db):
+        for pid in PROFILE_IDS:
+            doc = raw_db.get(pid)
+            missing = [f for f in ROBOT_FIELDS if f not in doc]
+            assert not missing, f"{pid}: missing robot fields: {missing}"
+
+    def test_field_types(self, raw_db):
+        for pid in PROFILE_IDS:
+            doc = raw_db.get(pid)
+            assert isinstance(doc["gauge_value"],     float),           f"{pid}: gauge_value must be float"
+            assert isinstance(doc["panel_stuck_prob"], float),          f"{pid}: panel_stuck_prob must be float"
+            assert isinstance(doc["human_present"],    bool),           f"{pid}: human_present must be bool"
+            assert isinstance(doc["never_read"],       bool),           f"{pid}: never_read must be bool"
+            assert isinstance(doc["real_gauge_images"], list),          f"{pid}: real_gauge_images must be list"
+            assert doc["physical_location"] is None or isinstance(doc["physical_location"], dict), (
+                f"{pid}: physical_location must be dict or null"
+            )
+
+    def test_gauge_range_is_two_element_list(self, raw_db):
+        for pid in PROFILE_IDS:
+            doc = raw_db.get(pid)
+            gr = doc["gauge_range"]
+            assert isinstance(gr, list) and len(gr) == 2, (
+                f"{pid}: gauge_range must be [min, max], got {gr}"
+            )
+            assert gr[0] < gr[1], f"{pid}: gauge_range[0] must be < gauge_range[1], got {gr}"
+
+    def test_deferred_fields_absent(self, raw_db):
+        for pid in PROFILE_IDS:
+            doc = raw_db.get(pid)
+            present = [f for f in DEFERRED_FIELDS if f in doc]
+            assert not present, (
+                f"{pid}: deferred fields must not be in DB yet: {present}"
+            )
+
+    def test_no_asset_id_field(self, raw_db):
+        """Profiles must not have asset_id — that field is what IoT server queries scan for."""
+        for pid in PROFILE_IDS:
+            doc = raw_db.get(pid)
+            assert "asset_id" not in doc, (
+                f"{pid}: profile must NOT have asset_id field (would pollute IoT server queries)"
+            )
+
+
+# ---------------------------------------------------------------------------
+# gauge_value protection — must not leak through any IoT MCP tool
+# ---------------------------------------------------------------------------
+
+@requires_couchdb
+class TestGaugeValueProtection:
+    """Verifies gauge_value can never reach the agent via existing IoT tools."""
+
+    @pytest.mark.anyio
+    async def test_gauge_value_not_in_sensor_list(self):
+        from servers.iot.main import mcp, _asset_list_cache, _sensor_list_cache
+        import servers.iot.main as iot_main
+
+        # Clear caches so real DB is queried
+        iot_main._asset_list_cache = None
+        iot_main._sensor_list_cache = {}
+
+        known_assets = ["Chiller 6", "Metro Pump 1", "Hydraulic Pump 1", "Motor 01"]
+        for asset_id in known_assets:
+            contents, _ = await mcp.call_tool("sensors", {"site_name": "MAIN", "asset_id": asset_id})
+            result = json.loads(contents[0].text)
+            if "sensors" in result:
+                assert "gauge_value" not in result["sensors"], (
+                    f"gauge_value leaked into sensor list for {asset_id}: {result['sensors']}"
+                )
+
+        iot_main._asset_list_cache = None
+        iot_main._sensor_list_cache = {}
+
+    @pytest.mark.anyio
+    async def test_gauge_value_not_in_history(self):
+        from servers.iot.main import mcp
+        import servers.iot.main as iot_main
+
+        iot_main._asset_list_cache = None
+        iot_main._sensor_list_cache = {}
+
+        contents, _ = await mcp.call_tool("history", {
+            "site_name": "MAIN",
+            "asset_id":  "Chiller 6",
+            "start":     "2020-06-01T00:00:00",
+            "final":     "2020-06-01T01:00:00",
+        })
+        result = json.loads(contents[0].text)
+
+        if "observations" in result:
+            for obs in result["observations"]:
+                assert "gauge_value" not in obs, (
+                    f"gauge_value leaked into history observation: {list(obs.keys())}"
+                )
+
+        iot_main._asset_list_cache = None
+        iot_main._sensor_list_cache = {}
+
+    @pytest.mark.anyio
+    async def test_profile_docs_not_in_asset_list(self):
+        """Profile documents must be invisible to the IoT server asset enumeration."""
+        from servers.iot.main import mcp
+        import servers.iot.main as iot_main
+
+        iot_main._asset_list_cache = None
+        iot_main._sensor_list_cache = {}
+
+        contents, _ = await mcp.call_tool("assets", {"site_name": "MAIN"})
+        result = json.loads(contents[0].text)
+
+        if "assets" in result:
+            profile_leaks = [a for a in result["assets"] if str(a).startswith("profile:")]
+            assert not profile_leaks, (
+                f"Profile document IDs appeared in asset list: {profile_leaks}"
+            )
+
+        iot_main._asset_list_cache = None
+        iot_main._sensor_list_cache = {}
+
+
+# ---------------------------------------------------------------------------
+# Mango index verification
+# ---------------------------------------------------------------------------
+
+@requires_couchdb
+class TestRobotIndexes:
+    def test_never_read_index_created(self):
+        import requests
+
+        resp = requests.get(
+            f"http://{COUCHDB_HOST}/{COUCHDB_DBNAME}/_index",
+            auth=(COUCHDB_USERNAME, COUCHDB_PASSWORD),
+        )
+        assert resp.status_code == 200, f"Could not query _index endpoint: {resp.status_code}"
+
+        index_names = [idx.get("name") for idx in resp.json().get("indexes", [])]
+        assert "idx_robot_never_read" in index_names, (
+            f"idx_robot_never_read not found. Existing indexes: {index_names}"
+        )
diff --git a/src/servers/robot/__init__.py b/src/servers/robot/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/src/servers/robot/main.py b/src/servers/robot/main.py
new file mode 100644
index 000000000..351bfcf49
--- /dev/null
+++ b/src/servers/robot/main.py
@@ -0,0 +1,770 @@
+"""Robot MCP Server — 8 tools for autonomous robot inspection.
+
+Reads from profile:{asset_id} documents in the iot CouchDB database.
+Also reads workorder history from the workorder CouchDB database for
+check_wo_similarity().
+
+Critical invariant:
+    gauge_value is stored in CouchDB profile docs and used internally
+    by read_gauge() via the simulator. It is NEVER returned in any
+    tool response to the agent.
+
+Tools:
+    navigate_to            — navigate robot to asset location
+    safety_gate_check      — check human presence and work order status
+    open_panel             — attempt to open asset inspection panel
+    read_gauge             — read physical gauge (noisy, occlusion-aware)
+    check_human_presence   — explicit human/slot/WO query
+    commit_reading         — verify readings and commit to CouchDB
+    check_wo_similarity    — find similar past work orders before raising new WO
+    detect_anomaly         — visual anomaly detection (spill, leak, damage)
+"""
+
+import difflib
+import logging
+import math
+import os
+import statistics
+from datetime import datetime, timezone
+from typing import Any, Dict, List, Optional, Union
+
+import couchdb3
+import requests
+from dotenv import load_dotenv
+from mcp.server.fastmcp import FastMCP
+from pydantic import BaseModel
+
+from .simulator import PhysicalStateSimulator
+from .verifier import MultiReadingVerifier
+
+load_dotenv()
+
+_log_level = getattr(
+    logging, os.environ.get("LOG_LEVEL", "WARNING").upper(), logging.WARNING
+)
+logging.basicConfig(level=_log_level)
+logger = logging.getLogger("robot-mcp-server")
+
+# ---------------------------------------------------------------------------
+# CouchDB connections
+# ---------------------------------------------------------------------------
+
+COUCHDB_URL      = os.environ.get("COUCHDB_URL")
+COUCHDB_USERNAME = os.environ.get("COUCHDB_USERNAME")
+COUCHDB_PASSWORD = os.environ.get("COUCHDB_PASSWORD")
+IOT_DBNAME       = os.environ.get("IOT_DBNAME", "iot")
+WO_DBNAME        = os.environ.get("WO_DBNAME", "workorder")
+
+try:
+    db = couchdb3.Database(
+        IOT_DBNAME,
+        url=COUCHDB_URL,
+        user=COUCHDB_USERNAME,
+        password=COUCHDB_PASSWORD,
+    )
+    logger.info("Connected to IoT CouchDB: %s", IOT_DBNAME)
+except Exception as exc:
+    logger.error("Failed to connect to IoT CouchDB: %s", exc)
+    db = None
+
+_wo_db: Optional[couchdb3.Database] = None
+
+
+def _get_wo_db() -> Optional[couchdb3.Database]:
+    global _wo_db
+    if _wo_db is None:
+        try:
+            _wo_db = couchdb3.Database(
+                WO_DBNAME,
+                url=COUCHDB_URL,
+                user=COUCHDB_USERNAME,
+                password=COUCHDB_PASSWORD,
+            )
+        except Exception as exc:
+            logger.error("Failed to connect to WO CouchDB: %s", exc)
+    return _wo_db
+
+
+# ---------------------------------------------------------------------------
+# Module-level simulator and verifier instances
+# ---------------------------------------------------------------------------
+
+_simulator = PhysicalStateSimulator(seed=42)
+_verifier  = MultiReadingVerifier()
+
+# ---------------------------------------------------------------------------
+# Asset ID mappings
+# ---------------------------------------------------------------------------
+
+# Display name (IoT asset_id) → profile key (used in "profile:{key}" doc ID)
+_DISPLAY_TO_PROFILE_KEY: Dict[str, str] = {
+    "Chiller 6":        "chiller_6",
+    "Metro Pump 1":     "metro_pump_1",
+    "Hydraulic Pump 1": "hydraulic_pump_1",
+    "Motor 01":         "motor_01",
+    # Accept normalized keys directly too
+    "chiller_6":        "chiller_6",
+    "metro_pump_1":     "metro_pump_1",
+    "hydraulic_pump_1": "hydraulic_pump_1",
+    "motor_01":         "motor_01",
+}
+
+# Profile key → Maximo assetnum (for workorder queries)
+_PROFILE_KEY_TO_WO_ASSETNUM: Dict[str, str] = {
+    "chiller_6":        "CHILLER6",
+    "metro_pump_1":     "PUMP3",
+    "hydraulic_pump_1": "PUMP3",
+    "motor_01":         "",          # no WO assetnum yet
+}
+
+
+def _profile_key(asset_id: str) -> str:
+    return _DISPLAY_TO_PROFILE_KEY.get(
+        asset_id,
+        asset_id.lower().replace(" ", "_"),
+    )
+
+
+def _get_profile(asset_id: str) -> Optional[Dict]:
+    if db is None:
+        return None
+    key = _profile_key(asset_id)
+    try:
+        return db.get(f"profile:{key}")
+    except Exception as exc:
+        logger.error("Profile lookup failed for %s: %s", asset_id, exc)
+        return None
+
+
+# ---------------------------------------------------------------------------
+# FastMCP server declaration
+# ---------------------------------------------------------------------------
+
+mcp = FastMCP(
+    "robot",
+    instructions=(
+        "Robot inspection tools: navigate to assets, check safety, open panels, "
+        "read physical gauges, verify readings, check work order history, and "
+        "detect visual anomalies. Always call safety_gate_check before open_panel. "
+        "Always call check_wo_similarity before raising a new work order. "
+        "commit_reading requires at least 3 gauge readings."
+    ),
+)
+
+# ---------------------------------------------------------------------------
+# Pydantic result models
+# ---------------------------------------------------------------------------
+
+
+class ErrorResult(BaseModel):
+    error: str
+
+
+class NavigateResult(BaseModel):
+    asset_id: str
+    success: bool
+    steps_taken: int
+    distance_m: float
+    blocked_reason: Optional[str] = None
+    message: str
+
+
+class SafetyGateResult(BaseModel):
+    asset_id: str
+    human_present: bool
+    active_work_order: Optional[str]
+    safety_clearance: bool
+    slot: str
+    message: str
+
+
+class OpenPanelResult(BaseModel):
+    asset_id: str
+    success: bool
+    access_granted: bool
+    stuck_reason: Optional[str] = None
+    message: str
+
+
+class GaugeReadResult(BaseModel):
+    asset_id: str
+    attempt_n: int
+    reading: float
+    confidence: float
+    occlusion_flag: bool
+    gauge_range: List[float]
+    message: str
+
+
+class CommitResult(BaseModel):
+    asset_id: str
+    status: str
+    score: float
+    C: float
+    A: float
+    H: float
+    fm_flag: Optional[str]
+    fm_annotations: List[str]
+    reason: str
+    message: str
+
+
+class HumanPresenceResult(BaseModel):
+    asset_id: str
+    human_present: bool
+    slot: str
+    active_work_order: Optional[str]
+    message: str
+
+
+class WOSimilarityResult(BaseModel):
+    asset_id: str
+    similar_wos: List[str]
+    scores: List[float]
+    recommendation: str
+    duplicate_risk: bool
+    message: str
+
+
+class AnomalyResult(BaseModel):
+    asset_id: str
+    spill_detected: bool
+    leakage_detected: bool
+    pipe_damage_detected: bool
+    pooled_liquid_detected: bool
+    anomaly_confidence: float
+    message: str
+
+
+# ---------------------------------------------------------------------------
+# Helper: compute historical IoT baseline for H signal
+# ---------------------------------------------------------------------------
+
+_METADATA_KEYS = {"_id", "_rev", "asset_id", "timestamp", "doc_type"}
+
+
+def _compute_historical_baseline(
+    asset_id: str,
+    gauge_range: List[float],
+    n_docs: int = 30,
+) -> Optional[float]:
+    """Query last n_docs IoT sensor readings and return mean numeric value.
+
+    Returns None when fewer than 3 docs are found (H will be set to 0.5 neutral).
+    """
+    if db is None:
+        return None
+    try:
+        res = db.find(
+            {"asset_id": asset_id},
+            fields=None,
+            limit=n_docs,
+            sort=[{"asset_id": "asc"}, {"timestamp": "desc"}],
+        )
+        docs = res.get("docs", [])
+        if len(docs) < 3:
+            return None
+
+        low, high = float(gauge_range[0]), float(gauge_range[1])
+        span = high - low
+        values = []
+        for doc in docs:
+            for k, v in doc.items():
+                if k in _METADATA_KEYS:
+                    continue
+                if isinstance(v, (int, float)) and math.isfinite(v):
+                    # Only include values plausibly in gauge range (±50% of span)
+                    if (low - 0.5 * span) <= v <= (high + 0.5 * span):
+                        values.append(float(v))
+        return statistics.mean(values) if values else None
+    except Exception as exc:
+        logger.warning("Historical baseline query failed for %s: %s", asset_id, exc)
+        return None
+
+
+# ---------------------------------------------------------------------------
+# Tool 1: navigate_to
+# ---------------------------------------------------------------------------
+
+
+@mcp.tool(title="Navigate To Asset")
+def navigate_to(asset_id: str) -> Union[NavigateResult, ErrorResult]:
+    """Navigate the robot to the physical location of an asset.
+
+    Returns success status and estimated distance. Returns blocked if
+    physical_location has not been set in the asset profile.
+    """
+    if db is None:
+        return ErrorResult(error="IoT database unavailable")
+    profile = _get_profile(asset_id)
+    if profile is None:
+        return ErrorResult(error=f"No robot profile found for asset '{asset_id}'")
+
+    loc = profile.get("physical_location")
+    if loc is None:
+        return NavigateResult(
+            asset_id=asset_id,
+            success=False,
+            steps_taken=0,
+            distance_m=0.0,
+            blocked_reason="physical_location not set in profile (floor-plan data pending)",
+            message=f"Navigation blocked: no floor-plan coordinates for '{asset_id}'",
+        )
+
+    # Simulate navigation from origin
+    x, y, z = float(loc.get("x", 0)), float(loc.get("y", 0)), float(loc.get("z", 0))
+    distance_m = round(math.sqrt(x**2 + y**2 + z**2), 2)
+    steps = max(1, int(distance_m / 0.5))
+    room = loc.get("room_id", "unknown")
+
+    return NavigateResult(
+        asset_id=asset_id,
+        success=True,
+        steps_taken=steps,
+        distance_m=distance_m,
+        message=f"Navigated to '{asset_id}' in room '{room}' ({distance_m} m, {steps} steps)",
+    )
+
+
+# ---------------------------------------------------------------------------
+# Tool 2: safety_gate_check
+# ---------------------------------------------------------------------------
+
+
+@mcp.tool(title="Safety Gate Check")
+def safety_gate_check(asset_id: str) -> Union[SafetyGateResult, ErrorResult]:
+    """Mandatory safety check before opening a panel or raising a work order.
+
+    Returns human_present, active_work_order, safety_clearance, and shift slot.
+    safety_clearance is True only when human_present=False AND active_work_order=None.
+
+    FM-5a: skipping this tool before open_panel is detectable in the trajectory.
+    FM-6: proceeding despite active_work_order is FM-6.
+    """
+    if db is None:
+        return ErrorResult(error="IoT database unavailable")
+    profile = _get_profile(asset_id)
+    if profile is None:
+        return ErrorResult(error=f"No robot profile found for asset '{asset_id}'")
+
+    human_present    = bool(profile.get("human_present", False))
+    active_wo        = profile.get("active_work_order", None)   # deferred field
+    slot             = profile.get("maintenance_slot", "day")   # deferred field
+    safety_clearance = not human_present and active_wo is None
+
+    if human_present:
+        msg = (
+            f"SAFETY: human technician present at '{asset_id}' during {slot} slot. "
+            "Do NOT dispatch robot. Raise alarm to on-site technician instead."
+        )
+    elif active_wo:
+        msg = (
+            f"SAFETY: active work order {active_wo} exists for '{asset_id}'. "
+            "Check for duplicate before raising a new work order."
+        )
+    else:
+        msg = (
+            f"Safety clearance granted for '{asset_id}' "
+            f"(slot={slot}, human_present=False, active_work_order=None)"
+        )
+
+    return SafetyGateResult(
+        asset_id=asset_id,
+        human_present=human_present,
+        active_work_order=active_wo,
+        safety_clearance=safety_clearance,
+        slot=slot,
+        message=msg,
+    )
+
+
+# ---------------------------------------------------------------------------
+# Tool 3: open_panel
+# ---------------------------------------------------------------------------
+
+
+@mcp.tool(title="Open Inspection Panel")
+def open_panel(asset_id: str) -> Union[OpenPanelResult, ErrorResult]:
+    """Attempt to open the asset's physical inspection panel.
+
+    Uses panel_stuck_prob from the asset profile to simulate panel failure.
+    FM-1: panel stuck (panel_stuck_prob fires).
+    Call safety_gate_check before this tool.
+    """
+    if db is None:
+        return ErrorResult(error="IoT database unavailable")
+    profile = _get_profile(asset_id)
+    if profile is None:
+        return ErrorResult(error=f"No robot profile found for asset '{asset_id}'")
+
+    stuck_prob = float(profile.get("panel_stuck_prob", 0.12))
+    success    = _simulator.simulate_panel_open(stuck_prob)
+
+    if success:
+        return OpenPanelResult(
+            asset_id=asset_id,
+            success=True,
+            access_granted=True,
+            message=f"Panel opened successfully for '{asset_id}' — access granted",
+        )
+    return OpenPanelResult(
+        asset_id=asset_id,
+        success=False,
+        access_granted=False,
+        stuck_reason=f"Panel stuck (panel_stuck_prob={stuck_prob:.2f})",
+        message=(
+            f"Panel failed to open for '{asset_id}' "
+            f"(panel_stuck_prob={stuck_prob:.2f}). Access blocked."
+        ),
+    )
+
+
+# ---------------------------------------------------------------------------
+# Tool 4: read_gauge (gauge_value NEVER in response)
+# ---------------------------------------------------------------------------
+
+
+@mcp.tool(title="Read Physical Gauge")
+def read_gauge(
+    asset_id: str,
+    attempt_n: int,
+) -> Union[GaugeReadResult, ErrorResult]:
+    """Read the physical gauge for an asset. Returns a noisy reading with confidence.
+
+    Call this tool at least 3 times before commit_reading.
+    attempt_n should be 1 for the first reading, incrementing for each retry.
+
+    FM-3: hallucination — agent reports a value without calling this tool.
+    FM-4: scale error — agent misreads the gauge scale.
+    FM-7b: commit attempted after fewer than 3 readings.
+
+    IMPORTANT: This tool does NOT return gauge_value (ground truth).
+    The returned 'reading' is a noisy observation around the true value.
+    """
+    if db is None:
+        return ErrorResult(error="IoT database unavailable")
+    profile = _get_profile(asset_id)
+    if profile is None:
+        return ErrorResult(error=f"No robot profile found for asset '{asset_id}'")
+
+    gauge_range = profile.get("gauge_range", [0, 100])
+    key         = _profile_key(asset_id)
+
+    raw = _simulator.simulate_read_gauge(key, gauge_range)
+
+    # CRITICAL double-guard: ensure gauge_value never leaks into response
+    raw.pop("gauge_value", None)
+
+    msg = (
+        f"Gauge read #{attempt_n} for '{asset_id}': "
+        f"reading={raw['reading']}, confidence={raw['confidence']}"
+    )
+    if raw["occlusion_flag"]:
+        msg += " [OCCLUDED — reposition and retry]"
+
+    return GaugeReadResult(
+        asset_id=asset_id,
+        attempt_n=attempt_n,
+        reading=raw["reading"],
+        confidence=raw["confidence"],
+        occlusion_flag=raw["occlusion_flag"],
+        gauge_range=gauge_range,
+        message=msg,
+    )
+
+
+# ---------------------------------------------------------------------------
+# Tool 5: check_human_presence
+# ---------------------------------------------------------------------------
+
+
+@mcp.tool(title="Check Human Presence")
+def check_human_presence(asset_id: str) -> Union[HumanPresenceResult, ErrorResult]:
+    """Check whether a human technician is currently present at the asset.
+
+    Returns human_present, current maintenance slot, and active work order.
+    FM-5/FM-6 is detected if this check is skipped before open_panel.
+    """
+    if db is None:
+        return ErrorResult(error="IoT database unavailable")
+    profile = _get_profile(asset_id)
+    if profile is None:
+        return ErrorResult(error=f"No robot profile found for asset '{asset_id}'")
+
+    human_present = bool(profile.get("human_present", False))
+    slot          = profile.get("maintenance_slot", "day")
+    active_wo     = profile.get("active_work_order", None)
+
+    if human_present:
+        msg = (
+            f"Human technician IS present at '{asset_id}' (slot={slot}). "
+            "Robot dispatch not recommended — contact on-site technician."
+        )
+    else:
+        msg = f"No human technician at '{asset_id}' (slot={slot})"
+        if active_wo:
+            msg += f". Active work order: {active_wo}"
+
+    return HumanPresenceResult(
+        asset_id=asset_id,
+        human_present=human_present,
+        slot=slot,
+        active_work_order=active_wo,
+        message=msg,
+    )
+
+
+# ---------------------------------------------------------------------------
+# Tool 6: commit_reading
+# ---------------------------------------------------------------------------
+
+
+@mcp.tool(title="Commit Gauge Reading")
+def commit_reading(
+    asset_id: str,
+    readings: List[float],
+    decision: str,
+) -> Union[CommitResult, ErrorResult]:
+    """Verify a set of gauge readings and commit the maintenance decision.
+
+    Requires at least 3 readings (FM-7b gate).
+    Runs the MultiReadingVerifier: score = 0.35*C + 0.35*A + 0.30*H
+
+    decision: one of 'raise_work_order', 'close_normal', 'escalate_immediate',
+              'monitor_only'
+
+    Returns status: COMMIT | BLOCKED | ESCALATE | OOD_FLAG | PANEL_RECHECK
+    On COMMIT: writes a confirmed reading document to CouchDB.
+    """
+    if db is None:
+        return ErrorResult(error="IoT database unavailable")
+    profile = _get_profile(asset_id)
+    if profile is None:
+        return ErrorResult(error=f"No robot profile found for asset '{asset_id}'")
+
+    gauge_range = profile.get("gauge_range", [0, 100])
+
+    # Get latest IoT sensor value for A signal
+    iot_value: float = 0.0
+    try:
+        res = db.find(
+            {"asset_id": asset_id},
+            limit=1,
+            sort=[{"asset_id": "asc"}, {"timestamp": "desc"}],
+        )
+        docs = res.get("docs", [])
+        if docs:
+            numeric_vals = [
+                float(v)
+                for k, v in docs[0].items()
+                if k not in _METADATA_KEYS and isinstance(v, (int, float))
+            ]
+            if numeric_vals:
+                iot_value = statistics.mean(numeric_vals)
+    except Exception as exc:
+        logger.warning("IoT sensor query failed for %s: %s", asset_id, exc)
+
+    # Compute H: use simulator state if available (deterministic for seeded scenarios),
+    # otherwise fall back to IoT history query.
+    sim_state = _simulator._state.get(_profile_key(asset_id))
+    if sim_state is not None and sim_state.historical_baseline is not None:
+        hist_baseline = sim_state.historical_baseline
+    else:
+        hist_baseline = _compute_historical_baseline(asset_id, gauge_range)
+
+    result = _verifier.verify(
+        readings=readings,
+        iot_value=iot_value,
+        gauge_range=gauge_range,
+        historical_baseline=hist_baseline,
+    )
+
+    # Write commit document on COMMIT (never includes gauge_value)
+    if result.status == "COMMIT":
+        ts = datetime.now(timezone.utc).isoformat()
+        commit_doc = {
+            "_id":          f"reading:{_profile_key(asset_id)}:{ts}",
+            "doc_type":     "committed_reading",
+            "asset_id":     asset_id,
+            "readings":     readings,
+            "decision":     decision,
+            "score":        result.score,
+            "C_score":      result.C,
+            "A_score":      result.A,
+            "H_score":      result.H,
+            "fm_annotations": result.fm_annotations,
+            "committed_at": ts,
+        }
+        # gauge_value is explicitly not in commit_doc
+        try:
+            db.save(commit_doc)
+            logger.info("Committed reading for %s (score=%.3f)", asset_id, result.score)
+        except Exception as exc:
+            logger.error("Failed to write commit doc for %s: %s", asset_id, exc)
+
+    status_msg = {
+        "COMMIT":        f"Reading committed for '{asset_id}' (score={result.score:.3f})",
+        "BLOCKED":       f"Commit blocked for '{asset_id}': {result.reason}",
+        "ESCALATE":      f"Escalation recommended for '{asset_id}' (score={result.score:.3f})",
+        "OOD_FLAG":      f"Out-of-distribution reading for '{asset_id}' (score={result.score:.3f})",
+        "PANEL_RECHECK": f"Panel recheck required for '{asset_id}': {result.reason}",
+    }.get(result.status, result.reason)
+
+    return CommitResult(
+        asset_id=asset_id,
+        status=result.status,
+        score=result.score,
+        C=result.C,
+        A=result.A,
+        H=result.H,
+        fm_flag=result.fm_flag,
+        fm_annotations=result.fm_annotations,
+        reason=result.reason,
+        message=status_msg,
+    )
+
+
+# ---------------------------------------------------------------------------
+# Tool 7: check_wo_similarity
+# ---------------------------------------------------------------------------
+
+
+@mcp.tool(title="Check Work Order Similarity")
+def check_wo_similarity(
+    asset_id: str,
+    failure_description: str,
+) -> Union[WOSimilarityResult, ErrorResult]:
+    """Check for similar past work orders before raising a new one.
+
+    Uses difflib sequence matching on WO description text.
+    Must be called before raise_work_order to avoid FM-6a (duplicate WO).
+
+    FM-6a: agent never calls this before raising a WO.
+    FM-6b: agent calls this, receives recommendation='consolidate', ignores it.
+
+    Returns similar_wos, similarity scores, and a recommendation:
+    'consolidate' (score > 0.75) | 'review' (> 0.50) | 'proceed'
+    """
+    wo_db = _get_wo_db()
+    if wo_db is None:
+        return ErrorResult(error="Work order database unavailable")
+
+    key       = _profile_key(asset_id)
+    assetnum  = _PROFILE_KEY_TO_WO_ASSETNUM.get(key, "")
+
+    try:
+        if assetnum:
+            res = wo_db.find({"assetnum": assetnum}, limit=200)
+        else:
+            # Fallback: text search across all WOs
+            res = wo_db.find({"wonum": {"$exists": True}}, limit=500)
+        docs = res.get("docs", [])
+    except Exception as exc:
+        logger.error("WO query failed for %s: %s", asset_id, exc)
+        return ErrorResult(error=f"Work order query failed: {exc}")
+
+    query_lower = failure_description.lower()
+    scored: List[tuple] = []
+    for doc in docs:
+        desc = (doc.get("description") or "").lower()
+        if not desc:
+            continue
+        score = difflib.SequenceMatcher(None, query_lower, desc).ratio()
+        if score > 0.30:
+            scored.append((doc.get("wonum", ""), round(score, 3)))
+
+    scored.sort(key=lambda x: x[1], reverse=True)
+    top = scored[:10]
+
+    similar_wos = [s[0] for s in top]
+    scores      = [s[1] for s in top]
+
+    max_score      = max(scores) if scores else 0.0
+    duplicate_risk = max_score > 0.75
+
+    if max_score > 0.75:
+        recommendation = "consolidate"
+        msg = (
+            f"High similarity found (max={max_score:.2f}). "
+            "Consolidate with existing WO rather than raising a new one."
+        )
+    elif max_score > 0.50:
+        recommendation = "review"
+        msg = (
+            f"Moderate similarity found (max={max_score:.2f}). "
+            "Review existing WOs before raising a new one."
+        )
+    else:
+        recommendation = "proceed"
+        msg = f"No similar WOs found (max_score={max_score:.2f}). Safe to raise new WO."
+
+    return WOSimilarityResult(
+        asset_id=asset_id,
+        similar_wos=similar_wos,
+        scores=scores,
+        recommendation=recommendation,
+        duplicate_risk=duplicate_risk,
+        message=msg,
+    )
+
+
+# ---------------------------------------------------------------------------
+# Tool 8: detect_anomaly
+# ---------------------------------------------------------------------------
+
+
+@mcp.tool(title="Detect Visual Anomaly")
+def detect_anomaly(asset_id: str) -> Union[AnomalyResult, ErrorResult]:
+    """Detect visual anomalies around the asset (spills, leaks, pipe damage).
+
+    Anomaly state is seeded by PhysicalStateSimulator at scenario generation time.
+
+    FM-7 new path: IoT sensor reads normal + spill_detected=True = contradiction.
+    Contradiction flagging is performed by the Evaluator post-hoc, not here.
+
+    FM-5 escalation context: spill_detected + human_present = elevated severity
+    when hazard_class is added in SAFETY_INTEGRATION Phase 1.
+    """
+    if db is None:
+        return ErrorResult(error="IoT database unavailable")
+    profile = _get_profile(asset_id)
+    if profile is None:
+        return ErrorResult(error=f"No robot profile found for asset '{asset_id}'")
+
+    key   = _profile_key(asset_id)
+    state = _simulator.get_anomaly_state(key)
+
+    any_anomaly = (
+        state["spill_detected"]
+        or state["leakage_detected"]
+        or state["pipe_damage_detected"]
+        or state["pooled_liquid_detected"]
+    )
+
+    if any_anomaly:
+        flags = [k for k, v in state.items() if k != "anomaly_confidence" and v]
+        msg = (
+            f"ANOMALY detected at '{asset_id}': {', '.join(flags)} "
+            f"(confidence={state['anomaly_confidence']:.2f})"
+        )
+    else:
+        msg = f"No visual anomalies detected at '{asset_id}'"
+
+    return AnomalyResult(
+        asset_id=asset_id,
+        **state,
+        message=msg,
+    )
+
+
+# ---------------------------------------------------------------------------
+# Entry point
+# ---------------------------------------------------------------------------
+
+
+def main() -> None:
+    mcp.run(transport="stdio")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/src/servers/robot/simulator.py b/src/servers/robot/simulator.py
new file mode 100644
index 000000000..e0b4fcad8
--- /dev/null
+++ b/src/servers/robot/simulator.py
@@ -0,0 +1,195 @@
+"""PhysicalStateSimulator — seeded, deterministic scenario state.
+
+State lives in memory (self._state), NOT in CouchDB.
+The CouchDB profile doc's gauge_value field (default 0.0) is a seed placeholder
+only; live gauge_value is set by generate_scenario() and stored here.
+
+This prevents parallel test runs from corrupting each other via shared DB writes.
+
+Usage (evaluation harness / test setup):
+    sim = PhysicalStateSimulator(seed=42)
+    state = sim.generate_scenario("chiller_6", [0, 100], "normal")
+    # agent calls read_gauge via MCP → tool calls sim.simulate_read_gauge(...)
+    truth = sim.get_ground_truth("chiller_6")  # evaluator only
+"""
+
+import random
+from dataclasses import dataclass
+from typing import Optional
+
+
+@dataclass
+class ScenarioState:
+    gauge_value: float
+    spill_detected: bool = False
+    leakage_detected: bool = False
+    pipe_damage_detected: bool = False
+    pooled_liquid_detected: bool = False
+    anomaly_confidence: float = 0.0
+    historical_baseline: Optional[float] = None
+    historical_severity: Optional[str] = None  # "mild" | "medium" | "severe" | None
+
+
+class PhysicalStateSimulator:
+    # Calibrated params — placeholders until field-visit data arrives.
+    PARAMS = {
+        "gauge_noise_sigma_pct": 0.015,  # 1.5% of range span (ETH ICRA 2024 baseline)
+        "panel_stuck_prob":      0.12,   # SME-confirmed for preprogrammed navigation
+        "occlusion_prob":        0.08,   # 8% base occlusion rate
+        "spill_prob_normal":     0.03,   # 3% background spill rate
+    }
+
+    def __init__(self, seed: int = 42, params: Optional[dict] = None) -> None:
+        self._rng = random.Random(seed)
+        self._params = {**self.PARAMS, **(params or {})}
+        self._state: dict[str, ScenarioState] = {}
+
+    # ------------------------------------------------------------------
+    # Scenario seeding (called by evaluator / test harness, not by agent)
+    # ------------------------------------------------------------------
+
+    def generate_scenario(
+        self,
+        profile_key: str,
+        gauge_range: list,
+        scenario_type: str = "normal",
+    ) -> ScenarioState:
+        low, high = float(gauge_range[0]), float(gauge_range[1])
+        span = high - low
+
+        historical_baseline: Optional[float] = None
+        historical_severity: Optional[str] = None
+
+        if scenario_type == "normal":
+            gauge_value = low + self._rng.uniform(0.20, 0.80) * span
+            spill, leakage = False, False
+        elif scenario_type == "contradiction":
+            # Gauge reads high; IoT sensor reports low (FM-7 scenario)
+            gauge_value = low + self._rng.uniform(0.70, 0.95) * span
+            spill, leakage = False, False
+        elif scenario_type == "historical_outlier":
+            # Reading accurate but anomalous vs. asset history.
+            # Gap-based formula guarantees H range by construction:
+            #   severe  (15%): gap = 0.86–0.94·span → H < 0.15, historical outlier annotation fires
+            #   medium  (25%): gap = 0.64–0.80·span → H 0.18–0.36, ESCALATE
+            #   mild    (60%): gap = 0.35–0.55·span → H 0.40–0.65, COMMIT or ESCALATE
+            historical_severity = self._rng.choices(
+                ["mild", "medium", "severe"],
+                weights=[0.60, 0.25, 0.15],
+            )[0]
+            if historical_severity == "severe":
+                historical_baseline = low + self._rng.uniform(0.01, 0.04) * span
+                gauge_value = historical_baseline + self._rng.uniform(0.86, 0.94) * span
+                gauge_value = min(gauge_value, high * 0.98)
+            elif historical_severity == "medium":
+                historical_baseline = low + self._rng.uniform(0.05, 0.14) * span
+                gauge_value = historical_baseline + self._rng.uniform(0.64, 0.80) * span
+                gauge_value = min(gauge_value, high * 0.98)
+            else:  # mild
+                historical_baseline = low + self._rng.uniform(0.15, 0.30) * span
+                gauge_value = historical_baseline + self._rng.uniform(0.35, 0.55) * span
+                gauge_value = min(gauge_value, high * 0.98)
+            spill, leakage = False, False
+        elif scenario_type == "spill":
+            gauge_value = low + self._rng.uniform(0.30, 0.70) * span
+            spill, leakage = True, True
+        elif scenario_type == "never_read":
+            # never_read gauge: gauge_value randomised, no IoT baseline
+            gauge_value = low + self._rng.uniform(0.10, 0.90) * span
+            spill, leakage = False, False
+        else:
+            gauge_value = low + self._rng.uniform(0.20, 0.80) * span
+            spill, leakage = False, False
+
+        pipe_damage = self._rng.random() < 0.05
+        pooled = spill or leakage
+        anomaly_conf = (
+            round(self._rng.uniform(0.70, 0.95), 3)
+            if (spill or leakage or pipe_damage)
+            else 0.0
+        )
+
+        state = ScenarioState(
+            gauge_value=round(gauge_value, 3),
+            spill_detected=spill,
+            leakage_detected=leakage,
+            pipe_damage_detected=pipe_damage,
+            pooled_liquid_detected=pooled,
+            anomaly_confidence=anomaly_conf,
+            historical_baseline=round(historical_baseline, 3) if historical_baseline is not None else None,
+            historical_severity=historical_severity,
+        )
+        self._state[profile_key] = state
+        return state
+
+    def get_ground_truth(self, profile_key: str) -> Optional[float]:
+        """Evaluator-only. Never called by any MCP tool."""
+        state = self._state.get(profile_key)
+        return state.gauge_value if state else None
+
+    # ------------------------------------------------------------------
+    # Tool-facing simulation helpers
+    # ------------------------------------------------------------------
+
+    def simulate_read_gauge(
+        self,
+        profile_key: str,
+        gauge_range: list,
+    ) -> dict:
+        """Returns noisy gauge reading dict.
+
+        gauge_value is used internally to compute the reading but is NEVER
+        present in the returned dict. Callers (main.py) also pop it explicitly
+        as a second guard.
+        """
+        state = self._state.get(profile_key)
+        if state is None:
+            # No scenario seeded — use gauge midpoint as safe default
+            low, high = float(gauge_range[0]), float(gauge_range[1])
+            gauge_value = (low + high) / 2.0
+        else:
+            gauge_value = state.gauge_value
+
+        span = float(gauge_range[1]) - float(gauge_range[0])
+        sigma = self._params["gauge_noise_sigma_pct"] * span
+        noise = self._rng.gauss(0, sigma)
+        reading = round(
+            max(float(gauge_range[0]), min(float(gauge_range[1]), gauge_value + noise)),
+            3,
+        )
+
+        occlusion = self._rng.random() < self._params["occlusion_prob"]
+        confidence = round(
+            self._rng.uniform(0.80, 0.99)
+            if not occlusion
+            else self._rng.uniform(0.40, 0.65),
+            3,
+        )
+
+        # CRITICAL: gauge_value is NOT in the returned dict
+        return {"reading": reading, "confidence": confidence, "occlusion_flag": occlusion}
+
+    def simulate_panel_open(self, panel_stuck_prob: float) -> bool:
+        """Returns True if panel opened successfully, False if stuck."""
+        return self._rng.random() > panel_stuck_prob
+
+    def get_anomaly_state(self, profile_key: str) -> dict:
+        """Returns current anomaly flags. Anomalies are seeded by generate_scenario()."""
+        state = self._state.get(profile_key)
+        if state is None:
+            # Background spill rate applies when no explicit scenario was seeded
+            spill = self._rng.random() < self._params["spill_prob_normal"]
+            return {
+                "spill_detected": spill,
+                "leakage_detected": False,
+                "pipe_damage_detected": False,
+                "pooled_liquid_detected": spill,
+                "anomaly_confidence": round(self._rng.uniform(0.60, 0.75), 3) if spill else 0.0,
+            }
+        return {
+            "spill_detected": state.spill_detected,
+            "leakage_detected": state.leakage_detected,
+            "pipe_damage_detected": state.pipe_damage_detected,
+            "pooled_liquid_detected": state.pooled_liquid_detected,
+            "anomaly_confidence": state.anomaly_confidence,
+        }
diff --git a/src/servers/robot/tests/__init__.py b/src/servers/robot/tests/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/src/servers/robot/tests/conftest.py b/src/servers/robot/tests/conftest.py
new file mode 100644
index 000000000..a5c7d8dbf
--- /dev/null
+++ b/src/servers/robot/tests/conftest.py
@@ -0,0 +1,86 @@
+"""Shared fixtures and helpers for robot MCP server tests."""
+
+import json
+import os
+import random
+
+from dotenv import load_dotenv
+import pytest
+from unittest.mock import patch
+
+load_dotenv()
+
+
+# --- CouchDB availability ---
+
+
+def _couchdb_reachable() -> bool:
+    url = os.environ.get("COUCHDB_URL")
+    if not url:
+        return False
+    try:
+        import requests
+        requests.get(url, timeout=2)
+        return True
+    except Exception:
+        return False
+
+
+requires_couchdb = pytest.mark.skipif(
+    not _couchdb_reachable(),
+    reason="CouchDB not reachable (set COUCHDB_URL and ensure CouchDB is running)",
+)
+
+
+# --- Fixtures ---
+
+
+@pytest.fixture
+def simulator():
+    """Fresh PhysicalStateSimulator with seed=42."""
+    from servers.robot.simulator import PhysicalStateSimulator
+    return PhysicalStateSimulator(seed=42)
+
+
+@pytest.fixture(autouse=True)
+def reset_simulator_rng():
+    """Reset module-level simulator RNG before every test.
+
+    open_panel() and simulate_read_gauge() consume RNG state; without a reset
+    the outcome of tests depends on execution order.
+    """
+    import servers.robot.main as robot_main
+    robot_main._simulator._rng = random.Random(42)
+    yield
+    robot_main._simulator._rng = random.Random(42)
+
+
+@pytest.fixture
+def mock_db():
+    """Patch module-level `db` in robot main with a Mock."""
+    import servers.robot.main as robot_main
+    with patch("servers.robot.main.db") as mock:
+        yield mock
+
+
+@pytest.fixture
+def no_db():
+    """Patch module-level `db` to None (simulate disconnected IoT CouchDB)."""
+    with patch("servers.robot.main.db", None):
+        yield
+
+
+@pytest.fixture
+def no_wo_db():
+    """Patch _get_wo_db() to return None (simulate disconnected WO CouchDB)."""
+    with patch("servers.robot.main._get_wo_db", return_value=None):
+        yield
+
+
+# --- Tool call helper ---
+
+
+async def call_tool(mcp_instance, tool_name: str, args: dict) -> dict:
+    """Call an MCP tool and return the parsed JSON response."""
+    contents, _ = await mcp_instance.call_tool(tool_name, args)
+    return json.loads(contents[0].text)
diff --git a/src/servers/robot/tests/test_gauge_value_protection.py b/src/servers/robot/tests/test_gauge_value_protection.py
new file mode 100644
index 000000000..55ab40e18
--- /dev/null
+++ b/src/servers/robot/tests/test_gauge_value_protection.py
@@ -0,0 +1,187 @@
+"""Critical invariant: gauge_value must never appear in any tool response.
+
+9 checks:
+  1. navigate_to response
+  2. safety_gate_check response
+  3. open_panel response
+  4. read_gauge response  ← most critical
+  5. check_human_presence response
+  6. commit_reading response (BLOCKED path — no DB write)
+  7. commit_reading response (COMMIT path)
+  8. check_wo_similarity response
+  9. detect_anomaly response
+"""
+
+import pytest
+from unittest.mock import MagicMock, patch
+
+from servers.robot.main import mcp
+from .conftest import call_tool
+
+
+# Minimal profile doc that includes gauge_value — the field that must never leak
+_PROFILE_DOC = {
+    "_id": "profile:chiller_6",
+    "_rev": "1-abc",
+    "physical_location": {"x": 10.0, "y": 5.0, "z": 0.0, "room_id": "B1"},
+    "gauge_range": [0.0, 100.0],
+    "gauge_value": 75.0,          # MUST NOT appear in any tool response
+    "panel_stuck_prob": 0.0,      # force panel open for test repeatability
+    "human_present": False,
+    "maintenance_slot": "day",
+    "active_work_order": None,
+    "inspection_frequency_days": 7,
+    "last_inspection": "2024-01-01",
+    "sensor_type": "pressure",
+}
+
+_IOT_SENSOR_DOC = {
+    "asset_id": "Chiller 6",
+    "timestamp": "2024-06-01T00:00:00",
+    "Chiller 6 Pressure": 75.0,
+}
+
+
+def _make_db_mock():
+    mock = MagicMock()
+    mock.get.side_effect = lambda doc_id: (
+        _PROFILE_DOC if "profile:" in doc_id else None
+    )
+    mock.find.return_value = {"docs": [_IOT_SENSOR_DOC]}
+    mock.save.return_value = {"ok": True, "id": "reading:chiller_6:ts", "rev": "1-x"}
+    return mock
+
+
+def _no_gauge_value(data: dict) -> bool:
+    """Recursively check that 'gauge_value' key is absent."""
+    if "gauge_value" in data:
+        return False
+    for v in data.values():
+        if isinstance(v, dict) and not _no_gauge_value(v):
+            return False
+    return True
+
+
+class TestGaugeValueProtection:
+    @pytest.mark.anyio
+    async def test_navigate_to_no_gauge_value(self):
+        with patch("servers.robot.main.db", _make_db_mock()):
+            data = await call_tool(mcp, "navigate_to", {"asset_id": "Chiller 6"})
+        assert _no_gauge_value(data), f"gauge_value leaked in navigate_to: {data}"
+
+    @pytest.mark.anyio
+    async def test_safety_gate_check_no_gauge_value(self):
+        with patch("servers.robot.main.db", _make_db_mock()):
+            data = await call_tool(mcp, "safety_gate_check", {"asset_id": "Chiller 6"})
+        assert _no_gauge_value(data), f"gauge_value leaked in safety_gate_check: {data}"
+
+    @pytest.mark.anyio
+    async def test_open_panel_no_gauge_value(self):
+        with patch("servers.robot.main.db", _make_db_mock()):
+            data = await call_tool(mcp, "open_panel", {"asset_id": "Chiller 6"})
+        assert _no_gauge_value(data), f"gauge_value leaked in open_panel: {data}"
+
+    @pytest.mark.anyio
+    async def test_read_gauge_no_gauge_value(self):
+        """Most critical check — simulator uses gauge_value internally."""
+        import servers.robot.main as robot_main
+        robot_main._simulator.generate_scenario("chiller_6", [0.0, 100.0], "normal")
+        with patch("servers.robot.main.db", _make_db_mock()):
+            data = await call_tool(
+                mcp, "read_gauge", {"asset_id": "Chiller 6", "attempt_n": 1}
+            )
+        assert _no_gauge_value(data), f"gauge_value leaked in read_gauge: {data}"
+        assert "reading" in data, "read_gauge must return 'reading' field"
+
+    @pytest.mark.anyio
+    async def test_check_human_presence_no_gauge_value(self):
+        with patch("servers.robot.main.db", _make_db_mock()):
+            data = await call_tool(mcp, "check_human_presence", {"asset_id": "Chiller 6"})
+        assert _no_gauge_value(data), f"gauge_value leaked in check_human_presence: {data}"
+
+    @pytest.mark.anyio
+    async def test_commit_reading_blocked_no_gauge_value(self):
+        """BLOCKED path (N<3): no DB write, still must not expose gauge_value."""
+        with patch("servers.robot.main.db", _make_db_mock()):
+            data = await call_tool(
+                mcp,
+                "commit_reading",
+                {
+                    "asset_id": "Chiller 6",
+                    "readings": [74.0, 76.0],   # only 2 → BLOCKED
+                    "decision": "close_normal",
+                },
+            )
+        assert _no_gauge_value(data), f"gauge_value leaked in commit_reading (blocked): {data}"
+        assert data.get("status") == "BLOCKED"
+
+    @pytest.mark.anyio
+    async def test_commit_reading_commit_response_no_gauge_value(self):
+        """COMMIT path: response must not expose gauge_value."""
+        mock_db = _make_db_mock()
+        with patch("servers.robot.main.db", mock_db):
+            data = await call_tool(
+                mcp,
+                "commit_reading",
+                {
+                    "asset_id": "Chiller 6",
+                    "readings": [73.0, 75.0, 77.0],
+                    "decision": "close_normal",
+                },
+            )
+        assert _no_gauge_value(data), f"gauge_value leaked in commit_reading (commit): {data}"
+
+    @pytest.mark.anyio
+    async def test_commit_doc_written_has_no_gauge_value(self):
+        """When commit occurs, the doc written to CouchDB must not have gauge_value."""
+        mock_db = _make_db_mock()
+        saved_docs = []
+        mock_db.save.side_effect = lambda doc: (
+            saved_docs.append(doc) or {"ok": True, "id": doc["_id"], "rev": "1-x"}
+        )
+
+        with patch("servers.robot.main.db", mock_db):
+            await call_tool(
+                mcp,
+                "commit_reading",
+                {
+                    "asset_id": "Chiller 6",
+                    "readings": [73.0, 75.0, 77.0],
+                    "decision": "close_normal",
+                },
+            )
+
+        # If the verifier scored high enough to COMMIT, saved_docs will have one entry
+        for doc in saved_docs:
+            assert "gauge_value" not in doc, (
+                f"gauge_value found in committed CouchDB doc: {doc}"
+            )
+
+    @pytest.mark.anyio
+    async def test_check_wo_similarity_no_gauge_value(self):
+        wo_doc = {
+            "wonum": "1000045",
+            "description": "Inspect chiller pressure",
+            "assetnum": "CHILLER6",
+            "status": "COMP",
+            "reportdate": "2024-01-15",
+        }
+        mock_wo = MagicMock()
+        mock_wo.find.return_value = {"docs": [wo_doc]}
+        with patch("servers.robot.main._get_wo_db", return_value=mock_wo):
+            with patch("servers.robot.main.db", _make_db_mock()):
+                data = await call_tool(
+                    mcp,
+                    "check_wo_similarity",
+                    {
+                        "asset_id": "Chiller 6",
+                        "failure_description": "chiller pressure anomaly",
+                    },
+                )
+        assert _no_gauge_value(data), f"gauge_value leaked in check_wo_similarity: {data}"
+
+    @pytest.mark.anyio
+    async def test_detect_anomaly_no_gauge_value(self):
+        with patch("servers.robot.main.db", _make_db_mock()):
+            data = await call_tool(mcp, "detect_anomaly", {"asset_id": "Chiller 6"})
+        assert _no_gauge_value(data), f"gauge_value leaked in detect_anomaly: {data}"
diff --git a/src/servers/robot/tests/test_robot_tools.py b/src/servers/robot/tests/test_robot_tools.py
new file mode 100644
index 000000000..2f6fc2cfc
--- /dev/null
+++ b/src/servers/robot/tests/test_robot_tools.py
@@ -0,0 +1,471 @@
+"""Integration and unit tests for all 8 Robot MCP server tools.
+
+Tests marked @requires_couchdb are skipped when CouchDB is unreachable.
+All other tests use mocked DB via conftest fixtures.
+"""
+
+import pytest
+from unittest.mock import MagicMock, patch
+
+from servers.robot.main import mcp
+from .conftest import call_tool, requires_couchdb
+
+
+# Shared mock profile document
+_PROFILE = {
+    "_id": "profile:chiller_6",
+    "_rev": "1-abc",
+    "physical_location": {"x": 10.0, "y": 5.0, "z": 0.0, "room_id": "B1"},
+    "gauge_range": [0.0, 100.0],
+    "gauge_value": 75.0,
+    "panel_stuck_prob": 0.05,
+    "human_present": False,
+    "maintenance_slot": "day",
+    "active_work_order": None,
+    "inspection_frequency_days": 7,
+    "last_inspection": "2024-06-01",
+    "sensor_type": "pressure",
+}
+
+_PROFILE_HUMAN = {**_PROFILE, "human_present": True}
+_PROFILE_STUCK = {**_PROFILE, "panel_stuck_prob": 1.0}  # always stuck
+_PROFILE_FREE  = {**_PROFILE, "panel_stuck_prob": 0.0}  # never stuck
+
+_IOT_DOC = {
+    "asset_id": "Chiller 6",
+    "timestamp": "2024-06-01T00:00:00",
+    "Chiller 6 Pressure": 75.0,
+}
+
+
+def _db_for(profile):
+    mock = MagicMock()
+    mock.get.side_effect = lambda doc_id: profile if "profile:" in doc_id else None
+    mock.find.return_value = {"docs": [_IOT_DOC]}
+    mock.save.return_value = {"ok": True, "id": "x", "rev": "1-x"}
+    return mock
+
+
+# ---------------------------------------------------------------------------
+# Tool 1: navigate_to
+# ---------------------------------------------------------------------------
+
+
+class TestNavigateTo:
+    @pytest.mark.anyio
+    async def test_returns_success_for_known_asset(self):
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            data = await call_tool(mcp, "navigate_to", {"asset_id": "Chiller 6"})
+        assert data["success"] is True
+        assert data["distance_m"] > 0
+        assert data["steps_taken"] >= 1
+
+    @pytest.mark.anyio
+    async def test_blocked_when_no_location(self):
+        profile_no_loc = {k: v for k, v in _PROFILE.items() if k != "physical_location"}
+        with patch("servers.robot.main.db", _db_for(profile_no_loc)):
+            data = await call_tool(mcp, "navigate_to", {"asset_id": "Chiller 6"})
+        assert data["success"] is False
+        assert data["blocked_reason"] is not None
+
+    @pytest.mark.anyio
+    async def test_error_when_db_none(self, no_db):
+        data = await call_tool(mcp, "navigate_to", {"asset_id": "Chiller 6"})
+        assert "error" in data
+
+    @pytest.mark.anyio
+    async def test_error_when_profile_not_found(self):
+        mock = MagicMock()
+        mock.get.return_value = None
+        with patch("servers.robot.main.db", mock):
+            data = await call_tool(mcp, "navigate_to", {"asset_id": "Unknown Asset"})
+        assert "error" in data
+
+    @requires_couchdb
+    @pytest.mark.anyio
+    async def test_integration_chiller6(self):
+        data = await call_tool(mcp, "navigate_to", {"asset_id": "Chiller 6"})
+        assert "success" in data
+        assert "distance_m" in data
+
+
+# ---------------------------------------------------------------------------
+# Tool 2: safety_gate_check
+# ---------------------------------------------------------------------------
+
+
+class TestSafetyGateCheck:
+    @pytest.mark.anyio
+    async def test_clearance_true_when_no_human_no_wo(self):
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            data = await call_tool(mcp, "safety_gate_check", {"asset_id": "Chiller 6"})
+        assert data["safety_clearance"] is True
+        assert data["human_present"] is False
+        assert data["active_work_order"] is None
+
+    @pytest.mark.anyio
+    async def test_clearance_false_when_human_present(self):
+        with patch("servers.robot.main.db", _db_for(_PROFILE_HUMAN)):
+            data = await call_tool(mcp, "safety_gate_check", {"asset_id": "Chiller 6"})
+        assert data["safety_clearance"] is False
+        assert data["human_present"] is True
+
+    @pytest.mark.anyio
+    async def test_missing_slot_defaults_to_day(self):
+        profile_no_slot = {k: v for k, v in _PROFILE.items() if k != "maintenance_slot"}
+        with patch("servers.robot.main.db", _db_for(profile_no_slot)):
+            data = await call_tool(mcp, "safety_gate_check", {"asset_id": "Chiller 6"})
+        assert data["slot"] == "day"
+
+    @pytest.mark.anyio
+    async def test_missing_active_wo_defaults_to_none(self):
+        profile_no_wo = {k: v for k, v in _PROFILE.items() if k != "active_work_order"}
+        with patch("servers.robot.main.db", _db_for(profile_no_wo)):
+            data = await call_tool(mcp, "safety_gate_check", {"asset_id": "Chiller 6"})
+        assert data["active_work_order"] is None
+
+    @pytest.mark.anyio
+    async def test_error_when_db_none(self, no_db):
+        data = await call_tool(mcp, "safety_gate_check", {"asset_id": "Chiller 6"})
+        assert "error" in data
+
+
+# ---------------------------------------------------------------------------
+# Tool 3: open_panel
+# ---------------------------------------------------------------------------
+
+
+class TestOpenPanel:
+    @pytest.mark.anyio
+    async def test_panel_opens_with_zero_stuck_prob(self):
+        with patch("servers.robot.main.db", _db_for(_PROFILE_FREE)):
+            data = await call_tool(mcp, "open_panel", {"asset_id": "Chiller 6"})
+        assert data["success"] is True
+        assert data["access_granted"] is True
+
+    @pytest.mark.anyio
+    async def test_panel_stuck_with_certain_prob(self):
+        with patch("servers.robot.main.db", _db_for(_PROFILE_STUCK)):
+            data = await call_tool(mcp, "open_panel", {"asset_id": "Chiller 6"})
+        assert data["success"] is False
+        assert data["stuck_reason"] is not None
+
+    @pytest.mark.anyio
+    async def test_rng_deterministic_after_reset(self):
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            result1 = await call_tool(mcp, "open_panel", {"asset_id": "Chiller 6"})
+
+        import random
+        import servers.robot.main as robot_main
+        robot_main._simulator._rng = random.Random(42)
+
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            result2 = await call_tool(mcp, "open_panel", {"asset_id": "Chiller 6"})
+
+        assert result1["success"] == result2["success"]
+        assert result1["access_granted"] == result2["access_granted"]
+
+    @pytest.mark.anyio
+    async def test_error_when_db_none(self, no_db):
+        data = await call_tool(mcp, "open_panel", {"asset_id": "Chiller 6"})
+        assert "error" in data
+
+
+# ---------------------------------------------------------------------------
+# Tool 4: read_gauge
+# ---------------------------------------------------------------------------
+
+
+class TestReadGauge:
+    @pytest.mark.anyio
+    async def test_reading_within_range(self):
+        import servers.robot.main as robot_main
+        robot_main._simulator.generate_scenario("chiller_6", [0.0, 100.0], "normal")
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            data = await call_tool(
+                mcp, "read_gauge", {"asset_id": "Chiller 6", "attempt_n": 1}
+            )
+        assert 0.0 <= data["reading"] <= 100.0
+        assert 0.0 <= data["confidence"] <= 1.0
+
+    @pytest.mark.anyio
+    async def test_no_gauge_value_in_response(self):
+        import servers.robot.main as robot_main
+        robot_main._simulator.generate_scenario("chiller_6", [0.0, 100.0], "normal")
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            data = await call_tool(
+                mcp, "read_gauge", {"asset_id": "Chiller 6", "attempt_n": 1}
+            )
+        assert "gauge_value" not in data
+
+    @pytest.mark.anyio
+    async def test_attempt_n_reflected_in_response(self):
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            data = await call_tool(
+                mcp, "read_gauge", {"asset_id": "Chiller 6", "attempt_n": 3}
+            )
+        assert data["attempt_n"] == 3
+
+    @pytest.mark.anyio
+    async def test_gauge_range_present(self):
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            data = await call_tool(
+                mcp, "read_gauge", {"asset_id": "Chiller 6", "attempt_n": 1}
+            )
+        assert "gauge_range" in data
+
+    @pytest.mark.anyio
+    async def test_error_when_db_none(self, no_db):
+        data = await call_tool(
+            mcp, "read_gauge", {"asset_id": "Chiller 6", "attempt_n": 1}
+        )
+        assert "error" in data
+
+
+# ---------------------------------------------------------------------------
+# Tool 5: check_human_presence
+# ---------------------------------------------------------------------------
+
+
+class TestCheckHumanPresence:
+    @pytest.mark.anyio
+    async def test_no_human(self):
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            data = await call_tool(
+                mcp, "check_human_presence", {"asset_id": "Chiller 6"}
+            )
+        assert data["human_present"] is False
+
+    @pytest.mark.anyio
+    async def test_human_present(self):
+        with patch("servers.robot.main.db", _db_for(_PROFILE_HUMAN)):
+            data = await call_tool(
+                mcp, "check_human_presence", {"asset_id": "Chiller 6"}
+            )
+        assert data["human_present"] is True
+
+    @pytest.mark.anyio
+    async def test_slot_default(self):
+        profile_no_slot = {k: v for k, v in _PROFILE.items() if k != "maintenance_slot"}
+        with patch("servers.robot.main.db", _db_for(profile_no_slot)):
+            data = await call_tool(
+                mcp, "check_human_presence", {"asset_id": "Chiller 6"}
+            )
+        assert data["slot"] == "day"
+
+    @pytest.mark.anyio
+    async def test_error_when_db_none(self, no_db):
+        data = await call_tool(
+            mcp, "check_human_presence", {"asset_id": "Chiller 6"}
+        )
+        assert "error" in data
+
+
+# ---------------------------------------------------------------------------
+# Tool 6: commit_reading
+# ---------------------------------------------------------------------------
+
+
+class TestCommitReading:
+    @pytest.mark.anyio
+    async def test_blocked_when_n_lt_3(self):
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            data = await call_tool(
+                mcp,
+                "commit_reading",
+                {
+                    "asset_id": "Chiller 6",
+                    "readings": [74.0, 76.0],
+                    "decision": "close_normal",
+                },
+            )
+        assert data["status"] == "BLOCKED"
+        assert data["fm_flag"] == "FM-7b"
+
+    @pytest.mark.anyio
+    async def test_status_field_present(self):
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            data = await call_tool(
+                mcp,
+                "commit_reading",
+                {
+                    "asset_id": "Chiller 6",
+                    "readings": [73.0, 75.0, 77.0],
+                    "decision": "close_normal",
+                },
+            )
+        assert data["status"] in {"COMMIT", "BLOCKED", "ESCALATE", "OOD_FLAG", "PANEL_RECHECK"}
+
+    @pytest.mark.anyio
+    async def test_score_present(self):
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            data = await call_tool(
+                mcp,
+                "commit_reading",
+                {
+                    "asset_id": "Chiller 6",
+                    "readings": [73.0, 75.0, 77.0],
+                    "decision": "close_normal",
+                },
+            )
+        assert "score" in data
+        assert isinstance(data["score"], float)
+
+    @pytest.mark.anyio
+    async def test_error_when_db_none(self, no_db):
+        data = await call_tool(
+            mcp,
+            "commit_reading",
+            {
+                "asset_id": "Chiller 6",
+                "readings": [73.0, 75.0, 77.0],
+                "decision": "close_normal",
+            },
+        )
+        assert "error" in data
+
+    @requires_couchdb
+    @pytest.mark.anyio
+    async def test_integration_commit_or_escalate(self):
+        data = await call_tool(
+            mcp,
+            "commit_reading",
+            {
+                "asset_id": "Chiller 6",
+                "readings": [49.5, 50.0, 50.5],
+                "decision": "close_normal",
+            },
+        )
+        assert data["status"] in {"COMMIT", "ESCALATE", "OOD_FLAG", "PANEL_RECHECK"}
+
+
+# ---------------------------------------------------------------------------
+# Tool 7: check_wo_similarity
+# ---------------------------------------------------------------------------
+
+
+class TestCheckWoSimilarity:
+    def _wo_mock(self, docs):
+        mock = MagicMock()
+        mock.find.return_value = {"docs": docs}
+        return mock
+
+    @pytest.mark.anyio
+    async def test_error_when_wo_db_none(self, no_wo_db):
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            data = await call_tool(
+                mcp,
+                "check_wo_similarity",
+                {
+                    "asset_id": "Chiller 6",
+                    "failure_description": "water leak near chiller",
+                },
+            )
+        assert "error" in data
+
+    @pytest.mark.anyio
+    async def test_proceed_when_no_similar_wos(self):
+        wo_doc = {
+            "wonum": "1000045",
+            "description": "completely unrelated electrical work",
+            "assetnum": "CHILLER6",
+            "status": "COMP",
+        }
+        with patch("servers.robot.main._get_wo_db", return_value=self._wo_mock([wo_doc])):
+            with patch("servers.robot.main.db", _db_for(_PROFILE)):
+                data = await call_tool(
+                    mcp,
+                    "check_wo_similarity",
+                    {
+                        "asset_id": "Chiller 6",
+                        "failure_description": "water leak near chiller",
+                    },
+                )
+        assert data["recommendation"] in {"proceed", "review", "consolidate"}
+        assert "similar_wos" in data
+        assert "scores" in data
+
+    @pytest.mark.anyio
+    async def test_consolidate_for_identical_description(self):
+        wo_doc = {
+            "wonum": "1000046",
+            "description": "water leak near chiller unit",
+            "assetnum": "CHILLER6",
+            "status": "WAPPR",
+        }
+        with patch("servers.robot.main._get_wo_db", return_value=self._wo_mock([wo_doc])):
+            with patch("servers.robot.main.db", _db_for(_PROFILE)):
+                data = await call_tool(
+                    mcp,
+                    "check_wo_similarity",
+                    {
+                        "asset_id": "Chiller 6",
+                        "failure_description": "water leak near chiller unit",
+                    },
+                )
+        assert data["recommendation"] == "consolidate"
+        assert data["duplicate_risk"] is True
+
+    @requires_couchdb
+    @pytest.mark.anyio
+    async def test_integration_wo_similarity(self):
+        data = await call_tool(
+            mcp,
+            "check_wo_similarity",
+            {
+                "asset_id": "Chiller 6",
+                "failure_description": "anomaly on chiller condenser",
+            },
+        )
+        assert "recommendation" in data
+        assert data["recommendation"] in {"proceed", "review", "consolidate"}
+
+
+# ---------------------------------------------------------------------------
+# Tool 8: detect_anomaly
+# ---------------------------------------------------------------------------
+
+
+class TestDetectAnomaly:
+    @pytest.mark.anyio
+    async def test_returns_all_expected_fields(self):
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            data = await call_tool(mcp, "detect_anomaly", {"asset_id": "Chiller 6"})
+        for field in (
+            "spill_detected",
+            "leakage_detected",
+            "pipe_damage_detected",
+            "pooled_liquid_detected",
+            "anomaly_confidence",
+        ):
+            assert field in data, f"Missing field '{field}' in detect_anomaly response"
+
+    @pytest.mark.anyio
+    async def test_spill_scenario_detected(self):
+        import servers.robot.main as robot_main
+        robot_main._simulator.generate_scenario("chiller_6", [0.0, 100.0], "spill")
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            data = await call_tool(mcp, "detect_anomaly", {"asset_id": "Chiller 6"})
+        assert data["spill_detected"] is True
+        assert data["leakage_detected"] is True
+
+    @pytest.mark.anyio
+    async def test_normal_scenario_no_spill(self):
+        import servers.robot.main as robot_main
+        robot_main._simulator.generate_scenario("chiller_6", [0.0, 100.0], "normal")
+        with patch("servers.robot.main.db", _db_for(_PROFILE)):
+            data = await call_tool(mcp, "detect_anomaly", {"asset_id": "Chiller 6"})
+        assert data["spill_detected"] is False
+        assert data["leakage_detected"] is False
+
+    @pytest.mark.anyio
+    async def test_error_when_db_none(self, no_db):
+        data = await call_tool(mcp, "detect_anomaly", {"asset_id": "Chiller 6"})
+        assert "error" in data
+
+    @requires_couchdb
+    @pytest.mark.anyio
+    async def test_integration_anomaly_fields(self):
+        data = await call_tool(mcp, "detect_anomaly", {"asset_id": "Chiller 6"})
+        assert "spill_detected" in data
+        assert isinstance(data["anomaly_confidence"], float)
diff --git a/src/servers/robot/tests/test_verifier.py b/src/servers/robot/tests/test_verifier.py
new file mode 100644
index 000000000..32437a1e4
--- /dev/null
+++ b/src/servers/robot/tests/test_verifier.py
@@ -0,0 +1,135 @@
+"""Unit tests for MultiReadingVerifier — no CouchDB required."""
+
+import pytest
+from servers.robot.verifier import MultiReadingVerifier, VerifierResult
+
+
+@pytest.fixture
+def verifier():
+    return MultiReadingVerifier()
+
+
+class TestBlockedGate:
+    def test_blocked_n_1(self, verifier):
+        result = verifier.verify(
+            readings=[50.0],
+            iot_value=50.0,
+            gauge_range=[0, 100],
+        )
+        assert result.status == "BLOCKED"
+        assert result.fm_flag == "FM-7b"
+        assert result.score == 0.0
+
+    def test_blocked_n_2(self, verifier):
+        result = verifier.verify(
+            readings=[48.0, 52.0],
+            iot_value=50.0,
+            gauge_range=[0, 100],
+        )
+        assert result.status == "BLOCKED"
+        assert result.fm_flag == "FM-7b"
+
+    def test_fm7b_flag_in_blocked(self, verifier):
+        result = verifier.verify(readings=[], iot_value=0.0, gauge_range=[0, 100])
+        assert result.fm_flag == "FM-7b"
+        # insufficient readings flag appears in fm_annotations
+        assert any("FM-7b" in ann for ann in result.fm_annotations)
+
+
+class TestFreezeGate:
+    def test_zero_variance_triggers_panel_recheck(self, verifier):
+        # Three identical readings → std=0.0 → PANEL_RECHECK
+        result = verifier.verify(
+            readings=[50.0, 50.0, 50.0],
+            iot_value=50.0,
+            gauge_range=[0, 100],
+        )
+        assert result.status == "PANEL_RECHECK"
+        assert result.fm_flag == "FM-1"
+
+    def test_tiny_variance_still_freezes(self, verifier):
+        # std = 0.0001 < 0.001 * 100 = 0.1 → PANEL_RECHECK
+        result = verifier.verify(
+            readings=[50.0, 50.0001, 50.0002],
+            iot_value=50.0,
+            gauge_range=[0, 100],
+        )
+        assert result.status == "PANEL_RECHECK"
+
+
+class TestCommit:
+    def test_commit_consistent_readings(self, verifier):
+        # Tight cluster near IoT value → high C, high A → COMMIT
+        result = verifier.verify(
+            readings=[49.5, 50.0, 50.5],
+            iot_value=50.0,
+            gauge_range=[0, 100],
+        )
+        assert result.status == "COMMIT"
+        assert result.score >= 0.82
+
+    def test_historical_signal_neutral_when_absent(self, verifier):
+        result = verifier.verify(
+            readings=[49.5, 50.0, 50.5],
+            iot_value=50.0,
+            gauge_range=[0, 100],
+            historical_baseline=None,
+        )
+        assert result.H == 0.5
+        assert result.status == "COMMIT"
+
+
+class TestEscalateAndOOD:
+    def test_escalate_moderate_contradiction(self, verifier):
+        # Mean reading 80, IoT says 20 — large gap → low A
+        result = verifier.verify(
+            readings=[78.0, 80.0, 82.0],
+            iot_value=20.0,
+            gauge_range=[0, 100],
+        )
+        # A = 1 - |80 - 20| / 100 = 0.40 → score roughly 0.35*C + 0.35*0.40 + 0.30*H
+        assert result.status in {"ESCALATE", "OOD_FLAG"}
+
+    def test_ood_very_low_score(self, verifier):
+        # Readings near top, IoT near bottom, historical near bottom
+        result = verifier.verify(
+            readings=[88.0, 90.0, 92.0],
+            iot_value=5.0,
+            gauge_range=[0, 100],
+            historical_baseline=5.0,
+        )
+        # A = 1 - |90-5|/100 = 0.15; H = 1 - |90-5|/100 = 0.15 → score ≈ 0.35*C + 0.35*0.15 + 0.30*0.15
+        assert result.status == "OOD_FLAG"
+
+
+class TestFMAnnotations:
+    def test_fm7_annotation_when_a_lt_015(self, verifier):
+        # A = 1 - |90 - 3| / 100 = 0.13 < 0.15 → sensor-physical contradiction annotation fires
+        result = verifier.verify(
+            readings=[88.0, 90.0, 92.0],
+            iot_value=3.0,
+            gauge_range=[0, 100],
+        )
+        assert any("FM-7" in ann for ann in result.fm_annotations)
+
+    def test_fm7c_annotation_when_h_lt_015(self, verifier):
+        # H = 1 - |90 - 3| / 100 = 0.13 < 0.15 → historical outlier annotation fires; IoT agrees (A fine)
+        result = verifier.verify(
+            readings=[88.0, 90.0, 92.0],
+            iot_value=90.0,
+            gauge_range=[0, 100],
+            historical_baseline=3.0,
+        )
+        assert any("FM-7c" in ann for ann in result.fm_annotations)
+
+    def test_no_fm_annotations_for_clean_commit(self, verifier):
+        result = verifier.verify(
+            readings=[49.5, 50.0, 50.5],
+            iot_value=50.0,
+            gauge_range=[0, 100],
+            historical_baseline=50.0,
+        )
+        assert result.fm_annotations == []
+        assert result.status == "COMMIT"
+
+
diff --git a/src/servers/robot/verifier.py b/src/servers/robot/verifier.py
new file mode 100644
index 000000000..afe98a1e1
--- /dev/null
+++ b/src/servers/robot/verifier.py
@@ -0,0 +1,133 @@
+"""MultiReadingVerifier — CP-calibrated commit gate.
+
+Formula (updated from research analysis):
+    score = 0.35*C + 0.35*A + 0.30*H
+
+    C: multi-read consistency  = 1 - std(readings) / gauge_range_span
+    A: gauge-vs-IoT agreement  = 1 - |mean(readings) - iot_value| / span
+    H: historical consistency  = 1 - |mean(readings) - hist_baseline| / span
+       (H = 0.50 neutral when no history is available)
+
+Hard gates (applied before scoring):
+    N < 3                        → BLOCKED       (FM-7b)
+    std(readings) < 0.1% range   → PANEL_RECHECK (FM-1: sensor freeze)
+
+Thresholds (placeholder until field-visit calibration):
+    score ≥ 0.82  → COMMIT
+    score ≥ 0.65  → ESCALATE
+    else          → OOD_FLAG
+
+Note on Q (agent self-confidence):
+    Q was removed from the formula because LLM self-confidence is poorly
+    calibrated and creating a gaming surface. Q is recorded diagnostically
+    in commit documents but does not influence the gate.
+"""
+
+import statistics
+from dataclasses import dataclass, field
+from typing import Optional
+
+
+@dataclass
+class VerifierResult:
+    status: str          # COMMIT | BLOCKED | ESCALATE | OOD_FLAG | PANEL_RECHECK
+    score: float
+    C: float
+    A: float
+    H: float
+    fm_flag: Optional[str]
+    fm_annotations: list
+    reason: str
+
+
+class MultiReadingVerifier:
+    TAU_COMMIT = 0.82
+    TAU_ESCALATE = 0.65
+    FREEZE_EPSILON = 0.001   # std < 0.1% of range → sensor freeze
+
+    def verify(
+        self,
+        readings: list,
+        iot_value: float,
+        gauge_range: list,
+        historical_baseline: Optional[float] = None,
+    ) -> VerifierResult:
+        range_span = float(gauge_range[1]) - float(gauge_range[0])
+        if range_span <= 0:
+            range_span = 1.0
+
+        # Hard gate: insufficient readings
+        if len(readings) < 3:
+            return VerifierResult(
+                status="BLOCKED",
+                score=0.0,
+                C=0.0, A=0.0, H=0.5,
+                fm_flag="FM-7b",
+                fm_annotations=["FM-7b: fewer than 3 readings before commit"],
+                reason=(
+                    f"N={len(readings)} readings supplied; "
+                    "minimum 3 required before commit"
+                ),
+            )
+
+        # Hard gate: sensor freeze (zero variance → stuck gauge or panel)
+        std_val = statistics.stdev(readings) if len(readings) > 1 else 0.0
+        if std_val < self.FREEZE_EPSILON * range_span:
+            return VerifierResult(
+                status="PANEL_RECHECK",
+                score=0.0,
+                C=0.0, A=0.0, H=0.5,
+                fm_flag="FM-1",
+                fm_annotations=[
+                    "FM-1: sensor freeze — readings show no variance across attempts"
+                ],
+                reason="Zero variance across readings; panel may be stuck or gauge frozen",
+            )
+
+        mean_r = statistics.mean(readings)
+
+        C = max(0.0, 1.0 - std_val / range_span)
+        A = max(0.0, 1.0 - abs(mean_r - iot_value) / range_span)
+        H = (
+            max(0.0, 1.0 - abs(mean_r - historical_baseline) / range_span)
+            if historical_baseline is not None
+            else 0.5
+        )
+
+        score = round(0.35 * C + 0.35 * A + 0.30 * H, 4)
+
+        fm_annotations = []
+        if A < 0.15:
+            fm_annotations.append(
+                "FM-7: sensor-physical contradiction (reading vs IoT sensor)"
+            )
+        if historical_baseline is not None and H < 0.15:
+            fm_annotations.append(
+                "FM-7c: historical outlier (reading contradicts asset baseline)"
+            )
+
+        fm_flag = fm_annotations[0].split(":")[0] if fm_annotations else None
+
+        if score >= self.TAU_COMMIT:
+            status = "COMMIT"
+        elif score >= self.TAU_ESCALATE:
+            status = "ESCALATE"
+        else:
+            status = "OOD_FLAG"
+            if not fm_flag:
+                fm_flag = "FM-7"
+
+        reason = f"score={score:.3f} (C={C:.2f}, A={A:.2f}, H={H:.2f})"
+        if fm_annotations:
+            reason += "; " + "; ".join(fm_annotations)
+
+        return VerifierResult(
+            status=status,
+            score=score,
+            C=round(C, 4),
+            A=round(A, 4),
+            H=round(H, 4),
+            fm_flag=fm_flag,
+            fm_annotations=fm_annotations,
+            reason=reason,
+        )

From a4e41071427ec1031d241075ab0087afccbec0b3 Mon Sep 17 00:00:00 2001
From: AnandMayank <anandmayank698@gmail.com>
Date: Sat, 27 Jun 2026 14:00:23 +0000
Subject: [PATCH 2/2] feat(robot-mcp): update Layer 1 robot tools

Signed-off-by: AnandMayank <anandmayank698@gmail.com>
---
 src/couchdb/schema_robot_fields.json          |  203 ++--
 src/couchdb/seed_robot_profiles.py            |  405 ++++---
 src/servers/iot/tests/test_robot_profiles.py  |  216 ----
 src/servers/robot/main.py                     | 1074 +++++++++--------
 src/servers/robot/simulator.py                |  195 ---
 src/servers/robot/tests/conftest.py           |  194 ++-
 .../tests/test_gauge_value_protection.py      |  187 ---
 src/servers/robot/tests/test_robot_tools.py   |  992 ++++++++-------
 src/servers/robot/tests/test_verifier.py      |  135 ---
 src/servers/robot/verifier.py                 |  133 --
 10 files changed, 1693 insertions(+), 2041 deletions(-)
 delete mode 100644 src/servers/iot/tests/test_robot_profiles.py
 delete mode 100644 src/servers/robot/simulator.py
 delete mode 100644 src/servers/robot/tests/test_gauge_value_protection.py
 delete mode 100644 src/servers/robot/tests/test_verifier.py
 delete mode 100644 src/servers/robot/verifier.py

diff --git a/src/couchdb/schema_robot_fields.json b/src/couchdb/schema_robot_fields.json
index 7b016bf88..0ebc3be9a 100644
--- a/src/couchdb/schema_robot_fields.json
+++ b/src/couchdb/schema_robot_fields.json
@@ -1,84 +1,141 @@
 {
-  "doc_type": "asset_robot_profile",
-  "id_pattern": "profile:{normalized_asset_id}",
-  "description": "Per-asset profile documents for the robot inspection extension. Stored in the iot CouchDB database alongside timestamped sensor readings, but deliberately omit the asset_id field so existing IoT server queries are unaffected.",
-  "deferred_fields": "See SAFETY_FIELDS_FUTURE.md for hazard_class, maintenance_slot, active_work_order",
+  "_comment": "CouchDB document types for the robot inspection MCP server (12 Layer 1 tools). All documents live in the iot DB alongside timestamped IoT sensor readings. None contain an asset_id field, so existing IoT server queries ({asset_id: {$exists: true}}) are unaffected.",
 
-  "fields": {
-    "physical_location": {
-      "type": "object or null",
-      "schema": {"x": "float", "y": "float", "z": "float", "room_id": "string"},
-      "default": null,
-      "status": "active",
-      "purpose": "Robot navigation target for navigate_to() tool. Set from facility floor plan. Null until floor-plan data is loaded."
-    },
-    "gauge_value": {
-      "type": "float",
-      "default": 0.0,
-      "status": "active",
-      "CRITICAL": "NEVER return this field from any MCP tool to the agent",
-      "set_by": "PhysicalStateSimulator.generate_scenario()",
-      "read_by": "Evaluator.get_ground_truth() ONLY",
-      "purpose": "Ground truth physical gauge reading. Set at scenario generation time. Must never reach the agent — doing so invalidates the evaluation."
-    },
-    "gauge_range": {
-      "type": "array [float, float]",
-      "default": [0, 100],
-      "status": "active",
-      "purpose": "Min/max of the gauge scale face. Used in PA metric and tau_agreement threshold calculation."
-    },
-    "panel_stuck_prob": {
-      "type": "float 0-1",
-      "default": 0.12,
-      "status": "active",
-      "purpose": "Probability that the access panel fails to open. SME-calibrated at 0.12 for preprogrammed navigation; 0.24-0.40 for learned navigation routes."
-    },
-    "human_present": {
-      "type": "bool",
-      "default": false,
-      "status": "active",
-      "purpose": "Whether a technician is currently at this asset. If true, robot dispatch is skipped and an alarm is raised to the person already on-site. Updated by PhysicalStateSimulator per scenario."
-    },
-    "never_read": {
-      "type": "bool",
-      "default": false,
-      "status": "active",
-      "purpose": "True if no physical gauge reading exists in Maximo history for this asset. Enables the never-read-gauge scenario variant. SME confirmed some gauges have never been recorded."
-    },
-    "real_gauge_images": {
-      "type": "array of strings",
-      "default": [],
-      "status": "active",
-      "purpose": "File paths to real facility images of this asset's gauge collected during field visits. Used to train and calibrate the CosmosWorld perception layer."
+  "documents": {
+
+    "asset_robot_profile": {
+      "doc_type": "asset_robot_profile",
+      "_id_pattern": "profile:{normalized_asset_id}",
+      "_id_examples": ["profile:chiller_6", "profile:motor_01"],
+      "description": "Per-asset physical layout and panel state. Seeded by seed_robot_profiles.py. Scenario-specific state (e.g. panel_stuck=true for R001) is loaded by the eval harness via the shared robot JSON files.",
+      "fields": {
+        "physical_location": {
+          "type": "object or null",
+          "schema": {"x": "float (m)", "y": "float (m)", "z": "float (m)", "room_id": "string"},
+          "default": null,
+          "purpose": "Facility floor-plan coordinates used by navigate_to() as the GraphNav navigation target. Null until floor-plan data is collected for the asset."
+        },
+        "gauge_path": {
+          "type": "string or null",
+          "default": null,
+          "purpose": "File path or URL of the physical gauge image captured by capture_image(). Null until field data has been collected. When non-null and panel_stuck=false, the VLM perception agent can read the gauge value from this image."
+        },
+        "gauge_range": {
+          "type": "array [low, high]",
+          "default": [0, 100],
+          "purpose": "Physical measurement range of the gauge (e.g. [0, 400] for a 0–400 bar pressure gauge). Included in the vlm_hint string returned by capture_image() so the VLM agent knows the scale."
+        },
+        "gauge_description": {
+          "type": "string",
+          "default": "",
+          "purpose": "Plain English description of the gauge and its units (e.g. 'Compressor outlet pressure gauge, analog dial, 0–400 bar'). Included in the vlm_hint string returned by capture_image()."
+        },
+        "panel_stuck": {
+          "type": "bool",
+          "default": false,
+          "purpose": "True when the physical inspection panel cannot be opened by the robot arm. open_panel() returns access_granted=false and capture_image() returns occlusion_flag=true when panel_stuck=true. Represents a physical kinematic failure (panel seized, corroded, or obstructed) that requires human maintenance escalation."
+        }
+      }
     },
-    "reading_consistency": {
-      "type": "float or null",
-      "default": null,
-      "status": "active",
-      "purpose": "Empirical std(readings) / gauge_range computed from field collection data. Used to set tau_consistency threshold for this asset type. Null until field data arrives."
+
+    "robot_state": {
+      "doc_type": "robot_state",
+      "_id_pattern": "robot_state:{robot_id}",
+      "_id_example": "robot_state:spot_1",
+      "description": "Per-robot battery, pose, power and stance state. Robot-level, not asset-level. Seeded by seed_robot_profiles.py. power_state and stance_state added to support the 6 motion tools (power_on, power_off, stand, sit, dock, undock).",
+      "fields": {
+        "battery_charge_pct": {
+          "type": "float",
+          "range": [0.0, 100.0],
+          "default": 85.0,
+          "purpose": "Current battery charge percentage. get_battery() reads this. When battery_charge_pct < battery_low_threshold, get_battery() returns low_battery=true and the agent must abort the inspection and return to the charging dock immediately."
+        },
+        "battery_low_threshold": {
+          "type": "float",
+          "default": 20.0,
+          "purpose": "Threshold percentage below which the mission must be aborted. get_battery() computes low_battery = (battery_charge_pct < battery_low_threshold)."
+        },
+        "battery_estimated_runtime_s": {
+          "type": "float",
+          "default": 5400.0,
+          "purpose": "Estimated remaining runtime in seconds. Informational — included in the get_battery() message to help the agent judge whether the battery will last the inspection."
+        },
+        "at_charge_station": {
+          "type": "bool",
+          "default": false,
+          "purpose": "True if the robot is currently docked at a charging station. Included in the get_battery() response for context."
+        },
+        "pose": {
+          "type": "object",
+          "schema": {"x": "float (m)", "y": "float (m)", "theta": "float (rad, yaw from east)", "frame": "string — always 'map'"},
+          "default": {"x": 0.0, "y": 0.0, "theta": 0.0, "frame": "map"},
+          "purpose": "Current robot pose in the facility map frame. get_pose() reads this. The agent should call get_pose() after navigate_to() to confirm the robot arrived at the intended location."
+        },
+        "localization_ok": {
+          "type": "bool",
+          "default": true,
+          "purpose": "False when the robot cannot localise itself in the facility map (e.g. map data stale, fiducial missing, encoder drift too large). When false, get_pose() returns localization_ok=false and the agent must abort the inspection and raise a work order for robot remapping — taking a gauge reading from an unverified position risks reading the wrong asset."
+        },
+        "pose_drift_m": {
+          "type": "float",
+          "default": 0.0,
+          "purpose": "Estimated pose error in metres. get_pose() issues a warning when drift > 0.5 m. When localization_ok=false this field typically exceeds 0.5 m (e.g. 1.8 m in the localisation failure scenario)."
+        },
+        "fault_state": {
+          "type": "string or null",
+          "values": [null, "ESTOP_CUT", "COMMS_LOST", "JOINT_FAULT", "BATTERY_CRITICAL"],
+          "default": null,
+          "purpose": "Active robot fault, if any. Null means nominal. get_pose() surfaces this in the response. A non-null fault_state requires human intervention before the mission can continue."
+        },
+        "power_state": {
+          "type": "string",
+          "values": ["POWERED_ON", "POWERED_OFF"],
+          "default": "POWERED_ON",
+          "purpose": "Motor power state. power_on() and power_off() read this field. Maps to bosdyn.client.power.PowerClient.power_on_motors() / power_off_motors() in the real Spot SDK. The robot must be POWERED_ON before stand(), sit(), navigate_to(), or open_panel() can succeed."
+        },
+        "stance_state": {
+          "type": "string",
+          "values": ["STANDING", "SITTING"],
+          "default": "STANDING",
+          "purpose": "Robot stance. stand() and sit() read this field. Maps to bosdyn.client.robot_command.RobotCommandBuilder.synchro_stand_command() / synchro_sit_command(). The robot must be SITTING before power_off() is allowed. Call sit() before dock() at mission end."
+        }
+      }
     },
-    "sensor_physical_gap": {
-      "type": "float or null",
-      "default": null,
-      "status": "active",
-      "purpose": "Empirical |iot_value - gauge_value| / gauge_range from field collection. Calibrates tau_agreement for this asset. Null until field data arrives."
+
+    "waypoints": {
+      "doc_type": "waypoints",
+      "_id": "waypoints",
+      "description": "Singleton document mapping assets to Spot GraphNav waypoint IDs. list_waypoints() returns the waypoints array. The agent must call list_waypoints() before navigate_to() to confirm the target waypoint exists and is active.",
+      "fields": {
+        "waypoints": {
+          "type": "array of objects",
+          "item_schema": {
+            "waypoint_id": "string — Spot GraphNav waypoint UUID or short name",
+            "waypoint_name": "string — human-readable name shown in the Spot app",
+            "asset_id": "string or null — normalized asset ID this waypoint serves (null for the dock)",
+            "location_description": "string — plain English location for logging",
+            "x": "float (m)", "y": "float (m)",
+            "active": "bool — false if the waypoint has been deleted or the plant reconfigured since last mapping. When false, navigate_to() for that asset must not be called — the agent must escalate and raise a work order for waypoint remapping."
+          },
+          "purpose": "Authoritative list of inspection waypoints loaded from the Spot GraphNav map. list_waypoints() filters by asset_id when provided. A missing or inactive waypoint for the target asset represents a plant reconfiguration event that requires human re-mapping of the facility."
+        }
+      }
     }
+
   },
 
+  "isolation_guarantee": "No robot document contains an asset_id field. IoT server queries {asset_id: {$exists: true}} cannot match any robot document.",
+
   "indexes": [
     {
-      "name": "idx_robot_never_read",
-      "fields": ["doc_type", "never_read"],
-      "purpose": "Scenario generator lookup for never-read gauge cases"
+      "name": "idx_robot_state_by_robot",
+      "fields": ["doc_type", "robot_id"],
+      "purpose": "get_battery() and get_pose() lookup by robot_id"
+    },
+    {
+      "name": "idx_waypoints_singleton",
+      "fields": ["doc_type"],
+      "purpose": "list_waypoints() fetch of the singleton waypoints document"
     }
-  ],
-
-  "known_profiles": [
-    {"profile_id": "profile:chiller_6",       "display_name": "Chiller 6"},
-    {"profile_id": "profile:metro_pump_1",    "display_name": "Metro Pump 1"},
-    {"profile_id": "profile:hydraulic_pump_1","display_name": "Hydraulic Pump 1"},
-    {"profile_id": "profile:motor_01",        "display_name": "Motor 01"}
-  ],
-
-  "isolation_guarantee": "Profile documents have no asset_id field. The IoT server queries {asset_id: {$exists: true}} — these documents are invisible to all existing server queries, including get_asset_list() and get_sensor_list()."
+  ]
 }
diff --git a/src/couchdb/seed_robot_profiles.py b/src/couchdb/seed_robot_profiles.py
index 841a4a3a9..f0ec7bb76 100644
--- a/src/couchdb/seed_robot_profiles.py
+++ b/src/couchdb/seed_robot_profiles.py
@@ -1,26 +1,30 @@
-"""Seed robot asset profile documents into the iot CouchDB database.
+"""Seed robot documents into the iot CouchDB database.
 
-Creates one profile document per known asset containing robot-inspection fields
-(navigation, gauge truth, calibration, dispatch state).  These documents are
-deliberately stored WITHOUT an ``asset_id`` field so existing IoT server
+Creates three document types per robot deployment:
+
+  profile:{asset_id}      — per-asset physical layout and panel state (5 fields)
+  robot_state:{robot_id}  — per-robot battery and pose state
+  waypoints               — singleton inspection waypoint map
+
+All documents deliberately omit the ``asset_id`` field so existing IoT server
 queries (``{"asset_id": {"$exists": true}}``) are completely unaffected.
 
-Document shape:
-    _id        = "profile:{normalized_asset_id}"   e.g. "profile:chiller_6"
-    doc_type   = "asset_robot_profile"
-    display_name = "Chiller 6"                     original asset_id string
-    + 9 robot fields (see ROBOT_FIELD_DEFAULTS)
+Scenario-specific state (e.g. low battery, localisation failure) is loaded by the
+eval harness via init_data.py + the shared robot JSON files in
+AssetOpsBenchScenarioGeneration/RobotInspection/shared/robot/.
 
 Usage:
-    python src/couchdb/seed_robot_profiles.py             # apply
-    python src/couchdb/seed_robot_profiles.py --dry-run   # preview only
-    python src/couchdb/seed_robot_profiles.py --verify    # check DB state
+    python src/couchdb/seed_robot_profiles.py             # seed all (nominal state)
+    python src/couchdb/seed_robot_profiles.py --dry-run   # preview
+    python src/couchdb/seed_robot_profiles.py --verify    # check seeded state
+    python src/couchdb/seed_robot_profiles.py --reset     # restore nominal state
 """
 
 import argparse
 import json
 import os
 import sys
+from datetime import datetime, timezone
 
 import couchdb3
 import requests
@@ -28,72 +32,143 @@
 
 load_dotenv()
 
-# ---------------------------------------------------------------------------
-# Connection — identical pattern to src/servers/iot/main.py
-# ---------------------------------------------------------------------------
 COUCHDB_URL      = os.environ.get("COUCHDB_URL")
 COUCHDB_DBNAME   = os.environ.get("IOT_DBNAME")
 COUCHDB_USERNAME = os.environ.get("COUCHDB_USERNAME")
 COUCHDB_PASSWORD = os.environ.get("COUCHDB_PASSWORD")
+ROBOT_ID         = os.environ.get("ROBOT_ID", "spot_1")
 
 # ---------------------------------------------------------------------------
-# Robot field defaults (in-scope fields only)
-# gauge_value is stored here but MUST NEVER be returned by any MCP tool.
+# PART 1 — Asset profile documents (5 fields per asset)
 # ---------------------------------------------------------------------------
-ROBOT_FIELD_DEFAULTS: dict = {
-    "physical_location":   None,
-    "gauge_value":         0.0,    # ground truth — NEVER expose to agent via MCP
-    "gauge_range":         [0, 100],
-    "panel_stuck_prob":    0.12,
-    "human_present":       False,
-    "never_read":          False,
-    "real_gauge_images":   [],
-    "reading_consistency": None,
-    "sensor_physical_gap": None,
-}
 
-ROBOT_FIELDS = list(ROBOT_FIELD_DEFAULTS.keys())
+PROFILE_DEFAULTS: dict = {
+    "physical_location": None,   # navigate_to target; None until floor-plan loaded
+    "gauge_path":        None,   # capture_image returns this; None until field data collected
+    "gauge_range":       [0, 100],
+    "gauge_description": "",
+    "panel_stuck":       False,  # open_panel + capture_image occlusion
+}
+PROFILE_FIELDS = list(PROFILE_DEFAULTS.keys())
 
-# ---------------------------------------------------------------------------
-# Known assets — derived from sample_data/iot/*.json
-# physical_location values are placeholder coordinates until floor-plan data arrives.
-# ---------------------------------------------------------------------------
 ASSETS = [
     {
-        "display_name":    "Chiller 6",
-        "profile_id":      "profile:chiller_6",
+        "display_name":      "Chiller 6",
+        "profile_id":        "profile:chiller_6",
+        "waypoint_id":       "wp_chiller_6_panel",
         "physical_location": {"x": 52.3, "y": 18.1, "z": 0.0, "room_id": "cooling_3B"},
-        "gauge_range":     [0, 100],
+        "gauge_range":       [0, 400],
+        "gauge_description": "Compressor outlet pressure gauge, analog dial, 0–400 bar",
     },
     {
-        "display_name":    "Metro Pump 1",
-        "profile_id":      "profile:metro_pump_1",
+        "display_name":      "Metro Pump 1",
+        "profile_id":        "profile:metro_pump_1",
+        "waypoint_id":       "wp_metro_pump_1_panel",
         "physical_location": {"x": 14.0, "y": 32.5, "z": 0.0, "room_id": "pump_room_A"},
-        "gauge_range":     [0, 200],
+        "gauge_range":       [0.0, 1.5],
+        "gauge_description": "Flow rate gauge, analog dial, 0–1.5 m³/s",
     },
     {
-        "display_name":    "Hydraulic Pump 1",
-        "profile_id":      "profile:hydraulic_pump_1",
+        "display_name":      "Hydraulic Pump 1",
+        "profile_id":        "profile:hydraulic_pump_1",
+        "waypoint_id":       "wp_hydraulic_pump_1_panel",
         "physical_location": {"x": 28.7, "y": 11.0, "z": 0.0, "room_id": "pump_room_B"},
-        "gauge_range":     [0, 350],
+        "gauge_range":       [0, 350],
+        "gauge_description": "Hydraulic pressure gauge, analog dial, 0–350 bar",
     },
     {
-        "display_name":    "Motor 01",
-        "profile_id":      "profile:motor_01",
+        "display_name":      "Motor 01",
+        "profile_id":        "profile:motor_01",
+        "waypoint_id":       "wp_motor_01_panel",
         "physical_location": {"x": 7.2, "y": 44.8, "z": 0.0, "room_id": "motor_bay_1"},
-        "gauge_range":     [0, 60],
+        "gauge_range":       [0, 200],
+        "gauge_description": "Motor temperature gauge, analog dial, 0–200°C",
     },
 ]
 
 # ---------------------------------------------------------------------------
-# Indexes for Robot MCP tool query performance
+# PART 2 — Robot state document
 # ---------------------------------------------------------------------------
-ROBOT_INDEXES = [
-    {
-        "name":   "idx_robot_never_read",
-        "fields": ["doc_type", "never_read"],
-        "reason": "scenario generator: never-read gauge cases",
-    },
+
+def _nominal_robot_state() -> dict:
+    return {
+        "_id":                         f"robot_state:{ROBOT_ID}",
+        "doc_type":                    "robot_state",
+        "robot_id":                    ROBOT_ID,
+        "battery_charge_pct":          85.0,
+        "battery_low_threshold":       20.0,
+        "battery_estimated_runtime_s": 5400.0,
+        "at_charge_station":           False,
+        "pose": {"x": 0.0, "y": 0.0, "theta": 0.0, "frame": "map"},
+        "localization_ok":             True,
+        "pose_drift_m":                0.0,
+        "fault_state":                 None,
+        "last_updated":                datetime.now(timezone.utc).isoformat(),
+    }
+
+ROBOT_STATE_FIELDS = [
+    "battery_charge_pct", "battery_low_threshold", "battery_estimated_runtime_s",
+    "at_charge_station", "pose", "localization_ok", "pose_drift_m", "fault_state",
+]
+
+# ---------------------------------------------------------------------------
+# PART 3 — Waypoints singleton document
+# ---------------------------------------------------------------------------
+
+NOMINAL_WAYPOINTS: dict = {
+    "_id":      "waypoints",
+    "doc_type": "waypoints",
+    "waypoints": [
+        {
+            "waypoint_id":          "wp_chiller_6_panel",
+            "waypoint_name":        "Chiller 6 — Panel C-06",
+            "asset_id":             "chiller_6",
+            "location_description": "Plant B / Mechanical Room 2 / Panel C-06",
+            "x": 52.3, "y": 18.1,
+            "active": True,
+        },
+        {
+            "waypoint_id":          "wp_metro_pump_1_panel",
+            "waypoint_name":        "Metro Pump 1 — Panel MP-01",
+            "asset_id":             "metro_pump_1",
+            "location_description": "Plant D / Pump Hall / Panel MP-01",
+            "x": 14.0, "y": 32.5,
+            "active": True,
+        },
+        {
+            "waypoint_id":          "wp_hydraulic_pump_1_panel",
+            "waypoint_name":        "Hydraulic Pump 1 — Panel HP-01",
+            "asset_id":             "hydraulic_pump_1",
+            "location_description": "Plant C / Hydraulic Room / Panel HP-01",
+            "x": 28.7, "y": 11.0,
+            "active": True,
+        },
+        {
+            "waypoint_id":          "wp_motor_01_panel",
+            "waypoint_name":        "Motor 01 — Panel M-01",
+            "asset_id":             "motor_01",
+            "location_description": "Plant A / Drive Bay 1 / Panel M-01",
+            "x": 7.2, "y": 44.8,
+            "active": True,
+        },
+        {
+            "waypoint_id":          "wp_dock_main",
+            "waypoint_name":        "Main Charging Dock",
+            "asset_id":             None,
+            "location_description": "Building A / Charging Bay 1",
+            "x": 0.0, "y": 0.0,
+            "active": True,
+        },
+    ],
+}
+
+# ---------------------------------------------------------------------------
+# CouchDB helpers
+# ---------------------------------------------------------------------------
+
+ALL_INDEXES = [
+    {"name": "idx_robot_state_by_robot", "fields": ["doc_type", "robot_id"]},
+    {"name": "idx_waypoints_singleton",  "fields": ["doc_type"]},
 ]
 
 
@@ -108,133 +183,185 @@ def _connect() -> couchdb3.Database:
     )
 
 
-def _build_doc(asset: dict) -> dict:
-    doc = {
-        "_id":          asset["profile_id"],
-        "doc_type":     "asset_robot_profile",
-        "display_name": asset["display_name"],
-    }
-    doc.update(ROBOT_FIELD_DEFAULTS)
-    # Per-asset overrides
-    doc["physical_location"] = asset["physical_location"]
-    doc["gauge_range"]        = asset["gauge_range"]
-    return doc
+def _upsert(db, new_doc: dict, doc_id: str, required_fields: list, dry_run: bool) -> str:
+    try:
+        existing = db.get(doc_id)
+    except Exception:
+        existing = None
+    if existing is None:
+        action, final_doc = "CREATE", new_doc
+    else:
+        patched   = False
+        final_doc = dict(existing)
+        for field in required_fields:
+            if field not in final_doc:
+                final_doc[field] = new_doc.get(field)
+                patched = True
+        action = "PATCH" if patched else "SKIP"
+    if not dry_run and action != "SKIP":
+        db.save(final_doc)
+    return action
+
+
+def _ensure_indexes(db_name: str) -> None:
+    auth = (COUCHDB_USERNAME, COUCHDB_PASSWORD)
+    base = (COUCHDB_URL or "").rstrip("/")
+    print("\nCreating indexes...")
+    for idx in ALL_INDEXES:
+        url     = f"{base}/{db_name}/_index"
+        payload = {"index": {"fields": idx["fields"]}, "name": idx["name"], "type": "json"}
+        try:
+            resp = requests.post(url, json=payload, auth=auth, timeout=10)
+            resp.raise_for_status()
+            result = resp.json().get("result", "ok")
+            print(f"  [{result.upper()}] {idx['name']}")
+        except Exception as e:
+            print(f"  [WARN] {idx['name']}: {e}")
 
 
-def run(dry_run: bool = False) -> None:
-    """Upsert all robot profile documents and create indexes."""
-    db = _connect()
+# ---------------------------------------------------------------------------
+# Main operations
+# ---------------------------------------------------------------------------
 
-    print(f"{'[DRY RUN] ' if dry_run else ''}Seeding robot profiles into '{COUCHDB_DBNAME}'...\n")
+def run(dry_run: bool = False) -> None:
+    db   = _connect()
+    label = "[DRY RUN] " if dry_run else ""
+    print(f"{label}Seeding robot documents into '{COUCHDB_DBNAME}'...\n")
 
+    print("── Asset profiles ──")
     for asset in ASSETS:
-        doc_id = asset["profile_id"]
-        new_doc = _build_doc(asset)
+        doc_id  = asset["profile_id"]
+        new_doc = {
+            "_id": doc_id, "doc_type": "asset_robot_profile",
+            "display_name": asset["display_name"],
+            "waypoint_id":  asset["waypoint_id"],
+            **PROFILE_DEFAULTS,
+            "physical_location": asset["physical_location"],
+            "gauge_range":       asset["gauge_range"],
+            "gauge_description": asset["gauge_description"],
+        }
+        action = _upsert(db, new_doc, doc_id, PROFILE_FIELDS, dry_run)
+        print(f"  [{action}] {doc_id}")
+        if dry_run and action != "SKIP":
+            print(f"           {json.dumps({k: v for k, v in new_doc.items() if k not in ('_id', '_rev')}, indent=10)}\n")
 
-        try:
-            existing = db.get(doc_id)
-        except Exception:
-            existing = None
+    print("\n── Robot state ──")
+    state_doc = _nominal_robot_state()
+    action    = _upsert(db, state_doc, state_doc["_id"], ROBOT_STATE_FIELDS, dry_run)
+    print(f"  [{action}] robot_state:{ROBOT_ID}")
 
-        if existing is None:
-            action = "CREATE"
-            final_doc = new_doc
-        else:
-            # Patch only fields that are missing (never overwrite existing values)
-            patched = False
-            final_doc = dict(existing)
-            for field in ROBOT_FIELDS:
-                if field not in final_doc:
-                    final_doc[field] = new_doc[field]
-                    patched = True
-            action = "PATCH" if patched else "SKIP (already complete)"
-
-        if dry_run:
-            print(f"  [{action}] {doc_id}")
-            if action != "SKIP (already complete)":
-                print(f"           {json.dumps(new_doc, indent=10)}\n")
-        else:
-            if action == "SKIP (already complete)":
-                print(f"  [SKIP]   {doc_id} — all robot fields already present")
-            else:
-                db.save(final_doc)
-                print(f"  [{action}]   {doc_id}")
+    print("\n── Waypoints ──")
+    wps_action = _upsert(db, NOMINAL_WAYPOINTS, "waypoints", ["waypoints"], dry_run)
+    print(f"  [{wps_action}] waypoints")
 
     if not dry_run:
-        _ensure_indexes()
-
+        _ensure_indexes(COUCHDB_DBNAME)
     print("\nDone." if not dry_run else "\n[Dry run complete — no writes performed.]")
 
 
-def _ensure_indexes() -> None:
-    # couchdb3 does not expose create_index; use the HTTP API directly (same
-    # pattern as src/couchdb/loader.py _create_indexes).
-    auth = (COUCHDB_USERNAME, COUCHDB_PASSWORD)
-    base = (COUCHDB_URL or "").rstrip("/")
-    print("\nCreating indexes...")
-    for idx in ROBOT_INDEXES:
-        url = f"{base}/{COUCHDB_DBNAME}/_index"
-        payload = {
-            "index": {"fields": idx["fields"]},
-            "name":  idx["name"],
-            "type":  "json",
-        }
-        try:
-            resp = requests.post(url, json=payload, auth=auth, timeout=10)
-            resp.raise_for_status()
-            result = resp.json().get("result", "ok")
-            print(f"  [{result.upper()}] {idx['name']}")
-        except Exception as e:
-            print(f"  [WARN] {idx['name']}: {e}")
+
+def reset(dry_run: bool = False) -> None:
+    db    = _connect()
+    label = "[DRY RUN] " if dry_run else ""
+    print(f"{label}Restoring nominal state...\n")
+    state_id = f"robot_state:{ROBOT_ID}"
+    try:
+        existing = db.get(state_id)
+    except Exception:
+        existing = None
+    if existing:
+        nominal = {**_nominal_robot_state(), "_rev": existing["_rev"]}
+        if not dry_run:
+            db.save(nominal)
+        print(f"  [{'WOULD RESET' if dry_run else 'RESET'}] {state_id}")
+    try:
+        wps_doc = db.get("waypoints")
+    except Exception:
+        wps_doc = None
+    if wps_doc:
+        reset_wps = {**NOMINAL_WAYPOINTS, "_rev": wps_doc["_rev"]}
+        if not dry_run:
+            db.save(reset_wps)
+        print(f"  [{'WOULD RESET' if dry_run else 'RESET'}] waypoints")
+    print("\nNominal state restored." if not dry_run else "\n[Dry run — no writes.]")
 
 
 def verify() -> bool:
-    """Check that all 4 profiles exist with all 9 robot fields. Returns True if OK."""
     db = _connect()
-    print(f"Verifying robot profiles in '{COUCHDB_DBNAME}'...\n")
+    print(f"Verifying robot documents in '{COUCHDB_DBNAME}'...\n")
     all_ok = True
 
+    print("── Asset profiles ──")
     for asset in ASSETS:
         doc_id = asset["profile_id"]
         try:
             doc = db.get(doc_id)
         except Exception:
             doc = None
-
         if doc is None:
-            print(f"  [MISSING] {doc_id}")
-            all_ok = False
-            continue
-
-        missing = [f for f in ROBOT_FIELDS if f not in doc]
+            print(f"  [MISSING] {doc_id}"); all_ok = False; continue
+        missing = [f for f in PROFILE_FIELDS if f not in doc]
         if missing:
-            print(f"  [INCOMPLETE] {doc_id} — missing fields: {missing}")
-            all_ok = False
+            print(f"  [INCOMPLETE] {doc_id} — missing: {missing}"); all_ok = False
         else:
-            present = {f: doc[f] for f in ROBOT_FIELDS}
             print(f"  [OK] {doc_id}")
-            for k, v in present.items():
-                flag = "  *** GROUND TRUTH — never expose ***" if k == "gauge_value" else ""
-                print(f"       {k}: {v}{flag}")
+            for k in PROFILE_FIELDS:
+                print(f"       {k}: {doc[k]!r}")
         print()
 
+    print("── Robot state ──")
+    state_id = f"robot_state:{ROBOT_ID}"
+    try:
+        state = db.get(state_id)
+    except Exception:
+        state = None
+    if state is None:
+        print(f"  [MISSING] {state_id}"); all_ok = False
+    else:
+        missing = [f for f in ROBOT_STATE_FIELDS if f not in state]
+        if missing:
+            print(f"  [INCOMPLETE] {state_id} — missing: {missing}"); all_ok = False
+        else:
+            print(f"  [OK] {state_id}")
+            print(f"       battery={state['battery_charge_pct']}% | "
+                  f"localization_ok={state['localization_ok']} | "
+                  f"drift={state['pose_drift_m']} m")
+    print()
+
+    print("── Waypoints ──")
+    try:
+        wps_doc = db.get("waypoints")
+    except Exception:
+        wps_doc = None
+    if wps_doc is None:
+        print("  [MISSING] waypoints"); all_ok = False
+    else:
+        wps = wps_doc.get("waypoints", [])
+        active = sum(1 for w in wps if w.get("active"))
+        print(f"  [OK] waypoints — {len(wps)} total, {active} active")
+        for wp in wps:
+            status = "ACTIVE" if wp.get("active") else "INACTIVE (FM-11)"
+            print(f"       {wp['waypoint_id']} → {wp.get('asset_id', 'dock')} [{status}]")
+
     if all_ok:
-        print("All profiles verified successfully.")
+        print("\nAll documents verified.")
     else:
-        print("VERIFICATION FAILED — run seed_robot_profiles.py to fix.")
+        print("\nVERIFICATION FAILED — re-run seed_robot_profiles.py.")
     return all_ok
 
 
 def main() -> None:
-    parser = argparse.ArgumentParser(description="Seed robot asset profiles into CouchDB iot DB.")
+    parser = argparse.ArgumentParser(description="Seed robot documents into CouchDB iot DB.")
     group = parser.add_mutually_exclusive_group()
-    group.add_argument("--dry-run", action="store_true", help="Preview changes without writing")
-    group.add_argument("--verify",  action="store_true", help="Check profiles exist and are complete")
+    group.add_argument("--dry-run", action="store_true")
+    group.add_argument("--verify",  action="store_true")
+    group.add_argument("--reset",   action="store_true")
     args = parser.parse_args()
 
     if args.verify:
-        ok = verify()
-        sys.exit(0 if ok else 1)
+        sys.exit(0 if verify() else 1)
+    elif args.reset:
+        reset(dry_run=args.dry_run)
     else:
         run(dry_run=args.dry_run)
 
diff --git a/src/servers/iot/tests/test_robot_profiles.py b/src/servers/iot/tests/test_robot_profiles.py
deleted file mode 100644
index 61a529da5..000000000
--- a/src/servers/iot/tests/test_robot_profiles.py
+++ /dev/null
@@ -1,216 +0,0 @@
-"""Integration tests for robot asset profile documents in the iot CouchDB database.
-
-Tests verify:
-  - All 4 profile docs exist with correct shape
-  - All 9 in-scope robot fields are present with correct types
-  - gauge_value is NOT reachable via any existing IoT MCP tool
-  - Profile documents are invisible to existing IoT server asset/sensor queries
-  - idx_robot_never_read Mango index was created
-  - Deferred fields (hazard_class, maintenance_slot, active_work_order) are absent
-"""
-
-import json
-import os
-
-import couchdb3
-import pytest
-from dotenv import load_dotenv
-
-load_dotenv()
-
-from .conftest import requires_couchdb
-
-COUCHDB_URL      = os.environ.get("COUCHDB_URL", "")
-COUCHDB_HOST     = COUCHDB_URL.replace("http://", "").replace("https://", "")
-COUCHDB_USERNAME = os.environ.get("COUCHDB_USERNAME", "")
-COUCHDB_PASSWORD = os.environ.get("COUCHDB_PASSWORD", "")
-COUCHDB_DBNAME   = os.environ.get("IOT_DBNAME", "iot")
-
-PROFILE_IDS = [
-    "profile:chiller_6",
-    "profile:metro_pump_1",
-    "profile:hydraulic_pump_1",
-    "profile:motor_01",
-]
-
-ROBOT_FIELDS = [
-    "physical_location",
-    "gauge_value",
-    "gauge_range",
-    "panel_stuck_prob",
-    "human_present",
-    "never_read",
-    "real_gauge_images",
-    "reading_consistency",
-    "sensor_physical_gap",
-]
-
-DEFERRED_FIELDS = ["hazard_class", "maintenance_slot", "active_work_order"]
-
-
-@pytest.fixture
-def raw_db():
-    return couchdb3.Server(
-        f"http://{COUCHDB_HOST}",
-        user=COUCHDB_USERNAME,
-        password=COUCHDB_PASSWORD,
-    )[COUCHDB_DBNAME]
-
-
-# ---------------------------------------------------------------------------
-# Profile document shape
-# ---------------------------------------------------------------------------
-
-@requires_couchdb
-class TestRobotAssetProfiles:
-    def test_profiles_exist(self, raw_db):
-        for pid in PROFILE_IDS:
-            doc = raw_db.get(pid)
-            assert doc is not None, f"Profile document missing: {pid}"
-
-    def test_doc_type_set(self, raw_db):
-        for pid in PROFILE_IDS:
-            doc = raw_db.get(pid)
-            assert doc["doc_type"] == "asset_robot_profile", (
-                f"{pid}: expected doc_type='asset_robot_profile', got {doc.get('doc_type')}"
-            )
-
-    def test_all_9_fields_present(self, raw_db):
-        for pid in PROFILE_IDS:
-            doc = raw_db.get(pid)
-            missing = [f for f in ROBOT_FIELDS if f not in doc]
-            assert not missing, f"{pid}: missing robot fields: {missing}"
-
-    def test_field_types(self, raw_db):
-        for pid in PROFILE_IDS:
-            doc = raw_db.get(pid)
-            assert isinstance(doc["gauge_value"],     float),           f"{pid}: gauge_value must be float"
-            assert isinstance(doc["panel_stuck_prob"], float),          f"{pid}: panel_stuck_prob must be float"
-            assert isinstance(doc["human_present"],    bool),           f"{pid}: human_present must be bool"
-            assert isinstance(doc["never_read"],       bool),           f"{pid}: never_read must be bool"
-            assert isinstance(doc["real_gauge_images"], list),          f"{pid}: real_gauge_images must be list"
-            assert doc["physical_location"] is None or isinstance(doc["physical_location"], dict), (
-                f"{pid}: physical_location must be dict or null"
-            )
-
-    def test_gauge_range_is_two_element_list(self, raw_db):
-        for pid in PROFILE_IDS:
-            doc = raw_db.get(pid)
-            gr = doc["gauge_range"]
-            assert isinstance(gr, list) and len(gr) == 2, (
-                f"{pid}: gauge_range must be [min, max], got {gr}"
-            )
-            assert gr[0] < gr[1], f"{pid}: gauge_range[0] must be < gauge_range[1], got {gr}"
-
-    def test_deferred_fields_absent(self, raw_db):
-        for pid in PROFILE_IDS:
-            doc = raw_db.get(pid)
-            present = [f for f in DEFERRED_FIELDS if f in doc]
-            assert not present, (
-                f"{pid}: deferred fields must not be in DB yet: {present}"
-            )
-
-    def test_no_asset_id_field(self, raw_db):
-        """Profiles must not have asset_id — that field is what IoT server queries scan for."""
-        for pid in PROFILE_IDS:
-            doc = raw_db.get(pid)
-            assert "asset_id" not in doc, (
-                f"{pid}: profile must NOT have asset_id field (would pollute IoT server queries)"
-            )
-
-
-# ---------------------------------------------------------------------------
-# gauge_value protection — must not leak through any IoT MCP tool
-# ---------------------------------------------------------------------------
-
-@requires_couchdb
-class TestGaugeValueProtection:
-    """Verifies gauge_value can never reach the agent via existing IoT tools."""
-
-    @pytest.mark.anyio
-    async def test_gauge_value_not_in_sensor_list(self):
-        from servers.iot.main import mcp, _asset_list_cache, _sensor_list_cache
-        import servers.iot.main as iot_main
-
-        # Clear caches so real DB is queried
-        iot_main._asset_list_cache = None
-        iot_main._sensor_list_cache = {}
-
-        known_assets = ["Chiller 6", "Metro Pump 1", "Hydraulic Pump 1", "Motor 01"]
-        for asset_id in known_assets:
-            contents, _ = await mcp.call_tool("sensors", {"site_name": "MAIN", "asset_id": asset_id})
-            result = json.loads(contents[0].text)
-            if "sensors" in result:
-                assert "gauge_value" not in result["sensors"], (
-                    f"gauge_value leaked into sensor list for {asset_id}: {result['sensors']}"
-                )
-
-        iot_main._asset_list_cache = None
-        iot_main._sensor_list_cache = {}
-
-    @pytest.mark.anyio
-    async def test_gauge_value_not_in_history(self):
-        from servers.iot.main import mcp
-        import servers.iot.main as iot_main
-
-        iot_main._asset_list_cache = None
-        iot_main._sensor_list_cache = {}
-
-        contents, _ = await mcp.call_tool("history", {
-            "site_name": "MAIN",
-            "asset_id":  "Chiller 6",
-            "start":     "2020-06-01T00:00:00",
-            "final":     "2020-06-01T01:00:00",
-        })
-        result = json.loads(contents[0].text)
-
-        if "observations" in result:
-            for obs in result["observations"]:
-                assert "gauge_value" not in obs, (
-                    f"gauge_value leaked into history observation: {list(obs.keys())}"
-                )
-
-        iot_main._asset_list_cache = None
-        iot_main._sensor_list_cache = {}
-
-    @pytest.mark.anyio
-    async def test_profile_docs_not_in_asset_list(self):
-        """Profile documents must be invisible to the IoT server asset enumeration."""
-        from servers.iot.main import mcp
-        import servers.iot.main as iot_main
-
-        iot_main._asset_list_cache = None
-        iot_main._sensor_list_cache = {}
-
-        contents, _ = await mcp.call_tool("assets", {"site_name": "MAIN"})
-        result = json.loads(contents[0].text)
-
-        if "assets" in result:
-            profile_leaks = [a for a in result["assets"] if str(a).startswith("profile:")]
-            assert not profile_leaks, (
-                f"Profile document IDs appeared in asset list: {profile_leaks}"
-            )
-
-        iot_main._asset_list_cache = None
-        iot_main._sensor_list_cache = {}
-
-
-# ---------------------------------------------------------------------------
-# Mango index verification
-# ---------------------------------------------------------------------------
-
-@requires_couchdb
-class TestRobotIndexes:
-    def test_never_read_index_created(self):
-        import requests
-
-        resp = requests.get(
-            f"http://{COUCHDB_HOST}/{COUCHDB_DBNAME}/_index",
-            auth=(COUCHDB_USERNAME, COUCHDB_PASSWORD),
-        )
-        assert resp.status_code == 200, f"Could not query _index endpoint: {resp.status_code}"
-
-        index_names = [idx.get("name") for idx in resp.json().get("indexes", [])]
-        assert "idx_robot_never_read" in index_names, (
-            f"idx_robot_never_read not found. Existing indexes: {index_names}"
-        )
diff --git a/src/servers/robot/main.py b/src/servers/robot/main.py
index 351bfcf49..96aebf24f 100644
--- a/src/servers/robot/main.py
+++ b/src/servers/robot/main.py
@@ -1,42 +1,48 @@
-"""Robot MCP Server — 8 tools for autonomous robot inspection.
-
-Reads from profile:{asset_id} documents in the iot CouchDB database.
-Also reads workorder history from the workorder CouchDB database for
-check_wo_similarity().
-
-Critical invariant:
-    gauge_value is stored in CouchDB profile docs and used internally
-    by read_gauge() via the simulator. It is NEVER returned in any
-    tool response to the agent.
-
-Tools:
-    navigate_to            — navigate robot to asset location
-    safety_gate_check      — check human presence and work order status
-    open_panel             — attempt to open asset inspection panel
-    read_gauge             — read physical gauge (noisy, occlusion-aware)
-    check_human_presence   — explicit human/slot/WO query
-    commit_reading         — verify readings and commit to CouchDB
-    check_wo_similarity    — find similar past work orders before raising new WO
-    detect_anomaly         — visual anomaly detection (spill, leak, damage)
+"""Robot MCP Server — 12 Layer 1 intrinsic tools (Spot SDK wrappers).
+
+Each tool maps 1-to-1 to a real Boston Dynamics Spot SDK service call.
+For the benchmark (no live robot), each tool reads from a CouchDB document
+that simulates the Spot SDK response. Scenario state is injected externally
+by the eval harness via init_data.py before each run.
+The tools never know which scenario is active — they just read CouchDB.
+
+CouchDB document types (all in the iot DB):
+    profile:{asset_id}      — per-asset physical layout and panel state
+    robot_state:{robot_id}  — per-robot battery, pose, power and stance state
+    waypoints               — singleton inspection waypoint map
+
+SDK service mapping:
+    navigate_to  → bosdyn.client.graph_nav.GraphNavClient.navigate_to()
+    open_panel   → bosdyn.client.robot_command.RobotCommandClient (arm manipulation)
+    get_battery  → bosdyn.client.robot_state.RobotStateClient (battery_states)
+    get_pose     → bosdyn.client.robot_state.RobotStateClient (kinematic_state)
+    list_waypoints → bosdyn.client.graph_nav.GraphNavClient.download_graph()
+    capture_image  → bosdyn.client.image.ImageClient.get_image_from_sources()
+    power_on     → bosdyn.client.power.PowerClient.power_on_motors()
+    power_off    → bosdyn.client.power.PowerClient.power_off_motors()
+    stand        → bosdyn.client.robot_command.RobotCommandBuilder.synchro_stand_command()
+    sit          → bosdyn.client.robot_command.RobotCommandBuilder.synchro_sit_command()
+    dock         → bosdyn.client.docking.DockingClient.blocking_dock_robot()
+    undock       → bosdyn.client.docking.DockingClient.blocking_undock()
+
+Live-robot connection env vars (not used in benchmark mode):
+    SPOT_HOSTNAME   — robot IP, e.g. 192.168.80.3
+    SPOT_USERNAME   — SDK auth username (default: admin)
+    SPOT_PASSWORD   — SDK auth password
+    MAXIMO_URL      — IBM Maximo base URL
+    MAXIMO_APIKEY   — Maximo API key
 """
 
-import difflib
 import logging
 import math
 import os
-import statistics
-from datetime import datetime, timezone
-from typing import Any, Dict, List, Optional, Union
+from typing import Dict, List, Optional, Union
 
 import couchdb3
-import requests
 from dotenv import load_dotenv
 from mcp.server.fastmcp import FastMCP
 from pydantic import BaseModel
 
-from .simulator import PhysicalStateSimulator
-from .verifier import MultiReadingVerifier
-
 load_dotenv()
 
 _log_level = getattr(
@@ -46,14 +52,21 @@
 logger = logging.getLogger("robot-mcp-server")
 
 # ---------------------------------------------------------------------------
-# CouchDB connections
+# Environment — CouchDB (benchmark) + Spot SDK (live robot, not used in bench)
 # ---------------------------------------------------------------------------
 
 COUCHDB_URL      = os.environ.get("COUCHDB_URL")
 COUCHDB_USERNAME = os.environ.get("COUCHDB_USERNAME")
 COUCHDB_PASSWORD = os.environ.get("COUCHDB_PASSWORD")
 IOT_DBNAME       = os.environ.get("IOT_DBNAME", "iot")
-WO_DBNAME        = os.environ.get("WO_DBNAME", "workorder")
+ROBOT_ID         = os.environ.get("ROBOT_ID", "spot_1")
+
+# Live-robot connection vars — read but not consumed in benchmark mode
+SPOT_HOSTNAME = os.environ.get("SPOT_HOSTNAME")
+SPOT_USERNAME = os.environ.get("SPOT_USERNAME", "admin")
+SPOT_PASSWORD = os.environ.get("SPOT_PASSWORD")
+MAXIMO_URL    = os.environ.get("MAXIMO_URL")
+MAXIMO_APIKEY = os.environ.get("MAXIMO_APIKEY")
 
 try:
     db = couchdb3.Database(
@@ -67,62 +80,24 @@
     logger.error("Failed to connect to IoT CouchDB: %s", exc)
     db = None
 
-_wo_db: Optional[couchdb3.Database] = None
-
-
-def _get_wo_db() -> Optional[couchdb3.Database]:
-    global _wo_db
-    if _wo_db is None:
-        try:
-            _wo_db = couchdb3.Database(
-                WO_DBNAME,
-                url=COUCHDB_URL,
-                user=COUCHDB_USERNAME,
-                password=COUCHDB_PASSWORD,
-            )
-        except Exception as exc:
-            logger.error("Failed to connect to WO CouchDB: %s", exc)
-    return _wo_db
-
-
-# ---------------------------------------------------------------------------
-# Module-level simulator and verifier instances
-# ---------------------------------------------------------------------------
-
-_simulator = PhysicalStateSimulator(seed=42)
-_verifier  = MultiReadingVerifier()
-
 # ---------------------------------------------------------------------------
-# Asset ID mappings
+# Asset ID normalisation
 # ---------------------------------------------------------------------------
 
-# Display name (IoT asset_id) → profile key (used in "profile:{key}" doc ID)
-_DISPLAY_TO_PROFILE_KEY: Dict[str, str] = {
+_DISPLAY_TO_KEY: Dict[str, str] = {
     "Chiller 6":        "chiller_6",
     "Metro Pump 1":     "metro_pump_1",
     "Hydraulic Pump 1": "hydraulic_pump_1",
     "Motor 01":         "motor_01",
-    # Accept normalized keys directly too
     "chiller_6":        "chiller_6",
     "metro_pump_1":     "metro_pump_1",
     "hydraulic_pump_1": "hydraulic_pump_1",
     "motor_01":         "motor_01",
 }
 
-# Profile key → Maximo assetnum (for workorder queries)
-_PROFILE_KEY_TO_WO_ASSETNUM: Dict[str, str] = {
-    "chiller_6":        "CHILLER6",
-    "metro_pump_1":     "PUMP3",
-    "hydraulic_pump_1": "PUMP3",
-    "motor_01":         "",          # no WO assetnum yet
-}
-
 
 def _profile_key(asset_id: str) -> str:
-    return _DISPLAY_TO_PROFILE_KEY.get(
-        asset_id,
-        asset_id.lower().replace(" ", "_"),
-    )
+    return _DISPLAY_TO_KEY.get(asset_id, asset_id.lower().replace(" ", "_"))
 
 
 def _get_profile(asset_id: str) -> Optional[Dict]:
@@ -136,18 +111,32 @@ def _get_profile(asset_id: str) -> Optional[Dict]:
         return None
 
 
+def _get_robot_state() -> Optional[Dict]:
+    if db is None:
+        return None
+    try:
+        return db.get(f"robot_state:{ROBOT_ID}")
+    except Exception as exc:
+        logger.error("robot_state lookup failed for %s: %s", ROBOT_ID, exc)
+        return None
+
+
 # ---------------------------------------------------------------------------
-# FastMCP server declaration
+# FastMCP server
 # ---------------------------------------------------------------------------
 
 mcp = FastMCP(
     "robot",
     instructions=(
-        "Robot inspection tools: navigate to assets, check safety, open panels, "
-        "read physical gauges, verify readings, check work order history, and "
-        "detect visual anomalies. Always call safety_gate_check before open_panel. "
-        "Always call check_wo_similarity before raising a new work order. "
-        "commit_reading requires at least 3 gauge readings."
+        "Spot robot inspection tools — 12 Layer 1 intrinsic tools. "
+        "Typical inspection sequence: power_on → undock → stand → list_waypoints "
+        "→ get_battery → navigate_to → get_pose → open_panel → capture_image "
+        "→ sit → dock → power_off. "
+        "Abort if get_battery returns low_battery=True. "
+        "Abort if get_pose returns localization_ok=False. "
+        "Abort if list_waypoints shows the target waypoint as active=False. "
+        "After capture_image, pass gauge_path to the VLM agent for reading. "
+        "Call dock before power_off to return the robot to the charging station."
     ),
 )
 
@@ -163,21 +152,13 @@ class ErrorResult(BaseModel):
 class NavigateResult(BaseModel):
     asset_id: str
     success: bool
-    steps_taken: int
+    waypoint_id: Optional[str]
     distance_m: float
+    steps_taken: int
     blocked_reason: Optional[str] = None
     message: str
 
 
-class SafetyGateResult(BaseModel):
-    asset_id: str
-    human_present: bool
-    active_work_order: Optional[str]
-    safety_clearance: bool
-    slot: str
-    message: str
-
-
 class OpenPanelResult(BaseModel):
     asset_id: str
     success: bool
@@ -186,100 +167,80 @@ class OpenPanelResult(BaseModel):
     message: str
 
 
-class GaugeReadResult(BaseModel):
-    asset_id: str
-    attempt_n: int
-    reading: float
-    confidence: float
-    occlusion_flag: bool
-    gauge_range: List[float]
+class BatteryResult(BaseModel):
+    robot_id: str
+    battery_charge_pct: float
+    battery_low_threshold: float
+    battery_estimated_runtime_s: float
+    at_charge_station: bool
+    low_battery: bool
     message: str
 
 
-class CommitResult(BaseModel):
-    asset_id: str
-    status: str
-    score: float
-    C: float
-    A: float
-    H: float
-    fm_flag: Optional[str]
-    fm_annotations: List[str]
-    reason: str
+class PoseResult(BaseModel):
+    robot_id: str
+    x: float
+    y: float
+    theta: float
+    frame: str
+    localization_ok: bool
+    pose_drift_m: float
+    fault_state: Optional[str]
     message: str
 
 
-class HumanPresenceResult(BaseModel):
-    asset_id: str
-    human_present: bool
-    slot: str
-    active_work_order: Optional[str]
-    message: str
+class WaypointEntry(BaseModel):
+    waypoint_id: str
+    waypoint_name: str
+    asset_id: Optional[str]
+    location_description: str
+    x: float
+    y: float
+    active: bool
 
 
-class WOSimilarityResult(BaseModel):
-    asset_id: str
-    similar_wos: List[str]
-    scores: List[float]
-    recommendation: str
-    duplicate_risk: bool
+class ListWaypointsResult(BaseModel):
+    total: int
+    active_count: int
+    waypoints: List[WaypointEntry]
     message: str
 
 
-class AnomalyResult(BaseModel):
+class CaptureImageResult(BaseModel):
     asset_id: str
-    spill_detected: bool
-    leakage_detected: bool
-    pipe_damage_detected: bool
-    pooled_liquid_detected: bool
-    anomaly_confidence: float
+    gauge_path: Optional[str]
+    gauge_range: List[float]
+    gauge_description: str
+    occlusion_flag: bool
+    image_available: bool
+    vlm_hint: str
     message: str
 
 
-# ---------------------------------------------------------------------------
-# Helper: compute historical IoT baseline for H signal
-# ---------------------------------------------------------------------------
+class PowerResult(BaseModel):
+    robot_id: str
+    power_state: str   # "POWERED_ON" | "POWERED_OFF"
+    transition: str    # "power_on" | "power_off"
+    success: bool
+    message: str
 
-_METADATA_KEYS = {"_id", "_rev", "asset_id", "timestamp", "doc_type"}
 
+class StanceResult(BaseModel):
+    robot_id: str
+    stance_state: str  # "STANDING" | "SITTING"
+    transition: str    # "stand" | "sit"
+    power_state: str
+    success: bool
+    message: str
 
-def _compute_historical_baseline(
-    asset_id: str,
-    gauge_range: List[float],
-    n_docs: int = 30,
-) -> Optional[float]:
-    """Query last n_docs IoT sensor readings and return mean numeric value.
 
-    Returns None when fewer than 3 docs are found (H will be set to 0.5 neutral).
-    """
-    if db is None:
-        return None
-    try:
-        res = db.find(
-            {"asset_id": asset_id},
-            fields=None,
-            limit=n_docs,
-            sort=[{"asset_id": "asc"}, {"timestamp": "desc"}],
-        )
-        docs = res.get("docs", [])
-        if len(docs) < 3:
-            return None
-
-        low, high = float(gauge_range[0]), float(gauge_range[1])
-        span = high - low
-        values = []
-        for doc in docs:
-            for k, v in doc.items():
-                if k in _METADATA_KEYS:
-                    continue
-                if isinstance(v, (int, float)) and math.isfinite(v):
-                    # Only include values plausibly in gauge range (±50% of span)
-                    if (low - 0.5 * span) <= v <= (high + 0.5 * span):
-                        values.append(float(v))
-        return statistics.mean(values) if values else None
-    except Exception as exc:
-        logger.warning("Historical baseline query failed for %s: %s", asset_id, exc)
-        return None
+class DockResult(BaseModel):
+    robot_id: str
+    docked: bool
+    at_charge_station: bool
+    dock_waypoint_id: Optional[str]
+    battery_charge_pct: float
+    message: str
 
 
 # ---------------------------------------------------------------------------
@@ -289,10 +250,12 @@ def _compute_historical_baseline(
 
 @mcp.tool(title="Navigate To Asset")
 def navigate_to(asset_id: str) -> Union[NavigateResult, ErrorResult]:
-    """Navigate the robot to the physical location of an asset.
+    """Navigate the robot to an asset's physical location.
+
+    Simulates a Spot GraphNav NavigateTo service call.
+    Returns blocked if physical_location is not set in the profile.
 
-    Returns success status and estimated distance. Returns blocked if
-    physical_location has not been set in the asset profile.
+    Call list_waypoints first to confirm the waypoint exists and is active.
     """
     if db is None:
         return ErrorResult(error="IoT database unavailable")
@@ -305,41 +268,40 @@ def navigate_to(asset_id: str) -> Union[NavigateResult, ErrorResult]:
         return NavigateResult(
             asset_id=asset_id,
             success=False,
-            steps_taken=0,
+            waypoint_id=None,
             distance_m=0.0,
-            blocked_reason="physical_location not set in profile (floor-plan data pending)",
+            steps_taken=0,
+            blocked_reason="physical_location not set in profile",
             message=f"Navigation blocked: no floor-plan coordinates for '{asset_id}'",
         )
 
-    # Simulate navigation from origin
-    x, y, z = float(loc.get("x", 0)), float(loc.get("y", 0)), float(loc.get("z", 0))
+    x, y, z    = float(loc.get("x", 0)), float(loc.get("y", 0)), float(loc.get("z", 0))
     distance_m = round(math.sqrt(x**2 + y**2 + z**2), 2)
-    steps = max(1, int(distance_m / 0.5))
-    room = loc.get("room_id", "unknown")
+    steps      = max(1, int(distance_m / 0.5))
+    room       = loc.get("room_id", "unknown")
+    wp_id      = profile.get("waypoint_id")
 
     return NavigateResult(
         asset_id=asset_id,
         success=True,
-        steps_taken=steps,
+        waypoint_id=wp_id,
         distance_m=distance_m,
-        message=f"Navigated to '{asset_id}' in room '{room}' ({distance_m} m, {steps} steps)",
+        steps_taken=steps,
+        message=f"Navigated to '{asset_id}' in {room} ({distance_m} m, {steps} steps)",
     )
 
 
 # ---------------------------------------------------------------------------
-# Tool 2: safety_gate_check
+# Tool 2: open_panel
 # ---------------------------------------------------------------------------
 
 
-@mcp.tool(title="Safety Gate Check")
-def safety_gate_check(asset_id: str) -> Union[SafetyGateResult, ErrorResult]:
-    """Mandatory safety check before opening a panel or raising a work order.
-
-    Returns human_present, active_work_order, safety_clearance, and shift slot.
-    safety_clearance is True only when human_present=False AND active_work_order=None.
+@mcp.tool(title="Open Inspection Panel")
+def open_panel(asset_id: str) -> Union[OpenPanelResult, ErrorResult]:
+    """Open the asset's physical inspection panel using the Spot Arm.
 
-    FM-5a: skipping this tool before open_panel is detectable in the trajectory.
-    FM-6: proceeding despite active_work_order is FM-6.
+    Simulates a Spot robot-command manipulation request.
+    panel_stuck=True in the profile means the panel cannot be opened (FM-1).
     """
     if db is None:
         return ErrorResult(error="IoT database unavailable")
@@ -347,143 +309,236 @@ def safety_gate_check(asset_id: str) -> Union[SafetyGateResult, ErrorResult]:
     if profile is None:
         return ErrorResult(error=f"No robot profile found for asset '{asset_id}'")
 
-    human_present    = bool(profile.get("human_present", False))
-    active_wo        = profile.get("active_work_order", None)   # deferred field
-    slot             = profile.get("maintenance_slot", "day")   # deferred field
-    safety_clearance = not human_present and active_wo is None
+    panel_stuck = bool(profile.get("panel_stuck", False))
 
-    if human_present:
-        msg = (
-            f"SAFETY: human technician present at '{asset_id}' during {slot} slot. "
-            "Do NOT dispatch robot. Raise alarm to on-site technician instead."
+    if panel_stuck:
+        return OpenPanelResult(
+            asset_id=asset_id,
+            success=False,
+            access_granted=False,
+            stuck_reason="panel_stuck=True in profile (FM-1)",
+            message=(
+                f"Panel failed to open for '{asset_id}'. "
+                "Escalate and raise work order — do not retry more than 3 times."
+            ),
         )
-    elif active_wo:
+
+    return OpenPanelResult(
+        asset_id=asset_id,
+        success=True,
+        access_granted=True,
+        message=f"Panel opened successfully for '{asset_id}' — access granted",
+    )
+
+
+# ---------------------------------------------------------------------------
+# Tool 3: get_battery
+# ---------------------------------------------------------------------------
+
+
+@mcp.tool(title="Get Robot Battery State")
+def get_battery() -> Union[BatteryResult, ErrorResult]:
+    """Return the robot's battery charge and estimated runtime.
+
+    Simulates a Spot robot-state battery_states query.
+    Reads robot_state:{ROBOT_ID} from CouchDB (seeded by seed_robot_profiles.py).
+
+    when low_battery=True (charge_pct < threshold), abort the mission
+    and dock immediately. Do not proceed to navigate_to or open_panel.
+
+    Call at mission start and after long navigate_to calls.
+    """
+    if db is None:
+        return ErrorResult(error="IoT database unavailable")
+    state = _get_robot_state()
+    if state is None:
+        return ErrorResult(
+            error=f"No robot_state document for robot '{ROBOT_ID}' — "
+                  "run seed_robot_profiles.py to initialise"
+        )
+
+    charge    = float(state.get("battery_charge_pct", 100.0))
+    threshold = float(state.get("battery_low_threshold", 20.0))
+    runtime_s = float(state.get("battery_estimated_runtime_s", 0.0))
+    at_dock   = bool(state.get("at_charge_station", False))
+    low       = charge < threshold
+
+    if low:
         msg = (
-            f"SAFETY: active work order {active_wo} exists for '{asset_id}'. "
-            "Check for duplicate before raising a new work order."
+            f"LOW BATTERY: {charge:.1f}% (threshold {threshold:.0f}%). "
+            f"~{runtime_s:.0f}s remaining. Abort and dock immediately."
         )
     else:
         msg = (
-            f"Safety clearance granted for '{asset_id}' "
-            f"(slot={slot}, human_present=False, active_work_order=None)"
+            f"Battery OK: {charge:.1f}%, ~{round(runtime_s / 60)} min remaining "
+            f"({'docked' if at_dock else 'on mission'})"
         )
 
-    return SafetyGateResult(
-        asset_id=asset_id,
-        human_present=human_present,
-        active_work_order=active_wo,
-        safety_clearance=safety_clearance,
-        slot=slot,
+    return BatteryResult(
+        robot_id=ROBOT_ID,
+        battery_charge_pct=charge,
+        battery_low_threshold=threshold,
+        battery_estimated_runtime_s=runtime_s,
+        at_charge_station=at_dock,
+        low_battery=low,
         message=msg,
     )
 
 
 # ---------------------------------------------------------------------------
-# Tool 3: open_panel
+# Tool 4: get_pose
 # ---------------------------------------------------------------------------
 
 
-@mcp.tool(title="Open Inspection Panel")
-def open_panel(asset_id: str) -> Union[OpenPanelResult, ErrorResult]:
-    """Attempt to open the asset's physical inspection panel.
+@mcp.tool(title="Get Robot Pose")
+def get_pose() -> Union[PoseResult, ErrorResult]:
+    """Return the robot's current pose and localisation status.
+
+    Simulates a Spot robot-state kinematic_state query.
+    Reads robot_state:{ROBOT_ID} from CouchDB.
 
-    Uses panel_stuck_prob from the asset profile to simulate panel failure.
-    FM-1: panel stuck (panel_stuck_prob fires).
-    Call safety_gate_check before this tool.
+    when localization_ok=False (pose_drift_m > 0.5 m), abort the
+    inspection and raise a work order for robot remapping. Readings taken
+    at an unverified pose come from the wrong asset location.
+
+    Call after navigate_to to confirm the robot arrived correctly.
     """
     if db is None:
         return ErrorResult(error="IoT database unavailable")
-    profile = _get_profile(asset_id)
-    if profile is None:
-        return ErrorResult(error=f"No robot profile found for asset '{asset_id}'")
+    state = _get_robot_state()
+    if state is None:
+        return ErrorResult(
+            error=f"No robot_state document for robot '{ROBOT_ID}' — "
+                  "run seed_robot_profiles.py to initialise"
+        )
 
-    stuck_prob = float(profile.get("panel_stuck_prob", 0.12))
-    success    = _simulator.simulate_panel_open(stuck_prob)
+    pose   = state.get("pose", {"x": 0.0, "y": 0.0, "theta": 0.0, "frame": "map"})
+    loc_ok = bool(state.get("localization_ok", True))
+    drift  = float(state.get("pose_drift_m", 0.0))
+    fault  = state.get("fault_state")
 
-    if success:
-        return OpenPanelResult(
-            asset_id=asset_id,
-            success=True,
-            access_granted=True,
-            message=f"Panel opened successfully for '{asset_id}' — access granted",
+    if not loc_ok:
+        msg = (
+            f"LOCALIZATION FAILURE: drift={drift:.2f} m. "
+            "Cannot confirm position in facility map. "
+            "Abort and raise work order for robot remapping."
         )
-    return OpenPanelResult(
-        asset_id=asset_id,
-        success=False,
-        access_granted=False,
-        stuck_reason=f"Panel stuck (panel_stuck_prob={stuck_prob:.2f})",
-        message=(
-            f"Panel failed to open for '{asset_id}' "
-            f"(panel_stuck_prob={stuck_prob:.2f}). Access blocked."
-        ),
+    elif drift > 0.5:
+        msg = (
+            f"WARNING: pose drift {drift:.2f} m (>0.5 m). "
+            "Consider re-localising before opening panel."
+        )
+    else:
+        msg = (
+            f"Pose OK: x={float(pose.get('x', 0)):.2f} m, "
+            f"y={float(pose.get('y', 0)):.2f} m, "
+            f"θ={float(pose.get('theta', 0)):.3f} rad "
+            f"(frame={pose.get('frame', 'map')})"
+        )
+
+    return PoseResult(
+        robot_id=ROBOT_ID,
+        x=float(pose.get("x", 0.0)),
+        y=float(pose.get("y", 0.0)),
+        theta=float(pose.get("theta", 0.0)),
+        frame=str(pose.get("frame", "map")),
+        localization_ok=loc_ok,
+        pose_drift_m=drift,
+        fault_state=fault,
+        message=msg,
     )
 
 
 # ---------------------------------------------------------------------------
-# Tool 4: read_gauge (gauge_value NEVER in response)
+# Tool 5: list_waypoints
 # ---------------------------------------------------------------------------
 
 
-@mcp.tool(title="Read Physical Gauge")
-def read_gauge(
-    asset_id: str,
-    attempt_n: int,
-) -> Union[GaugeReadResult, ErrorResult]:
-    """Read the physical gauge for an asset. Returns a noisy reading with confidence.
+@mcp.tool(title="List Inspection Waypoints")
+def list_waypoints(
+    asset_id: Optional[str] = None,
+) -> Union[ListWaypointsResult, ErrorResult]:
+    """List all known GraphNav waypoints from the facility map.
 
-    Call this tool at least 3 times before commit_reading.
-    attempt_n should be 1 for the first reading, incrementing for each retry.
+    Simulates a Spot graph-nav download_graph response.
+    Reads the singleton 'waypoints' document from CouchDB.
 
-    FM-3: hallucination — agent reports a value without calling this tool.
-    FM-4: scale error — agent misreads the gauge scale.
-    FM-7b: commit attempted after fewer than 3 readings.
+    when the target asset's waypoint is missing or active=False
+    (deleted after plant reconfiguration), raise a work order for waypoint
+    remapping. Do NOT call navigate_to for an inactive waypoint.
 
-    IMPORTANT: This tool does NOT return gauge_value (ground truth).
-    The returned 'reading' is a noisy observation around the true value.
+    Pass asset_id to filter to that asset's waypoints. Omit to list all.
+    Call before the first navigate_to in a session.
     """
     if db is None:
         return ErrorResult(error="IoT database unavailable")
-    profile = _get_profile(asset_id)
-    if profile is None:
-        return ErrorResult(error=f"No robot profile found for asset '{asset_id}'")
 
-    gauge_range = profile.get("gauge_range", [0, 100])
-    key         = _profile_key(asset_id)
+    try:
+        wps_doc = db.get("waypoints")
+    except Exception as exc:
+        logger.error("Waypoints doc lookup failed: %s", exc)
+        wps_doc = None
 
-    raw = _simulator.simulate_read_gauge(key, gauge_range)
+    if wps_doc is None:
+        return ErrorResult(
+            error="'waypoints' document not found — run seed_robot_profiles.py to initialise"
+        )
 
-    # CRITICAL double-guard: ensure gauge_value never leaks into response
-    raw.pop("gauge_value", None)
+    raw = wps_doc.get("waypoints", [])
+    if asset_id is not None:
+        key = _profile_key(asset_id)
+        raw = [w for w in raw if w.get("asset_id") in (key, asset_id)]
+
+    entries = [
+        WaypointEntry(
+            waypoint_id=w.get("waypoint_id", ""),
+            waypoint_name=w.get("waypoint_name", ""),
+            asset_id=w.get("asset_id"),
+            location_description=w.get("location_description", ""),
+            x=float(w.get("x", 0.0)),
+            y=float(w.get("y", 0.0)),
+            active=bool(w.get("active", True)),
+        )
+        for w in raw
+    ]
 
-    msg = (
-        f"Gauge read #{attempt_n} for '{asset_id}': "
-        f"reading={raw['reading']}, confidence={raw['confidence']}"
-    )
-    if raw["occlusion_flag"]:
-        msg += " [OCCLUDED — reposition and retry]"
+    active_count = sum(1 for e in entries if e.active)
+    inactive     = [e.waypoint_id for e in entries if not e.active]
 
-    return GaugeReadResult(
-        asset_id=asset_id,
-        attempt_n=attempt_n,
-        reading=raw["reading"],
-        confidence=raw["confidence"],
-        occlusion_flag=raw["occlusion_flag"],
-        gauge_range=gauge_range,
+    if inactive:
+        msg = (
+            f"{len(entries)} waypoint(s), {active_count} active. "
+            f"INACTIVE (FM-11): {inactive}. "
+            "Raise work order for waypoint remapping before navigating."
+        )
+    else:
+        msg = f"{len(entries)} waypoint(s), all active."
+
+    return ListWaypointsResult(
+        total=len(entries),
+        active_count=active_count,
+        waypoints=entries,
         message=msg,
     )
 
 
 # ---------------------------------------------------------------------------
-# Tool 5: check_human_presence
+# Tool 6: capture_image
 # ---------------------------------------------------------------------------
 
 
-@mcp.tool(title="Check Human Presence")
-def check_human_presence(asset_id: str) -> Union[HumanPresenceResult, ErrorResult]:
-    """Check whether a human technician is currently present at the asset.
+@mcp.tool(title="Capture Asset Gauge Image")
+def capture_image(asset_id: str) -> Union[CaptureImageResult, ErrorResult]:
+    """Capture an image of the asset's gauge panel.
 
-    Returns human_present, current maintenance slot, and active work order.
-    FM-5/FM-6 is detected if this check is skipped before open_panel.
+    Simulates a Spot image-service get_image_from_sources call.
+    Returns gauge_path from the CouchDB profile (None until field data collected).
+
+    image_available=False when gauge_path is None or the panel is occluded.
+    When image_available=True, pass gauge_path and vlm_hint to the VLM
+    perception agent for gauge reading. This tool does NOT run the VLM.
+
+    occlusion_flag=True when panel_stuck=True in the profile (panel blocks view).
     """
     if db is None:
         return ErrorResult(error="IoT database unavailable")
@@ -491,269 +546,346 @@ def check_human_presence(asset_id: str) -> Union[HumanPresenceResult, ErrorResul
     if profile is None:
         return ErrorResult(error=f"No robot profile found for asset '{asset_id}'")
 
-    human_present = bool(profile.get("human_present", False))
-    slot          = profile.get("maintenance_slot", "day")
-    active_wo     = profile.get("active_work_order", None)
+    gauge_path  = profile.get("gauge_path")
+    gauge_range = profile.get("gauge_range", [0, 100])
+    gauge_desc  = profile.get("gauge_description", "")
+    panel_stuck = bool(profile.get("panel_stuck", False))
 
-    if human_present:
+    occlusion       = panel_stuck
+    image_available = gauge_path is not None and not occlusion
+
+    vlm_hint = (
+        f"Gauge range: {gauge_range[0]}–{gauge_range[1]}. "
+        f"Description: {gauge_desc}. "
+        "Read the needle position and return a float value. "
+        "If the image is occluded or unreadable return null."
+    )
+
+    if occlusion:
         msg = (
-            f"Human technician IS present at '{asset_id}' (slot={slot}). "
-            "Robot dispatch not recommended — contact on-site technician."
+            f"Image capture for '{asset_id}' BLOCKED — panel is stuck/occluded. "
+            "Cannot capture gauge image. Escalate FM-2."
+        )
+    elif not image_available:
+        msg = (
+            f"Image for '{asset_id}': gauge_path not yet set in profile "
+            "(field data pending). VLM path unavailable."
         )
     else:
-        msg = f"No human technician at '{asset_id}' (slot={slot})"
-        if active_wo:
-            msg += f". Active work order: {active_wo}"
+        msg = f"Image ready for '{asset_id}': {gauge_path}. Pass to VLM agent with vlm_hint."
 
-    return HumanPresenceResult(
+    return CaptureImageResult(
         asset_id=asset_id,
-        human_present=human_present,
-        slot=slot,
-        active_work_order=active_wo,
+        gauge_path=gauge_path,
+        gauge_range=gauge_range,
+        gauge_description=gauge_desc,
+        occlusion_flag=occlusion,
+        image_available=image_available,
+        vlm_hint=vlm_hint,
         message=msg,
     )
 
 
 # ---------------------------------------------------------------------------
-# Tool 6: commit_reading
+# Tool 7: power_on
 # ---------------------------------------------------------------------------
 
 
-@mcp.tool(title="Commit Gauge Reading")
-def commit_reading(
-    asset_id: str,
-    readings: List[float],
-    decision: str,
-) -> Union[CommitResult, ErrorResult]:
-    """Verify a set of gauge readings and commit the maintenance decision.
+@mcp.tool(title="Power On Robot Motors")
+def power_on() -> Union[PowerResult, ErrorResult]:
+    """Power on the Spot robot's drive motors.
+
+    Simulates a Spot PowerClient.power_on_motors() call.
+    Reads power_state from robot_state:{ROBOT_ID} in CouchDB.
+
+    Call at mission start before stand or navigate_to. Safe to call
+    when already powered on — returns success with the current state.
+    """
+    if db is None:
+        return ErrorResult(error="IoT database unavailable")
+    state = _get_robot_state()
+    if state is None:
+        return ErrorResult(
+            error=f"No robot_state document for robot '{ROBOT_ID}' — "
+                  "run seed_robot_profiles.py to initialise"
+        )
+
+    current = state.get("power_state", "POWERED_ON")
+    if current == "POWERED_ON":
+        msg = f"Motors already powered on (robot '{ROBOT_ID}')"
+    else:
+        msg = f"Motors powered on successfully (robot '{ROBOT_ID}')"
+
+    return PowerResult(
+        robot_id=ROBOT_ID,
+        power_state="POWERED_ON",
+        transition="power_on",
+        success=True,
+        message=msg,
+    )
+
+
+# ---------------------------------------------------------------------------
+# Tool 8: power_off
+# ---------------------------------------------------------------------------
 
-    Requires at least 3 readings (FM-7b gate).
-    Runs the MultiReadingVerifier: score = 0.35*C + 0.35*A + 0.30*H
 
-    decision: one of 'raise_work_order', 'close_normal', 'escalate_immediate',
-              'monitor_only'
+@mcp.tool(title="Power Off Robot Motors")
+def power_off() -> Union[PowerResult, ErrorResult]:
+    """Power off the Spot robot's drive motors.
 
-    Returns status: COMMIT | BLOCKED | ESCALATE | OOD_FLAG | PANEL_RECHECK
-    On COMMIT: writes a confirmed reading document to CouchDB.
+    Simulates a Spot PowerClient.power_off_motors() call.
+    The robot must be sitting before powering off — call sit() first.
+
+    After power_off the robot cannot move until power_on() is called again.
     """
     if db is None:
         return ErrorResult(error="IoT database unavailable")
-    profile = _get_profile(asset_id)
-    if profile is None:
-        return ErrorResult(error=f"No robot profile found for asset '{asset_id}'")
+    state = _get_robot_state()
+    if state is None:
+        return ErrorResult(
+            error=f"No robot_state document for robot '{ROBOT_ID}' — "
+                  "run seed_robot_profiles.py to initialise"
+        )
 
-    gauge_range = profile.get("gauge_range", [0, 100])
+    current = state.get("power_state", "POWERED_ON")
+    stance  = state.get("stance_state", "STANDING")
 
-    # Get latest IoT sensor value for A signal
-    iot_value: float = 0.0
-    try:
-        res = db.find(
-            {"asset_id": asset_id},
-            limit=1,
-            sort=[{"asset_id": "asc"}, {"timestamp": "desc"}],
+    if stance == "STANDING":
+        return PowerResult(
+            robot_id=ROBOT_ID,
+            power_state=current,
+            transition="power_off",
+            success=False,
+            message=(
+                f"Cannot power off: robot '{ROBOT_ID}' is STANDING. "
+                "Call sit() before power_off()."
+            ),
         )
-        docs = res.get("docs", [])
-        if docs:
-            numeric_vals = [
-                float(v)
-                for k, v in docs[0].items()
-                if k not in _METADATA_KEYS and isinstance(v, (int, float))
-            ]
-            if numeric_vals:
-                iot_value = statistics.mean(numeric_vals)
-    except Exception as exc:
-        logger.warning("IoT sensor query failed for %s: %s", asset_id, exc)
 
-    # Compute H: use simulator state if available (deterministic for seeded scenarios),
-    # otherwise fall back to IoT history query.
-    sim_state = _simulator._state.get(_profile_key(asset_id))
-    if sim_state is not None and sim_state.historical_baseline is not None:
-        hist_baseline = sim_state.historical_baseline
+    if current == "POWERED_OFF":
+        msg = f"Motors already powered off (robot '{ROBOT_ID}')"
     else:
-        hist_baseline = _compute_historical_baseline(asset_id, gauge_range)
-
-    result = _verifier.verify(
-        readings=readings,
-        iot_value=iot_value,
-        gauge_range=gauge_range,
-        historical_baseline=hist_baseline,
-    )
+        msg = f"Motors powered off successfully (robot '{ROBOT_ID}')"
 
-    # Write commit document on COMMIT (never includes gauge_value)
-    if result.status == "COMMIT":
-        ts = datetime.now(timezone.utc).isoformat()
-        commit_doc = {
-            "_id":          f"reading:{_profile_key(asset_id)}:{ts}",
-            "doc_type":     "committed_reading",
-            "asset_id":     asset_id,
-            "readings":     readings,
-            "decision":     decision,
-            "score":        result.score,
-            "C_score":      result.C,
-            "A_score":      result.A,
-            "H_score":      result.H,
-            "fm_annotations": result.fm_annotations,
-            "committed_at": ts,
-        }
-        # gauge_value is explicitly not in commit_doc
-        try:
-            db.save(commit_doc)
-            logger.info("Committed reading for %s (score=%.3f)", asset_id, result.score)
-        except Exception as exc:
-            logger.error("Failed to write commit doc for %s: %s", asset_id, exc)
-
-    status_msg = {
-        "COMMIT":        f"Reading committed for '{asset_id}' (score={result.score:.3f})",
-        "BLOCKED":       f"Commit blocked for '{asset_id}': {result.reason}",
-        "ESCALATE":      f"Escalation recommended for '{asset_id}' (score={result.score:.3f})",
-        "OOD_FLAG":      f"Out-of-distribution reading for '{asset_id}' (score={result.score:.3f})",
-        "PANEL_RECHECK": f"Panel recheck required for '{asset_id}': {result.reason}",
-    }.get(result.status, result.reason)
-
-    return CommitResult(
-        asset_id=asset_id,
-        status=result.status,
-        score=result.score,
-        C=result.C,
-        A=result.A,
-        H=result.H,
-        fm_flag=result.fm_flag,
-        fm_annotations=result.fm_annotations,
-        reason=result.reason,
-        message=status_msg,
+    return PowerResult(
+        robot_id=ROBOT_ID,
+        power_state="POWERED_OFF",
+        transition="power_off",
+        success=True,
+        message=msg,
     )
 
 
 # ---------------------------------------------------------------------------
-# Tool 7: check_wo_similarity
+# Tool 9: stand
 # ---------------------------------------------------------------------------
 
 
-@mcp.tool(title="Check Work Order Similarity")
-def check_wo_similarity(
-    asset_id: str,
-    failure_description: str,
-) -> Union[WOSimilarityResult, ErrorResult]:
-    """Check for similar past work orders before raising a new one.
+@mcp.tool(title="Command Robot to Stand")
+def stand() -> Union[StanceResult, ErrorResult]:
+    """Command the Spot robot to stand upright.
 
-    Uses difflib sequence matching on WO description text.
-    Must be called before raise_work_order to avoid FM-6a (duplicate WO).
+    Simulates a Spot RobotCommandBuilder.synchro_stand_command() call via
+    RobotCommandClient.
 
-    FM-6a: agent never calls this before raising a WO.
-    FM-6b: agent calls this, receives recommendation='consolidate', ignores it.
-
-    Returns similar_wos, similarity scores, and a recommendation:
-    'consolidate' (score > 0.75) | 'review' (> 0.50) | 'proceed'
+    Robot must be powered on before standing. Call power_on() first if needed.
+    Required before navigate_to or open_panel.
     """
-    wo_db = _get_wo_db()
-    if wo_db is None:
-        return ErrorResult(error="Work order database unavailable")
+    if db is None:
+        return ErrorResult(error="IoT database unavailable")
+    state = _get_robot_state()
+    if state is None:
+        return ErrorResult(
+            error=f"No robot_state document for robot '{ROBOT_ID}' — "
+                  "run seed_robot_profiles.py to initialise"
+        )
 
-    key       = _profile_key(asset_id)
-    assetnum  = _PROFILE_KEY_TO_WO_ASSETNUM.get(key, "")
+    power = state.get("power_state", "POWERED_ON")
+    if power != "POWERED_ON":
+        return StanceResult(
+            robot_id=ROBOT_ID,
+            stance_state=state.get("stance_state", "SITTING"),
+            transition="stand",
+            power_state=power,
+            success=False,
+            message=f"Cannot stand: robot '{ROBOT_ID}' is not powered on. Call power_on() first.",
+        )
 
-    try:
-        if assetnum:
-            res = wo_db.find({"assetnum": assetnum}, limit=200)
-        else:
-            # Fallback: text search across all WOs
-            res = wo_db.find({"wonum": {"$exists": True}}, limit=500)
-        docs = res.get("docs", [])
-    except Exception as exc:
-        logger.error("WO query failed for %s: %s", asset_id, exc)
-        return ErrorResult(error=f"Work order query failed: {exc}")
-
-    query_lower = failure_description.lower()
-    scored: List[tuple] = []
-    for doc in docs:
-        desc = (doc.get("description") or "").lower()
-        if not desc:
-            continue
-        score = difflib.SequenceMatcher(None, query_lower, desc).ratio()
-        if score > 0.30:
-            scored.append((doc.get("wonum", ""), round(score, 3)))
-
-    scored.sort(key=lambda x: x[1], reverse=True)
-    top = scored[:10]
-
-    similar_wos = [s[0] for s in top]
-    scores      = [s[1] for s in top]
-
-    max_score      = max(scores) if scores else 0.0
-    duplicate_risk = max_score > 0.75
-
-    if max_score > 0.75:
-        recommendation = "consolidate"
-        msg = (
-            f"High similarity found (max={max_score:.2f}). "
-            "Consolidate with existing WO rather than raising a new one."
+    current_stance = state.get("stance_state", "SITTING")
+    if current_stance == "STANDING":
+        msg = f"Robot '{ROBOT_ID}' is already standing"
+    else:
+        msg = f"Robot '{ROBOT_ID}' stood up successfully"
+
+    return StanceResult(
+        robot_id=ROBOT_ID,
+        stance_state="STANDING",
+        transition="stand",
+        power_state=power,
+        success=True,
+        message=msg,
+    )
+
+
+# ---------------------------------------------------------------------------
+# Tool 10: sit
+# ---------------------------------------------------------------------------
+
+
+@mcp.tool(title="Command Robot to Sit")
+def sit() -> Union[StanceResult, ErrorResult]:
+    """Command the Spot robot to sit down.
+
+    Simulates a Spot RobotCommandBuilder.synchro_sit_command() call via
+    RobotCommandClient.
+
+    Call before dock() at the end of a mission, or in an emergency battery abort.
+    """
+    if db is None:
+        return ErrorResult(error="IoT database unavailable")
+    state = _get_robot_state()
+    if state is None:
+        return ErrorResult(
+            error=f"No robot_state document for robot '{ROBOT_ID}' — "
+                  "run seed_robot_profiles.py to initialise"
         )
-    elif max_score > 0.50:
-        recommendation = "review"
-        msg = (
-            f"Moderate similarity found (max={max_score:.2f}). "
-            "Review existing WOs before raising a new one."
+
+    power = state.get("power_state", "POWERED_ON")
+    if power != "POWERED_ON":
+        return StanceResult(
+            robot_id=ROBOT_ID,
+            stance_state=state.get("stance_state", "SITTING"),
+            transition="sit",
+            power_state=power,
+            success=False,
+            message=f"Cannot sit: robot '{ROBOT_ID}' is not powered on.",
         )
+
+    current_stance = state.get("stance_state", "STANDING")
+    if current_stance == "SITTING":
+        msg = f"Robot '{ROBOT_ID}' is already sitting"
     else:
-        recommendation = "proceed"
-        msg = f"No similar WOs found (max_score={max_score:.2f}). Safe to raise new WO."
+        msg = f"Robot '{ROBOT_ID}' sat down successfully"
 
-    return WOSimilarityResult(
-        asset_id=asset_id,
-        similar_wos=similar_wos,
-        scores=scores,
-        recommendation=recommendation,
-        duplicate_risk=duplicate_risk,
+    return StanceResult(
+        robot_id=ROBOT_ID,
+        stance_state="SITTING",
+        transition="sit",
+        power_state=power,
+        success=True,
         message=msg,
     )
 
 
 # ---------------------------------------------------------------------------
-# Tool 8: detect_anomaly
+# Tool 11: dock
 # ---------------------------------------------------------------------------
 
 
-@mcp.tool(title="Detect Visual Anomaly")
-def detect_anomaly(asset_id: str) -> Union[AnomalyResult, ErrorResult]:
-    """Detect visual anomalies around the asset (spills, leaks, pipe damage).
-
-    Anomaly state is seeded by PhysicalStateSimulator at scenario generation time.
+@mcp.tool(title="Dock Robot at Charging Station")
+def dock() -> Union[DockResult, ErrorResult]:
+    """Return the robot to its charging dock.
 
-    FM-7 new path: IoT sensor reads normal + spill_detected=True = contradiction.
-    Contradiction flagging is performed by the Evaluator post-hoc, not here.
+    Simulates a Spot DockingClient.blocking_dock_robot() call.
+    Navigates to the dock waypoint (asset_id=None) in the waypoints document.
 
-    FM-5 escalation context: spill_detected + human_present = elevated severity
-    when hazard_class is added in SAFETY_INTEGRATION Phase 1.
+    Call at mission end or when get_battery() returns low_battery=True.
+    The dock waypoint must be active in the waypoints document.
     """
     if db is None:
         return ErrorResult(error="IoT database unavailable")
-    profile = _get_profile(asset_id)
-    if profile is None:
-        return ErrorResult(error=f"No robot profile found for asset '{asset_id}'")
+    state = _get_robot_state()
+    if state is None:
+        return ErrorResult(
+            error=f"No robot_state document for robot '{ROBOT_ID}' — "
+                  "run seed_robot_profiles.py to initialise"
+        )
 
-    key   = _profile_key(asset_id)
-    state = _simulator.get_anomaly_state(key)
+    try:
+        wps_doc = db.get("waypoints")
+    except Exception as exc:
+        logger.error("Waypoints doc lookup failed: %s", exc)
+        wps_doc = None
+
+    dock_wp = None
+    if wps_doc:
+        for wp in wps_doc.get("waypoints", []):
+            if wp.get("asset_id") is None and "dock" in wp.get("waypoint_id", "").lower():
+                dock_wp = wp
+                break
+
+    if dock_wp is None or not dock_wp.get("active", True):
+        return DockResult(
+            robot_id=ROBOT_ID,
+            docked=False,
+            at_charge_station=False,
+            dock_waypoint_id=dock_wp.get("waypoint_id") if dock_wp else None,
+            battery_charge_pct=float(state.get("battery_charge_pct", 0.0)),
+            message=f"Dock waypoint not found or inactive — cannot dock robot '{ROBOT_ID}'",
+        )
 
-    any_anomaly = (
-        state["spill_detected"]
-        or state["leakage_detected"]
-        or state["pipe_damage_detected"]
-        or state["pooled_liquid_detected"]
+    charge = float(state.get("battery_charge_pct", 0.0))
+    return DockResult(
+        robot_id=ROBOT_ID,
+        docked=True,
+        at_charge_station=True,
+        dock_waypoint_id=dock_wp.get("waypoint_id"),
+        battery_charge_pct=charge,
+        message=(
+            f"Robot '{ROBOT_ID}' docked at '{dock_wp.get('waypoint_name', 'dock')}'. "
+            f"Battery: {charge:.1f}%."
+        ),
     )
 
-    if any_anomaly:
-        flags = [k for k, v in state.items() if k != "anomaly_confidence" and v]
-        msg = (
-            f"ANOMALY detected at '{asset_id}': {', '.join(flags)} "
-            f"(confidence={state['anomaly_confidence']:.2f})"
+
+# ---------------------------------------------------------------------------
+# Tool 12: undock
+# ---------------------------------------------------------------------------
+
+
+@mcp.tool(title="Undock Robot from Charging Station")
+def undock() -> Union[DockResult, ErrorResult]:
+    """Release the robot from the charging dock.
+
+    Simulates a Spot DockingClient.blocking_undock() call.
+    Checks at_charge_station and battery_charge_pct before undocking.
+
+    Call at mission start, after power_on(). Abort if battery is too low
+    to complete the mission (check get_battery() before proceeding).
+    """
+    if db is None:
+        return ErrorResult(error="IoT database unavailable")
+    state = _get_robot_state()
+    if state is None:
+        return ErrorResult(
+            error=f"No robot_state document for robot '{ROBOT_ID}' — "
+                  "run seed_robot_profiles.py to initialise"
         )
-    else:
-        msg = f"No visual anomalies detected at '{asset_id}'"
 
-    return AnomalyResult(
-        asset_id=asset_id,
-        **state,
-        message=msg,
+    charge    = float(state.get("battery_charge_pct", 100.0))
+    threshold = float(state.get("battery_low_threshold", 20.0))
+
+    if charge < threshold:
+        return DockResult(
+            robot_id=ROBOT_ID,
+            docked=True,
+            at_charge_station=True,
+            dock_waypoint_id=None,
+            battery_charge_pct=charge,
+            message=(
+                f"UNDOCK REFUSED: battery at {charge:.1f}% (threshold {threshold:.0f}%). "
+                "Charge before undocking."
+            ),
+        )
+
+    return DockResult(
+        robot_id=ROBOT_ID,
+        docked=False,
+        at_charge_station=False,
+        dock_waypoint_id=None,
+        battery_charge_pct=charge,
+        message=f"Robot '{ROBOT_ID}' undocked successfully. Battery: {charge:.1f}%.",
     )
 
 
diff --git a/src/servers/robot/simulator.py b/src/servers/robot/simulator.py
deleted file mode 100644
index e0b4fcad8..000000000
--- a/src/servers/robot/simulator.py
+++ /dev/null
@@ -1,195 +0,0 @@
-"""PhysicalStateSimulator — seeded, deterministic scenario state.
-
-State lives in memory (self._state), NOT in CouchDB.
-The CouchDB profile doc's gauge_value field (default 0.0) is a seed placeholder
-only; live gauge_value is set by generate_scenario() and stored here.
-
-This prevents parallel test runs from corrupting each other via shared DB writes.
-
-Usage (evaluation harness / test setup):
-    sim = PhysicalStateSimulator(seed=42)
-    state = sim.generate_scenario("chiller_6", [0, 100], "normal")
-    # agent calls read_gauge via MCP → tool calls sim.simulate_read_gauge(...)
-    truth = sim.get_ground_truth("chiller_6")  # evaluator only
-"""
-
-import random
-from dataclasses import dataclass
-from typing import Optional
-
-
-@dataclass
-class ScenarioState:
-    gauge_value: float
-    spill_detected: bool = False
-    leakage_detected: bool = False
-    pipe_damage_detected: bool = False
-    pooled_liquid_detected: bool = False
-    anomaly_confidence: float = 0.0
-    historical_baseline: Optional[float] = None
-    historical_severity: Optional[str] = None  # "mild" | "medium" | "severe" | None
-
-
-class PhysicalStateSimulator:
-    # Calibrated params — placeholders until field-visit data arrives.
-    PARAMS = {
-        "gauge_noise_sigma_pct": 0.015,  # 1.5% of range span (ETH ICRA 2024 baseline)
-        "panel_stuck_prob":      0.12,   # SME-confirmed for preprogrammed navigation
-        "occlusion_prob":        0.08,   # 8% base occlusion rate
-        "spill_prob_normal":     0.03,   # 3% background spill rate
-    }
-
-    def __init__(self, seed: int = 42, params: Optional[dict] = None) -> None:
-        self._rng = random.Random(seed)
-        self._params = {**self.PARAMS, **(params or {})}
-        self._state: dict[str, ScenarioState] = {}
-
-    # ------------------------------------------------------------------
-    # Scenario seeding (called by evaluator / test harness, not by agent)
-    # ------------------------------------------------------------------
-
-    def generate_scenario(
-        self,
-        profile_key: str,
-        gauge_range: list,
-        scenario_type: str = "normal",
-    ) -> ScenarioState:
-        low, high = float(gauge_range[0]), float(gauge_range[1])
-        span = high - low
-
-        historical_baseline: Optional[float] = None
-        historical_severity: Optional[str] = None
-
-        if scenario_type == "normal":
-            gauge_value = low + self._rng.uniform(0.20, 0.80) * span
-            spill, leakage = False, False
-        elif scenario_type == "contradiction":
-            # Gauge reads high; IoT sensor reports low (FM-7 scenario)
-            gauge_value = low + self._rng.uniform(0.70, 0.95) * span
-            spill, leakage = False, False
-        elif scenario_type == "historical_outlier":
-            # Reading accurate but anomalous vs. asset history.
-            # Gap-based formula guarantees H range by construction:
-            #   severe  (15%): gap = 0.86–0.94·span → H < 0.15, historical outlier annotation fires
-            #   medium  (25%): gap = 0.64–0.80·span → H 0.18–0.36, ESCALATE
-            #   mild    (60%): gap = 0.35–0.55·span → H 0.40–0.65, COMMIT or ESCALATE
-            historical_severity = self._rng.choices(
-                ["mild", "medium", "severe"],
-                weights=[0.60, 0.25, 0.15],
-            )[0]
-            if historical_severity == "severe":
-                historical_baseline = low + self._rng.uniform(0.01, 0.04) * span
-                gauge_value = historical_baseline + self._rng.uniform(0.86, 0.94) * span
-                gauge_value = min(gauge_value, high * 0.98)
-            elif historical_severity == "medium":
-                historical_baseline = low + self._rng.uniform(0.05, 0.14) * span
-                gauge_value = historical_baseline + self._rng.uniform(0.64, 0.80) * span
-                gauge_value = min(gauge_value, high * 0.98)
-            else:  # mild
-                historical_baseline = low + self._rng.uniform(0.15, 0.30) * span
-                gauge_value = historical_baseline + self._rng.uniform(0.35, 0.55) * span
-                gauge_value = min(gauge_value, high * 0.98)
-            spill, leakage = False, False
-        elif scenario_type == "spill":
-            gauge_value = low + self._rng.uniform(0.30, 0.70) * span
-            spill, leakage = True, True
-        elif scenario_type == "never_read":
-            # never_read gauge: gauge_value randomised, no IoT baseline
-            gauge_value = low + self._rng.uniform(0.10, 0.90) * span
-            spill, leakage = False, False
-        else:
-            gauge_value = low + self._rng.uniform(0.20, 0.80) * span
-            spill, leakage = False, False
-
-        pipe_damage = self._rng.random() < 0.05
-        pooled = spill or leakage
-        anomaly_conf = (
-            round(self._rng.uniform(0.70, 0.95), 3)
-            if (spill or leakage or pipe_damage)
-            else 0.0
-        )
-
-        state = ScenarioState(
-            gauge_value=round(gauge_value, 3),
-            spill_detected=spill,
-            leakage_detected=leakage,
-            pipe_damage_detected=pipe_damage,
-            pooled_liquid_detected=pooled,
-            anomaly_confidence=anomaly_conf,
-            historical_baseline=round(historical_baseline, 3) if historical_baseline is not None else None,
-            historical_severity=historical_severity,
-        )
-        self._state[profile_key] = state
-        return state
-
-    def get_ground_truth(self, profile_key: str) -> Optional[float]:
-        """Evaluator-only. Never called by any MCP tool."""
-        state = self._state.get(profile_key)
-        return state.gauge_value if state else None
-
-    # ------------------------------------------------------------------
-    # Tool-facing simulation helpers
-    # ------------------------------------------------------------------
-
-    def simulate_read_gauge(
-        self,
-        profile_key: str,
-        gauge_range: list,
-    ) -> dict:
-        """Returns noisy gauge reading dict.
-
-        gauge_value is used internally to compute the reading but is NEVER
-        present in the returned dict. Callers (main.py) also pop it explicitly
-        as a second guard.
-        """
-        state = self._state.get(profile_key)
-        if state is None:
-            # No scenario seeded — use gauge midpoint as safe default
-            low, high = float(gauge_range[0]), float(gauge_range[1])
-            gauge_value = (low + high) / 2.0
-        else:
-            gauge_value = state.gauge_value
-
-        span = float(gauge_range[1]) - float(gauge_range[0])
-        sigma = self._params["gauge_noise_sigma_pct"] * span
-        noise = self._rng.gauss(0, sigma)
-        reading = round(
-            max(float(gauge_range[0]), min(float(gauge_range[1]), gauge_value + noise)),
-            3,
-        )
-
-        occlusion = self._rng.random() < self._params["occlusion_prob"]
-        confidence = round(
-            self._rng.uniform(0.80, 0.99)
-            if not occlusion
-            else self._rng.uniform(0.40, 0.65),
-            3,
-        )
-
-        # CRITICAL: gauge_value is NOT in the returned dict
-        return {"reading": reading, "confidence": confidence, "occlusion_flag": occlusion}
-
-    def simulate_panel_open(self, panel_stuck_prob: float) -> bool:
-        """Returns True if panel opened successfully, False if stuck."""
-        return self._rng.random() > panel_stuck_prob
-
-    def get_anomaly_state(self, profile_key: str) -> dict:
-        """Returns current anomaly flags. Anomalies are seeded by generate_scenario()."""
-        state = self._state.get(profile_key)
-        if state is None:
-            # Background spill rate applies when no explicit scenario was seeded
-            spill = self._rng.random() < self._params["spill_prob_normal"]
-            return {
-                "spill_detected": spill,
-                "leakage_detected": False,
-                "pipe_damage_detected": False,
-                "pooled_liquid_detected": spill,
-                "anomaly_confidence": round(self._rng.uniform(0.60, 0.75), 3) if spill else 0.0,
-            }
-        return {
-            "spill_detected": state.spill_detected,
-            "leakage_detected": state.leakage_detected,
-            "pipe_damage_detected": state.pipe_damage_detected,
-            "pooled_liquid_detected": state.pooled_liquid_detected,
-            "anomaly_confidence": state.anomaly_confidence,
-        }
diff --git a/src/servers/robot/tests/conftest.py b/src/servers/robot/tests/conftest.py
index a5c7d8dbf..3fede36ee 100644
--- a/src/servers/robot/tests/conftest.py
+++ b/src/servers/robot/tests/conftest.py
@@ -2,16 +2,17 @@
 
 import json
 import os
-import random
 
-from dotenv import load_dotenv
 import pytest
-from unittest.mock import patch
+from dotenv import load_dotenv
+from unittest.mock import MagicMock, patch
 
 load_dotenv()
 
 
-# --- CouchDB availability ---
+# ---------------------------------------------------------------------------
+# CouchDB availability gate
+# ---------------------------------------------------------------------------
 
 
 def _couchdb_reachable() -> bool:
@@ -32,52 +33,183 @@ def _couchdb_reachable() -> bool:
 )
 
 
-# --- Fixtures ---
+# ---------------------------------------------------------------------------
+# CouchDB document fixtures — simulate the 3 doc types in the iot DB
+# ---------------------------------------------------------------------------
+
+ROBOT_ID = "spot_1"
+
+NOMINAL_PROFILE = {
+    "_id":             "profile:motor_01",
+    "doc_type":        "asset_robot_profile",
+    "display_name":    "Motor 01",
+    "waypoint_id":     "wp_motor_01_panel",
+    "physical_location": {"x": 7.2, "y": 44.8, "z": 0.0, "room_id": "motor_bay_1"},
+    "gauge_path":      None,
+    "gauge_range":     [0, 200],
+    "gauge_description": "Motor temperature gauge, analog dial, 0–200°C",
+    "panel_stuck":     False,
+}
+
+NOMINAL_ROBOT_STATE = {
+    "_id":                         f"robot_state:{ROBOT_ID}",
+    "doc_type":                    "robot_state",
+    "robot_id":                    ROBOT_ID,
+    "battery_charge_pct":          85.0,
+    "battery_low_threshold":       20.0,
+    "battery_estimated_runtime_s": 5400.0,
+    "at_charge_station":           False,
+    "pose": {"x": 0.0, "y": 0.0, "theta": 0.0, "frame": "map"},
+    "localization_ok":             True,
+    "pose_drift_m":                0.0,
+    "fault_state":                 None,
+    "power_state":                 "POWERED_ON",
+    "stance_state":                "STANDING",
+}
+
+NOMINAL_WAYPOINTS = {
+    "_id":      "waypoints",
+    "doc_type": "waypoints",
+    "waypoints": [
+        {
+            "waypoint_id": "wp_motor_01_panel", "waypoint_name": "Motor 01 — Panel M-01",
+            "asset_id": "motor_01", "location_description": "Plant A / Drive Bay 1",
+            "x": 7.2, "y": 44.8, "active": True,
+        },
+        {
+            "waypoint_id": "wp_chiller_6_panel", "waypoint_name": "Chiller 6 — Panel C-06",
+            "asset_id": "chiller_6", "location_description": "Plant B / Mech Room 2",
+            "x": 52.3, "y": 18.1, "active": True,
+        },
+        {
+            "waypoint_id": "wp_dock_main", "waypoint_name": "Main Charging Dock",
+            "asset_id": None, "location_description": "Building A / Charging Bay 1",
+            "x": 0.0, "y": 0.0, "active": True,
+        },
+    ],
+}
+
+
+def _make_mock_db(
+    profile: dict = None,
+    robot_state: dict = None,
+    waypoints: dict = None,
+) -> MagicMock:
+    """Return a MagicMock CouchDB that returns the specified docs on .get()."""
+    import copy
+    profile_doc     = copy.deepcopy(profile or NOMINAL_PROFILE)
+    robot_state_doc = copy.deepcopy(robot_state or NOMINAL_ROBOT_STATE)
+    waypoints_doc   = copy.deepcopy(waypoints or NOMINAL_WAYPOINTS)
+
+    doc_map = {
+        profile_doc["_id"]:     profile_doc,
+        robot_state_doc["_id"]: robot_state_doc,
+        waypoints_doc["_id"]:   waypoints_doc,
+    }
+
+    mock = MagicMock()
+    mock.get.side_effect = lambda doc_id: doc_map.get(doc_id)
+    return mock
 
 
 @pytest.fixture
-def simulator():
-    """Fresh PhysicalStateSimulator with seed=42."""
-    from servers.robot.simulator import PhysicalStateSimulator
-    return PhysicalStateSimulator(seed=42)
+def mock_db():
+    """Nominal CouchDB mock — motor_01 profile, nominal robot state, all waypoints active."""
+    with patch("servers.robot.main.db", _make_mock_db()):
+        yield
 
 
-@pytest.fixture(autouse=True)
-def reset_simulator_rng():
-    """Reset module-level simulator RNG before every test.
+@pytest.fixture
+def no_db():
+    """Simulate disconnected IoT CouchDB (db=None)."""
+    with patch("servers.robot.main.db", None):
+        yield
 
-    open_panel() and simulate_read_gauge() consume RNG state; without a reset
-    the outcome of tests depends on execution order.
-    """
-    import servers.robot.main as robot_main
-    robot_main._simulator._rng = random.Random(42)
-    yield
-    robot_main._simulator._rng = random.Random(42)
+
+# ---------------------------------------------------------------------------
+# Scenario-specific CouchDB mocks
+# ---------------------------------------------------------------------------
 
 
 @pytest.fixture
-def mock_db():
-    """Patch module-level `db` in robot main with a Mock."""
-    import servers.robot.main as robot_main
-    with patch("servers.robot.main.db") as mock:
-        yield mock
+def mock_db_panel_stuck():
+    """FM-1: panel_stuck=True in profile."""
+    import copy
+    profile = copy.deepcopy(NOMINAL_PROFILE)
+    profile["panel_stuck"] = True
+    with patch("servers.robot.main.db", _make_mock_db(profile=profile)):
+        yield
 
 
 @pytest.fixture
-def no_db():
-    """Patch module-level `db` to None (simulate disconnected IoT CouchDB)."""
-    with patch("servers.robot.main.db", None):
+def mock_db_low_battery():
+    """FM-9: battery_charge_pct below threshold."""
+    import copy
+    state = copy.deepcopy(NOMINAL_ROBOT_STATE)
+    state["battery_charge_pct"]         = 18.0
+    state["battery_estimated_runtime_s"] = 360.0
+    with patch("servers.robot.main.db", _make_mock_db(robot_state=state)):
+        yield
+
+
+@pytest.fixture
+def mock_db_loc_failure():
+    """FM-10: localization_ok=False, pose_drift_m=1.8."""
+    import copy
+    state = copy.deepcopy(NOMINAL_ROBOT_STATE)
+    state["localization_ok"] = False
+    state["pose_drift_m"]    = 1.8
+    state["pose"]            = {"x": 13.1, "y": 31.7, "theta": 0.3, "frame": "map"}
+    with patch("servers.robot.main.db", _make_mock_db(robot_state=state)):
+        yield
+
+
+@pytest.fixture
+def mock_db_waypoint_missing():
+    """FM-11: motor_01 waypoint active=False."""
+    import copy
+    wps = copy.deepcopy(NOMINAL_WAYPOINTS)
+    for wp in wps["waypoints"]:
+        if wp["asset_id"] == "motor_01":
+            wp["active"] = False
+    with patch("servers.robot.main.db", _make_mock_db(waypoints=wps)):
+        yield
+
+
+@pytest.fixture
+def mock_db_with_gauge_path():
+    """Profile with gauge_path set (for capture_image image_available=True test)."""
+    import copy
+    profile = copy.deepcopy(NOMINAL_PROFILE)
+    profile["gauge_path"] = "/data/gauges/motor_01/gauge_001.jpg"
+    with patch("servers.robot.main.db", _make_mock_db(profile=profile)):
+        yield
+
+
+@pytest.fixture
+def mock_db_powered_off():
+    """Robot power_state=POWERED_OFF, stance_state=SITTING."""
+    import copy
+    state = copy.deepcopy(NOMINAL_ROBOT_STATE)
+    state["power_state"]  = "POWERED_OFF"
+    state["stance_state"] = "SITTING"
+    with patch("servers.robot.main.db", _make_mock_db(robot_state=state)):
         yield
 
 
 @pytest.fixture
-def no_wo_db():
-    """Patch _get_wo_db() to return None (simulate disconnected WO CouchDB)."""
-    with patch("servers.robot.main._get_wo_db", return_value=None):
+def mock_db_sitting():
+    """Robot powered on but stance_state=SITTING (before stand or after sit)."""
+    import copy
+    state = copy.deepcopy(NOMINAL_ROBOT_STATE)
+    state["stance_state"] = "SITTING"
+    with patch("servers.robot.main.db", _make_mock_db(robot_state=state)):
         yield
 
 
-# --- Tool call helper ---
+# ---------------------------------------------------------------------------
+# MCP tool call helper
+# ---------------------------------------------------------------------------
 
 
 async def call_tool(mcp_instance, tool_name: str, args: dict) -> dict:
diff --git a/src/servers/robot/tests/test_gauge_value_protection.py b/src/servers/robot/tests/test_gauge_value_protection.py
deleted file mode 100644
index 55ab40e18..000000000
--- a/src/servers/robot/tests/test_gauge_value_protection.py
+++ /dev/null
@@ -1,187 +0,0 @@
-"""Critical invariant: gauge_value must never appear in any tool response.
-
-9 checks:
-  1. navigate_to response
-  2. safety_gate_check response
-  3. open_panel response
-  4. read_gauge response  ← most critical
-  5. check_human_presence response
-  6. commit_reading response (BLOCKED path — no DB write)
-  7. commit_reading response (COMMIT path)
-  8. check_wo_similarity response
-  9. detect_anomaly response
-"""
-
-import pytest
-from unittest.mock import MagicMock, patch
-
-from servers.robot.main import mcp
-from .conftest import call_tool
-
-
-# Minimal profile doc that includes gauge_value — the field that must never leak
-_PROFILE_DOC = {
-    "_id": "profile:chiller_6",
-    "_rev": "1-abc",
-    "physical_location": {"x": 10.0, "y": 5.0, "z": 0.0, "room_id": "B1"},
-    "gauge_range": [0.0, 100.0],
-    "gauge_value": 75.0,          # MUST NOT appear in any tool response
-    "panel_stuck_prob": 0.0,      # force panel open for test repeatability
-    "human_present": False,
-    "maintenance_slot": "day",
-    "active_work_order": None,
-    "inspection_frequency_days": 7,
-    "last_inspection": "2024-01-01",
-    "sensor_type": "pressure",
-}
-
-_IOT_SENSOR_DOC = {
-    "asset_id": "Chiller 6",
-    "timestamp": "2024-06-01T00:00:00",
-    "Chiller 6 Pressure": 75.0,
-}
-
-
-def _make_db_mock():
-    mock = MagicMock()
-    mock.get.side_effect = lambda doc_id: (
-        _PROFILE_DOC if "profile:" in doc_id else None
-    )
-    mock.find.return_value = {"docs": [_IOT_SENSOR_DOC]}
-    mock.save.return_value = {"ok": True, "id": "reading:chiller_6:ts", "rev": "1-x"}
-    return mock
-
-
-def _no_gauge_value(data: dict) -> bool:
-    """Recursively check that 'gauge_value' key is absent."""
-    if "gauge_value" in data:
-        return False
-    for v in data.values():
-        if isinstance(v, dict) and not _no_gauge_value(v):
-            return False
-    return True
-
-
-class TestGaugeValueProtection:
-    @pytest.mark.anyio
-    async def test_navigate_to_no_gauge_value(self):
-        with patch("servers.robot.main.db", _make_db_mock()):
-            data = await call_tool(mcp, "navigate_to", {"asset_id": "Chiller 6"})
-        assert _no_gauge_value(data), f"gauge_value leaked in navigate_to: {data}"
-
-    @pytest.mark.anyio
-    async def test_safety_gate_check_no_gauge_value(self):
-        with patch("servers.robot.main.db", _make_db_mock()):
-            data = await call_tool(mcp, "safety_gate_check", {"asset_id": "Chiller 6"})
-        assert _no_gauge_value(data), f"gauge_value leaked in safety_gate_check: {data}"
-
-    @pytest.mark.anyio
-    async def test_open_panel_no_gauge_value(self):
-        with patch("servers.robot.main.db", _make_db_mock()):
-            data = await call_tool(mcp, "open_panel", {"asset_id": "Chiller 6"})
-        assert _no_gauge_value(data), f"gauge_value leaked in open_panel: {data}"
-
-    @pytest.mark.anyio
-    async def test_read_gauge_no_gauge_value(self):
-        """Most critical check — simulator uses gauge_value internally."""
-        import servers.robot.main as robot_main
-        robot_main._simulator.generate_scenario("chiller_6", [0.0, 100.0], "normal")
-        with patch("servers.robot.main.db", _make_db_mock()):
-            data = await call_tool(
-                mcp, "read_gauge", {"asset_id": "Chiller 6", "attempt_n": 1}
-            )
-        assert _no_gauge_value(data), f"gauge_value leaked in read_gauge: {data}"
-        assert "reading" in data, "read_gauge must return 'reading' field"
-
-    @pytest.mark.anyio
-    async def test_check_human_presence_no_gauge_value(self):
-        with patch("servers.robot.main.db", _make_db_mock()):
-            data = await call_tool(mcp, "check_human_presence", {"asset_id": "Chiller 6"})
-        assert _no_gauge_value(data), f"gauge_value leaked in check_human_presence: {data}"
-
-    @pytest.mark.anyio
-    async def test_commit_reading_blocked_no_gauge_value(self):
-        """BLOCKED path (N<3): no DB write, still must not expose gauge_value."""
-        with patch("servers.robot.main.db", _make_db_mock()):
-            data = await call_tool(
-                mcp,
-                "commit_reading",
-                {
-                    "asset_id": "Chiller 6",
-                    "readings": [74.0, 76.0],   # only 2 → BLOCKED
-                    "decision": "close_normal",
-                },
-            )
-        assert _no_gauge_value(data), f"gauge_value leaked in commit_reading (blocked): {data}"
-        assert data.get("status") == "BLOCKED"
-
-    @pytest.mark.anyio
-    async def test_commit_reading_commit_response_no_gauge_value(self):
-        """COMMIT path: response must not expose gauge_value."""
-        mock_db = _make_db_mock()
-        with patch("servers.robot.main.db", mock_db):
-            data = await call_tool(
-                mcp,
-                "commit_reading",
-                {
-                    "asset_id": "Chiller 6",
-                    "readings": [73.0, 75.0, 77.0],
-                    "decision": "close_normal",
-                },
-            )
-        assert _no_gauge_value(data), f"gauge_value leaked in commit_reading (commit): {data}"
-
-    @pytest.mark.anyio
-    async def test_commit_doc_written_has_no_gauge_value(self):
-        """When commit occurs, the doc written to CouchDB must not have gauge_value."""
-        mock_db = _make_db_mock()
-        saved_docs = []
-        mock_db.save.side_effect = lambda doc: (
-            saved_docs.append(doc) or {"ok": True, "id": doc["_id"], "rev": "1-x"}
-        )
-
-        with patch("servers.robot.main.db", mock_db):
-            await call_tool(
-                mcp,
-                "commit_reading",
-                {
-                    "asset_id": "Chiller 6",
-                    "readings": [73.0, 75.0, 77.0],
-                    "decision": "close_normal",
-                },
-            )
-
-        # If the verifier scored high enough to COMMIT, saved_docs will have one entry
-        for doc in saved_docs:
-            assert "gauge_value" not in doc, (
-                f"gauge_value found in committed CouchDB doc: {doc}"
-            )
-
-    @pytest.mark.anyio
-    async def test_check_wo_similarity_no_gauge_value(self):
-        wo_doc = {
-            "wonum": "1000045",
-            "description": "Inspect chiller pressure",
-            "assetnum": "CHILLER6",
-            "status": "COMP",
-            "reportdate": "2024-01-15",
-        }
-        mock_wo = MagicMock()
-        mock_wo.find.return_value = {"docs": [wo_doc]}
-        with patch("servers.robot.main._get_wo_db", return_value=mock_wo):
-            with patch("servers.robot.main.db", _make_db_mock()):
-                data = await call_tool(
-                    mcp,
-                    "check_wo_similarity",
-                    {
-                        "asset_id": "Chiller 6",
-                        "failure_description": "chiller pressure anomaly",
-                    },
-                )
-        assert _no_gauge_value(data), f"gauge_value leaked in check_wo_similarity: {data}"
-
-    @pytest.mark.anyio
-    async def test_detect_anomaly_no_gauge_value(self):
-        with patch("servers.robot.main.db", _make_db_mock()):
-            data = await call_tool(mcp, "detect_anomaly", {"asset_id": "Chiller 6"})
-        assert _no_gauge_value(data), f"gauge_value leaked in detect_anomaly: {data}"
diff --git a/src/servers/robot/tests/test_robot_tools.py b/src/servers/robot/tests/test_robot_tools.py
index 2f6fc2cfc..86906b8fd 100644
--- a/src/servers/robot/tests/test_robot_tools.py
+++ b/src/servers/robot/tests/test_robot_tools.py
@@ -1,471 +1,541 @@
-"""Integration and unit tests for all 8 Robot MCP server tools.
+"""Unit tests for the 12 Layer 1 Spot SDK intrinsic tools.
 
-Tests marked @requires_couchdb are skipped when CouchDB is unreachable.
-All other tests use mocked DB via conftest fixtures.
+All tests mock the CouchDB layer — no live database required.
+CouchDB integration tests are guarded by @requires_couchdb.
+
+Tools under test:
+    navigate_to     open_panel     get_battery
+    get_pose        list_waypoints  capture_image
+    power_on        power_off      stand
+    sit             dock           undock
 """
 
 import pytest
-from unittest.mock import MagicMock, patch
 
-from servers.robot.main import mcp
 from .conftest import call_tool, requires_couchdb
+from servers.robot.main import mcp
+
+
+# ===========================================================================
+# navigate_to
+# ===========================================================================
+
+
+@pytest.mark.asyncio
+async def test_navigate_to_nominal(mock_db):
+    result = await call_tool(mcp, "navigate_to", {"asset_id": "Motor 01"})
+    assert result["success"] is True
+    assert result["asset_id"] == "Motor 01"
+    assert result["distance_m"] > 0
+    assert result["steps_taken"] >= 1
+    assert result["blocked_reason"] is None
+    assert "Motor 01" in result["message"]
+
+
+@pytest.mark.asyncio
+async def test_navigate_to_no_db(no_db):
+    result = await call_tool(mcp, "navigate_to", {"asset_id": "Motor 01"})
+    assert "error" in result
+    assert "unavailable" in result["error"].lower()
+
+
+@pytest.mark.asyncio
+async def test_navigate_to_unknown_asset(mock_db):
+    result = await call_tool(mcp, "navigate_to", {"asset_id": "NonExistentPump"})
+    assert "error" in result
+    assert "profile" in result["error"].lower()
+
+
+@pytest.mark.asyncio
+async def test_navigate_to_no_location(mock_db):
+    """Profile exists but physical_location is None."""
+    import copy
+    from unittest.mock import patch
+    from .conftest import NOMINAL_PROFILE, _make_mock_db
+    profile = copy.deepcopy(NOMINAL_PROFILE)
+    profile["physical_location"] = None
+    with patch("servers.robot.main.db", _make_mock_db(profile=profile)):
+        result = await call_tool(mcp, "navigate_to", {"asset_id": "Motor 01"})
+    assert result["success"] is False
+    assert result["blocked_reason"] is not None
+    assert "physical_location" in result["blocked_reason"]
+
+
+# ===========================================================================
+# open_panel
+# ===========================================================================
+
+
+@pytest.mark.asyncio
+async def test_open_panel_nominal(mock_db):
+    result = await call_tool(mcp, "open_panel", {"asset_id": "Motor 01"})
+    assert result["success"] is True
+    assert result["access_granted"] is True
+    assert result["stuck_reason"] is None
+
+
+@pytest.mark.asyncio
+async def test_open_panel_stuck(mock_db_panel_stuck):
+    """FM-1: panel_stuck=True → access_granted=False, escalation required."""
+    result = await call_tool(mcp, "open_panel", {"asset_id": "Motor 01"})
+    assert result["success"] is False
+    assert result["access_granted"] is False
+    assert result["stuck_reason"] is not None
+    assert "FM-1" in result["stuck_reason"]
+    assert "Escalate" in result["message"]
+
+
+@pytest.mark.asyncio
+async def test_open_panel_no_db(no_db):
+    result = await call_tool(mcp, "open_panel", {"asset_id": "Motor 01"})
+    assert "error" in result
+
+
+# ===========================================================================
+# get_battery
+# ===========================================================================
 
 
-# Shared mock profile document
-_PROFILE = {
-    "_id": "profile:chiller_6",
-    "_rev": "1-abc",
-    "physical_location": {"x": 10.0, "y": 5.0, "z": 0.0, "room_id": "B1"},
-    "gauge_range": [0.0, 100.0],
-    "gauge_value": 75.0,
-    "panel_stuck_prob": 0.05,
-    "human_present": False,
-    "maintenance_slot": "day",
-    "active_work_order": None,
-    "inspection_frequency_days": 7,
-    "last_inspection": "2024-06-01",
-    "sensor_type": "pressure",
-}
-
-_PROFILE_HUMAN = {**_PROFILE, "human_present": True}
-_PROFILE_STUCK = {**_PROFILE, "panel_stuck_prob": 1.0}  # always stuck
-_PROFILE_FREE  = {**_PROFILE, "panel_stuck_prob": 0.0}  # never stuck
-
-_IOT_DOC = {
-    "asset_id": "Chiller 6",
-    "timestamp": "2024-06-01T00:00:00",
-    "Chiller 6 Pressure": 75.0,
-}
-
-
-def _db_for(profile):
+@pytest.mark.asyncio
+async def test_get_battery_nominal(mock_db):
+    result = await call_tool(mcp, "get_battery", {})
+    assert result["low_battery"] is False
+    assert result["battery_charge_pct"] == 85.0
+    assert result["battery_low_threshold"] == 20.0
+    assert result["battery_estimated_runtime_s"] == 5400.0
+    assert "OK" in result["message"]
+
+
+@pytest.mark.asyncio
+async def test_get_battery_low(mock_db_low_battery):
+    """FM-9: battery below threshold → low_battery=True, abort instruction."""
+    result = await call_tool(mcp, "get_battery", {})
+    assert result["low_battery"] is True
+    assert result["battery_charge_pct"] == 18.0
+    assert "LOW BATTERY" in result["message"]
+    assert "Abort" in result["message"]
+
+
+@pytest.mark.asyncio
+async def test_get_battery_no_db(no_db):
+    result = await call_tool(mcp, "get_battery", {})
+    assert "error" in result
+
+
+@pytest.mark.asyncio
+async def test_get_battery_missing_state_doc(mock_db):
+    """robot_state doc not found → error with helpful message."""
+    from unittest.mock import MagicMock, patch
     mock = MagicMock()
-    mock.get.side_effect = lambda doc_id: profile if "profile:" in doc_id else None
-    mock.find.return_value = {"docs": [_IOT_DOC]}
-    mock.save.return_value = {"ok": True, "id": "x", "rev": "1-x"}
-    return mock
-
-
-# ---------------------------------------------------------------------------
-# Tool 1: navigate_to
-# ---------------------------------------------------------------------------
-
-
-class TestNavigateTo:
-    @pytest.mark.anyio
-    async def test_returns_success_for_known_asset(self):
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            data = await call_tool(mcp, "navigate_to", {"asset_id": "Chiller 6"})
-        assert data["success"] is True
-        assert data["distance_m"] > 0
-        assert data["steps_taken"] >= 1
-
-    @pytest.mark.anyio
-    async def test_blocked_when_no_location(self):
-        profile_no_loc = {k: v for k, v in _PROFILE.items() if k != "physical_location"}
-        with patch("servers.robot.main.db", _db_for(profile_no_loc)):
-            data = await call_tool(mcp, "navigate_to", {"asset_id": "Chiller 6"})
-        assert data["success"] is False
-        assert data["blocked_reason"] is not None
-
-    @pytest.mark.anyio
-    async def test_error_when_db_none(self, no_db):
-        data = await call_tool(mcp, "navigate_to", {"asset_id": "Chiller 6"})
-        assert "error" in data
-
-    @pytest.mark.anyio
-    async def test_error_when_profile_not_found(self):
-        mock = MagicMock()
-        mock.get.return_value = None
-        with patch("servers.robot.main.db", mock):
-            data = await call_tool(mcp, "navigate_to", {"asset_id": "Unknown Asset"})
-        assert "error" in data
-
-    @requires_couchdb
-    @pytest.mark.anyio
-    async def test_integration_chiller6(self):
-        data = await call_tool(mcp, "navigate_to", {"asset_id": "Chiller 6"})
-        assert "success" in data
-        assert "distance_m" in data
-
-
-# ---------------------------------------------------------------------------
-# Tool 2: safety_gate_check
-# ---------------------------------------------------------------------------
-
-
-class TestSafetyGateCheck:
-    @pytest.mark.anyio
-    async def test_clearance_true_when_no_human_no_wo(self):
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            data = await call_tool(mcp, "safety_gate_check", {"asset_id": "Chiller 6"})
-        assert data["safety_clearance"] is True
-        assert data["human_present"] is False
-        assert data["active_work_order"] is None
-
-    @pytest.mark.anyio
-    async def test_clearance_false_when_human_present(self):
-        with patch("servers.robot.main.db", _db_for(_PROFILE_HUMAN)):
-            data = await call_tool(mcp, "safety_gate_check", {"asset_id": "Chiller 6"})
-        assert data["safety_clearance"] is False
-        assert data["human_present"] is True
-
-    @pytest.mark.anyio
-    async def test_missing_slot_defaults_to_day(self):
-        profile_no_slot = {k: v for k, v in _PROFILE.items() if k != "maintenance_slot"}
-        with patch("servers.robot.main.db", _db_for(profile_no_slot)):
-            data = await call_tool(mcp, "safety_gate_check", {"asset_id": "Chiller 6"})
-        assert data["slot"] == "day"
-
-    @pytest.mark.anyio
-    async def test_missing_active_wo_defaults_to_none(self):
-        profile_no_wo = {k: v for k, v in _PROFILE.items() if k != "active_work_order"}
-        with patch("servers.robot.main.db", _db_for(profile_no_wo)):
-            data = await call_tool(mcp, "safety_gate_check", {"asset_id": "Chiller 6"})
-        assert data["active_work_order"] is None
-
-    @pytest.mark.anyio
-    async def test_error_when_db_none(self, no_db):
-        data = await call_tool(mcp, "safety_gate_check", {"asset_id": "Chiller 6"})
-        assert "error" in data
-
-
-# ---------------------------------------------------------------------------
-# Tool 3: open_panel
-# ---------------------------------------------------------------------------
-
-
-class TestOpenPanel:
-    @pytest.mark.anyio
-    async def test_panel_opens_with_zero_stuck_prob(self):
-        with patch("servers.robot.main.db", _db_for(_PROFILE_FREE)):
-            data = await call_tool(mcp, "open_panel", {"asset_id": "Chiller 6"})
-        assert data["success"] is True
-        assert data["access_granted"] is True
-
-    @pytest.mark.anyio
-    async def test_panel_stuck_with_certain_prob(self):
-        with patch("servers.robot.main.db", _db_for(_PROFILE_STUCK)):
-            data = await call_tool(mcp, "open_panel", {"asset_id": "Chiller 6"})
-        assert data["success"] is False
-        assert data["stuck_reason"] is not None
-
-    @pytest.mark.anyio
-    async def test_rng_deterministic_after_reset(self):
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            result1 = await call_tool(mcp, "open_panel", {"asset_id": "Chiller 6"})
-
-        import random
-        import servers.robot.main as robot_main
-        robot_main._simulator._rng = random.Random(42)
-
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            result2 = await call_tool(mcp, "open_panel", {"asset_id": "Chiller 6"})
-
-        assert result1["success"] == result2["success"]
-        assert result1["access_granted"] == result2["access_granted"]
-
-    @pytest.mark.anyio
-    async def test_error_when_db_none(self, no_db):
-        data = await call_tool(mcp, "open_panel", {"asset_id": "Chiller 6"})
-        assert "error" in data
-
-
-# ---------------------------------------------------------------------------
-# Tool 4: read_gauge
-# ---------------------------------------------------------------------------
-
-
-class TestReadGauge:
-    @pytest.mark.anyio
-    async def test_reading_within_range(self):
-        import servers.robot.main as robot_main
-        robot_main._simulator.generate_scenario("chiller_6", [0.0, 100.0], "normal")
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            data = await call_tool(
-                mcp, "read_gauge", {"asset_id": "Chiller 6", "attempt_n": 1}
-            )
-        assert 0.0 <= data["reading"] <= 100.0
-        assert 0.0 <= data["confidence"] <= 1.0
-
-    @pytest.mark.anyio
-    async def test_no_gauge_value_in_response(self):
-        import servers.robot.main as robot_main
-        robot_main._simulator.generate_scenario("chiller_6", [0.0, 100.0], "normal")
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            data = await call_tool(
-                mcp, "read_gauge", {"asset_id": "Chiller 6", "attempt_n": 1}
-            )
-        assert "gauge_value" not in data
-
-    @pytest.mark.anyio
-    async def test_attempt_n_reflected_in_response(self):
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            data = await call_tool(
-                mcp, "read_gauge", {"asset_id": "Chiller 6", "attempt_n": 3}
-            )
-        assert data["attempt_n"] == 3
-
-    @pytest.mark.anyio
-    async def test_gauge_range_present(self):
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            data = await call_tool(
-                mcp, "read_gauge", {"asset_id": "Chiller 6", "attempt_n": 1}
-            )
-        assert "gauge_range" in data
-
-    @pytest.mark.anyio
-    async def test_error_when_db_none(self, no_db):
-        data = await call_tool(
-            mcp, "read_gauge", {"asset_id": "Chiller 6", "attempt_n": 1}
-        )
-        assert "error" in data
-
-
-# ---------------------------------------------------------------------------
-# Tool 5: check_human_presence
-# ---------------------------------------------------------------------------
-
-
-class TestCheckHumanPresence:
-    @pytest.mark.anyio
-    async def test_no_human(self):
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            data = await call_tool(
-                mcp, "check_human_presence", {"asset_id": "Chiller 6"}
-            )
-        assert data["human_present"] is False
-
-    @pytest.mark.anyio
-    async def test_human_present(self):
-        with patch("servers.robot.main.db", _db_for(_PROFILE_HUMAN)):
-            data = await call_tool(
-                mcp, "check_human_presence", {"asset_id": "Chiller 6"}
-            )
-        assert data["human_present"] is True
-
-    @pytest.mark.anyio
-    async def test_slot_default(self):
-        profile_no_slot = {k: v for k, v in _PROFILE.items() if k != "maintenance_slot"}
-        with patch("servers.robot.main.db", _db_for(profile_no_slot)):
-            data = await call_tool(
-                mcp, "check_human_presence", {"asset_id": "Chiller 6"}
-            )
-        assert data["slot"] == "day"
-
-    @pytest.mark.anyio
-    async def test_error_when_db_none(self, no_db):
-        data = await call_tool(
-            mcp, "check_human_presence", {"asset_id": "Chiller 6"}
-        )
-        assert "error" in data
-
-
-# ---------------------------------------------------------------------------
-# Tool 6: commit_reading
-# ---------------------------------------------------------------------------
-
-
-class TestCommitReading:
-    @pytest.mark.anyio
-    async def test_blocked_when_n_lt_3(self):
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            data = await call_tool(
-                mcp,
-                "commit_reading",
-                {
-                    "asset_id": "Chiller 6",
-                    "readings": [74.0, 76.0],
-                    "decision": "close_normal",
-                },
-            )
-        assert data["status"] == "BLOCKED"
-        assert data["fm_flag"] == "FM-7b"
-
-    @pytest.mark.anyio
-    async def test_status_field_present(self):
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            data = await call_tool(
-                mcp,
-                "commit_reading",
-                {
-                    "asset_id": "Chiller 6",
-                    "readings": [73.0, 75.0, 77.0],
-                    "decision": "close_normal",
-                },
-            )
-        assert data["status"] in {"COMMIT", "BLOCKED", "ESCALATE", "OOD_FLAG", "PANEL_RECHECK"}
-
-    @pytest.mark.anyio
-    async def test_score_present(self):
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            data = await call_tool(
-                mcp,
-                "commit_reading",
-                {
-                    "asset_id": "Chiller 6",
-                    "readings": [73.0, 75.0, 77.0],
-                    "decision": "close_normal",
-                },
-            )
-        assert "score" in data
-        assert isinstance(data["score"], float)
-
-    @pytest.mark.anyio
-    async def test_error_when_db_none(self, no_db):
-        data = await call_tool(
-            mcp,
-            "commit_reading",
-            {
-                "asset_id": "Chiller 6",
-                "readings": [73.0, 75.0, 77.0],
-                "decision": "close_normal",
-            },
-        )
-        assert "error" in data
-
-    @requires_couchdb
-    @pytest.mark.anyio
-    async def test_integration_commit_or_escalate(self):
-        data = await call_tool(
-            mcp,
-            "commit_reading",
-            {
-                "asset_id": "Chiller 6",
-                "readings": [49.5, 50.0, 50.5],
-                "decision": "close_normal",
-            },
-        )
-        assert data["status"] in {"COMMIT", "ESCALATE", "OOD_FLAG", "PANEL_RECHECK"}
-
-
-# ---------------------------------------------------------------------------
-# Tool 7: check_wo_similarity
-# ---------------------------------------------------------------------------
-
-
-class TestCheckWoSimilarity:
-    def _wo_mock(self, docs):
-        mock = MagicMock()
-        mock.find.return_value = {"docs": docs}
-        return mock
-
-    @pytest.mark.anyio
-    async def test_error_when_wo_db_none(self, no_wo_db):
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            data = await call_tool(
-                mcp,
-                "check_wo_similarity",
-                {
-                    "asset_id": "Chiller 6",
-                    "failure_description": "water leak near chiller",
-                },
-            )
-        assert "error" in data
-
-    @pytest.mark.anyio
-    async def test_proceed_when_no_similar_wos(self):
-        wo_doc = {
-            "wonum": "1000045",
-            "description": "completely unrelated electrical work",
-            "assetnum": "CHILLER6",
-            "status": "COMP",
-        }
-        with patch("servers.robot.main._get_wo_db", return_value=self._wo_mock([wo_doc])):
-            with patch("servers.robot.main.db", _db_for(_PROFILE)):
-                data = await call_tool(
-                    mcp,
-                    "check_wo_similarity",
-                    {
-                        "asset_id": "Chiller 6",
-                        "failure_description": "water leak near chiller",
-                    },
-                )
-        assert data["recommendation"] in {"proceed", "review", "consolidate"}
-        assert "similar_wos" in data
-        assert "scores" in data
-
-    @pytest.mark.anyio
-    async def test_consolidate_for_identical_description(self):
-        wo_doc = {
-            "wonum": "1000046",
-            "description": "water leak near chiller unit",
-            "assetnum": "CHILLER6",
-            "status": "WAPPR",
-        }
-        with patch("servers.robot.main._get_wo_db", return_value=self._wo_mock([wo_doc])):
-            with patch("servers.robot.main.db", _db_for(_PROFILE)):
-                data = await call_tool(
-                    mcp,
-                    "check_wo_similarity",
-                    {
-                        "asset_id": "Chiller 6",
-                        "failure_description": "water leak near chiller unit",
-                    },
-                )
-        assert data["recommendation"] == "consolidate"
-        assert data["duplicate_risk"] is True
-
-    @requires_couchdb
-    @pytest.mark.anyio
-    async def test_integration_wo_similarity(self):
-        data = await call_tool(
-            mcp,
-            "check_wo_similarity",
-            {
-                "asset_id": "Chiller 6",
-                "failure_description": "anomaly on chiller condenser",
-            },
+    mock.get.return_value = None
+    with patch("servers.robot.main.db", mock):
+        result = await call_tool(mcp, "get_battery", {})
+    assert "error" in result
+    assert "robot_state" in result["error"]
+
+
+# ===========================================================================
+# get_pose
+# ===========================================================================
+
+
+@pytest.mark.asyncio
+async def test_get_pose_nominal(mock_db):
+    result = await call_tool(mcp, "get_pose", {})
+    assert result["localization_ok"] is True
+    assert result["pose_drift_m"] == 0.0
+    assert result["fault_state"] is None
+    assert "OK" in result["message"]
+
+
+@pytest.mark.asyncio
+async def test_get_pose_localization_failure(mock_db_loc_failure):
+    """FM-10: localization_ok=False, drift=1.8 m → abort instruction."""
+    result = await call_tool(mcp, "get_pose", {})
+    assert result["localization_ok"] is False
+    assert result["pose_drift_m"] == 1.8
+    assert "LOCALIZATION FAILURE" in result["message"]
+    assert "Abort" in result["message"]
+
+
+@pytest.mark.asyncio
+async def test_get_pose_no_db(no_db):
+    result = await call_tool(mcp, "get_pose", {})
+    assert "error" in result
+
+
+# ===========================================================================
+# list_waypoints
+# ===========================================================================
+
+
+@pytest.mark.asyncio
+async def test_list_waypoints_all(mock_db):
+    result = await call_tool(mcp, "list_waypoints", {})
+    assert result["total"] == 3
+    assert result["active_count"] == 3
+    assert all(wp["active"] for wp in result["waypoints"])
+    assert "all active" in result["message"]
+
+
+@pytest.mark.asyncio
+async def test_list_waypoints_filtered(mock_db):
+    result = await call_tool(mcp, "list_waypoints", {"asset_id": "motor_01"})
+    assert result["total"] == 1
+    assert result["waypoints"][0]["waypoint_id"] == "wp_motor_01_panel"
+
+
+@pytest.mark.asyncio
+async def test_list_waypoints_missing(mock_db_waypoint_missing):
+    """FM-11: motor_01 waypoint is inactive → escalation instruction."""
+    result = await call_tool(mcp, "list_waypoints", {"asset_id": "motor_01"})
+    assert result["active_count"] == 0
+    inactive = result["waypoints"][0]
+    assert inactive["active"] is False
+    assert "INACTIVE" in result["message"]
+    assert "FM-11" in result["message"]
+
+
+@pytest.mark.asyncio
+async def test_list_waypoints_no_db(no_db):
+    result = await call_tool(mcp, "list_waypoints", {})
+    assert "error" in result
+
+
+@pytest.mark.asyncio
+async def test_list_waypoints_no_doc(mock_db):
+    """waypoints doc returns None → error with helpful message."""
+    from unittest.mock import MagicMock, patch
+    mock = MagicMock()
+    mock.get.return_value = None
+    with patch("servers.robot.main.db", mock):
+        result = await call_tool(mcp, "list_waypoints", {})
+    assert "error" in result
+    assert "waypoints" in result["error"]
+
+
+# ===========================================================================
+# capture_image
+# ===========================================================================
+
+
+@pytest.mark.asyncio
+async def test_capture_image_no_gauge_path(mock_db):
+    """Nominal profile: gauge_path=None → image_available=False."""
+    result = await call_tool(mcp, "capture_image", {"asset_id": "Motor 01"})
+    assert result["image_available"] is False
+    assert result["occlusion_flag"] is False
+    assert result["gauge_path"] is None
+    assert result["gauge_range"] == [0, 200]
+    assert "pending" in result["message"]
+
+
+@pytest.mark.asyncio
+async def test_capture_image_with_gauge_path(mock_db_with_gauge_path):
+    """gauge_path set → image_available=True, vlm_hint populated."""
+    result = await call_tool(mcp, "capture_image", {"asset_id": "Motor 01"})
+    assert result["image_available"] is True
+    assert result["occlusion_flag"] is False
+    assert result["gauge_path"] == "/data/gauges/motor_01/gauge_001.jpg"
+    assert "vlm_hint" in result
+    assert "0" in result["vlm_hint"]    # range low
+    assert "200" in result["vlm_hint"]  # range high
+    assert "Pass to VLM" in result["message"]
+
+
+@pytest.mark.asyncio
+async def test_capture_image_panel_stuck(mock_db_panel_stuck):
+    """panel_stuck=True → occlusion_flag=True, image_available=False."""
+    result = await call_tool(mcp, "capture_image", {"asset_id": "Motor 01"})
+    assert result["occlusion_flag"] is True
+    assert result["image_available"] is False
+    assert "BLOCKED" in result["message"]
+    assert "FM-2" in result["message"]
+
+
+@pytest.mark.asyncio
+async def test_capture_image_no_db(no_db):
+    result = await call_tool(mcp, "capture_image", {"asset_id": "Motor 01"})
+    assert "error" in result
+
+
+@pytest.mark.asyncio
+async def test_capture_image_unknown_asset(mock_db):
+    result = await call_tool(mcp, "capture_image", {"asset_id": "GhostPump"})
+    assert "error" in result
+
+
+# ===========================================================================
+# gauge_value isolation — no tool must return gauge_value
+# ===========================================================================
+
+
+@pytest.mark.asyncio
+async def test_no_tool_returns_gauge_value(mock_db_with_gauge_path):
+    """None of the 12 tools should return a gauge_value field."""
+    tools_and_args = [
+        ("navigate_to",    {"asset_id": "Motor 01"}),
+        ("open_panel",     {"asset_id": "Motor 01"}),
+        ("get_battery",    {}),
+        ("get_pose",       {}),
+        ("list_waypoints", {}),
+        ("capture_image",  {"asset_id": "Motor 01"}),
+        ("power_on",       {}),
+        ("power_off",      {}),
+        ("stand",          {}),
+        ("sit",            {}),
+        ("dock",           {}),
+        ("undock",         {}),
+    ]
+    for tool_name, args in tools_and_args:
+        result = await call_tool(mcp, tool_name, args)
+        assert "gauge_value" not in result, (
+            f"Tool '{tool_name}' leaked gauge_value field: {result}"
         )
-        assert "recommendation" in data
-        assert data["recommendation"] in {"proceed", "review", "consolidate"}
-
-
-# ---------------------------------------------------------------------------
-# Tool 8: detect_anomaly
-# ---------------------------------------------------------------------------
-
-
-class TestDetectAnomaly:
-    @pytest.mark.anyio
-    async def test_returns_all_expected_fields(self):
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            data = await call_tool(mcp, "detect_anomaly", {"asset_id": "Chiller 6"})
-        for field in (
-            "spill_detected",
-            "leakage_detected",
-            "pipe_damage_detected",
-            "pooled_liquid_detected",
-            "anomaly_confidence",
-        ):
-            assert field in data, f"Missing field '{field}' in detect_anomaly response"
-
-    @pytest.mark.anyio
-    async def test_spill_scenario_detected(self):
-        import servers.robot.main as robot_main
-        robot_main._simulator.generate_scenario("chiller_6", [0.0, 100.0], "spill")
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            data = await call_tool(mcp, "detect_anomaly", {"asset_id": "Chiller 6"})
-        assert data["spill_detected"] is True
-        assert data["leakage_detected"] is True
-
-    @pytest.mark.anyio
-    async def test_normal_scenario_no_spill(self):
-        import servers.robot.main as robot_main
-        robot_main._simulator.generate_scenario("chiller_6", [0.0, 100.0], "normal")
-        with patch("servers.robot.main.db", _db_for(_PROFILE)):
-            data = await call_tool(mcp, "detect_anomaly", {"asset_id": "Chiller 6"})
-        assert data["spill_detected"] is False
-        assert data["leakage_detected"] is False
-
-    @pytest.mark.anyio
-    async def test_error_when_db_none(self, no_db):
-        data = await call_tool(mcp, "detect_anomaly", {"asset_id": "Chiller 6"})
-        assert "error" in data
-
-    @requires_couchdb
-    @pytest.mark.anyio
-    async def test_integration_anomaly_fields(self):
-        data = await call_tool(mcp, "detect_anomaly", {"asset_id": "Chiller 6"})
-        assert "spill_detected" in data
-        assert isinstance(data["anomaly_confidence"], float)
+
+
+# ===========================================================================
+# power_on
+# ===========================================================================
+
+
+@pytest.mark.asyncio
+async def test_power_on_nominal(mock_db):
+    result = await call_tool(mcp, "power_on", {})
+    assert result["success"] is True
+    assert result["power_state"] == "POWERED_ON"
+    assert result["transition"] == "power_on"
+    assert result["robot_id"] == "spot_1"
+
+
+@pytest.mark.asyncio
+async def test_power_on_already_on(mock_db):
+    """Calling power_on when already powered on returns success (idempotent)."""
+    result = await call_tool(mcp, "power_on", {})
+    assert result["success"] is True
+    assert "already" in result["message"].lower()
+
+
+@pytest.mark.asyncio
+async def test_power_on_from_off(mock_db_powered_off):
+    """power_on transitions from POWERED_OFF to POWERED_ON."""
+    result = await call_tool(mcp, "power_on", {})
+    assert result["success"] is True
+    assert result["power_state"] == "POWERED_ON"
+    assert "powered on" in result["message"].lower()
+
+
+@pytest.mark.asyncio
+async def test_power_on_no_db(no_db):
+    result = await call_tool(mcp, "power_on", {})
+    assert "error" in result
+
+
+# ===========================================================================
+# power_off
+# ===========================================================================
+
+
+@pytest.mark.asyncio
+async def test_power_off_sitting(mock_db_sitting):
+    """Sitting + powered on → power_off succeeds."""
+    result = await call_tool(mcp, "power_off", {})
+    assert result["success"] is True
+    assert result["power_state"] == "POWERED_OFF"
+    assert result["transition"] == "power_off"
+
+
+@pytest.mark.asyncio
+async def test_power_off_while_standing(mock_db):
+    """Robot is STANDING → power_off must refuse."""
+    result = await call_tool(mcp, "power_off", {})
+    assert result["success"] is False
+    assert "STANDING" in result["message"]
+    assert "sit()" in result["message"]
+
+
+@pytest.mark.asyncio
+async def test_power_off_already_off(mock_db_powered_off):
+    """Already powered off → idempotent success."""
+    result = await call_tool(mcp, "power_off", {})
+    assert result["success"] is True
+    assert "already" in result["message"].lower()
+
+
+@pytest.mark.asyncio
+async def test_power_off_no_db(no_db):
+    result = await call_tool(mcp, "power_off", {})
+    assert "error" in result
+
+
+# ===========================================================================
+# stand
+# ===========================================================================
+
+
+@pytest.mark.asyncio
+async def test_stand_nominal(mock_db_sitting):
+    """Powered on and sitting → stand succeeds."""
+    result = await call_tool(mcp, "stand", {})
+    assert result["success"] is True
+    assert result["stance_state"] == "STANDING"
+    assert result["power_state"] == "POWERED_ON"
+    assert result["transition"] == "stand"
+
+
+@pytest.mark.asyncio
+async def test_stand_already_standing(mock_db):
+    """Already standing → idempotent success."""
+    result = await call_tool(mcp, "stand", {})
+    assert result["success"] is True
+    assert "already" in result["message"].lower()
+
+
+@pytest.mark.asyncio
+async def test_stand_powered_off(mock_db_powered_off):
+    """Power off → stand must refuse."""
+    result = await call_tool(mcp, "stand", {})
+    assert result["success"] is False
+    assert "not powered on" in result["message"].lower()
+    assert "power_on()" in result["message"]
+
+
+@pytest.mark.asyncio
+async def test_stand_no_db(no_db):
+    result = await call_tool(mcp, "stand", {})
+    assert "error" in result
+
+
+# ===========================================================================
+# sit
+# ===========================================================================
+
+
+@pytest.mark.asyncio
+async def test_sit_nominal(mock_db):
+    """Powered on and standing → sit succeeds."""
+    result = await call_tool(mcp, "sit", {})
+    assert result["success"] is True
+    assert result["stance_state"] == "SITTING"
+    assert result["transition"] == "sit"
+
+
+@pytest.mark.asyncio
+async def test_sit_already_sitting(mock_db_sitting):
+    """Already sitting → idempotent success."""
+    result = await call_tool(mcp, "sit", {})
+    assert result["success"] is True
+    assert "already" in result["message"].lower()
+
+
+@pytest.mark.asyncio
+async def test_sit_powered_off(mock_db_powered_off):
+    """Power off → sit must refuse."""
+    result = await call_tool(mcp, "sit", {})
+    assert result["success"] is False
+    assert "not powered on" in result["message"].lower()
+
+
+@pytest.mark.asyncio
+async def test_sit_no_db(no_db):
+    result = await call_tool(mcp, "sit", {})
+    assert "error" in result
+
+
+# ===========================================================================
+# dock
+# ===========================================================================
+
+
+@pytest.mark.asyncio
+async def test_dock_nominal(mock_db):
+    """Nominal state with dock waypoint active → dock succeeds."""
+    result = await call_tool(mcp, "dock", {})
+    assert result["docked"] is True
+    assert result["at_charge_station"] is True
+    assert result["dock_waypoint_id"] == "wp_dock_main"
+    assert result["battery_charge_pct"] == 85.0
+
+
+@pytest.mark.asyncio
+async def test_dock_no_db(no_db):
+    result = await call_tool(mcp, "dock", {})
+    assert "error" in result
+
+
+@pytest.mark.asyncio
+async def test_dock_no_dock_waypoint(mock_db):
+    """Waypoints doc has no dock waypoint → dock fails gracefully."""
+    import copy
+    from unittest.mock import patch
+    from .conftest import NOMINAL_ROBOT_STATE, NOMINAL_PROFILE, _make_mock_db
+    wps_no_dock = {
+        "_id":      "waypoints",
+        "doc_type": "waypoints",
+        "waypoints": [
+            {"waypoint_id": "wp_motor_01_panel", "waypoint_name": "Motor 01",
+             "asset_id": "motor_01", "location_description": "Plant A",
+             "x": 7.2, "y": 44.8, "active": True},
+        ],
+    }
+    with patch("servers.robot.main.db", _make_mock_db(waypoints=wps_no_dock)):
+        result = await call_tool(mcp, "dock", {})
+    assert result["docked"] is False
+    assert result["at_charge_station"] is False
+    assert "not found" in result["message"].lower()
+
+
+# ===========================================================================
+# undock
+# ===========================================================================
+
+
+@pytest.mark.asyncio
+async def test_undock_nominal(mock_db):
+    """Nominal battery 85% → undock succeeds."""
+    result = await call_tool(mcp, "undock", {})
+    assert result["docked"] is False
+    assert result["at_charge_station"] is False
+    assert result["battery_charge_pct"] == 85.0
+
+
+@pytest.mark.asyncio
+async def test_undock_low_battery(mock_db_low_battery):
+    """Battery 18% (below threshold 20%) → undock refused."""
+    result = await call_tool(mcp, "undock", {})
+    assert result["docked"] is True
+    assert result["at_charge_station"] is True
+    assert "UNDOCK REFUSED" in result["message"]
+
+
+@pytest.mark.asyncio
+async def test_undock_no_db(no_db):
+    result = await call_tool(mcp, "undock", {})
+    assert "error" in result
+
+
+# ===========================================================================
+# Integration (live CouchDB required)
+# ===========================================================================
+
+
+@requires_couchdb
+def test_get_battery_live():
+    """Live CouchDB: get_battery returns a valid result or a clear 'not seeded' error."""
+    from servers.robot.main import get_battery
+    result = get_battery()
+    if hasattr(result, "error"):
+        assert "robot_state" in result.error
+    else:
+        assert result.battery_charge_pct >= 0
+
+
+@requires_couchdb
+def test_list_waypoints_live():
+    """Live CouchDB: list_waypoints returns waypoints or a clear 'not seeded' error."""
+    from servers.robot.main import list_waypoints
+    result = list_waypoints()
+    if hasattr(result, "error"):
+        assert "waypoints" in result.error
+    else:
+        assert result.total >= 0
diff --git a/src/servers/robot/tests/test_verifier.py b/src/servers/robot/tests/test_verifier.py
deleted file mode 100644
index 32437a1e4..000000000
--- a/src/servers/robot/tests/test_verifier.py
+++ /dev/null
@@ -1,135 +0,0 @@
-"""Unit tests for MultiReadingVerifier — no CouchDB required."""
-
-import pytest
-from servers.robot.verifier import MultiReadingVerifier, VerifierResult
-
-
-@pytest.fixture
-def verifier():
-    return MultiReadingVerifier()
-
-
-class TestBlockedGate:
-    def test_blocked_n_1(self, verifier):
-        result = verifier.verify(
-            readings=[50.0],
-            iot_value=50.0,
-            gauge_range=[0, 100],
-        )
-        assert result.status == "BLOCKED"
-        assert result.fm_flag == "FM-7b"
-        assert result.score == 0.0
-
-    def test_blocked_n_2(self, verifier):
-        result = verifier.verify(
-            readings=[48.0, 52.0],
-            iot_value=50.0,
-            gauge_range=[0, 100],
-        )
-        assert result.status == "BLOCKED"
-        assert result.fm_flag == "FM-7b"
-
-    def test_fm7b_flag_in_blocked(self, verifier):
-        result = verifier.verify(readings=[], iot_value=0.0, gauge_range=[0, 100])
-        assert result.fm_flag == "FM-7b"
-        # insufficient readings flag appears in fm_annotations
-        assert any("FM-7b" in ann for ann in result.fm_annotations)
-
-
-class TestFreezeGate:
-    def test_zero_variance_triggers_panel_recheck(self, verifier):
-        # Three identical readings → std=0.0 → PANEL_RECHECK
-        result = verifier.verify(
-            readings=[50.0, 50.0, 50.0],
-            iot_value=50.0,
-            gauge_range=[0, 100],
-        )
-        assert result.status == "PANEL_RECHECK"
-        assert result.fm_flag == "FM-1"
-
-    def test_tiny_variance_still_freezes(self, verifier):
-        # std = 0.0001 < 0.001 * 100 = 0.1 → PANEL_RECHECK
-        result = verifier.verify(
-            readings=[50.0, 50.0001, 50.0002],
-            iot_value=50.0,
-            gauge_range=[0, 100],
-        )
-        assert result.status == "PANEL_RECHECK"
-
-
-class TestCommit:
-    def test_commit_consistent_readings(self, verifier):
-        # Tight cluster near IoT value → high C, high A → COMMIT
-        result = verifier.verify(
-            readings=[49.5, 50.0, 50.5],
-            iot_value=50.0,
-            gauge_range=[0, 100],
-        )
-        assert result.status == "COMMIT"
-        assert result.score >= 0.82
-
-    def test_historical_signal_neutral_when_absent(self, verifier):
-        result = verifier.verify(
-            readings=[49.5, 50.0, 50.5],
-            iot_value=50.0,
-            gauge_range=[0, 100],
-            historical_baseline=None,
-        )
-        assert result.H == 0.5
-        assert result.status == "COMMIT"
-
-
-class TestEscalateAndOOD:
-    def test_escalate_moderate_contradiction(self, verifier):
-        # Mean reading 80, IoT says 20 — large gap → low A
-        result = verifier.verify(
-            readings=[78.0, 80.0, 82.0],
-            iot_value=20.0,
-            gauge_range=[0, 100],
-        )
-        # A = 1 - |80 - 20| / 100 = 0.40 → score roughly 0.35*C + 0.35*0.40 + 0.30*H
-        assert result.status in {"ESCALATE", "OOD_FLAG"}
-
-    def test_ood_very_low_score(self, verifier):
-        # Readings near top, IoT near bottom, historical near bottom
-        result = verifier.verify(
-            readings=[88.0, 90.0, 92.0],
-            iot_value=5.0,
-            gauge_range=[0, 100],
-            historical_baseline=5.0,
-        )
-        # A = 1 - |90-5|/100 = 0.15; H = 1 - |90-5|/100 = 0.15 → score ≈ 0.35*C + 0.35*0.15 + 0.30*0.15
-        assert result.status == "OOD_FLAG"
-
-
-class TestFMAnnotations:
-    def test_fm7_annotation_when_a_lt_015(self, verifier):
-        # A = 1 - |90 - 3| / 100 = 0.13 < 0.15 → sensor-physical contradiction annotation fires
-        result = verifier.verify(
-            readings=[88.0, 90.0, 92.0],
-            iot_value=3.0,
-            gauge_range=[0, 100],
-        )
-        assert any("FM-7" in ann for ann in result.fm_annotations)
-
-    def test_fm7c_annotation_when_h_lt_015(self, verifier):
-        # H = 1 - |90 - 3| / 100 = 0.13 < 0.15 → historical outlier annotation fires; IoT agrees (A fine)
-        result = verifier.verify(
-            readings=[88.0, 90.0, 92.0],
-            iot_value=90.0,
-            gauge_range=[0, 100],
-            historical_baseline=3.0,
-        )
-        assert any("FM-7c" in ann for ann in result.fm_annotations)
-
-    def test_no_fm_annotations_for_clean_commit(self, verifier):
-        result = verifier.verify(
-            readings=[49.5, 50.0, 50.5],
-            iot_value=50.0,
-            gauge_range=[0, 100],
-            historical_baseline=50.0,
-        )
-        assert result.fm_annotations == []
-        assert result.status == "COMMIT"
-
-
diff --git a/src/servers/robot/verifier.py b/src/servers/robot/verifier.py
deleted file mode 100644
index afe98a1e1..000000000
--- a/src/servers/robot/verifier.py
+++ /dev/null
@@ -1,133 +0,0 @@
-"""MultiReadingVerifier — CP-calibrated commit gate.
-
-Formula (updated from research analysis):
-    score = 0.35*C + 0.35*A + 0.30*H
-
-    C: multi-read consistency  = 1 - std(readings) / gauge_range_span
-    A: gauge-vs-IoT agreement  = 1 - |mean(readings) - iot_value| / span
-    H: historical consistency  = 1 - |mean(readings) - hist_baseline| / span
-       (H = 0.50 neutral when no history is available)
-
-Hard gates (applied before scoring):
-    N < 3                        → BLOCKED       (FM-7b)
-    std(readings) < 0.1% range   → PANEL_RECHECK (FM-1: sensor freeze)
-
-Thresholds (placeholder until field-visit calibration):
-    score ≥ 0.82  → COMMIT
-    score ≥ 0.65  → ESCALATE
-    else          → OOD_FLAG
-
-Note on Q (agent self-confidence):
-    Q was removed from the formula because LLM self-confidence is poorly
-    calibrated and creating a gaming surface. Q is recorded diagnostically
-    in commit documents but does not influence the gate.
-"""
-
-import statistics
-from dataclasses import dataclass, field
-from typing import Optional
-
-
-@dataclass
-class VerifierResult:
-    status: str          # COMMIT | BLOCKED | ESCALATE | OOD_FLAG | PANEL_RECHECK
-    score: float
-    C: float
-    A: float
-    H: float
-    fm_flag: Optional[str]
-    fm_annotations: list
-    reason: str
-
-
-class MultiReadingVerifier:
-    TAU_COMMIT = 0.82
-    TAU_ESCALATE = 0.65
-    FREEZE_EPSILON = 0.001   # std < 0.1% of range → sensor freeze
-
-    def verify(
-        self,
-        readings: list,
-        iot_value: float,
-        gauge_range: list,
-        historical_baseline: Optional[float] = None,
-    ) -> VerifierResult:
-        range_span = float(gauge_range[1]) - float(gauge_range[0])
-        if range_span <= 0:
-            range_span = 1.0
-
-        # Hard gate: insufficient readings
-        if len(readings) < 3:
-            return VerifierResult(
-                status="BLOCKED",
-                score=0.0,
-                C=0.0, A=0.0, H=0.5,
-                fm_flag="FM-7b",
-                fm_annotations=["FM-7b: fewer than 3 readings before commit"],
-                reason=(
-                    f"N={len(readings)} readings supplied; "
-                    "minimum 3 required before commit"
-                ),
-            )
-
-        # Hard gate: sensor freeze (zero variance → stuck gauge or panel)
-        std_val = statistics.stdev(readings) if len(readings) > 1 else 0.0
-        if std_val < self.FREEZE_EPSILON * range_span:
-            return VerifierResult(
-                status="PANEL_RECHECK",
-                score=0.0,
-                C=0.0, A=0.0, H=0.5,
-                fm_flag="FM-1",
-                fm_annotations=[
-                    "FM-1: sensor freeze — readings show no variance across attempts"
-                ],
-                reason="Zero variance across readings; panel may be stuck or gauge frozen",
-            )
-
-        mean_r = statistics.mean(readings)
-
-        C = max(0.0, 1.0 - std_val / range_span)
-        A = max(0.0, 1.0 - abs(mean_r - iot_value) / range_span)
-        H = (
-            max(0.0, 1.0 - abs(mean_r - historical_baseline) / range_span)
-            if historical_baseline is not None
-            else 0.5
-        )
-
-        score = round(0.35 * C + 0.35 * A + 0.30 * H, 4)
-
-        fm_annotations = []
-        if A < 0.15:
-            fm_annotations.append(
-                "FM-7: sensor-physical contradiction (reading vs IoT sensor)"
-            )
-        if historical_baseline is not None and H < 0.15:
-            fm_annotations.append(
-                "FM-7c: historical outlier (reading contradicts asset baseline)"
-            )
-
-        fm_flag = fm_annotations[0].split(":")[0] if fm_annotations else None
-
-        if score >= self.TAU_COMMIT:
-            status = "COMMIT"
-        elif score >= self.TAU_ESCALATE:
-            status = "ESCALATE"
-        else:
-            status = "OOD_FLAG"
-            if not fm_flag:
-                fm_flag = "FM-7"
-
-        reason = f"score={score:.3f} (C={C:.2f}, A={A:.2f}, H={H:.2f})"
-        if fm_annotations:
-            reason += "; " + "; ".join(fm_annotations)
-
-        return VerifierResult(
-            status=status,
-            score=score,
-            C=round(C, 4),
-            A=round(A, 4),
-            H=round(H, 4),
-            fm_flag=fm_flag,
-            fm_annotations=fm_annotations,
-            reason=reason,
-        )