From b87e30212579f5d30f0ccca480b6accbf92140e9 Mon Sep 17 00:00:00 2001
From: Your Name <your.email@example.com>
Date: Sat, 4 Apr 2026 18:13:09 -0400
Subject: [PATCH 1/4] =?UTF-8?q?feat:=20rebase=20onto=20upstream=20main=20?=
 =?UTF-8?q?=E2=80=94=20port=20FTS5=20BM25=20search,=20Interface=20registra?=
 =?UTF-8?q?tion,=20embeddings,=20cross-repo=20infrastructure?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Rebased our PR #162 features onto upstream's latest main (commit 1d30971)
which includes MinHash SIMILAR_TO edges, CBM_CACHE_DIR, and major refactoring.

Ported features (building clean on upstream's refactored codebase):

1. FTS5 BM25 search infrastructure:
   - Contentless FTS5 virtual table (nodes_fts) with camelCase token splitting
   - cbm_camel_split() SQLite function: updateCloudClient → 'update Cloud Client'
   - FTS5 backfill in both full pipeline and incremental pipeline
   - Incremental reindex now preserves FTS5 (was wiping to 0 rows)

2. Interface registration in symbol registry:
   - Added 'Interface' to label filter in process_def() (pass_definitions.c)
   - Added 'Interface' to label filter in register_and_link_def() (pass_parallel.c)
   - Fixes: C# class Foo : IBar now creates INHERITS → Interface edges

3. C# base_list extraction:
   - Added 'base_list' to fallback base_types[] in extract_base_classes()

4. Embeddings infrastructure (opt-in via CBM_EMBEDDING_URL):
   - embeddings table in SQLite schema
   - cbm_cosine_sim() SQLite function for vector search
   - embedding.c/h: HTTP client, text generation, RRF merge, pipeline integration
   - Auto-generates embeddings during indexing when configured

5. Cross-repo infrastructure:
   - cross_repo.c/h: unified _cross_repo.db builder, cross-repo search,
     channel matching, trace helper

Not yet ported (follow-up commits):
- MCP tool changes (search_graph query param, generate_embeddings tool,
  cross-repo tools, get_impact tool)
- Process detection (cbm_store_detect_processes)
- Channel detection (cbm_store_detect_channels)
- C# delegate event subscription (extract_calls.c)
- WRITES expansion (extract_semantic.c)

All upstream features preserved: MinHash SIMILAR_TO, pass_similarity,
CBM_CACHE_DIR, TS_FIELD() macro, extracted helpers.
---
 Makefile.cbm                        |   5 +-
 internal/cbm/extract_defs.c         |   1 +
 src/pipeline/embedding.c            | 498 ++++++++++++++++
 src/pipeline/embedding.h            |  81 +++
 src/pipeline/pass_definitions.c     |   3 +-
 src/pipeline/pass_parallel.c        |   2 +-
 src/pipeline/pipeline.c             |  33 ++
 src/pipeline/pipeline_incremental.c |   7 +
 src/store/cross_repo.c              | 889 ++++++++++++++++++++++++++++
 src/store/cross_repo.h              | 137 +++++
 src/store/store.c                   | 245 +++++++-
 src/store/store.h                   |  29 +
 12 files changed, 1923 insertions(+), 7 deletions(-)
 create mode 100644 src/pipeline/embedding.c
 create mode 100644 src/pipeline/embedding.h
 create mode 100644 src/store/cross_repo.c
 create mode 100644 src/store/cross_repo.h

diff --git a/Makefile.cbm b/Makefile.cbm
index c347e6a..c432f7c 100644
--- a/Makefile.cbm
+++ b/Makefile.cbm
@@ -145,7 +145,7 @@ PREPROCESSOR_SRC = $(CBM_DIR)/preprocessor.cpp
 SQLITE_WRITER_SRC = $(CBM_DIR)/sqlite_writer.c
 
 # Store module (new)
-STORE_SRCS = src/store/store.c
+STORE_SRCS = src/store/store.c src/store/cross_repo.c
 
 # Cypher module (new)
 CYPHER_SRCS = src/cypher/cypher.c
@@ -186,7 +186,8 @@ PIPELINE_SRCS = \
     src/pipeline/pass_compile_commands.c \
     src/pipeline/pass_infrascan.c \
     src/pipeline/pass_k8s.c \
-    src/pipeline/pass_similarity.c
+    src/pipeline/pass_similarity.c \
+    src/pipeline/embedding.c
 
 # SimHash / MinHash module
 SIMHASH_SRCS = src/simhash/minhash.c
diff --git a/internal/cbm/extract_defs.c b/internal/cbm/extract_defs.c
index 887c103..cc930f5 100644
--- a/internal/cbm/extract_defs.c
+++ b/internal/cbm/extract_defs.c
@@ -955,6 +955,7 @@ static const char **extract_base_classes(CBMArena *a, TSNode node, const char *s
                                        "implements_clause",
                                        "argument_list",
                                        "inheritance_specifier",
+                                       "base_list", /* C# class Foo : IBar */
                                        NULL};
     return find_base_from_children(a, node, source, base_types);
 }
diff --git a/src/pipeline/embedding.c b/src/pipeline/embedding.c
new file mode 100644
index 0000000..6daa008
--- /dev/null
+++ b/src/pipeline/embedding.c
@@ -0,0 +1,498 @@
+/*
+ * embedding.c — Semantic embedding generation via HTTP API + RRF hybrid search.
+ *
+ * Uses Mongoose for synchronous HTTP POST to OpenAI-compatible /v1/embeddings.
+ * Uses yyjson for JSON serialization/deserialization.
+ */
+
+#include "pipeline/embedding.h"
+#include "foundation/log.h"
+#include "foundation/platform.h"
+#include "foundation/compat.h"
+
+#include <mongoose/mongoose.h>
+#include <yyjson/yyjson.h>
+#include <sqlite3/sqlite3.h>
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+
+/* Thread-local int-to-string buffer for log key-value pairs. */
+static _Thread_local char _itoa_buf[32];
+static const char *itoa_buf(int val) {
+    snprintf(_itoa_buf, sizeof(_itoa_buf), "%d", val);
+    return _itoa_buf;
+}
+
+/* ── Configuration ──────────────────────────────────────────────── */
+
+cbm_embedding_config_t cbm_embedding_get_config(void) {
+    cbm_embedding_config_t cfg = {0};
+    cfg.url = getenv("CBM_EMBEDDING_URL");
+    cfg.model = getenv("CBM_EMBEDDING_MODEL");
+    if (!cfg.model) cfg.model = "nomic-embed-text";
+
+    const char *dims_str = getenv("CBM_EMBEDDING_DIMS");
+    cfg.dims = dims_str ? atoi(dims_str) : 768;
+    if (cfg.dims <= 0) cfg.dims = 768;
+
+    const char *batch_str = getenv("CBM_EMBEDDING_BATCH_SIZE");
+    cfg.batch_size = batch_str ? atoi(batch_str) : 32;
+    if (cfg.batch_size <= 0) cfg.batch_size = 32;
+
+    cfg.timeout_ms = 30000;
+    return cfg;
+}
+
+bool cbm_embedding_is_configured(void) {
+    const char *url = getenv("CBM_EMBEDDING_URL");
+    return url && url[0];
+}
+
+/* ── HTTP embedding client (Mongoose synchronous) ──────────────── */
+
+/* State for the synchronous HTTP request. */
+typedef struct {
+    bool done;
+    bool error;
+    char *response_body;
+    int response_len;
+    const char *url;         /* original URL for building the request */
+    const char *content_type;
+    const char *body;
+    bool request_sent;
+} http_state_t;
+
+static void http_handler(struct mg_connection *c, int ev, void *ev_data) {
+    http_state_t *state = (http_state_t *)c->fn_data;
+
+    if (ev == MG_EV_CONNECT) {
+        /* Connection established — send the HTTP request */
+        struct mg_str host = mg_url_host(state->url);
+        mg_printf(c,
+                  "POST %s HTTP/1.1\r\n"
+                  "Host: %.*s\r\n"
+                  "Content-Type: %s\r\n"
+                  "Content-Length: %d\r\n"
+                  "\r\n"
+                  "%s",
+                  mg_url_uri(state->url),
+                  (int)host.len, host.buf,
+                  state->content_type,
+                  (int)strlen(state->body),
+                  state->body);
+        state->request_sent = true;
+    } else if (ev == MG_EV_HTTP_MSG) {
+        struct mg_http_message *hm = (struct mg_http_message *)ev_data;
+        state->response_body = malloc((size_t)hm->body.len + 1);
+        if (state->response_body) {
+            memcpy(state->response_body, hm->body.buf, hm->body.len);
+            state->response_body[hm->body.len] = '\0';
+            state->response_len = (int)hm->body.len;
+        }
+        state->done = true;
+        c->is_draining = 1;
+    } else if (ev == MG_EV_ERROR) {
+        state->error = true;
+        state->done = true;
+        c->is_draining = 1;
+    }
+}
+
+/* Synchronous HTTP POST. Returns allocated response body or NULL on error.
+ * Caller must free the returned string. */
+static char *http_post_sync(const char *url, const char *content_type,
+                            const char *body, int timeout_ms) {
+    struct mg_mgr mgr;
+    mg_mgr_init(&mgr);
+
+    http_state_t state = {0};
+    state.url = url;
+    state.content_type = content_type;
+    state.body = body;
+
+    struct mg_connection *c = mg_http_connect(&mgr, url, http_handler, &state);
+    if (!c) {
+        mg_mgr_free(&mgr);
+        return NULL;
+    }
+
+    /* Poll until done or timeout */
+    int elapsed = 0;
+    while (!state.done && elapsed < timeout_ms) {
+        mg_mgr_poll(&mgr, 50);
+        elapsed += 50;
+    }
+
+    mg_mgr_free(&mgr);
+
+    if (state.error || !state.done) {
+        free(state.response_body);
+        return NULL;
+    }
+    return state.response_body;
+}
+
+/* ── Embedding API calls ───────────────────────────────────────── */
+
+/* Build the JSON request body for /v1/embeddings.
+ * {"model": "...", "input": ["text1", "text2", ...]} */
+static char *build_embedding_request(const char *model, const char **texts, int count) {
+    yyjson_mut_doc *doc = yyjson_mut_doc_new(NULL);
+    yyjson_mut_val *root = yyjson_mut_obj(doc);
+    yyjson_mut_doc_set_root(doc, root);
+
+    yyjson_mut_obj_add_str(doc, root, "model", model);
+
+    yyjson_mut_val *input = yyjson_mut_arr(doc);
+    for (int i = 0; i < count; i++) {
+        yyjson_mut_arr_add_str(doc, input, texts[i]);
+    }
+    yyjson_mut_obj_add_val(doc, root, "input", input);
+
+    char *json = yyjson_mut_write(doc, 0, NULL);
+    yyjson_mut_doc_free(doc);
+    return json;
+}
+
+/* Parse the JSON response from /v1/embeddings.
+ * Returns allocated float[count * dims] or NULL on error. */
+static float *parse_embedding_response(const char *json, int expected_count,
+                                       int expected_dims) {
+    yyjson_doc *doc = yyjson_read(json, strlen(json), 0);
+    if (!doc) return NULL;
+
+    yyjson_val *root = yyjson_doc_get_root(doc);
+    yyjson_val *data = yyjson_obj_get(root, "data");
+    if (!data || !yyjson_is_arr(data)) {
+        yyjson_doc_free(doc);
+        return NULL;
+    }
+
+    int arr_len = (int)yyjson_arr_size(data);
+    if (arr_len != expected_count) {
+        cbm_log_error("embedding.parse", "msg", "count_mismatch",
+                      "expected", itoa_buf(expected_count),
+                      "got", itoa_buf(arr_len));
+        yyjson_doc_free(doc);
+        return NULL;
+    }
+
+    float *result = calloc((size_t)(expected_count * expected_dims), sizeof(float));
+    if (!result) {
+        yyjson_doc_free(doc);
+        return NULL;
+    }
+
+    size_t idx, max;
+    yyjson_val *item;
+    yyjson_arr_foreach(data, idx, max, item) {
+        /* Each item: {"embedding": [...], "index": N} */
+        yyjson_val *emb = yyjson_obj_get(item, "embedding");
+        yyjson_val *index_val = yyjson_obj_get(item, "index");
+        if (!emb || !yyjson_is_arr(emb)) continue;
+
+        int emb_idx = index_val ? (int)yyjson_get_int(index_val) : (int)idx;
+        if (emb_idx < 0 || emb_idx >= expected_count) continue;
+
+        int emb_dims = (int)yyjson_arr_size(emb);
+        if (emb_dims != expected_dims) {
+            /* Dimension mismatch — first occurrence, log and bail */
+            if (idx == 0) {
+                cbm_log_error("embedding.parse", "msg", "dims_mismatch",
+                              "expected", itoa_buf(expected_dims),
+                              "got", itoa_buf(emb_dims));
+            }
+            /* Still try to copy what we can */
+            emb_dims = emb_dims < expected_dims ? emb_dims : expected_dims;
+        }
+
+        float *dest = &result[emb_idx * expected_dims];
+        size_t ei, emax;
+        yyjson_val *val;
+        int d = 0;
+        yyjson_arr_foreach(emb, ei, emax, val) {
+            if (d >= expected_dims) break;
+            dest[d++] = (float)yyjson_get_real(val);
+        }
+    }
+
+    yyjson_doc_free(doc);
+    return result;
+}
+
+float *cbm_embedding_embed_text(const cbm_embedding_config_t *cfg, const char *text) {
+    if (!cfg || !cfg->url || !text) return NULL;
+    const char *texts[] = {text};
+    return cbm_embedding_embed_batch(cfg, texts, 1);
+}
+
+float *cbm_embedding_embed_batch(const cbm_embedding_config_t *cfg,
+                                 const char **texts, int count) {
+    if (!cfg || !cfg->url || !texts || count <= 0) return NULL;
+
+    /* Build URL: base_url + "/embeddings" */
+    char url[1024];
+    snprintf(url, sizeof(url), "%s/embeddings", cfg->url);
+
+    /* Build JSON request */
+    char *request_json = build_embedding_request(cfg->model, texts, count);
+    if (!request_json) return NULL;
+
+    /* HTTP POST */
+    char *response = http_post_sync(url, "application/json",
+                                    request_json, cfg->timeout_ms);
+    free(request_json);
+
+    if (!response) {
+        cbm_log_error("embedding.http", "msg", "request_failed", "url", url);
+        return NULL;
+    }
+
+    /* Parse response */
+    float *embeddings = parse_embedding_response(response, count, cfg->dims);
+    free(response);
+
+    return embeddings;
+}
+
+/* ── Text generation ───────────────────────────────────────────── */
+
+char *cbm_embedding_node_text(const cbm_node_t *node) {
+    if (!node || !node->name) return NULL;
+
+    /* Extract directory from file_path */
+    char dir[256] = "";
+    if (node->file_path) {
+        const char *last_slash = strrchr(node->file_path, '/');
+        if (last_slash && last_slash > node->file_path) {
+            int dlen = (int)(last_slash - node->file_path);
+            if (dlen >= (int)sizeof(dir)) dlen = (int)sizeof(dir) - 1;
+            memcpy(dir, node->file_path, (size_t)dlen);
+            dir[dlen] = '\0';
+        }
+    }
+
+    /* Extract filename from file_path */
+    const char *filename = node->file_path;
+    if (filename) {
+        const char *last_slash = strrchr(filename, '/');
+        if (last_slash) filename = last_slash + 1;
+    }
+
+    /* Extract code snippet from properties JSON (first 500 chars) */
+    char snippet[512] = "";
+    if (node->properties_json && node->properties_json[0] != '{') {
+        /* properties_json IS the code sometimes */
+    } else if (node->properties_json) {
+        yyjson_doc *pdoc = yyjson_read(node->properties_json,
+                                       strlen(node->properties_json), 0);
+        if (pdoc) {
+            yyjson_val *proot = yyjson_doc_get_root(pdoc);
+            yyjson_val *code = yyjson_obj_get(proot, "code");
+            if (!code) code = yyjson_obj_get(proot, "content");
+            if (!code) code = yyjson_obj_get(proot, "signature");
+            if (code && yyjson_is_str(code)) {
+                const char *s = yyjson_get_str(code);
+                if (s) {
+                    int slen = (int)strlen(s);
+                    if (slen > 500) slen = 500;
+                    memcpy(snippet, s, (size_t)slen);
+                    snippet[slen] = '\0';
+                }
+            }
+            yyjson_doc_free(pdoc);
+        }
+    }
+
+    /* Build: "Label: name\nFile: filename\nDirectory: dir\n\nsnippet" */
+    int buf_size = 2048;
+    char *buf = malloc((size_t)buf_size);
+    if (!buf) return NULL;
+
+    int len = snprintf(buf, (size_t)buf_size,
+                       "%s: %s\nFile: %s\nDirectory: %s",
+                       node->label ? node->label : "Symbol",
+                       node->name,
+                       filename ? filename : "",
+                       dir[0] ? dir : "");
+
+    if (snippet[0]) {
+        len += snprintf(buf + len, (size_t)(buf_size - len), "\n\n%s", snippet);
+    }
+
+    return buf;
+}
+
+/* ── RRF merge ─────────────────────────────────────────────────── */
+
+int cbm_embedding_rrf_merge(const int64_t *bm25_ids, int bm25_count,
+                            const cbm_vector_result_t *vec_results, int vec_count,
+                            cbm_rrf_result_t **out, int *out_count) {
+    if (!out || !out_count) return CBM_STORE_ERR;
+    *out = NULL;
+    *out_count = 0;
+
+    /* Estimate max unique results */
+    int max_results = bm25_count + vec_count;
+    if (max_results == 0) return CBM_STORE_OK;
+
+    cbm_rrf_result_t *results = calloc((size_t)max_results, sizeof(cbm_rrf_result_t));
+    if (!results) return CBM_STORE_ERR;
+
+    int count = 0;
+
+    /* Add BM25 results with RRF scores */
+    for (int i = 0; i < bm25_count; i++) {
+        double rrf_score = 1.0 / (CBM_RRF_K + i);
+        /* Check if already in results (shouldn't happen for BM25) */
+        results[count].node_id = bm25_ids[i];
+        results[count].rrf_score = rrf_score;
+        results[count].bm25_rank = i;
+        results[count].vec_rank = -1;
+        results[count].similarity = 0;
+        count++;
+    }
+
+    /* Add vector results, merging with existing BM25 results */
+    for (int i = 0; i < vec_count; i++) {
+        double rrf_score = 1.0 / (CBM_RRF_K + i);
+        int64_t nid = vec_results[i].node_id;
+
+        /* Check if this node_id already exists from BM25 */
+        bool found = false;
+        for (int j = 0; j < count; j++) {
+            if (results[j].node_id == nid) {
+                results[j].rrf_score += rrf_score;
+                results[j].vec_rank = i;
+                results[j].similarity = vec_results[i].similarity;
+                found = true;
+                break;
+            }
+        }
+
+        if (!found) {
+            results[count].node_id = nid;
+            results[count].rrf_score = rrf_score;
+            results[count].bm25_rank = -1;
+            results[count].vec_rank = i;
+            results[count].similarity = vec_results[i].similarity;
+            count++;
+        }
+    }
+
+    /* Sort by RRF score descending */
+    for (int i = 0; i < count - 1; i++) {
+        for (int j = i + 1; j < count; j++) {
+            if (results[j].rrf_score > results[i].rrf_score) {
+                cbm_rrf_result_t tmp = results[i];
+                results[i] = results[j];
+                results[j] = tmp;
+            }
+        }
+    }
+
+    *out = results;
+    *out_count = count;
+    return CBM_STORE_OK;
+}
+
+/* ── Pipeline integration ──────────────────────────────────────── */
+
+int cbm_embedding_generate_for_project(cbm_store_t *s, const char *project, bool force) {
+    if (!s || !project) return -1;
+
+    cbm_embedding_config_t cfg = cbm_embedding_get_config();
+    if (!cfg.url) {
+        cbm_log_info("embedding.skip", "reason", "not_configured");
+        return 0;
+    }
+
+    /* Query embeddable nodes */
+    const char *sql = force
+        ? "SELECT id, project, label, name, qualified_name, file_path, "
+          "start_line, end_line, properties FROM nodes "
+          "WHERE project = ?1 "
+          "AND label IN ('Function','Method','Class','Interface','Route')"
+        : "SELECT id, project, label, name, qualified_name, file_path, "
+          "start_line, end_line, properties FROM nodes "
+          "WHERE project = ?1 "
+          "AND label IN ('Function','Method','Class','Interface','Route') "
+          "AND id NOT IN (SELECT node_id FROM embeddings WHERE project = ?1)";
+
+    sqlite3_stmt *stmt = NULL;
+    struct sqlite3 *db = cbm_store_get_db(s);
+    if (!db) return -1;
+    if (sqlite3_prepare_v2(db, sql, -1, &stmt, NULL) != SQLITE_OK) return -1;
+    sqlite3_bind_text(stmt, 1, project, -1, SQLITE_STATIC);
+
+    /* Collect nodes into batches */
+    int total_embedded = 0;
+    int batch_cap = cfg.batch_size;
+    int64_t *batch_ids = malloc((size_t)batch_cap * sizeof(int64_t));
+    const char **batch_texts = malloc((size_t)batch_cap * sizeof(char *));
+    int batch_count = 0;
+
+    while (sqlite3_step(stmt) == SQLITE_ROW) {
+        cbm_node_t node = {0};
+        node.id = sqlite3_column_int64(stmt, 0);
+        node.project = (const char *)sqlite3_column_text(stmt, 1);
+        node.label = (const char *)sqlite3_column_text(stmt, 2);
+        node.name = (const char *)sqlite3_column_text(stmt, 3);
+        node.qualified_name = (const char *)sqlite3_column_text(stmt, 4);
+        node.file_path = (const char *)sqlite3_column_text(stmt, 5);
+        node.start_line = sqlite3_column_int(stmt, 6);
+        node.end_line = sqlite3_column_int(stmt, 7);
+        node.properties_json = (const char *)sqlite3_column_text(stmt, 8);
+
+        char *text = cbm_embedding_node_text(&node);
+        if (!text) continue;
+
+        batch_ids[batch_count] = node.id;
+        batch_texts[batch_count] = text;
+        batch_count++;
+
+        /* Flush batch when full */
+        if (batch_count >= batch_cap) {
+            float *embeddings = cbm_embedding_embed_batch(&cfg, batch_texts, batch_count);
+            if (embeddings) {
+                cbm_store_upsert_embedding_batch(s, batch_ids, project,
+                                                 embeddings, cfg.dims, batch_count);
+                total_embedded += batch_count;
+                free(embeddings);
+            } else {
+                cbm_log_error("embedding.batch", "msg", "failed",
+                              "batch_size", itoa_buf(batch_count));
+            }
+
+            /* Free batch texts */
+            for (int i = 0; i < batch_count; i++) {
+                free((void *)batch_texts[i]);
+            }
+            batch_count = 0;
+        }
+    }
+
+    /* Flush remaining batch */
+    if (batch_count > 0) {
+        float *embeddings = cbm_embedding_embed_batch(&cfg, batch_texts, batch_count);
+        if (embeddings) {
+            cbm_store_upsert_embedding_batch(s, batch_ids, project,
+                                             embeddings, cfg.dims, batch_count);
+            total_embedded += batch_count;
+            free(embeddings);
+        }
+        for (int i = 0; i < batch_count; i++) {
+            free((void *)batch_texts[i]);
+        }
+    }
+
+    sqlite3_finalize(stmt);
+    free(batch_ids);
+    free(batch_texts);
+
+    cbm_log_info("embedding.done", "project", project,
+                 "embedded", itoa_buf(total_embedded));
+    return total_embedded;
+}
diff --git a/src/pipeline/embedding.h b/src/pipeline/embedding.h
new file mode 100644
index 0000000..5eb2179
--- /dev/null
+++ b/src/pipeline/embedding.h
@@ -0,0 +1,81 @@
+/*
+ * embedding.h — Semantic embedding generation and hybrid search.
+ *
+ * Generates embeddings via HTTP POST to an OpenAI-compatible /v1/embeddings
+ * endpoint (Ollama, llamafile, OpenAI, etc.). Configuration via env vars:
+ *   CBM_EMBEDDING_URL   — Base URL (e.g., http://localhost:11434/v1)
+ *   CBM_EMBEDDING_MODEL — Model name (e.g., nomic-embed-text)
+ *   CBM_EMBEDDING_DIMS  — Expected vector dimensions (default: 768)
+ *
+ * When CBM_EMBEDDING_URL is not set, all embedding functions are no-ops.
+ */
+#ifndef CBM_EMBEDDING_H
+#define CBM_EMBEDDING_H
+
+#include "store/store.h"
+#include <stdbool.h>
+
+/* ── Configuration ──────────────────────────────────────────────── */
+
+typedef struct {
+    const char *url;    /* CBM_EMBEDDING_URL (NULL = disabled) */
+    const char *model;  /* CBM_EMBEDDING_MODEL */
+    int dims;           /* CBM_EMBEDDING_DIMS (default 768) */
+    int batch_size;     /* texts per HTTP request (default 32) */
+    int timeout_ms;     /* HTTP timeout (default 30000) */
+} cbm_embedding_config_t;
+
+/* Read config from environment variables. Returns config with url=NULL if disabled. */
+cbm_embedding_config_t cbm_embedding_get_config(void);
+
+/* Check if embedding is configured (CBM_EMBEDDING_URL is set). */
+bool cbm_embedding_is_configured(void);
+
+/* ── Embedding generation ──────────────────────────────────────── */
+
+/* Embed a single text string. Returns allocated float[dims] or NULL on error.
+ * Caller must free the returned array. */
+float *cbm_embedding_embed_text(const cbm_embedding_config_t *cfg, const char *text);
+
+/* Embed multiple texts in a single HTTP request.
+ * Returns allocated float[count * dims] or NULL on error.
+ * Caller must free the returned array. */
+float *cbm_embedding_embed_batch(const cbm_embedding_config_t *cfg,
+                                 const char **texts, int count);
+
+/* ── Text generation (node → embeddable text) ──────────────────── */
+
+/* Generate embeddable text for a node: "Label: name\nFile: path\nDir: dir\n\n<snippet>"
+ * Returns allocated string. Caller must free. */
+char *cbm_embedding_node_text(const cbm_node_t *node);
+
+/* ── Hybrid search (BM25 + vector + RRF merge) ────────────────── */
+
+/* RRF constant (from IR literature). */
+#define CBM_RRF_K 60
+
+/* Merged search result with combined RRF score. */
+typedef struct {
+    int64_t node_id;
+    double rrf_score;    /* combined RRF score (higher = better) */
+    double bm25_rank;    /* rank in BM25 results (-1 if not found by BM25) */
+    double vec_rank;     /* rank in vector results (-1 if not found by vector) */
+    double similarity;   /* cosine similarity (0 if not found by vector) */
+} cbm_rrf_result_t;
+
+/* Merge BM25 search results with vector search results using RRF (k=60).
+ * bm25_ids: node IDs from BM25 search, in ranked order (best first).
+ * vec_results: vector search results from cbm_store_vector_search.
+ * Returns allocated array sorted by combined RRF score. Caller frees. */
+int cbm_embedding_rrf_merge(const int64_t *bm25_ids, int bm25_count,
+                            const cbm_vector_result_t *vec_results, int vec_count,
+                            cbm_rrf_result_t **out, int *out_count);
+
+/* ── Pipeline integration ──────────────────────────────────────── */
+
+/* Generate embeddings for all embeddable nodes in a project.
+ * Skips nodes that already have embeddings unless force=true.
+ * Returns number of embeddings generated, or -1 on error. */
+int cbm_embedding_generate_for_project(cbm_store_t *s, const char *project, bool force);
+
+#endif /* CBM_EMBEDDING_H */
diff --git a/src/pipeline/pass_definitions.c b/src/pipeline/pass_definitions.c
index 5929a05..e498df7 100644
--- a/src/pipeline/pass_definitions.c
+++ b/src/pipeline/pass_definitions.c
@@ -216,9 +216,10 @@ static void process_def(cbm_pipeline_ctx_t *ctx, const CBMDefinition *def, const
     int64_t node_id = cbm_gbuf_upsert_node(
         ctx->gbuf, def->label ? def->label : "Function", def->name, def->qualified_name,
         def->file_path ? def->file_path : rel, (int)def->start_line, (int)def->end_line, props);
+    /* Register callable symbols + Interface (for C#/Java INHERITS resolution) */
     if (node_id > 0 && def->label &&
         (strcmp(def->label, "Function") == 0 || strcmp(def->label, "Method") == 0 ||
-         strcmp(def->label, "Class") == 0)) {
+         strcmp(def->label, "Class") == 0 || strcmp(def->label, "Interface") == 0)) {
         cbm_registry_add(ctx->registry, def->name, def->qualified_name, def->label);
     }
     char *file_qn = cbm_pipeline_fqn_compute(ctx->project_name, rel, "__file__");
diff --git a/src/pipeline/pass_parallel.c b/src/pipeline/pass_parallel.c
index 68843df..f2a0d9c 100644
--- a/src/pipeline/pass_parallel.c
+++ b/src/pipeline/pass_parallel.c
@@ -632,7 +632,7 @@ static int register_and_link_def(cbm_pipeline_ctx_t *ctx, const CBMDefinition *d
         return 0;
     }
     if (strcmp(def->label, "Function") == 0 || strcmp(def->label, "Method") == 0 ||
-        strcmp(def->label, "Class") == 0) {
+        strcmp(def->label, "Class") == 0 || strcmp(def->label, "Interface") == 0) {
         cbm_registry_add(ctx->registry, def->name, def->qualified_name, def->label);
         (*reg_entries)++;
     }
diff --git a/src/pipeline/pipeline.c b/src/pipeline/pipeline.c
index 5afc3dd..dd88a82 100644
--- a/src/pipeline/pipeline.c
+++ b/src/pipeline/pipeline.c
@@ -21,6 +21,7 @@ enum { CBM_DIR_PERMS = 0755, PL_RING = 4, PL_RING_MASK = 3, PL_SEQ_PASSES = 5, P
 #include "store/store.h"
 #include "discover/discover.h"
 #include "discover/userconfig.h"
+#include "pipeline/embedding.h"
 #include "foundation/platform.h"
 #include "foundation/compat_fs.h"
 #include "foundation/log.h"
@@ -780,6 +781,38 @@ int cbm_pipeline_run(cbm_pipeline_t *p) {
         goto cleanup;
     }
 
+    /* ── Post-dump passes: FTS5, processes, channels, embeddings ── */
+    {
+        char db_path[1024];
+        if (p->db_path) {
+            snprintf(db_path, sizeof(db_path), "%s", p->db_path);
+        } else {
+            const char *cdir = cbm_resolve_cache_dir();
+            if (!cdir) cdir = cbm_tmpdir();
+            snprintf(db_path, sizeof(db_path), "%s/%s.db", cdir, p->project_name);
+        }
+
+        cbm_store_t *post_store = cbm_store_open_path(db_path);
+        if (post_store) {
+            /* FTS5 backfill with camelCase splitting */
+            cbm_store_exec(post_store, "DELETE FROM nodes_fts;");
+            cbm_store_exec(post_store,
+                "INSERT INTO nodes_fts(rowid, name, qualified_name, label, file_path) "
+                "SELECT id, cbm_camel_split(name), qualified_name, label, file_path FROM nodes;");
+
+            /* Embedding generation (if configured) */
+            if (cbm_embedding_is_configured()) {
+                int nemb = cbm_embedding_generate_for_project(post_store, p->project_name, false);
+                if (nemb > 0) {
+                    cbm_log_info("pass.done", "pass", "embeddings",
+                                 "generated", itoa_buf(nemb));
+                }
+            }
+
+            cbm_store_close(post_store);
+        }
+    }
+
     cbm_log_info("pipeline.done", "nodes", itoa_buf(cbm_gbuf_node_count(p->gbuf)), "edges",
                  itoa_buf(cbm_gbuf_edge_count(p->gbuf)), "elapsed_ms",
                  itoa_buf((int)elapsed_ms(t0)));
diff --git a/src/pipeline/pipeline_incremental.c b/src/pipeline/pipeline_incremental.c
index 3978b24..0768f8c 100644
--- a/src/pipeline/pipeline_incremental.c
+++ b/src/pipeline/pipeline_incremental.c
@@ -269,6 +269,13 @@ static void dump_and_persist(cbm_gbuf_t *gbuf, const char *db_path, const char *
     cbm_store_t *hash_store = cbm_store_open_path(db_path);
     if (hash_store) {
         persist_hashes(hash_store, project, files, file_count);
+
+        /* Rebuild FTS5 index: btree dump bypasses triggers */
+        cbm_store_exec(hash_store, "DELETE FROM nodes_fts;");
+        cbm_store_exec(hash_store,
+            "INSERT INTO nodes_fts(rowid, name, qualified_name, label, file_path) "
+            "SELECT id, cbm_camel_split(name), qualified_name, label, file_path FROM nodes;");
+
         cbm_store_close(hash_store);
     }
 }
diff --git a/src/store/cross_repo.c b/src/store/cross_repo.c
new file mode 100644
index 0000000..9f0af44
--- /dev/null
+++ b/src/store/cross_repo.c
@@ -0,0 +1,889 @@
+/*
+ * cross_repo.c — Cross-repository index: build, search, channel matching.
+ *
+ * Scans all per-project .db files to build a unified _cross_repo.db with:
+ * - cross_channels: all channel emit/listen from every repo
+ * - cross_nodes: Function/Method/Class/Interface/Route stubs from all repos
+ * - cross_nodes_fts: BM25 FTS5 index with camelCase splitting
+ * - cross_embeddings: semantic vectors copied from per-project DBs
+ *
+ * The cross-repo DB is a standard SQLite file — no ATTACH needed.
+ * Built by scanning each project DB via cbm_store_open_path_query().
+ */
+
+#include "store/cross_repo.h"
+#include "store/store.h"
+#include "foundation/log.h"
+#include "foundation/platform.h"
+#include "foundation/compat.h"
+#include "foundation/compat_fs.h"
+
+#include <sqlite3.h>
+#include <math.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <time.h>
+
+/* ── Helpers ────────────────────────────────────────────────────── */
+
+static _Thread_local char _itoa[32];
+static const char *itoa_cr(int v) { snprintf(_itoa, sizeof(_itoa), "%d", v); return _itoa; }
+
+static const char *get_cross_repo_path(void) {
+    static char path[1024];
+    const char *home = getenv("HOME");
+    if (!home) home = getenv("USERPROFILE");
+    if (!home) return NULL;
+    snprintf(path, sizeof(path), "%s/.cache/codebase-memory-mcp/_cross_repo.db", home);
+    return path;
+}
+
+static const char *get_cache_dir(void) {
+    static char dir[1024];
+    const char *home = getenv("HOME");
+    if (!home) home = getenv("USERPROFILE");
+    if (!home) return NULL;
+    snprintf(dir, sizeof(dir), "%s/.cache/codebase-memory-mcp", home);
+    return dir;
+}
+
+/* CamelCase splitter — same as store.c. Duplicated to keep cross_repo self-contained. */
+static void sqlite_camel_split_cr(sqlite3_context *ctx, int argc, sqlite3_value **argv) {
+    (void)argc;
+    const char *input = (const char *)sqlite3_value_text(argv[0]);
+    if (!input || !input[0]) {
+        sqlite3_result_text(ctx, input ? input : "", -1, SQLITE_TRANSIENT);
+        return;
+    }
+    char buf[2048];
+    int len = snprintf(buf, sizeof(buf), "%s ", input);
+    for (int i = 0; input[i] && len < (int)sizeof(buf) - 2; i++) {
+        if (i > 0) {
+            bool split = false;
+            if (input[i] >= 'A' && input[i] <= 'Z' &&
+                input[i - 1] >= 'a' && input[i - 1] <= 'z') split = true;
+            if (input[i] >= 'A' && input[i] <= 'Z' &&
+                input[i - 1] >= 'A' && input[i - 1] <= 'Z' &&
+                input[i + 1] >= 'a' && input[i + 1] <= 'z') split = true;
+            if (split) buf[len++] = ' ';
+        }
+        buf[len++] = input[i];
+    }
+    buf[len] = '\0';
+    sqlite3_result_text(ctx, buf, len, SQLITE_TRANSIENT);
+}
+
+/* Cosine similarity — same as store.c. */
+static void sqlite_cosine_sim_cr(sqlite3_context *ctx, int argc, sqlite3_value **argv) {
+    (void)argc;
+    if (sqlite3_value_type(argv[0]) != SQLITE_BLOB ||
+        sqlite3_value_type(argv[1]) != SQLITE_BLOB) {
+        sqlite3_result_null(ctx); return;
+    }
+    const float *a = (const float *)sqlite3_value_blob(argv[0]);
+    const float *b = (const float *)sqlite3_value_blob(argv[1]);
+    int a_bytes = sqlite3_value_bytes(argv[0]);
+    int b_bytes = sqlite3_value_bytes(argv[1]);
+    if (a_bytes != b_bytes || a_bytes == 0 || (a_bytes % (int)sizeof(float)) != 0) {
+        sqlite3_result_null(ctx); return;
+    }
+    int dims = a_bytes / (int)sizeof(float);
+    float dot = 0.0f, na = 0.0f, nb = 0.0f;
+    for (int i = 0; i < dims; i++) {
+        dot += a[i] * b[i]; na += a[i] * a[i]; nb += b[i] * b[i];
+    }
+    if (na == 0.0f || nb == 0.0f) { sqlite3_result_double(ctx, 0.0); return; }
+    sqlite3_result_double(ctx, (double)dot / (sqrt((double)na) * sqrt((double)nb)));
+}
+
+/* ── Cross-Repo Handle ──────────────────────────────────────────── */
+
+struct cbm_cross_repo {
+    sqlite3 *db;
+};
+
+cbm_cross_repo_t *cbm_cross_repo_open(void) {
+    const char *path = get_cross_repo_path();
+    if (!path) return NULL;
+
+    sqlite3 *db = NULL;
+    if (sqlite3_open_v2(path, &db, SQLITE_OPEN_READONLY | SQLITE_OPEN_NOMUTEX, NULL) != SQLITE_OK) {
+        if (db) sqlite3_close(db);
+        return NULL;
+    }
+
+    /* Register custom functions */
+    sqlite3_create_function(db, "cbm_camel_split", 1, SQLITE_UTF8 | SQLITE_DETERMINISTIC,
+                            NULL, sqlite_camel_split_cr, NULL, NULL);
+    sqlite3_create_function(db, "cbm_cosine_sim", 2, SQLITE_UTF8 | SQLITE_DETERMINISTIC,
+                            NULL, sqlite_cosine_sim_cr, NULL, NULL);
+
+    cbm_cross_repo_t *cr = calloc(1, sizeof(cbm_cross_repo_t));
+    if (!cr) { sqlite3_close(db); return NULL; }
+    cr->db = db;
+    return cr;
+}
+
+void cbm_cross_repo_close(cbm_cross_repo_t *cr) {
+    if (!cr) return;
+    if (cr->db) sqlite3_close(cr->db);
+    free(cr);
+}
+
+/* ── Build ──────────────────────────────────────────────────────── */
+
+static const char *CROSS_SCHEMA =
+    "CREATE TABLE IF NOT EXISTS cross_channels ("
+    "  id INTEGER PRIMARY KEY AUTOINCREMENT,"
+    "  channel_name TEXT NOT NULL,"
+    "  transport TEXT NOT NULL,"
+    "  direction TEXT NOT NULL,"
+    "  project TEXT NOT NULL,"
+    "  file_path TEXT NOT NULL DEFAULT '',"
+    "  function_name TEXT NOT NULL DEFAULT '',"
+    "  node_id INTEGER NOT NULL DEFAULT 0"
+    ");"
+    "CREATE INDEX IF NOT EXISTS idx_xch_name ON cross_channels(channel_name);"
+    "CREATE INDEX IF NOT EXISTS idx_xch_project ON cross_channels(project);"
+    "CREATE TABLE IF NOT EXISTS cross_nodes ("
+    "  id INTEGER PRIMARY KEY AUTOINCREMENT,"
+    "  project TEXT NOT NULL,"
+    "  orig_id INTEGER NOT NULL,"
+    "  label TEXT NOT NULL,"
+    "  name TEXT NOT NULL,"
+    "  qualified_name TEXT NOT NULL,"
+    "  file_path TEXT NOT NULL DEFAULT ''"
+    ");"
+    "CREATE INDEX IF NOT EXISTS idx_xn_project ON cross_nodes(project);"
+    "CREATE INDEX IF NOT EXISTS idx_xn_name ON cross_nodes(name);"
+    "CREATE INDEX IF NOT EXISTS idx_xn_proj_orig ON cross_nodes(project, orig_id);"
+    "CREATE TABLE IF NOT EXISTS cross_embeddings ("
+    "  node_id INTEGER PRIMARY KEY,"
+    "  project TEXT NOT NULL,"
+    "  embedding BLOB NOT NULL,"
+    "  dimensions INTEGER NOT NULL"
+    ");"
+    "CREATE INDEX IF NOT EXISTS idx_xe_project ON cross_embeddings(project);"
+    "CREATE TABLE IF NOT EXISTS cross_meta ("
+    "  key TEXT PRIMARY KEY,"
+    "  value TEXT NOT NULL"
+    ");";
+
+static const char *CROSS_FTS =
+    "CREATE VIRTUAL TABLE IF NOT EXISTS cross_nodes_fts USING fts5("
+    "name, qualified_name, label, file_path, project,"
+    "content='',"
+    "tokenize='unicode61 remove_diacritics 2'"
+    ");";
+
+cbm_cross_repo_stats_t cbm_cross_repo_build(void) {
+    cbm_cross_repo_stats_t stats = {0};
+    struct timespec t0;
+    clock_gettime(CLOCK_MONOTONIC, &t0);
+
+    const char *db_path = get_cross_repo_path();
+    const char *cache_dir = get_cache_dir();
+    if (!db_path || !cache_dir) {
+        stats.repos_scanned = -1;
+        return stats;
+    }
+
+    /* Delete old cross-repo DB and create fresh */
+    remove(db_path);
+
+    sqlite3 *db = NULL;
+    if (sqlite3_open_v2(db_path, &db,
+                        SQLITE_OPEN_READWRITE | SQLITE_OPEN_CREATE | SQLITE_OPEN_NOMUTEX,
+                        NULL) != SQLITE_OK) {
+        if (db) sqlite3_close(db);
+        stats.repos_scanned = -1;
+        return stats;
+    }
+
+    /* Register custom functions for FTS5 */
+    sqlite3_create_function(db, "cbm_camel_split", 1, SQLITE_UTF8 | SQLITE_DETERMINISTIC,
+                            NULL, sqlite_camel_split_cr, NULL, NULL);
+
+    /* Pragmas for fast bulk write */
+    sqlite3_exec(db, "PRAGMA journal_mode=WAL; PRAGMA synchronous=OFF; "
+                     "PRAGMA cache_size=-32000;", NULL, NULL, NULL);
+
+    /* Create schema */
+    char *err = NULL;
+    sqlite3_exec(db, CROSS_SCHEMA, NULL, NULL, &err);
+    if (err) { sqlite3_free(err); err = NULL; }
+    sqlite3_exec(db, CROSS_FTS, NULL, NULL, &err);
+    if (err) { sqlite3_free(err); err = NULL; }
+
+    sqlite3_exec(db, "BEGIN TRANSACTION", NULL, NULL, NULL);
+
+    /* Scan all project DBs in cache directory */
+    cbm_dir_t *dir = cbm_opendir(cache_dir);
+    if (!dir) {
+        sqlite3_close(db);
+        stats.repos_scanned = -1;
+        return stats;
+    }
+
+    /* Prepared statements for inserting into cross-repo DB */
+    sqlite3_stmt *ins_ch = NULL;
+    sqlite3_prepare_v2(db,
+        "INSERT INTO cross_channels(channel_name, transport, direction, project, "
+        "file_path, function_name, node_id) VALUES(?1,?2,?3,?4,?5,?6,?7)",
+        -1, &ins_ch, NULL);
+
+    sqlite3_stmt *ins_node = NULL;
+    sqlite3_prepare_v2(db,
+        "INSERT INTO cross_nodes(project, orig_id, label, name, qualified_name, file_path) "
+        "VALUES(?1,?2,?3,?4,?5,?6)",
+        -1, &ins_node, NULL);
+
+    sqlite3_stmt *ins_emb = NULL;
+    sqlite3_prepare_v2(db,
+        "INSERT INTO cross_embeddings(node_id, project, embedding, dimensions) "
+        "VALUES(?1,?2,?3,?4)",
+        -1, &ins_emb, NULL);
+
+    cbm_dirent_t *dent;
+    while ((dent = cbm_readdir(dir)) != NULL) {
+        const char *entry = dent->name;
+        /* Skip non-.db files, _cross_repo.db, _config.db */
+        size_t elen = strlen(entry);
+        if (elen < 4 || strcmp(entry + elen - 3, ".db") != 0) continue;
+        if (strstr(entry, "_cross_repo") || strstr(entry, "_config")) continue;
+        if (strstr(entry, "-wal") || strstr(entry, "-shm")) continue;
+
+        char proj_db_path[2048];
+        snprintf(proj_db_path, sizeof(proj_db_path), "%s/%s", cache_dir, entry);
+
+        /* Derive project name from filename (remove .db suffix) */
+        char project_name[512];
+        snprintf(project_name, sizeof(project_name), "%.*s", (int)(elen - 3), entry);
+
+        /* Open project DB read-only */
+        sqlite3 *pdb = NULL;
+        if (sqlite3_open_v2(proj_db_path, &pdb,
+                            SQLITE_OPEN_READONLY | SQLITE_OPEN_NOMUTEX, NULL) != SQLITE_OK) {
+            if (pdb) sqlite3_close(pdb);
+            continue;
+        }
+
+        stats.repos_scanned++;
+
+        /* Copy channels */
+        {
+            sqlite3_stmt *sel = NULL;
+            if (sqlite3_prepare_v2(pdb,
+                    "SELECT channel_name, transport, direction, project, file_path, "
+                    "function_name, node_id FROM channels", -1, &sel, NULL) == SQLITE_OK) {
+                while (sqlite3_step(sel) == SQLITE_ROW) {
+                    sqlite3_reset(ins_ch);
+                    for (int c = 0; c < 7; c++) {
+                        if (sqlite3_column_type(sel, c) == SQLITE_INTEGER)
+                            sqlite3_bind_int64(ins_ch, c + 1, sqlite3_column_int64(sel, c));
+                        else
+                            sqlite3_bind_text(ins_ch, c + 1,
+                                (const char *)sqlite3_column_text(sel, c), -1, SQLITE_TRANSIENT);
+                    }
+                    sqlite3_step(ins_ch);
+                    stats.channels_copied++;
+                }
+                sqlite3_finalize(sel);
+            }
+        }
+
+        /* Copy embeddable nodes */
+        {
+            sqlite3_stmt *sel = NULL;
+            if (sqlite3_prepare_v2(pdb,
+                    "SELECT id, label, name, qualified_name, file_path FROM nodes "
+                    "WHERE label IN ('Function','Method','Class','Interface','Route')",
+                    -1, &sel, NULL) == SQLITE_OK) {
+                while (sqlite3_step(sel) == SQLITE_ROW) {
+                    sqlite3_reset(ins_node);
+                    sqlite3_bind_text(ins_node, 1, project_name, -1, SQLITE_TRANSIENT);
+                    sqlite3_bind_int64(ins_node, 2, sqlite3_column_int64(sel, 0)); /* orig_id */
+                    sqlite3_bind_text(ins_node, 3,
+                        (const char *)sqlite3_column_text(sel, 1), -1, SQLITE_TRANSIENT);
+                    sqlite3_bind_text(ins_node, 4,
+                        (const char *)sqlite3_column_text(sel, 2), -1, SQLITE_TRANSIENT);
+                    sqlite3_bind_text(ins_node, 5,
+                        (const char *)sqlite3_column_text(sel, 3), -1, SQLITE_TRANSIENT);
+                    sqlite3_bind_text(ins_node, 6,
+                        (const char *)sqlite3_column_text(sel, 4), -1, SQLITE_TRANSIENT);
+                    sqlite3_step(ins_node);
+                    stats.nodes_copied++;
+                }
+                sqlite3_finalize(sel);
+            }
+        }
+
+        /* Copy embeddings — join with cross_nodes via a single efficient query.
+         * First ensure we have the index on (project, orig_id) for the join. */
+        {
+            sqlite3_stmt *sel = NULL;
+            /* Use the per-project DB to read embeddings, then look up cross_nodes.id
+             * via a prepared statement (reuse for all rows in this project). */
+            sqlite3_stmt *lu_emb = NULL;
+            sqlite3_prepare_v2(db,
+                "SELECT id FROM cross_nodes WHERE project=?1 AND orig_id=?2",
+                -1, &lu_emb, NULL);
+
+            if (lu_emb && sqlite3_prepare_v2(pdb,
+                    "SELECT node_id, embedding, dimensions FROM embeddings",
+                    -1, &sel, NULL) == SQLITE_OK) {
+                while (sqlite3_step(sel) == SQLITE_ROW) {
+                    int64_t orig_id = sqlite3_column_int64(sel, 0);
+                    sqlite3_reset(lu_emb);
+                    sqlite3_bind_text(lu_emb, 1, project_name, -1, SQLITE_TRANSIENT);
+                    sqlite3_bind_int64(lu_emb, 2, orig_id);
+                    if (sqlite3_step(lu_emb) == SQLITE_ROW) {
+                        int64_t cross_id = sqlite3_column_int64(lu_emb, 0);
+                        sqlite3_reset(ins_emb);
+                        sqlite3_bind_int64(ins_emb, 1, cross_id);
+                        sqlite3_bind_text(ins_emb, 2, project_name, -1, SQLITE_TRANSIENT);
+                        sqlite3_bind_blob(ins_emb, 3,
+                            sqlite3_column_blob(sel, 1),
+                            sqlite3_column_bytes(sel, 1), SQLITE_TRANSIENT);
+                        sqlite3_bind_int(ins_emb, 4, sqlite3_column_int(sel, 2));
+                        sqlite3_step(ins_emb);
+                        stats.embeddings_copied++;
+                    }
+                }
+                sqlite3_finalize(sel);
+            }
+            if (lu_emb) sqlite3_finalize(lu_emb);
+        }
+
+        sqlite3_close(pdb);
+    }
+    cbm_closedir(dir);
+
+    if (ins_ch) sqlite3_finalize(ins_ch);
+    if (ins_node) sqlite3_finalize(ins_node);
+    if (ins_emb) sqlite3_finalize(ins_emb);
+
+    /* Suppress file-level ghost channel entries when named entries exist */
+    sqlite3_exec(db,
+        "DELETE FROM cross_channels WHERE function_name = '(file-level)' "
+        "AND EXISTS (SELECT 1 FROM cross_channels c2 "
+        "WHERE c2.channel_name = cross_channels.channel_name "
+        "AND c2.file_path = cross_channels.file_path "
+        "AND c2.project = cross_channels.project "
+        "AND c2.direction = cross_channels.direction "
+        "AND c2.function_name != '(file-level)')", NULL, NULL, NULL);
+
+    /* Build FTS5 index with camelCase splitting */
+    sqlite3_exec(db, "DELETE FROM cross_nodes_fts", NULL, NULL, NULL);
+    sqlite3_exec(db,
+        "INSERT INTO cross_nodes_fts(rowid, name, qualified_name, label, file_path, project) "
+        "SELECT id, cbm_camel_split(name), qualified_name, label, file_path, project "
+        "FROM cross_nodes",
+        NULL, NULL, NULL);
+
+    /* Count cross-repo channel matches */
+    {
+        sqlite3_stmt *cnt = NULL;
+        if (sqlite3_prepare_v2(db,
+                "SELECT COUNT(DISTINCT e.channel_name) FROM cross_channels e "
+                "JOIN cross_channels l ON e.channel_name = l.channel_name "
+                "WHERE e.direction = 'emit' AND l.direction = 'listen' "
+                "AND e.project != l.project",
+                -1, &cnt, NULL) == SQLITE_OK) {
+            if (sqlite3_step(cnt) == SQLITE_ROW) {
+                stats.cross_repo_matches = sqlite3_column_int(cnt, 0);
+            }
+            sqlite3_finalize(cnt);
+        }
+    }
+
+    /* Store metadata */
+    {
+        time_t now = time(NULL);
+        char ts[64];
+        strftime(ts, sizeof(ts), "%Y-%m-%dT%H:%M:%SZ", gmtime(&now));
+        sqlite3_stmt *meta = NULL;
+        sqlite3_prepare_v2(db,
+            "INSERT OR REPLACE INTO cross_meta(key, value) VALUES(?1, ?2)",
+            -1, &meta, NULL);
+        if (meta) {
+            sqlite3_bind_text(meta, 1, "built_at", -1, SQLITE_STATIC);
+            sqlite3_bind_text(meta, 2, ts, -1, SQLITE_TRANSIENT);
+            sqlite3_step(meta);
+            sqlite3_reset(meta);
+            char buf[32];
+            snprintf(buf, sizeof(buf), "%d", stats.repos_scanned);
+            sqlite3_bind_text(meta, 1, "repos", -1, SQLITE_STATIC);
+            sqlite3_bind_text(meta, 2, buf, -1, SQLITE_TRANSIENT);
+            sqlite3_step(meta);
+            sqlite3_finalize(meta);
+        }
+    }
+
+    sqlite3_exec(db, "COMMIT", NULL, NULL, NULL);
+    sqlite3_exec(db, "PRAGMA synchronous=NORMAL", NULL, NULL, NULL);
+    sqlite3_close(db);
+
+    struct timespec t1;
+    clock_gettime(CLOCK_MONOTONIC, &t1);
+    stats.build_time_ms = (double)(t1.tv_sec - t0.tv_sec) * 1000.0 +
+                          (double)(t1.tv_nsec - t0.tv_nsec) / 1000000.0;
+
+    cbm_log_info("cross_repo.build", "repos", itoa_cr(stats.repos_scanned),
+                 "nodes", itoa_cr(stats.nodes_copied),
+                 "channels", itoa_cr(stats.channels_copied),
+                 "embeddings", itoa_cr(stats.embeddings_copied),
+                 "cross_matches", itoa_cr(stats.cross_repo_matches));
+
+    return stats;
+}
+
+/* ── Cross-Repo Search ──────────────────────────────────────────── */
+
+static char *heap_dup(const char *s) {
+    if (!s) return NULL;
+    size_t len = strlen(s);
+    char *d = malloc(len + 1);
+    if (d) { memcpy(d, s, len + 1); }
+    return d;
+}
+
+int cbm_cross_repo_search(cbm_cross_repo_t *cr, const char *query,
+                          const float *query_vec, int dims,
+                          int limit, cbm_cross_search_output_t *out) {
+    if (!cr || !cr->db || !query || !out) return CBM_STORE_ERR;
+    memset(out, 0, sizeof(*out));
+    if (limit <= 0) limit = 50;
+
+    /* Tokenize query for FTS5: split on whitespace, join with OR */
+    char fts_query[1024];
+    {
+        char tmp[1024];
+        snprintf(tmp, sizeof(tmp), "%s", query);
+        int fq_len = 0;
+        char *tok = strtok(tmp, " \t\n");
+        while (tok && fq_len < (int)sizeof(fts_query) - 20) {
+            if (fq_len > 0) fq_len += snprintf(fts_query + fq_len,
+                sizeof(fts_query) - (size_t)fq_len, " OR ");
+            fq_len += snprintf(fts_query + fq_len,
+                sizeof(fts_query) - (size_t)fq_len, "%s", tok);
+            tok = strtok(NULL, " \t\n");
+        }
+        fts_query[fq_len] = '\0';
+    }
+
+    /* BM25 search */
+    int bm25_cap = limit * 2;
+    int64_t *bm25_ids = calloc((size_t)bm25_cap, sizeof(int64_t));
+    int bm25_count = 0;
+
+    {
+        sqlite3_stmt *stmt = NULL;
+        const char *sql =
+            "SELECT cn.id, cn.project, cn.orig_id, cn.label, cn.name, "
+            "cn.qualified_name, cn.file_path, "
+            "(bm25(cross_nodes_fts) "
+            " - CASE WHEN cn.label IN ('Function','Method') THEN 10.0 "
+            "        WHEN cn.label IN ('Class','Interface') THEN 5.0 "
+            "        WHEN cn.label = 'Route' THEN 8.0 "
+            "        ELSE 0.0 END) AS rank "
+            "FROM cross_nodes_fts f "
+            "JOIN cross_nodes cn ON cn.id = f.rowid "
+            "WHERE cross_nodes_fts MATCH ?1 "
+            "ORDER BY rank LIMIT ?2";
+        if (sqlite3_prepare_v2(cr->db, sql, -1, &stmt, NULL) == SQLITE_OK) {
+            sqlite3_bind_text(stmt, 1, fts_query, -1, SQLITE_TRANSIENT);
+            sqlite3_bind_int(stmt, 2, bm25_cap);
+            while (sqlite3_step(stmt) == SQLITE_ROW && bm25_count < bm25_cap) {
+                bm25_ids[bm25_count++] = sqlite3_column_int64(stmt, 0);
+            }
+            sqlite3_finalize(stmt);
+        }
+    }
+
+    /* Vector search (if query_vec provided and embeddings exist) */
+    int vec_cap = limit;
+    int64_t *vec_ids = NULL;
+    double *vec_sims = NULL;
+    int vec_count = 0;
+
+    if (query_vec && dims > 0) {
+        int emb_count = 0;
+        {
+            sqlite3_stmt *cnt = NULL;
+            sqlite3_prepare_v2(cr->db, "SELECT COUNT(*) FROM cross_embeddings", -1, &cnt, NULL);
+            if (cnt && sqlite3_step(cnt) == SQLITE_ROW) emb_count = sqlite3_column_int(cnt, 0);
+            if (cnt) sqlite3_finalize(cnt);
+        }
+        if (emb_count > 0) {
+            vec_ids = calloc((size_t)vec_cap, sizeof(int64_t));
+            vec_sims = calloc((size_t)vec_cap, sizeof(double));
+
+            sqlite3_stmt *stmt = NULL;
+            const char *sql =
+                "SELECT ce.node_id, cbm_cosine_sim(?1, ce.embedding) AS sim "
+                "FROM cross_embeddings ce "
+                "WHERE sim > 0.3 "
+                "ORDER BY sim DESC LIMIT ?2";
+            if (sqlite3_prepare_v2(cr->db, sql, -1, &stmt, NULL) == SQLITE_OK) {
+                sqlite3_bind_blob(stmt, 1, query_vec, dims * (int)sizeof(float), SQLITE_STATIC);
+                sqlite3_bind_int(stmt, 2, vec_cap);
+                while (sqlite3_step(stmt) == SQLITE_ROW && vec_count < vec_cap) {
+                    vec_ids[vec_count] = sqlite3_column_int64(stmt, 0);
+                    vec_sims[vec_count] = sqlite3_column_double(stmt, 1);
+                    vec_count++;
+                }
+                sqlite3_finalize(stmt);
+            }
+            out->used_vector = (vec_count > 0);
+        }
+    }
+
+    /* RRF merge (k=60) */
+    int merge_cap = bm25_count + vec_count;
+    if (merge_cap == 0) {
+        free(bm25_ids); free(vec_ids); free(vec_sims);
+        return CBM_STORE_OK;
+    }
+
+    typedef struct { int64_t id; double score; double sim; } rrf_entry_t;
+    rrf_entry_t *merged = calloc((size_t)merge_cap, sizeof(rrf_entry_t));
+    int merge_count = 0;
+
+    for (int i = 0; i < bm25_count; i++) {
+        merged[merge_count].id = bm25_ids[i];
+        merged[merge_count].score = 1.0 / (60 + i);
+        merged[merge_count].sim = 0;
+        merge_count++;
+    }
+    for (int i = 0; i < vec_count; i++) {
+        bool found = false;
+        for (int j = 0; j < merge_count; j++) {
+            if (merged[j].id == vec_ids[i]) {
+                merged[j].score += 1.0 / (60 + i);
+                merged[j].sim = vec_sims[i];
+                found = true;
+                break;
+            }
+        }
+        if (!found && merge_count < merge_cap) {
+            merged[merge_count].id = vec_ids[i];
+            merged[merge_count].score = 1.0 / (60 + i);
+            merged[merge_count].sim = vec_sims[i];
+            merge_count++;
+        }
+    }
+
+    /* Sort by RRF score descending */
+    for (int i = 0; i < merge_count - 1; i++) {
+        for (int j = i + 1; j < merge_count; j++) {
+            if (merged[j].score > merged[i].score) {
+                rrf_entry_t tmp = merged[i]; merged[i] = merged[j]; merged[j] = tmp;
+            }
+        }
+    }
+
+    /* Build output — look up node details from cross_nodes */
+    int result_count = merge_count < limit ? merge_count : limit;
+    out->results = calloc((size_t)result_count, sizeof(cbm_cross_search_result_t));
+    out->total = merge_count;
+
+    sqlite3_stmt *lu = NULL;
+    sqlite3_prepare_v2(cr->db,
+        "SELECT project, orig_id, label, name, qualified_name, file_path "
+        "FROM cross_nodes WHERE id = ?1", -1, &lu, NULL);
+
+    for (int i = 0; i < result_count && lu; i++) {
+        sqlite3_reset(lu);
+        sqlite3_bind_int64(lu, 1, merged[i].id);
+        if (sqlite3_step(lu) == SQLITE_ROW) {
+            cbm_cross_search_result_t *r = &out->results[out->count];
+            r->project = heap_dup((const char *)sqlite3_column_text(lu, 0));
+            r->orig_id = sqlite3_column_int64(lu, 1);
+            r->label = heap_dup((const char *)sqlite3_column_text(lu, 2));
+            r->name = heap_dup((const char *)sqlite3_column_text(lu, 3));
+            r->qualified_name = heap_dup((const char *)sqlite3_column_text(lu, 4));
+            r->file_path = heap_dup((const char *)sqlite3_column_text(lu, 5));
+            r->score = merged[i].score;
+            r->similarity = merged[i].sim;
+            out->count++;
+        }
+    }
+    if (lu) sqlite3_finalize(lu);
+
+    free(bm25_ids); free(vec_ids); free(vec_sims); free(merged);
+    return CBM_STORE_OK;
+}
+
+void cbm_cross_search_free(cbm_cross_search_output_t *out) {
+    if (!out || !out->results) return;
+    for (int i = 0; i < out->count; i++) {
+        free((void *)out->results[i].project);
+        free((void *)out->results[i].label);
+        free((void *)out->results[i].name);
+        free((void *)out->results[i].qualified_name);
+        free((void *)out->results[i].file_path);
+    }
+    free(out->results);
+    memset(out, 0, sizeof(*out));
+}
+
+/* ── Cross-Repo Channel Matching ────────────────────────────────── */
+
+int cbm_cross_repo_match_channels(cbm_cross_repo_t *cr, const char *channel_filter,
+                                  cbm_cross_channel_match_t **out, int *count) {
+    if (!cr || !cr->db || !out || !count) return CBM_STORE_ERR;
+    *out = NULL;
+    *count = 0;
+
+    const char *sql =
+        "SELECT e.channel_name, e.transport, "
+        "e.project, e.file_path, e.function_name, "
+        "l.project, l.file_path, l.function_name "
+        "FROM cross_channels e "
+        "JOIN cross_channels l ON e.channel_name = l.channel_name "
+        "WHERE e.direction = 'emit' AND l.direction = 'listen' "
+        "AND e.project != l.project "
+        "%s "
+        "ORDER BY e.channel_name LIMIT 200";
+
+    char full_sql[2048];
+    if (channel_filter && channel_filter[0]) {
+        char filter_clause[256];
+        snprintf(filter_clause, sizeof(filter_clause),
+                 "AND e.channel_name LIKE '%%%s%%'", channel_filter);
+        snprintf(full_sql, sizeof(full_sql), sql, filter_clause);
+    } else {
+        snprintf(full_sql, sizeof(full_sql), sql, "");
+    }
+
+    sqlite3_stmt *stmt = NULL;
+    if (sqlite3_prepare_v2(cr->db, full_sql, -1, &stmt, NULL) != SQLITE_OK) {
+        return CBM_STORE_ERR;
+    }
+
+    int cap = 200;
+    cbm_cross_channel_match_t *matches = calloc((size_t)cap, sizeof(cbm_cross_channel_match_t));
+    int n = 0;
+
+    while (sqlite3_step(stmt) == SQLITE_ROW && n < cap) {
+        cbm_cross_channel_match_t *m = &matches[n];
+        m->channel_name = heap_dup((const char *)sqlite3_column_text(stmt, 0));
+        m->transport = heap_dup((const char *)sqlite3_column_text(stmt, 1));
+        m->emit_project = heap_dup((const char *)sqlite3_column_text(stmt, 2));
+        m->emit_file = heap_dup((const char *)sqlite3_column_text(stmt, 3));
+        m->emit_function = heap_dup((const char *)sqlite3_column_text(stmt, 4));
+        m->listen_project = heap_dup((const char *)sqlite3_column_text(stmt, 5));
+        m->listen_file = heap_dup((const char *)sqlite3_column_text(stmt, 6));
+        m->listen_function = heap_dup((const char *)sqlite3_column_text(stmt, 7));
+        n++;
+    }
+    sqlite3_finalize(stmt);
+
+    *out = matches;
+    *count = n;
+    return CBM_STORE_OK;
+}
+
+void cbm_cross_channel_free(cbm_cross_channel_match_t *matches, int count) {
+    if (!matches) return;
+    for (int i = 0; i < count; i++) {
+        free((void *)matches[i].channel_name);
+        free((void *)matches[i].transport);
+        free((void *)matches[i].emit_project);
+        free((void *)matches[i].emit_file);
+        free((void *)matches[i].emit_function);
+        free((void *)matches[i].listen_project);
+        free((void *)matches[i].listen_file);
+        free((void *)matches[i].listen_function);
+    }
+    free(matches);
+}
+
+/* ── Cross-Repo Stats ───────────────────────────────────────────── */
+
+int cbm_cross_repo_get_info(cbm_cross_repo_t *cr, cbm_cross_repo_info_t *out) {
+    if (!cr || !cr->db || !out) return CBM_STORE_ERR;
+    memset(out, 0, sizeof(*out));
+
+    sqlite3_stmt *s = NULL;
+    sqlite3_prepare_v2(cr->db, "SELECT COUNT(DISTINCT project) FROM cross_nodes", -1, &s, NULL);
+    if (s && sqlite3_step(s) == SQLITE_ROW) out->total_repos = sqlite3_column_int(s, 0);
+    if (s) sqlite3_finalize(s);
+
+    sqlite3_prepare_v2(cr->db, "SELECT COUNT(*) FROM cross_nodes", -1, &s, NULL);
+    if (s && sqlite3_step(s) == SQLITE_ROW) out->total_nodes = sqlite3_column_int(s, 0);
+    if (s) sqlite3_finalize(s);
+
+    sqlite3_prepare_v2(cr->db, "SELECT COUNT(*) FROM cross_channels", -1, &s, NULL);
+    if (s && sqlite3_step(s) == SQLITE_ROW) out->total_channels = sqlite3_column_int(s, 0);
+    if (s) sqlite3_finalize(s);
+
+    sqlite3_prepare_v2(cr->db, "SELECT COUNT(*) FROM cross_embeddings", -1, &s, NULL);
+    if (s && sqlite3_step(s) == SQLITE_ROW) out->total_embeddings = sqlite3_column_int(s, 0);
+    if (s) sqlite3_finalize(s);
+
+    /* Cross-repo channel count */
+    sqlite3_prepare_v2(cr->db,
+        "SELECT COUNT(DISTINCT e.channel_name) FROM cross_channels e "
+        "JOIN cross_channels l ON e.channel_name = l.channel_name "
+        "WHERE e.direction = 'emit' AND l.direction = 'listen' "
+        "AND e.project != l.project", -1, &s, NULL);
+    if (s && sqlite3_step(s) == SQLITE_ROW) out->cross_repo_channel_count = sqlite3_column_int(s, 0);
+    if (s) sqlite3_finalize(s);
+
+    sqlite3_prepare_v2(cr->db,
+        "SELECT value FROM cross_meta WHERE key = 'built_at'", -1, &s, NULL);
+    if (s && sqlite3_step(s) == SQLITE_ROW)
+        out->built_at = heap_dup((const char *)sqlite3_column_text(s, 0));
+    if (s) sqlite3_finalize(s);
+
+    return CBM_STORE_OK;
+}
+
+void cbm_cross_repo_info_free(cbm_cross_repo_info_t *info) {
+    if (!info) return;
+    free((void *)info->built_at);
+    info->built_at = NULL;
+}
+
+/* ── Cross-Repo Trace Helper ────────────────────────────────────── */
+
+int cbm_cross_repo_trace_in_project(
+    const char *project_db_path,
+    const char *function_name,
+    const char *file_path_hint,
+    const char *channel_name,
+    const char *direction,
+    int max_depth,
+    cbm_cross_trace_step_t **out, int *out_count) {
+
+    if (!project_db_path || !function_name || !direction || !out || !out_count) {
+        return CBM_STORE_ERR;
+    }
+    *out = NULL;
+    *out_count = 0;
+    if (max_depth <= 0) max_depth = 2;
+
+    /* Open project DB read-only */
+    cbm_store_t *store = cbm_store_open_path_query(project_db_path);
+    if (!store) return CBM_STORE_ERR;
+
+    struct sqlite3 *db = cbm_store_get_db(store);
+    if (!db) { cbm_store_close(store); return CBM_STORE_ERR; }
+
+    int64_t start_id = 0;
+
+    /* Resolve start node — handle special cases */
+    if (strcmp(function_name, "(file-level)") == 0 && file_path_hint) {
+        /* File-level listener: find the actual handler function via channels table */
+        if (channel_name) {
+            sqlite3_stmt *s = NULL;
+            sqlite3_prepare_v2(db,
+                "SELECT DISTINCT c.node_id FROM channels c "
+                "WHERE c.file_path = ?1 AND c.channel_name = ?2 AND c.node_id > 0 "
+                "LIMIT 1", -1, &s, NULL);
+            if (s) {
+                sqlite3_bind_text(s, 1, file_path_hint, -1, SQLITE_STATIC);
+                sqlite3_bind_text(s, 2, channel_name, -1, SQLITE_STATIC);
+                if (sqlite3_step(s) == SQLITE_ROW) {
+                    start_id = sqlite3_column_int64(s, 0);
+                }
+                sqlite3_finalize(s);
+            }
+        }
+        /* Fallback: first Function/Method in the file */
+        if (start_id == 0) {
+            sqlite3_stmt *s = NULL;
+            sqlite3_prepare_v2(db,
+                "SELECT id FROM nodes WHERE file_path = ?1 "
+                "AND label IN ('Function','Method') ORDER BY start_line LIMIT 1",
+                -1, &s, NULL);
+            if (s) {
+                sqlite3_bind_text(s, 1, file_path_hint, -1, SQLITE_STATIC);
+                if (sqlite3_step(s) == SQLITE_ROW) {
+                    start_id = sqlite3_column_int64(s, 0);
+                }
+                sqlite3_finalize(s);
+            }
+        }
+    } else {
+        /* Normal case: find by name, optionally filtered by file_path */
+        const char *sql = file_path_hint
+            ? "SELECT id, label FROM nodes WHERE name = ?1 AND file_path = ?2 "
+              "AND label IN ('Function','Method','Class') LIMIT 1"
+            : "SELECT id, label FROM nodes WHERE name = ?1 "
+              "AND label IN ('Function','Method','Class') LIMIT 1";
+        sqlite3_stmt *s = NULL;
+        sqlite3_prepare_v2(db, sql, -1, &s, NULL);
+        if (s) {
+            sqlite3_bind_text(s, 1, function_name, -1, SQLITE_STATIC);
+            if (file_path_hint)
+                sqlite3_bind_text(s, 2, file_path_hint, -1, SQLITE_STATIC);
+            if (sqlite3_step(s) == SQLITE_ROW) {
+                start_id = sqlite3_column_int64(s, 0);
+                const char *label = (const char *)sqlite3_column_text(s, 1);
+                /* If it's a Class, resolve through DEFINES_METHOD → use first method */
+                if (label && strcmp(label, "Class") == 0) {
+                    int64_t class_id = start_id;
+                    sqlite3_stmt *m = NULL;
+                    sqlite3_prepare_v2(db,
+                        "SELECT target_id FROM edges WHERE source_id = ?1 "
+                        "AND type = 'DEFINES_METHOD' LIMIT 1", -1, &m, NULL);
+                    if (m) {
+                        sqlite3_bind_int64(m, 1, class_id);
+                        if (sqlite3_step(m) == SQLITE_ROW) {
+                            start_id = sqlite3_column_int64(m, 0);
+                        }
+                        sqlite3_finalize(m);
+                    }
+                }
+            }
+            sqlite3_finalize(s);
+        }
+    }
+
+    if (start_id == 0) {
+        cbm_store_close(store);
+        return CBM_STORE_OK; /* no results, not an error */
+    }
+
+    /* Run BFS */
+    const char *edge_types[] = {"CALLS"};
+    cbm_traverse_result_t trav = {0};
+    cbm_store_bfs(store, start_id, direction, edge_types, 1,
+                  max_depth, 20, &trav);
+
+    /* Convert to output format */
+    int cap = trav.visited_count;
+    if (cap > 0) {
+        cbm_cross_trace_step_t *steps = calloc((size_t)cap, sizeof(cbm_cross_trace_step_t));
+        int count = 0;
+        for (int i = 0; i < trav.visited_count && count < cap; i++) {
+            cbm_node_hop_t *h = &trav.visited[i];
+            if (h->node.id == start_id) continue; /* skip the start node itself */
+            steps[count].name = heap_dup(h->node.name);
+            steps[count].label = heap_dup(h->node.label);
+            steps[count].file_path = heap_dup(h->node.file_path);
+            steps[count].depth = h->hop;
+            count++;
+        }
+        *out = steps;
+        *out_count = count;
+    }
+
+    cbm_store_traverse_free(&trav);
+    cbm_store_close(store);
+    return CBM_STORE_OK;
+}
+
+void cbm_cross_trace_free(cbm_cross_trace_step_t *steps, int count) {
+    if (!steps) return;
+    for (int i = 0; i < count; i++) {
+        free((void *)steps[i].name);
+        free((void *)steps[i].label);
+        free((void *)steps[i].file_path);
+    }
+    free(steps);
+}
diff --git a/src/store/cross_repo.h b/src/store/cross_repo.h
new file mode 100644
index 0000000..421fdeb
--- /dev/null
+++ b/src/store/cross_repo.h
@@ -0,0 +1,137 @@
+/*
+ * cross_repo.h — Cross-repository discovery, search, and flow tracing.
+ *
+ * Builds a unified _cross_repo.db by scanning all per-project databases.
+ * Enables: cross-repo channel matching, cross-repo BM25+vector search,
+ * cross-repo flow tracing, and cross-repo impact analysis.
+ *
+ * The cross-repo DB is read-only (built by cbm_cross_repo_build) and
+ * does NOT use ATTACH — it copies data into a separate SQLite file,
+ * preserving per-project security isolation.
+ */
+#ifndef CBM_CROSS_REPO_H
+#define CBM_CROSS_REPO_H
+
+#include "store/store.h"
+#include <stdbool.h>
+
+/* ── Build ──────────────────────────────────────────────────────── */
+
+typedef struct {
+    int repos_scanned;
+    int channels_copied;
+    int nodes_copied;
+    int embeddings_copied;
+    int cross_repo_matches;   /* channels with emit in A + listen in B */
+    double build_time_ms;
+} cbm_cross_repo_stats_t;
+
+/* Build (or rebuild) the cross-repo index by scanning all project DBs.
+ * Writes to ~/.cache/codebase-memory-mcp/_cross_repo.db.
+ * Returns stats on success, or sets stats.repos_scanned=-1 on error. */
+cbm_cross_repo_stats_t cbm_cross_repo_build(void);
+
+/* ── Query ──────────────────────────────────────────────────────── */
+
+/* Opaque handle for the cross-repo DB (separate from per-project stores). */
+typedef struct cbm_cross_repo cbm_cross_repo_t;
+
+/* Open the cross-repo DB for querying. Returns NULL if not built yet. */
+cbm_cross_repo_t *cbm_cross_repo_open(void);
+
+/* Close and free. NULL-safe. */
+void cbm_cross_repo_close(cbm_cross_repo_t *cr);
+
+/* ── Cross-Repo Search ──────────────────────────────────────────── */
+
+typedef struct {
+    const char *project;        /* short project name */
+    int64_t orig_id;            /* node ID in the project's own DB */
+    const char *label;
+    const char *name;
+    const char *qualified_name;
+    const char *file_path;
+    double score;               /* BM25 or RRF score */
+    double similarity;          /* cosine similarity (0 if BM25-only) */
+} cbm_cross_search_result_t;
+
+typedef struct {
+    cbm_cross_search_result_t *results;
+    int count;
+    int total;
+    bool used_vector;           /* true if hybrid BM25+vector was used */
+} cbm_cross_search_output_t;
+
+/* Search across all repos. Uses BM25 FTS5 + optional vector search + RRF merge.
+ * query_vec may be NULL (BM25-only). Caller frees output with _free(). */
+int cbm_cross_repo_search(cbm_cross_repo_t *cr, const char *query,
+                          const float *query_vec, int dims,
+                          int limit, cbm_cross_search_output_t *out);
+
+void cbm_cross_search_free(cbm_cross_search_output_t *out);
+
+/* ── Cross-Repo Channel Matching ────────────────────────────────── */
+
+typedef struct {
+    const char *channel_name;
+    const char *transport;
+    /* Emitter side */
+    const char *emit_project;
+    const char *emit_file;
+    const char *emit_function;
+    /* Listener side */
+    const char *listen_project;
+    const char *listen_file;
+    const char *listen_function;
+} cbm_cross_channel_match_t;
+
+/* Find cross-repo channel matches: channels where emit is in one repo
+ * and listen is in another. Optional channel_name filter (partial match).
+ * Returns allocated array. Caller frees with _free(). */
+int cbm_cross_repo_match_channels(cbm_cross_repo_t *cr, const char *channel_filter,
+                                  cbm_cross_channel_match_t **out, int *count);
+
+void cbm_cross_channel_free(cbm_cross_channel_match_t *matches, int count);
+
+/* ── Cross-Repo Stats ───────────────────────────────────────────── */
+
+typedef struct {
+    int total_repos;
+    int total_nodes;
+    int total_channels;
+    int total_embeddings;
+    int cross_repo_channel_count;
+    const char *built_at;       /* ISO timestamp */
+} cbm_cross_repo_info_t;
+
+/* Get stats about the cross-repo index. */
+int cbm_cross_repo_get_info(cbm_cross_repo_t *cr, cbm_cross_repo_info_t *out);
+
+void cbm_cross_repo_info_free(cbm_cross_repo_info_t *info);
+
+/* ── Cross-Repo Trace Helper ────────────────────────────────────── */
+
+typedef struct {
+    const char *name;
+    const char *label;
+    const char *file_path;
+    int depth;
+} cbm_cross_trace_step_t;
+
+/* Trace callers (inbound) or callees (outbound) from a function in a project DB.
+ * Opens the project DB read-only, resolves the function, runs BFS, closes DB.
+ * Handles Class→Method resolution and (file-level) listener fallback.
+ * channel_name is optional — used for file-level listener resolution.
+ * Returns allocated array. Caller frees with cbm_cross_trace_free(). */
+int cbm_cross_repo_trace_in_project(
+    const char *project_db_path,
+    const char *function_name,
+    const char *file_path_hint,
+    const char *channel_name,   /* optional: for resolving (file-level) listeners */
+    const char *direction,      /* "inbound" or "outbound" */
+    int max_depth,
+    cbm_cross_trace_step_t **out, int *out_count);
+
+void cbm_cross_trace_free(cbm_cross_trace_step_t *steps, int count);
+
+#endif /* CBM_CROSS_REPO_H */
diff --git a/src/store/store.c b/src/store/store.c
index 4920732..36ab88a 100644
--- a/src/store/store.c
+++ b/src/store/store.c
@@ -9,6 +9,7 @@
 // for ISO timestamp
 
 #include <stdint.h>
+#include <math.h>
 #include "foundation/constants.h"
 
 enum {
@@ -246,9 +247,35 @@ static int init_schema(cbm_store_t *s) {
                       "  source_hash TEXT NOT NULL,"
                       "  created_at TEXT NOT NULL,"
                       "  updated_at TEXT NOT NULL"
-                      ");";
+                      ");"
+                      "CREATE TABLE IF NOT EXISTS embeddings ("
+                      "  node_id INTEGER PRIMARY KEY,"
+                      "  project TEXT NOT NULL,"
+                      "  embedding BLOB NOT NULL,"
+                      "  dimensions INTEGER NOT NULL DEFAULT 0"
+                      ");"
+                      "CREATE INDEX IF NOT EXISTS idx_embeddings_project "
+                      "ON embeddings(project);";
+
+    int rc = exec_sql(s, ddl);
+    if (rc != CBM_STORE_OK) return rc;
+
+    /* FTS5 contentless index for BM25 search with camelCase splitting */
+    {
+        char *fts_err = NULL;
+        int fts_rc = sqlite3_exec(s->db,
+            "CREATE VIRTUAL TABLE IF NOT EXISTS nodes_fts USING fts5("
+            "name, qualified_name, label, file_path,"
+            "content='', content_rowid='id',"
+            "tokenize='unicode61 remove_diacritics 2'"
+            ");",
+            NULL, NULL, &fts_err);
+        if (fts_rc != SQLITE_OK) {
+            sqlite3_free(fts_err);
+        }
+    }
 
-    return exec_sql(s, ddl);
+    return CBM_STORE_OK;
 }
 
 static int create_user_indexes(cbm_store_t *s) {
@@ -297,6 +324,56 @@ static int configure_pragmas(cbm_store_t *s, bool in_memory) {
 
 /* ── REGEXP function for SQLite ──────────────────────────────────── */
 
+/* CamelCase token splitter for FTS5.
+ * "updateCloudClient" → "updateCloudClient update Cloud Client" */
+static void sqlite_camel_split(sqlite3_context *ctx, int argc, sqlite3_value **argv) {
+    (void)argc;
+    const char *input = (const char *)sqlite3_value_text(argv[0]);
+    if (!input || !input[0]) {
+        sqlite3_result_text(ctx, input ? input : "", -1, SQLITE_TRANSIENT);
+        return;
+    }
+    char buf[2048];
+    int len = snprintf(buf, sizeof(buf), "%s ", input);
+    for (int i = 0; input[i] && len < (int)sizeof(buf) - 2; i++) {
+        if (i > 0) {
+            bool split = false;
+            if (input[i] >= 'A' && input[i] <= 'Z' &&
+                input[i - 1] >= 'a' && input[i - 1] <= 'z') split = true;
+            if (input[i] >= 'A' && input[i] <= 'Z' &&
+                input[i - 1] >= 'A' && input[i - 1] <= 'Z' &&
+                input[i + 1] >= 'a' && input[i + 1] <= 'z') split = true;
+            if (split) buf[len++] = ' ';
+        }
+        buf[len++] = input[i];
+    }
+    buf[len] = '\0';
+    sqlite3_result_text(ctx, buf, len, SQLITE_TRANSIENT);
+}
+
+/* Cosine similarity for vector search. */
+static void sqlite_cosine_sim(sqlite3_context *ctx, int argc, sqlite3_value **argv) {
+    (void)argc;
+    if (sqlite3_value_type(argv[0]) != SQLITE_BLOB ||
+        sqlite3_value_type(argv[1]) != SQLITE_BLOB) {
+        sqlite3_result_null(ctx); return;
+    }
+    const float *a = (const float *)sqlite3_value_blob(argv[0]);
+    const float *b = (const float *)sqlite3_value_blob(argv[1]);
+    int a_bytes = sqlite3_value_bytes(argv[0]);
+    int b_bytes = sqlite3_value_bytes(argv[1]);
+    if (a_bytes != b_bytes || a_bytes == 0 || (a_bytes % (int)sizeof(float)) != 0) {
+        sqlite3_result_null(ctx); return;
+    }
+    int dims = a_bytes / (int)sizeof(float);
+    float dot = 0.0f, na = 0.0f, nb = 0.0f;
+    for (int i = 0; i < dims; i++) {
+        dot += a[i] * b[i]; na += a[i] * a[i]; nb += b[i] * b[i];
+    }
+    if (na == 0.0f || nb == 0.0f) { sqlite3_result_double(ctx, 0.0); return; }
+    sqlite3_result_double(ctx, (double)dot / (sqrt((double)na) * sqrt((double)nb)));
+}
+
 static void sqlite_regexp(sqlite3_context *ctx, int argc, sqlite3_value **argv) {
     (void)argc;
     const char *pattern = (const char *)sqlite3_value_text(argv[0]);
@@ -388,9 +465,12 @@ static cbm_store_t *store_open_internal(const char *path, bool in_memory) {
     /* Register REGEXP function (SQLite doesn't have one built-in) */
     sqlite3_create_function(s->db, "regexp", ST_COL_2, SQLITE_UTF8 | SQLITE_DETERMINISTIC, NULL,
                             sqlite_regexp, NULL, NULL);
-    /* Case-insensitive variant for search with case_sensitive=false */
     sqlite3_create_function(s->db, "iregexp", ST_COL_2, SQLITE_UTF8 | SQLITE_DETERMINISTIC, NULL,
                             sqlite_iregexp, NULL, NULL);
+    sqlite3_create_function(s->db, "cbm_camel_split", 1, SQLITE_UTF8 | SQLITE_DETERMINISTIC,
+                            NULL, sqlite_camel_split, NULL, NULL);
+    sqlite3_create_function(s->db, "cbm_cosine_sim", 2, SQLITE_UTF8 | SQLITE_DETERMINISTIC,
+                            NULL, sqlite_cosine_sim, NULL, NULL);
 
     if (configure_pragmas(s, in_memory) != CBM_STORE_OK || init_schema(s) != CBM_STORE_OK ||
         create_user_indexes(s) != CBM_STORE_OK) {
@@ -443,6 +523,10 @@ cbm_store_t *cbm_store_open_path_query(const char *db_path) {
                             sqlite_regexp, NULL, NULL);
     sqlite3_create_function(s->db, "iregexp", ST_COL_2, SQLITE_UTF8 | SQLITE_DETERMINISTIC, NULL,
                             sqlite_iregexp, NULL, NULL);
+    sqlite3_create_function(s->db, "cbm_camel_split", 1, SQLITE_UTF8 | SQLITE_DETERMINISTIC,
+                            NULL, sqlite_camel_split, NULL, NULL);
+    sqlite3_create_function(s->db, "cbm_cosine_sim", 2, SQLITE_UTF8 | SQLITE_DETERMINISTIC,
+                            NULL, sqlite_cosine_sim, NULL, NULL);
 
     if (configure_pragmas(s, false) != CBM_STORE_OK) {
         sqlite3_close(s->db);
@@ -4525,3 +4609,158 @@ void cbm_store_free_file_hashes(cbm_file_hash_t *hashes, int count) {
     }
     free(hashes);
 }
+
+/* ── cbm_store_exec (utility) ─────────────────────────────────── */
+int cbm_store_exec(cbm_store_t *s, const char *sql) {
+    return exec_sql(s, sql);
+}
+
+/* ── Embeddings (vector search) ─────────────────────────────────── */
+
+int cbm_store_upsert_embedding(cbm_store_t *s, int64_t node_id, const char *project,
+                               const float *embedding, int dims) {
+    if (!s || !s->db || !embedding || dims <= 0) return CBM_STORE_ERR;
+
+    const char *sql =
+        "INSERT OR REPLACE INTO embeddings(node_id, project, embedding, dimensions) "
+        "VALUES(?1, ?2, ?3, ?4)";
+    sqlite3_stmt *stmt = NULL;
+    if (sqlite3_prepare_v2(s->db, sql, -1, &stmt, NULL) != SQLITE_OK) {
+        return CBM_STORE_ERR;
+    }
+    sqlite3_bind_int64(stmt, 1, node_id);
+    bind_text(stmt, 2, project);
+    sqlite3_bind_blob(stmt, 3, embedding, dims * (int)sizeof(float), SQLITE_STATIC);
+    sqlite3_bind_int(stmt, 4, dims);
+    int rc = (sqlite3_step(stmt) == SQLITE_DONE) ? CBM_STORE_OK : CBM_STORE_ERR;
+    sqlite3_finalize(stmt);
+    return rc;
+}
+
+int cbm_store_upsert_embedding_batch(cbm_store_t *s, const int64_t *node_ids,
+                                     const char *project, const float *embeddings,
+                                     int dims, int count) {
+    if (!s || !s->db || !embeddings || dims <= 0 || count <= 0) return CBM_STORE_ERR;
+
+    const char *sql =
+        "INSERT OR REPLACE INTO embeddings(node_id, project, embedding, dimensions) "
+        "VALUES(?1, ?2, ?3, ?4)";
+    sqlite3_stmt *stmt = NULL;
+    if (sqlite3_prepare_v2(s->db, sql, -1, &stmt, NULL) != SQLITE_OK) {
+        return CBM_STORE_ERR;
+    }
+
+    int blob_size = dims * (int)sizeof(float);
+    for (int i = 0; i < count; i++) {
+        sqlite3_reset(stmt);
+        sqlite3_bind_int64(stmt, 1, node_ids[i]);
+        bind_text(stmt, 2, project);
+        sqlite3_bind_blob(stmt, 3, &embeddings[i * dims], blob_size, SQLITE_STATIC);
+        sqlite3_bind_int(stmt, 4, dims);
+        if (sqlite3_step(stmt) != SQLITE_DONE) {
+            sqlite3_finalize(stmt);
+            return CBM_STORE_ERR;
+        }
+    }
+    sqlite3_finalize(stmt);
+    return CBM_STORE_OK;
+}
+
+int cbm_store_count_embeddings(cbm_store_t *s, const char *project) {
+    if (!s || !s->db) return 0;
+    const char *sql = project
+        ? "SELECT COUNT(*) FROM embeddings WHERE project = ?1"
+        : "SELECT COUNT(*) FROM embeddings";
+    sqlite3_stmt *stmt = NULL;
+    if (sqlite3_prepare_v2(s->db, sql, -1, &stmt, NULL) != SQLITE_OK) return 0;
+    if (project) bind_text(stmt, 1, project);
+    int count = 0;
+    if (sqlite3_step(stmt) == SQLITE_ROW) {
+        count = sqlite3_column_int(stmt, 0);
+    }
+    sqlite3_finalize(stmt);
+    return count;
+}
+
+int cbm_store_delete_embeddings(cbm_store_t *s, const char *project) {
+    if (!s || !s->db || !project) return CBM_STORE_ERR;
+    char sql[256];
+    snprintf(sql, sizeof(sql), "DELETE FROM embeddings WHERE project = '%s'", project);
+    return exec_sql(s, sql);
+}
+
+/* Semantic search: find top-k nodes by cosine similarity to query vector.
+ * Returns node IDs and similarity scores, ordered by similarity descending.
+ * Only searches nodes with embeddings in the given project.
+ * Filters to embeddable labels (Function, Method, Class, Interface, Route). */
+int cbm_store_vector_search(cbm_store_t *s, const char *project,
+                            const float *query_vec, int dims, int limit,
+                            cbm_vector_result_t **out, int *out_count) {
+    if (!s || !s->db || !query_vec || dims <= 0 || !out || !out_count) {
+        return CBM_STORE_ERR;
+    }
+    *out = NULL;
+    *out_count = 0;
+
+    /* Brute-force cosine similarity scan using registered cbm_cosine_sim() */
+    const char *sql =
+        "SELECT e.node_id, n.name, n.label, n.qualified_name, n.file_path, "
+        "n.start_line, n.end_line, n.properties, "
+        "cbm_cosine_sim(?1, e.embedding) AS similarity "
+        "FROM embeddings e "
+        "JOIN nodes n ON n.id = e.node_id "
+        "WHERE e.project = ?2 "
+        "AND n.label IN ('Function','Method','Class','Interface','Route') "
+        "AND similarity > 0.3 "
+        "ORDER BY similarity DESC "
+        "LIMIT ?3";
+
+    sqlite3_stmt *stmt = NULL;
+    if (sqlite3_prepare_v2(s->db, sql, -1, &stmt, NULL) != SQLITE_OK) {
+        return CBM_STORE_ERR;
+    }
+
+    int blob_size = dims * (int)sizeof(float);
+    sqlite3_bind_blob(stmt, 1, query_vec, blob_size, SQLITE_STATIC);
+    bind_text(stmt, 2, project);
+    sqlite3_bind_int(stmt, 3, limit > 0 ? limit : 50);
+
+    int cap = limit > 0 ? limit : 50;
+    cbm_vector_result_t *results = calloc((size_t)cap, sizeof(cbm_vector_result_t));
+    if (!results) {
+        sqlite3_finalize(stmt);
+        return CBM_STORE_ERR;
+    }
+
+    int count = 0;
+    while (sqlite3_step(stmt) == SQLITE_ROW && count < cap) {
+        cbm_vector_result_t *r = &results[count];
+        r->node_id = sqlite3_column_int64(stmt, 0);
+        r->name = heap_strdup((const char *)sqlite3_column_text(stmt, 1));
+        r->label = heap_strdup((const char *)sqlite3_column_text(stmt, 2));
+        r->qualified_name = heap_strdup((const char *)sqlite3_column_text(stmt, 3));
+        r->file_path = heap_strdup((const char *)sqlite3_column_text(stmt, 4));
+        r->start_line = sqlite3_column_int(stmt, 5);
+        r->end_line = sqlite3_column_int(stmt, 6);
+        r->properties_json = heap_strdup((const char *)sqlite3_column_text(stmt, 7));
+        r->similarity = sqlite3_column_double(stmt, 8);
+        count++;
+    }
+    sqlite3_finalize(stmt);
+
+    *out = results;
+    *out_count = count;
+    return CBM_STORE_OK;
+}
+
+void cbm_store_free_vector_results(cbm_vector_result_t *results, int count) {
+    if (!results) return;
+    for (int i = 0; i < count; i++) {
+        free((void *)results[i].name);
+        free((void *)results[i].label);
+        free((void *)results[i].qualified_name);
+        free((void *)results[i].file_path);
+        free((void *)results[i].properties_json);
+    }
+    free(results);
+}
diff --git a/src/store/store.h b/src/store/store.h
index 1715f42..283c224 100644
--- a/src/store/store.h
+++ b/src/store/store.h
@@ -608,4 +608,33 @@ void cbm_store_free_projects(cbm_project_t *projects, int count);
 /* Free an array of file hashes. */
 void cbm_store_free_file_hashes(cbm_file_hash_t *hashes, int count);
 
+/* Execute raw SQL. */
+int cbm_store_exec(cbm_store_t *s, const char *sql);
+
+/* ── Embeddings (semantic vector search) ─────────────────────────── */
+
+typedef struct {
+    int64_t node_id;
+    const char *name;
+    const char *label;
+    const char *qualified_name;
+    const char *file_path;
+    int start_line;
+    int end_line;
+    const char *properties_json;
+    double similarity;
+} cbm_vector_result_t;
+
+int cbm_store_upsert_embedding(cbm_store_t *s, int64_t node_id, const char *project,
+                               const float *embedding, int dims);
+int cbm_store_upsert_embedding_batch(cbm_store_t *s, const int64_t *node_ids,
+                                     const char *project, const float *embeddings,
+                                     int dims, int count);
+int cbm_store_count_embeddings(cbm_store_t *s, const char *project);
+int cbm_store_delete_embeddings(cbm_store_t *s, const char *project);
+int cbm_store_vector_search(cbm_store_t *s, const char *project,
+                            const float *query_vec, int dims, int limit,
+                            cbm_vector_result_t **out, int *out_count);
+void cbm_store_free_vector_results(cbm_vector_result_t *results, int count);
+
 #endif /* CBM_STORE_H */

From 21c4537e4ba3ef4f38b3402b561c7524f1165862 Mon Sep 17 00:00:00 2001
From: Your Name <your.email@example.com>
Date: Sat, 4 Apr 2026 22:37:25 -0400
Subject: [PATCH 2/4] =?UTF-8?q?feat:=20MCP=20layer=20=E2=80=94=20BM25=20se?=
 =?UTF-8?q?arch,=20embeddings=20tool,=20cross-repo=20tools=20+=20enable=20?=
 =?UTF-8?q?FTS5?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Completes the rebase by adding the MCP handler layer:

1. Enable FTS5 in SQLite compile flags (-DSQLITE_ENABLE_FTS5).
   Without this, CREATE VIRTUAL TABLE USING fts5(...) silently creates
   a stub that fails on any query with 'no such module: fts5'.

2. Expose 'query' and 'sort_by' params in search_graph inputSchema.
   AI agents can now send natural language queries for BM25 ranked search
   instead of regex patterns only.

3. BM25 search path in handle_search_graph.
   When 'query' is provided, uses FTS5 MATCH with label-type structural
   boosting (Function/Method +10, Route +8, Class +5). Falls back to
   regex path when FTS5 is unavailable.

4. FTS5 backfill with contentless delete-all syntax.
   Contentless FTS5 tables (content='') require
   INSERT INTO table(table) VALUES('delete-all') instead of DELETE FROM.
   Falls back to plain names if cbm_camel_split is unavailable.

5. generate_embeddings MCP tool — manual trigger for embedding generation.

6. build_cross_repo_index MCP tool — builds unified _cross_repo.db.

7. trace_cross_repo MCP tool — cross-repo channel flow tracing.

8. Tool dispatch entries for all 3 new tools.

Tested: 'audio stream' on 713-node repo returns 28 ranked results
(useMicStream, startStream, stopStream) instead of 713 unranked.
---
 .github/workflows/_build.yml        | 187 ------
 .github/workflows/_lint.yml         | 102 ---
 .github/workflows/_smoke.yml        | 193 ------
 .github/workflows/_soak.yml         | 186 ------
 .github/workflows/_test.yml         |  67 --
 .github/workflows/codeql.yml        |   6 +-
 .github/workflows/dry-run.yml       | 711 +++++++++++++++++++--
 .github/workflows/nightly-soak.yml  | 109 +++-
 .github/workflows/release.yml       | 928 ++++++++++++++++++++++++++--
 .github/workflows/scorecard.yml     |   4 +-
 Makefile.cbm                        |   4 +-
 src/mcp/mcp.c                       | 289 ++++++++-
 src/pipeline/pipeline.c             |  16 +-
 src/pipeline/pipeline_incremental.c |  13 +-
 14 files changed, 1964 insertions(+), 851 deletions(-)
 delete mode 100644 .github/workflows/_build.yml
 delete mode 100644 .github/workflows/_lint.yml
 delete mode 100644 .github/workflows/_smoke.yml
 delete mode 100644 .github/workflows/_soak.yml
 delete mode 100644 .github/workflows/_test.yml

diff --git a/.github/workflows/_build.yml b/.github/workflows/_build.yml
deleted file mode 100644
index 8a3336a..0000000
--- a/.github/workflows/_build.yml
+++ /dev/null
@@ -1,187 +0,0 @@
-# Reusable: build binaries (standard + UI) on all platforms
-name: Build
-
-on:
-  workflow_call:
-    inputs:
-      version:
-        description: 'Version string (e.g. v0.8.0)'
-        type: string
-        default: ''
-
-permissions:
-  contents: read
-
-jobs:
-  build-unix:
-    strategy:
-      fail-fast: false
-      matrix:
-        include:
-          - os: ubuntu-latest
-            goos: linux
-            goarch: amd64
-            cc: gcc
-            cxx: g++
-          - os: ubuntu-24.04-arm
-            goos: linux
-            goarch: arm64
-            cc: gcc
-            cxx: g++
-          - os: macos-14
-            goos: darwin
-            goarch: arm64
-            cc: cc
-            cxx: c++
-          - os: macos-15-intel
-            goos: darwin
-            goarch: amd64
-            cc: cc
-            cxx: c++
-    runs-on: ${{ matrix.os }}
-    timeout-minutes: 15
-    steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
-
-      - name: Install deps (Ubuntu)
-        if: startsWith(matrix.os, 'ubuntu')
-        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev
-
-      - uses: actions/setup-node@53b83947a5a98c8d113130e565377fae1a50d02f # v6.3.0
-        with:
-          node-version: "22"
-
-      - name: Build standard binary
-        run: scripts/build.sh ${{ inputs.version && format('--version {0}', inputs.version) || '' }} CC=${{ matrix.cc }} CXX=${{ matrix.cxx }}
-
-      - name: Ad-hoc sign macOS binary
-        if: startsWith(matrix.os, 'macos')
-        run: codesign --sign - --force build/c/codebase-memory-mcp
-
-      - name: Archive standard binary
-        run: |
-          cp LICENSE install.sh build/c/
-          tar -czf codebase-memory-mcp-${{ matrix.goos }}-${{ matrix.goarch }}.tar.gz \
-            -C build/c codebase-memory-mcp LICENSE install.sh
-
-      - name: Build UI binary
-        run: scripts/build.sh --with-ui ${{ inputs.version && format('--version {0}', inputs.version) || '' }} CC=${{ matrix.cc }} CXX=${{ matrix.cxx }}
-
-      - name: Ad-hoc sign macOS UI binary
-        if: startsWith(matrix.os, 'macos')
-        run: codesign --sign - --force build/c/codebase-memory-mcp
-
-      - name: Frontend integrity scan
-        if: matrix.goos == 'linux' && matrix.goarch == 'amd64'
-        run: scripts/security-ui.sh
-
-      - name: Archive UI binary
-        run: |
-          cp LICENSE install.sh build/c/
-          tar -czf codebase-memory-mcp-ui-${{ matrix.goos }}-${{ matrix.goarch }}.tar.gz \
-            -C build/c codebase-memory-mcp LICENSE install.sh
-
-      - uses: actions/upload-artifact@bbbca2ddaa5d8feaa63e36b76fdaad77386f024f # v7.0.0
-        with:
-          name: binaries-${{ matrix.goos }}-${{ matrix.goarch }}
-          path: "*.tar.gz"
-
-  build-windows:
-    runs-on: windows-latest
-    timeout-minutes: 15
-    steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
-
-      - uses: msys2/setup-msys2@4f806de0a5a7294ffabaff804b38a9b435a73bda # v2
-        with:
-          msystem: CLANG64
-          path-type: inherit
-          install: >-
-            mingw-w64-clang-x86_64-clang
-            mingw-w64-clang-x86_64-zlib
-            make
-            zip
-
-      - uses: actions/setup-node@53b83947a5a98c8d113130e565377fae1a50d02f # v6.3.0
-        with:
-          node-version: "22"
-
-      - name: Build standard binary
-        shell: msys2 {0}
-        run: scripts/build.sh ${{ inputs.version && format('--version {0}', inputs.version) || '' }} CC=clang CXX=clang++
-
-      - name: Archive standard binary
-        shell: msys2 {0}
-        run: |
-          BIN=build/c/codebase-memory-mcp
-          [ -f "${BIN}.exe" ] && BIN="${BIN}.exe"
-          cp "$BIN" codebase-memory-mcp.exe
-          zip codebase-memory-mcp-windows-amd64.zip codebase-memory-mcp.exe LICENSE install.ps1
-
-      - name: Build UI binary
-        shell: msys2 {0}
-        run: scripts/build.sh --with-ui ${{ inputs.version && format('--version {0}', inputs.version) || '' }} CC=clang CXX=clang++
-
-      - name: Archive UI binary
-        shell: msys2 {0}
-        run: |
-          BIN=build/c/codebase-memory-mcp
-          [ -f "${BIN}.exe" ] && BIN="${BIN}.exe"
-          cp "$BIN" codebase-memory-mcp.exe
-          zip codebase-memory-mcp-ui-windows-amd64.zip codebase-memory-mcp.exe LICENSE install.ps1
-
-      - uses: actions/upload-artifact@bbbca2ddaa5d8feaa63e36b76fdaad77386f024f # v7.0.0
-        with:
-          name: binaries-windows-amd64
-          path: "*.zip"
-
-  build-linux-portable:
-    # Fully static Linux binaries (gcc -static on Ubuntu).
-    # Runs on any Linux distro without shared library dependencies.
-    strategy:
-      fail-fast: false
-      matrix:
-        include:
-          - arch: amd64
-            runner: ubuntu-latest
-          - arch: arm64
-            runner: ubuntu-24.04-arm
-    runs-on: ${{ matrix.runner }}
-    timeout-minutes: 15
-    steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
-
-      - name: Install deps
-        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev
-
-      - uses: actions/setup-node@53b83947a5a98c8d113130e565377fae1a50d02f # v6.3.0
-        with:
-          node-version: "22"
-
-      - name: Build standard binary (static)
-        run: scripts/build.sh ${{ inputs.version && format('--version {0}', inputs.version) || '' }} CC=gcc CXX=g++ STATIC=1
-
-      - name: Verify static linking
-        run: |
-          file build/c/codebase-memory-mcp
-          ldd build/c/codebase-memory-mcp 2>&1 | grep -q "not a dynamic executable" || ldd build/c/codebase-memory-mcp 2>&1 | grep -q "statically linked"
-
-      - name: Archive standard binary
-        run: |
-          cp LICENSE install.sh build/c/
-          tar -czf codebase-memory-mcp-linux-${{ matrix.arch }}-portable.tar.gz \
-            -C build/c codebase-memory-mcp LICENSE install.sh
-
-      - name: Build UI binary (static)
-        run: scripts/build.sh --with-ui ${{ inputs.version && format('--version {0}', inputs.version) || '' }} CC=gcc CXX=g++ STATIC=1
-
-      - name: Archive UI binary
-        run: |
-          cp LICENSE install.sh build/c/
-          tar -czf codebase-memory-mcp-ui-linux-${{ matrix.arch }}-portable.tar.gz \
-            -C build/c codebase-memory-mcp LICENSE install.sh
-
-      - uses: actions/upload-artifact@bbbca2ddaa5d8feaa63e36b76fdaad77386f024f # v7.0.0
-        with:
-          name: binaries-linux-${{ matrix.arch }}-portable
-          path: "*.tar.gz"
diff --git a/.github/workflows/_lint.yml b/.github/workflows/_lint.yml
deleted file mode 100644
index edec9a8..0000000
--- a/.github/workflows/_lint.yml
+++ /dev/null
@@ -1,102 +0,0 @@
-# Reusable: lint + security-static + codeql-gate
-name: Lint & Security
-
-on:
-  workflow_call: {}
-
-permissions:
-  contents: read
-
-jobs:
-  lint:
-    runs-on: ubuntu-latest
-    timeout-minutes: 15
-    steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
-
-      - name: Install build deps
-        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev cmake
-
-      - name: Install LLVM 20
-        run: |
-          wget -qO- https://apt.llvm.org/llvm-snapshot.gpg.key | sudo tee /etc/apt/trusted.gpg.d/apt.llvm.org.asc
-          echo "deb http://apt.llvm.org/noble/ llvm-toolchain-noble-20 main" | sudo tee /etc/apt/sources.list.d/llvm-20.list
-          sudo apt-get update
-          sudo apt-get install -y clang-format-20
-
-      - uses: actions/cache@668228422ae6a00e4ad889ee87cd7109ec5666a7 # v5.0.4
-        id: cppcheck-cache
-        with:
-          path: /opt/cppcheck
-          key: cppcheck-2.20.0-ubuntu-amd64
-
-      - name: Build cppcheck 2.20.0
-        if: steps.cppcheck-cache.outputs.cache-hit != 'true'
-        run: |
-          git clone --depth 1 --branch 2.20.0 https://github.com/danmar/cppcheck.git /tmp/cppcheck
-          cmake -S /tmp/cppcheck -B /tmp/cppcheck/build -DCMAKE_BUILD_TYPE=Release -DHAVE_RULES=OFF -DCMAKE_INSTALL_PREFIX=/opt/cppcheck
-          cmake --build /tmp/cppcheck/build -j$(nproc)
-          cmake --install /tmp/cppcheck/build
-
-      - name: Add cppcheck to PATH
-        run: echo "/opt/cppcheck/bin" >> "$GITHUB_PATH"
-
-      - name: Lint (cppcheck + clang-format, no clang-tidy — enforced locally)
-        run: scripts/lint.sh --ci CLANG_FORMAT=clang-format-20
-
-  security-static:
-    runs-on: ubuntu-latest
-    timeout-minutes: 5
-    steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
-      - name: "Layer 1: Static allow-list audit"
-        run: scripts/security-audit.sh
-      - name: "Layer 6: UI security audit"
-        run: scripts/security-ui.sh
-      - name: "Layer 8: Vendored dependency integrity"
-        run: scripts/security-vendored.sh
-
-  codeql-gate:
-    runs-on: ubuntu-latest
-    timeout-minutes: 50
-    steps:
-      - name: Wait for CodeQL on current commit (max 45 min)
-        env:
-          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
-        run: |
-          CURRENT_SHA="${{ github.sha }}"
-          echo "Waiting for CodeQL to complete on $CURRENT_SHA..."
-          for attempt in $(seq 1 90); do
-            LATEST=$(gh api repos/${{ github.repository }}/actions/workflows/codeql.yml/runs?per_page=5 \
-              --jq '.workflow_runs[] | select(.head_sha == "'"$CURRENT_SHA"'") | "\(.conclusion) \(.status)"' 2>/dev/null | head -1 || echo "")
-            if [ -z "$LATEST" ]; then
-              echo "  $attempt/90: no run yet..."; sleep 30; continue
-            fi
-            CONCLUSION=$(echo "$LATEST" | cut -d' ' -f1)
-            STATUS=$(echo "$LATEST" | cut -d' ' -f2)
-            if [ "$STATUS" = "completed" ] && [ "$CONCLUSION" = "success" ]; then
-              echo "=== CodeQL passed ==="; exit 0
-            elif [ "$STATUS" = "completed" ]; then
-              echo "BLOCKED: CodeQL $CONCLUSION"; exit 1
-            fi
-            echo "  $attempt/90: $STATUS..."; sleep 30
-          done
-          echo "BLOCKED: CodeQL timeout"; exit 1
-
-      - name: Check for open code scanning alerts
-        env:
-          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
-        run: |
-          echo "Waiting 60s for alert API to settle..."
-          sleep 60
-          ALERTS=$(gh api 'repos/${{ github.repository }}/code-scanning/alerts?state=open' --jq 'length' 2>/dev/null || echo "0")
-          sleep 15
-          ALERTS2=$(gh api 'repos/${{ github.repository }}/code-scanning/alerts?state=open' --jq 'length' 2>/dev/null || echo "0")
-          [ "$ALERTS" -lt "$ALERTS2" ] && ALERTS=$ALERTS2
-          if [ "$ALERTS" -gt 0 ]; then
-            echo "BLOCKED: $ALERTS open alert(s)"
-            gh api 'repos/${{ github.repository }}/code-scanning/alerts?state=open' \
-              --jq '.[] | "  #\(.number) [\(.rule.security_severity_level // .rule.severity)] \(.rule.id) — \(.most_recent_instance.location.path):\(.most_recent_instance.location.start_line)"' 2>/dev/null || true
-            exit 1
-          fi
-          echo "=== CodeQL gate passed (0 alerts) ==="
diff --git a/.github/workflows/_smoke.yml b/.github/workflows/_smoke.yml
deleted file mode 100644
index ac220bd..0000000
--- a/.github/workflows/_smoke.yml
+++ /dev/null
@@ -1,193 +0,0 @@
-# Reusable: smoke test every binary (standard + UI, all platforms)
-name: Smoke
-
-on:
-  workflow_call: {}
-
-permissions:
-  contents: read
-
-jobs:
-  smoke-unix:
-    strategy:
-      fail-fast: false
-      matrix:
-        include:
-          - os: ubuntu-latest
-            goos: linux
-            goarch: amd64
-          - os: ubuntu-24.04-arm
-            goos: linux
-            goarch: arm64
-          - os: macos-14
-            goos: darwin
-            goarch: arm64
-          - os: macos-15-intel
-            goos: darwin
-            goarch: amd64
-        variant: [standard, ui]
-    runs-on: ${{ matrix.os }}
-    timeout-minutes: 15
-    steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
-
-      - uses: actions/download-artifact@d3f86a106a0bac45b974a628896c90dbdf5c8093 # v4
-        with:
-          name: binaries-${{ matrix.goos }}-${{ matrix.goarch }}
-
-      - name: Extract binary
-        run: |
-          SUFFIX=${{ matrix.variant == 'ui' && '-ui' || '' }}
-          tar -xzf codebase-memory-mcp${SUFFIX}-${{ matrix.goos }}-${{ matrix.goarch }}.tar.gz
-          chmod +x codebase-memory-mcp
-
-      - name: Start artifact server
-        run: |
-          mkdir -p /tmp/smoke-server
-          cp codebase-memory-mcp /tmp/smoke-server/
-          OS=${{ matrix.goos }}; ARCH=${{ matrix.goarch }}
-          SUFFIX=${{ matrix.variant == 'ui' && '-ui' || '' }}
-          tar -czf "/tmp/smoke-server/codebase-memory-mcp${SUFFIX}-${OS}-${ARCH}.tar.gz" \
-            -C /tmp/smoke-server codebase-memory-mcp
-          if [ -n "$SUFFIX" ]; then
-            cp "/tmp/smoke-server/codebase-memory-mcp${SUFFIX}-${OS}-${ARCH}.tar.gz" \
-               "/tmp/smoke-server/codebase-memory-mcp-${OS}-${ARCH}.tar.gz"
-          fi
-          cd /tmp/smoke-server
-          sha256sum *.tar.gz > checksums.txt 2>/dev/null || shasum -a 256 *.tar.gz > checksums.txt
-          python3 -m http.server 18080 -d /tmp/smoke-server &
-
-      - name: Smoke test
-        run: scripts/smoke-test.sh ./codebase-memory-mcp
-        env:
-          SMOKE_DOWNLOAD_URL: http://localhost:18080
-
-      - name: Security audits (standard only)
-        if: matrix.variant == 'standard'
-        run: |
-          scripts/security-strings.sh ./codebase-memory-mcp
-          scripts/security-install.sh ./codebase-memory-mcp
-          scripts/security-network.sh ./codebase-memory-mcp
-
-      - name: MCP robustness test (linux-amd64 standard only)
-        if: matrix.variant == 'standard' && matrix.goos == 'linux' && matrix.goarch == 'amd64'
-        run: |
-          scripts/security-fuzz.sh ./codebase-memory-mcp
-          scripts/security-fuzz-random.sh ./codebase-memory-mcp 60
-
-      - name: ClamAV scan (Linux)
-        if: matrix.variant == 'standard' && startsWith(matrix.os, 'ubuntu')
-        run: |
-          sudo apt-get update -qq && sudo apt-get install -y -qq clamav > /dev/null 2>&1
-          sudo sed -i 's/^Example/#Example/' /etc/clamav/freshclam.conf 2>/dev/null || true
-          grep -q "DatabaseMirror" /etc/clamav/freshclam.conf 2>/dev/null || \
-            echo "DatabaseMirror database.clamav.net" | sudo tee -a /etc/clamav/freshclam.conf > /dev/null
-          sudo freshclam --quiet
-          clamscan --no-summary ./codebase-memory-mcp
-
-      - name: ClamAV scan (macOS)
-        if: matrix.variant == 'standard' && startsWith(matrix.os, 'macos')
-        run: |
-          brew install clamav > /dev/null 2>&1
-          CLAMAV_ETC=$(brew --prefix)/etc/clamav
-          if [ ! -f "$CLAMAV_ETC/freshclam.conf" ]; then
-            cp "$CLAMAV_ETC/freshclam.conf.sample" "$CLAMAV_ETC/freshclam.conf" 2>/dev/null || true
-            sed -i '' 's/^Example/#Example/' "$CLAMAV_ETC/freshclam.conf" 2>/dev/null || true
-            echo "DatabaseMirror database.clamav.net" >> "$CLAMAV_ETC/freshclam.conf"
-          fi
-          freshclam --quiet --no-warnings 2>/dev/null || freshclam --quiet 2>/dev/null || echo "WARNING: freshclam update failed"
-          clamscan --no-summary ./codebase-memory-mcp
-
-  smoke-windows:
-    strategy:
-      fail-fast: false
-      matrix:
-        variant: [standard, ui]
-    runs-on: windows-latest
-    timeout-minutes: 15
-    steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
-
-      - uses: msys2/setup-msys2@4f806de0a5a7294ffabaff804b38a9b435a73bda # v2
-        with:
-          msystem: CLANG64
-          path-type: inherit
-          install: >-
-            mingw-w64-clang-x86_64-python3
-            unzip
-            zip
-            coreutils
-
-      - uses: actions/download-artifact@d3f86a106a0bac45b974a628896c90dbdf5c8093 # v4
-        with:
-          name: binaries-windows-amd64
-
-      - name: Extract binary
-        shell: msys2 {0}
-        run: |
-          SUFFIX=${{ matrix.variant == 'ui' && '-ui' || '' }}
-          unzip -o "codebase-memory-mcp${SUFFIX}-windows-amd64.zip"
-          [ -n "$SUFFIX" ] && cp "codebase-memory-mcp${SUFFIX}.exe" codebase-memory-mcp.exe || true
-
-      - name: Start artifact server
-        shell: msys2 {0}
-        run: |
-          mkdir -p /tmp/smoke-server
-          cp codebase-memory-mcp.exe /tmp/smoke-server/
-          SUFFIX=${{ matrix.variant == 'ui' && '-ui' || '' }}
-          cd /tmp/smoke-server
-          zip -q "codebase-memory-mcp${SUFFIX}-windows-amd64.zip" codebase-memory-mcp.exe
-          if [ -n "$SUFFIX" ]; then
-            cp "codebase-memory-mcp${SUFFIX}-windows-amd64.zip" "codebase-memory-mcp-windows-amd64.zip"
-          fi
-          sha256sum *.zip > checksums.txt
-          python3 -m http.server 18080 -d /tmp/smoke-server &
-
-      - name: Smoke test
-        shell: msys2 {0}
-        run: scripts/smoke-test.sh ./codebase-memory-mcp.exe
-        env:
-          SMOKE_DOWNLOAD_URL: http://localhost:18080
-
-      - name: Security audits (standard only)
-        if: matrix.variant == 'standard'
-        shell: msys2 {0}
-        run: |
-          scripts/security-strings.sh ./codebase-memory-mcp.exe
-          scripts/security-install.sh ./codebase-memory-mcp.exe
-
-      - name: Windows Defender scan (standard only)
-        if: matrix.variant == 'standard'
-        shell: pwsh
-        run: |
-          & "C:\Program Files\Windows Defender\MpCmdRun.exe" -SignatureUpdate 2>$null
-          $result = & "C:\Program Files\Windows Defender\MpCmdRun.exe" -Scan -ScanType 3 -File "$PWD\codebase-memory-mcp.exe" -DisableRemediation
-          Write-Host $result
-          if ($LASTEXITCODE -ne 0) { Write-Host "BLOCKED: Windows Defender flagged binary!"; exit 1 }
-          Write-Host "=== Windows Defender: clean ==="
-
-  smoke-linux-portable:
-    strategy:
-      fail-fast: false
-      matrix:
-        include:
-          - arch: amd64
-            runner: ubuntu-latest
-          - arch: arm64
-            runner: ubuntu-24.04-arm
-        variant: [standard, ui]
-    runs-on: ${{ matrix.runner }}
-    timeout-minutes: 15
-    steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
-
-      - uses: actions/download-artifact@d3f86a106a0bac45b974a628896c90dbdf5c8093 # v4
-        with:
-          name: binaries-linux-${{ matrix.arch }}-portable
-
-      - name: Extract and smoke test
-        run: |
-          SUFFIX=${{ matrix.variant == 'ui' && '-ui' || '' }}
-          tar -xzf codebase-memory-mcp${SUFFIX}-linux-${{ matrix.arch }}-portable.tar.gz
-          chmod +x codebase-memory-mcp
-          scripts/smoke-test.sh ./codebase-memory-mcp
diff --git a/.github/workflows/_soak.yml b/.github/workflows/_soak.yml
deleted file mode 100644
index fa92790..0000000
--- a/.github/workflows/_soak.yml
+++ /dev/null
@@ -1,186 +0,0 @@
-# Reusable: soak tests (quick + ASan, all platforms)
-name: Soak
-
-on:
-  workflow_call:
-    inputs:
-      duration_minutes:
-        description: 'Soak duration in minutes'
-        type: number
-        default: 10
-      run_asan:
-        description: 'Run ASan soak in addition to quick soak'
-        type: boolean
-        default: false
-      version:
-        description: 'Version string for build'
-        type: string
-        default: ''
-
-permissions:
-  contents: read
-
-jobs:
-  soak-quick:
-    strategy:
-      fail-fast: false
-      matrix:
-        include:
-          - os: ubuntu-latest
-            goos: linux
-            goarch: amd64
-            cc: gcc
-            cxx: g++
-          - os: ubuntu-24.04-arm
-            goos: linux
-            goarch: arm64
-            cc: gcc
-            cxx: g++
-          - os: macos-14
-            goos: darwin
-            goarch: arm64
-            cc: cc
-            cxx: c++
-          - os: macos-15-intel
-            goos: darwin
-            goarch: amd64
-            cc: cc
-            cxx: c++
-    runs-on: ${{ matrix.os }}
-    timeout-minutes: 30
-    steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
-      - name: Install deps (Linux)
-        if: startsWith(matrix.os, 'ubuntu')
-        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev python3 git
-      - name: Build
-        run: scripts/build.sh ${{ inputs.version && format('--version {0}', inputs.version) || '' }} CC=${{ matrix.cc }} CXX=${{ matrix.cxx }}
-      - name: Soak (${{ inputs.duration_minutes }} min)
-        run: scripts/soak-test.sh build/c/codebase-memory-mcp ${{ inputs.duration_minutes }}
-      - name: Upload metrics
-        if: always()
-        uses: actions/upload-artifact@bbbca2ddaa5d8feaa63e36b76fdaad77386f024f # v7.0.0
-        with:
-          name: soak-quick-${{ matrix.goos }}-${{ matrix.goarch }}
-          path: soak-results/
-          retention-days: 14
-
-  soak-quick-windows:
-    runs-on: windows-latest
-    timeout-minutes: 30
-    steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
-      - uses: msys2/setup-msys2@4f806de0a5a7294ffabaff804b38a9b435a73bda # v2
-        with:
-          msystem: CLANG64
-          path-type: inherit
-          install: >-
-            mingw-w64-clang-x86_64-clang
-            mingw-w64-clang-x86_64-zlib
-            mingw-w64-clang-x86_64-python3
-            make
-            git
-            coreutils
-      - name: Build
-        shell: msys2 {0}
-        run: scripts/build.sh ${{ inputs.version && format('--version {0}', inputs.version) || '' }} CC=clang CXX=clang++
-      - name: Soak (${{ inputs.duration_minutes }} min)
-        shell: msys2 {0}
-        run: |
-          BIN=build/c/codebase-memory-mcp
-          [ -f "${BIN}.exe" ] && BIN="${BIN}.exe"
-          scripts/soak-test.sh "$BIN" ${{ inputs.duration_minutes }}
-      - name: Upload metrics
-        if: always()
-        uses: actions/upload-artifact@bbbca2ddaa5d8feaa63e36b76fdaad77386f024f # v7.0.0
-        with:
-          name: soak-quick-windows-amd64
-          path: soak-results/
-          retention-days: 14
-
-  soak-asan:
-    if: ${{ inputs.run_asan }}
-    strategy:
-      fail-fast: false
-      matrix:
-        include:
-          - os: ubuntu-latest
-            goos: linux
-            goarch: amd64
-            cc: gcc
-            cxx: g++
-          - os: ubuntu-24.04-arm
-            goos: linux
-            goarch: arm64
-            cc: gcc
-            cxx: g++
-          - os: macos-14
-            goos: darwin
-            goarch: arm64
-            cc: cc
-            cxx: c++
-          - os: macos-15-intel
-            goos: darwin
-            goarch: amd64
-            cc: cc
-            cxx: c++
-    runs-on: ${{ matrix.os }}
-    timeout-minutes: 45
-    steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
-      - name: Install deps (Linux)
-        if: startsWith(matrix.os, 'ubuntu')
-        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev python3 git
-      - name: Build (ASan)
-        run: |
-          SANITIZE="-fsanitize=address,undefined -fno-omit-frame-pointer"
-          scripts/build.sh ${{ inputs.version && format('--version {0}', inputs.version) || '' }} CC=${{ matrix.cc }} CXX=${{ matrix.cxx }} EXTRA_CFLAGS="$SANITIZE" EXTRA_LDFLAGS="$SANITIZE"
-      - name: ASan soak (15 min)
-        env:
-          ASAN_OPTIONS: "detect_leaks=1:halt_on_error=0:log_path=soak-results/asan"
-        run: scripts/soak-test.sh build/c/codebase-memory-mcp 15
-      - name: Upload metrics
-        if: always()
-        uses: actions/upload-artifact@bbbca2ddaa5d8feaa63e36b76fdaad77386f024f # v7.0.0
-        with:
-          name: soak-asan-${{ matrix.goos }}-${{ matrix.goarch }}
-          path: soak-results/
-          retention-days: 14
-
-  soak-asan-windows:
-    if: ${{ inputs.run_asan }}
-    runs-on: windows-latest
-    timeout-minutes: 45
-    steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
-      - uses: msys2/setup-msys2@4f806de0a5a7294ffabaff804b38a9b435a73bda # v2
-        with:
-          msystem: CLANG64
-          path-type: inherit
-          install: >-
-            mingw-w64-clang-x86_64-clang
-            mingw-w64-clang-x86_64-zlib
-            mingw-w64-clang-x86_64-python3
-            make
-            git
-            coreutils
-      - name: Build (ASan)
-        shell: msys2 {0}
-        run: |
-          SANITIZE="-fsanitize=address,undefined -fno-omit-frame-pointer"
-          scripts/build.sh ${{ inputs.version && format('--version {0}', inputs.version) || '' }} CC=clang CXX=clang++ EXTRA_CFLAGS="$SANITIZE" EXTRA_LDFLAGS="$SANITIZE"
-      - name: ASan soak (15 min, no leak detection)
-        shell: msys2 {0}
-        env:
-          ASAN_OPTIONS: "detect_leaks=0:halt_on_error=0:log_path=soak-results/asan"
-        run: |
-          BIN=build/c/codebase-memory-mcp
-          [ -f "${BIN}.exe" ] && BIN="${BIN}.exe"
-          scripts/soak-test.sh "$BIN" 15
-      - name: Upload metrics
-        if: always()
-        uses: actions/upload-artifact@bbbca2ddaa5d8feaa63e36b76fdaad77386f024f # v7.0.0
-        with:
-          name: soak-asan-windows-amd64
-          path: soak-results/
-          retention-days: 14
diff --git a/.github/workflows/_test.yml b/.github/workflows/_test.yml
deleted file mode 100644
index 4b8b989..0000000
--- a/.github/workflows/_test.yml
+++ /dev/null
@@ -1,67 +0,0 @@
-# Reusable: unit + integration tests on all platforms
-name: Test
-
-on:
-  workflow_call:
-    inputs:
-      skip_perf:
-        description: 'Skip incremental perf tests (phases 2-7)'
-        type: boolean
-        default: true
-
-permissions:
-  contents: read
-
-jobs:
-  test-unix:
-    strategy:
-      fail-fast: false
-      matrix:
-        include:
-          - os: ubuntu-latest
-            cc: gcc
-            cxx: g++
-          - os: ubuntu-24.04-arm
-            cc: gcc
-            cxx: g++
-          - os: macos-14
-            cc: cc
-            cxx: c++
-          - os: macos-15-intel
-            cc: cc
-            cxx: c++
-    runs-on: ${{ matrix.os }}
-    timeout-minutes: 30
-    steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
-
-      - name: Install deps (Ubuntu)
-        if: startsWith(matrix.os, 'ubuntu')
-        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev
-
-      - name: Test
-        run: scripts/test.sh CC=${{ matrix.cc }} CXX=${{ matrix.cxx }}
-        env:
-          CBM_SKIP_PERF: ${{ inputs.skip_perf && '1' || '' }}
-
-  test-windows:
-    runs-on: windows-latest
-    timeout-minutes: 30
-    steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
-
-      - uses: msys2/setup-msys2@4f806de0a5a7294ffabaff804b38a9b435a73bda # v2
-        with:
-          msystem: CLANG64
-          path-type: inherit
-          install: >-
-            mingw-w64-clang-x86_64-clang
-            mingw-w64-clang-x86_64-compiler-rt
-            mingw-w64-clang-x86_64-zlib
-            make
-
-      - name: Test
-        shell: msys2 {0}
-        run: scripts/test.sh CC=clang CXX=clang++
-        env:
-          CBM_SKIP_PERF: ${{ inputs.skip_perf && '1' || '' }}
diff --git a/.github/workflows/codeql.yml b/.github/workflows/codeql.yml
index 64bb582..bfa783d 100644
--- a/.github/workflows/codeql.yml
+++ b/.github/workflows/codeql.yml
@@ -12,13 +12,13 @@ jobs:
   analyze:
     runs-on: ubuntu-latest
     steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
 
       - name: Install build dependencies
         run: sudo apt-get update && sudo apt-get install -y zlib1g-dev
 
       - name: Initialize CodeQL
-        uses: github/codeql-action/init@c10b8064de6f491fea524254123dbe5e09572f13 # v4
+        uses: github/codeql-action/init@38697555549f1db7851b81482ff19f1fa5c4fedc # v4
         with:
           languages: c-cpp
           build-mode: manual
@@ -27,6 +27,6 @@ jobs:
         run: scripts/build.sh
 
       - name: Perform CodeQL Analysis
-        uses: github/codeql-action/analyze@c10b8064de6f491fea524254123dbe5e09572f13 # v4
+        uses: github/codeql-action/analyze@38697555549f1db7851b81482ff19f1fa5c4fedc # v4
         with:
           category: "/language:c-cpp"
diff --git a/.github/workflows/dry-run.yml b/.github/workflows/dry-run.yml
index 0c7b1d6..584faaa 100644
--- a/.github/workflows/dry-run.yml
+++ b/.github/workflows/dry-run.yml
@@ -1,24 +1,22 @@
-# Manual trigger: test everything before pushing a release.
-# Each step can be skipped for faster iteration.
 name: Dry Run
 
 on:
   workflow_dispatch:
     inputs:
       skip_lint:
-        description: 'Skip lint + security + CodeQL'
+        description: 'Skip lint step (faster iteration)'
         type: boolean
         default: false
       skip_tests:
-        description: 'Skip unit/integration tests'
+        description: 'Skip test steps (faster iteration on build/smoke)'
         type: boolean
         default: false
       skip_builds:
-        description: 'Skip build + smoke'
+        description: 'Skip build+smoke steps (faster iteration on lint/tests)'
         type: boolean
         default: false
       soak_level:
-        description: 'Soak: full (quick+asan), quick (10min), none'
+        description: 'Soak test level: full (quick+asan+nightly), quick (10min only), none'
         type: choice
         options: ['full', 'quick', 'none']
         default: 'quick'
@@ -27,37 +25,678 @@ permissions:
   contents: read
 
 jobs:
-  # ── Lint + Security ──────────────────────────────────────────
+  # ── Step 1: Lint (clang-format + cppcheck) ───────────────────
   lint:
     if: ${{ inputs.skip_lint != true }}
-    uses: ./.github/workflows/_lint.yml
-    secrets: inherit
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
 
-  # ── Tests (all platforms, perf tests skipped on CI) ──────────
-  test:
+      - name: Install build deps
+        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev cmake
+
+      - name: Install LLVM 20
+        run: |
+          wget -qO- https://apt.llvm.org/llvm-snapshot.gpg.key | sudo tee /etc/apt/trusted.gpg.d/apt.llvm.org.asc
+          echo "deb http://apt.llvm.org/noble/ llvm-toolchain-noble-20 main" | sudo tee /etc/apt/sources.list.d/llvm-20.list
+          sudo apt-get update
+          sudo apt-get install -y clang-format-20
+
+      - uses: actions/cache@0057852bfaa89a56745cba8c7296529d2fc39830 # v4
+        id: cppcheck-cache
+        with:
+          path: /opt/cppcheck
+          key: cppcheck-2.20.0-ubuntu-amd64
+
+      - name: Build cppcheck 2.20.0
+        if: steps.cppcheck-cache.outputs.cache-hit != 'true'
+        run: |
+          git clone --depth 1 --branch 2.20.0 https://github.com/danmar/cppcheck.git /tmp/cppcheck
+          cmake -S /tmp/cppcheck -B /tmp/cppcheck/build -DCMAKE_BUILD_TYPE=Release -DHAVE_RULES=OFF -DCMAKE_INSTALL_PREFIX=/opt/cppcheck
+          cmake --build /tmp/cppcheck/build -j$(nproc)
+          cmake --install /tmp/cppcheck/build
+
+      - name: Add cppcheck to PATH
+        run: echo "/opt/cppcheck/bin" >> "$GITHUB_PATH"
+
+      - name: Lint
+        run: scripts/lint.sh CLANG_FORMAT=clang-format-20
+
+  # ── Step 1b: Security audit (source-only, runs parallel with lint+tests) ──
+  # No build needed — scans source files and vendored deps only.
+  # Binary-level security (L2/L3/L4/L7) runs in smoke jobs per-platform.
+  security-static:
+    if: ${{ inputs.skip_lint != true }}
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
+
+      - name: "Layer 1: Static allow-list audit"
+        run: scripts/security-audit.sh
+
+      - name: "Layer 6: UI security audit"
+        run: scripts/security-ui.sh
+
+      - name: "Layer 8: Vendored dependency integrity"
+        run: scripts/security-vendored.sh
+
+  # ── Step 1c: CodeQL SAST gate ────────────────────────────────
+  codeql-gate:
+    if: ${{ inputs.skip_lint != true }}
+    runs-on: ubuntu-latest
+    steps:
+      - name: Wait for CodeQL on current commit (max 45 min)
+        env:
+          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+        run: |
+          CURRENT_SHA="${{ github.sha }}"
+          echo "Current commit: $CURRENT_SHA"
+          echo "Waiting for CodeQL to complete on this commit..."
+
+          for attempt in $(seq 1 90); do
+            LATEST=$(gh api repos/${{ github.repository }}/actions/workflows/codeql.yml/runs?per_page=5 \
+              --jq '.workflow_runs[] | select(.head_sha == "'"$CURRENT_SHA"'") | "\(.conclusion) \(.status)"' 2>/dev/null | head -1 || echo "")
+
+            if [ -z "$LATEST" ]; then
+              echo "  Attempt $attempt/90: No CodeQL run found for $CURRENT_SHA yet..."
+              sleep 30
+              continue
+            fi
+
+            CONCLUSION=$(echo "$LATEST" | cut -d' ' -f1)
+            STATUS=$(echo "$LATEST" | cut -d' ' -f2)
+
+            if [ "$STATUS" = "completed" ] && [ "$CONCLUSION" = "success" ]; then
+              echo "=== CodeQL completed successfully on current commit ==="
+              exit 0
+            elif [ "$STATUS" = "completed" ]; then
+              echo "BLOCKED: CodeQL completed with conclusion: $CONCLUSION"
+              exit 1
+            fi
+
+            echo "  Attempt $attempt/90: CodeQL status=$STATUS (waiting 30s)..."
+            sleep 30
+          done
+
+          echo "BLOCKED: CodeQL did not complete within 45 minutes"
+          exit 1
+
+      - name: Check for open code scanning alerts
+        env:
+          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+        run: |
+          # Wait for GitHub to finish processing alert state changes.
+          # There is a race between CodeQL marking the workflow as "completed"
+          # and the alerts API reflecting new/closed alerts from that scan.
+          echo "Waiting 60s for alert API to settle after CodeQL completion..."
+          sleep 60
+
+          # Poll alerts twice with a gap to confirm the count is stable
+          ALERTS1=$(gh api 'repos/${{ github.repository }}/code-scanning/alerts?state=open' --jq 'length' 2>/dev/null || echo "0")
+          echo "Open alerts (check 1): $ALERTS1"
+          sleep 15
+          ALERTS2=$(gh api 'repos/${{ github.repository }}/code-scanning/alerts?state=open' --jq 'length' 2>/dev/null || echo "0")
+          echo "Open alerts (check 2): $ALERTS2"
+
+          # Use the higher count (conservative — if either check sees alerts, block)
+          ALERTS=$ALERTS2
+          if [ "$ALERTS1" -gt "$ALERTS2" ]; then
+            ALERTS=$ALERTS1
+          fi
+
+          if [ "$ALERTS" -gt 0 ]; then
+            echo "BLOCKED: $ALERTS open code scanning alert(s) found."
+            gh api 'repos/${{ github.repository }}/code-scanning/alerts?state=open' \
+              --jq '.[] | "  #\(.number) [\(.rule.security_severity_level // .rule.severity)] \(.rule.id) — \(.most_recent_instance.location.path):\(.most_recent_instance.location.start_line)"' 2>/dev/null || true
+            echo "Fix them: https://github.com/${{ github.repository }}/security/code-scanning"
+            exit 1
+          fi
+          echo "=== CodeQL gate passed (0 open alerts) ==="
+
+  # ── Step 2: Unit tests (ASan + UBSan) ───────────────────────
+  # macOS: use cc (Apple Clang) — GCC on macOS doesn't ship ASan runtime
+  # Linux: use system gcc — full ASan/UBSan support
+  # Windows: MSYS2 MinGW GCC
+  test-unix:
+    if: ${{ inputs.skip_tests != true && always() && (needs.lint.result == 'success' || needs.lint.result == 'skipped') }}
+    needs: [lint]
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          - os: ubuntu-latest
+            arch: amd64
+            cc: gcc
+            cxx: g++
+          - os: ubuntu-24.04-arm
+            arch: arm64
+            cc: gcc
+            cxx: g++
+          - os: macos-14
+            arch: arm64
+            cc: cc
+            cxx: c++
+          - os: macos-15-intel
+            arch: amd64
+            cc: cc
+            cxx: c++
+    runs-on: ${{ matrix.os }}
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
+
+      - name: Install deps (Ubuntu)
+        if: startsWith(matrix.os, 'ubuntu')
+        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev
+
+      - name: Test
+        run: scripts/test.sh CC=${{ matrix.cc }} CXX=${{ matrix.cxx }}
+
+  test-windows:
+    if: ${{ inputs.skip_tests != true && always() && (needs.lint.result == 'success' || needs.lint.result == 'skipped') }}
     needs: [lint]
-    if: ${{ inputs.skip_tests != true && !cancelled() && (needs.lint.result == 'success' || needs.lint.result == 'skipped') }}
-    uses: ./.github/workflows/_test.yml
-    with:
-      skip_perf: true
-
-  # ── Build all platforms ──────────────────────────────────────
-  build:
-    if: ${{ inputs.skip_builds != true && !cancelled() && (needs.test.result == 'success' || needs.test.result == 'skipped') }}
-    needs: [test]
-    uses: ./.github/workflows/_build.yml
-
-  # ── Smoke test every binary ─────────────────────────────────
-  smoke:
-    if: ${{ inputs.skip_builds != true && !cancelled() && needs.build.result == 'success' }}
-    needs: [build]
-    uses: ./.github/workflows/_smoke.yml
-
-  # ── Soak tests (optional, parallel with smoke) ──────────────
-  soak:
-    if: ${{ inputs.soak_level != 'none' && !cancelled() && needs.build.result == 'success' }}
-    needs: [build]
-    uses: ./.github/workflows/_soak.yml
-    with:
-      duration_minutes: 10
-      run_asan: ${{ inputs.soak_level == 'full' }}
+    runs-on: windows-latest
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
+
+      - uses: msys2/setup-msys2@4f806de0a5a7294ffabaff804b38a9b435a73bda # v2
+        with:
+          msystem: CLANG64
+          path-type: inherit
+          install: >-
+            mingw-w64-clang-x86_64-clang
+            mingw-w64-clang-x86_64-compiler-rt
+            mingw-w64-clang-x86_64-zlib
+            make
+
+      - name: Test
+        shell: msys2 {0}
+        run: scripts/test.sh CC=clang CXX=clang++
+
+  # ── Step 3: Build binaries (standard + UI, all OS) ──────────
+  build-unix:
+    if: ${{ inputs.skip_builds != true && always() && (needs.test-unix.result == 'success' || needs.test-unix.result == 'skipped') && (needs.test-windows.result == 'success' || needs.test-windows.result == 'skipped') }}
+    needs: [test-unix, test-windows]
+    strategy:
+      matrix:
+        include:
+          - os: ubuntu-latest
+            goos: linux
+            goarch: amd64
+            cc: gcc
+            cxx: g++
+          - os: ubuntu-24.04-arm
+            goos: linux
+            goarch: arm64
+            cc: gcc
+            cxx: g++
+          - os: macos-14
+            goos: darwin
+            goarch: arm64
+            cc: cc
+            cxx: c++
+          - os: macos-15-intel
+            goos: darwin
+            goarch: amd64
+            cc: cc
+            cxx: c++
+    runs-on: ${{ matrix.os }}
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
+
+      - name: Install deps (Ubuntu)
+        if: startsWith(matrix.os, 'ubuntu')
+        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev
+
+      - uses: actions/setup-node@53b83947a5a98c8d113130e565377fae1a50d02f # v6.3.0
+        with:
+          node-version: "22"
+
+      - name: Build standard binary
+        run: scripts/build.sh CC=${{ matrix.cc }} CXX=${{ matrix.cxx }}
+
+      - name: Ad-hoc sign macOS binary
+        if: startsWith(matrix.os, 'macos')
+        run: codesign --sign - --force build/c/codebase-memory-mcp
+
+      - name: Archive standard binary
+        run: |
+          cp LICENSE build/c/
+          tar -czf codebase-memory-mcp-${{ matrix.goos }}-${{ matrix.goarch }}.tar.gz \
+            -C build/c codebase-memory-mcp LICENSE
+
+      - name: Build UI binary
+        run: scripts/build.sh --with-ui CC=${{ matrix.cc }} CXX=${{ matrix.cxx }}
+
+      - name: Ad-hoc sign macOS UI binary
+        if: startsWith(matrix.os, 'macos')
+        run: codesign --sign - --force build/c/codebase-memory-mcp
+
+      - name: Frontend integrity scan (post-build dist/)
+        if: matrix.goos == 'linux' && matrix.goarch == 'amd64'
+        run: scripts/security-ui.sh
+
+      - name: Archive UI binary
+        run: |
+          cp LICENSE build/c/
+          tar -czf codebase-memory-mcp-ui-${{ matrix.goos }}-${{ matrix.goarch }}.tar.gz \
+            -C build/c codebase-memory-mcp LICENSE
+
+      - uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4
+        with:
+          name: binaries-${{ matrix.goos }}-${{ matrix.goarch }}
+          path: "*.tar.gz"
+
+  build-windows:
+    if: ${{ inputs.skip_builds != true && always() && (needs.test-unix.result == 'success' || needs.test-unix.result == 'skipped') && (needs.test-windows.result == 'success' || needs.test-windows.result == 'skipped') }}
+    needs: [test-unix, test-windows]
+    runs-on: windows-latest
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
+
+      - uses: msys2/setup-msys2@4f806de0a5a7294ffabaff804b38a9b435a73bda # v2
+        with:
+          msystem: CLANG64
+          path-type: inherit
+          install: >-
+            mingw-w64-clang-x86_64-clang
+            mingw-w64-clang-x86_64-zlib
+            make
+            zip
+
+      - uses: actions/setup-node@53b83947a5a98c8d113130e565377fae1a50d02f # v6.3.0
+        with:
+          node-version: "22"
+
+      - name: Build standard binary
+        shell: msys2 {0}
+        run: scripts/build.sh CC=clang CXX=clang++
+
+      - name: Archive standard binary
+        shell: msys2 {0}
+        run: |
+          BIN=build/c/codebase-memory-mcp
+          [ -f "${BIN}.exe" ] && BIN="${BIN}.exe"
+          cp "$BIN" codebase-memory-mcp.exe
+          zip codebase-memory-mcp-windows-amd64.zip codebase-memory-mcp.exe LICENSE
+
+      - name: Build UI binary
+        shell: msys2 {0}
+        run: scripts/build.sh --with-ui CC=clang CXX=clang++
+
+      - name: Archive UI binary
+        shell: msys2 {0}
+        run: |
+          BIN=build/c/codebase-memory-mcp
+          [ -f "${BIN}.exe" ] && BIN="${BIN}.exe"
+          cp "$BIN" codebase-memory-mcp-ui.exe
+          zip codebase-memory-mcp-ui-windows-amd64.zip codebase-memory-mcp-ui.exe LICENSE
+
+      - uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4
+        with:
+          name: binaries-windows-amd64
+          path: "*.zip"
+
+  # ── Step 4: Smoke test every binary ─────────────────────────
+  smoke-unix:
+    if: ${{ !cancelled() && inputs.skip_builds != true }}
+    needs: [build-unix]
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          - os: ubuntu-latest
+            goos: linux
+            goarch: amd64
+          - os: ubuntu-24.04-arm
+            goos: linux
+            goarch: arm64
+          - os: macos-14
+            goos: darwin
+            goarch: arm64
+          - os: macos-15-intel
+            goos: darwin
+            goarch: amd64
+        variant: [standard, ui]
+    runs-on: ${{ matrix.os }}
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
+
+      - uses: actions/download-artifact@d3f86a106a0bac45b974a628896c90dbdf5c8093 # v4
+        with:
+          name: binaries-${{ matrix.goos }}-${{ matrix.goarch }}
+
+      - name: Extract binary
+        run: |
+          SUFFIX=${{ matrix.variant == 'ui' && '-ui' || '' }}
+          tar -xzf codebase-memory-mcp${SUFFIX}-${{ matrix.goos }}-${{ matrix.goarch }}.tar.gz
+          chmod +x codebase-memory-mcp
+
+      - name: Start artifact server for E2E smoke tests
+        run: |
+          mkdir -p /tmp/smoke-server
+          cp codebase-memory-mcp /tmp/smoke-server/
+          OS=${{ matrix.goos }}
+          ARCH=${{ matrix.goarch }}
+          SUFFIX=${{ matrix.variant == 'ui' && '-ui' || '' }}
+          tar -czf "/tmp/smoke-server/codebase-memory-mcp${SUFFIX}-${OS}-${ARCH}.tar.gz" \
+            -C /tmp/smoke-server codebase-memory-mcp
+          # Also serve under standard name so install.sh + update --standard work
+          if [ -n "$SUFFIX" ]; then
+            cp "/tmp/smoke-server/codebase-memory-mcp${SUFFIX}-${OS}-${ARCH}.tar.gz" \
+               "/tmp/smoke-server/codebase-memory-mcp-${OS}-${ARCH}.tar.gz"
+          fi
+          cd /tmp/smoke-server
+          sha256sum *.tar.gz > checksums.txt 2>/dev/null || shasum -a 256 *.tar.gz > checksums.txt
+          python3 -m http.server 18080 -d /tmp/smoke-server &
+
+      - name: Smoke test (${{ matrix.variant }}, ${{ matrix.goos }}-${{ matrix.goarch }})
+        run: scripts/smoke-test.sh ./codebase-memory-mcp
+        env:
+          SMOKE_DOWNLOAD_URL: http://localhost:18080
+
+      - name: Binary string audit (${{ matrix.goos }}-${{ matrix.goarch }})
+        if: matrix.variant == 'standard'
+        run: scripts/security-strings.sh ./codebase-memory-mcp
+
+      - name: Install output audit (${{ matrix.goos }}-${{ matrix.goarch }})
+        if: matrix.variant == 'standard'
+        run: scripts/security-install.sh ./codebase-memory-mcp
+
+      - name: Network egress test (${{ matrix.goos }}-${{ matrix.goarch }})
+        if: matrix.variant == 'standard'
+        run: scripts/security-network.sh ./codebase-memory-mcp
+
+      - name: MCP robustness test
+        if: matrix.variant == 'standard' && matrix.goos == 'linux' && matrix.goarch == 'amd64'
+        run: scripts/security-fuzz.sh ./codebase-memory-mcp
+
+      - name: Fuzz testing (60s random input)
+        if: matrix.variant == 'standard' && matrix.goos == 'linux' && matrix.goarch == 'amd64'
+        run: scripts/security-fuzz-random.sh ./codebase-memory-mcp 60
+
+      - name: ClamAV scan (Linux)
+        if: matrix.variant == 'standard' && startsWith(matrix.os, 'ubuntu')
+        run: |
+          sudo apt-get update -qq && sudo apt-get install -y -qq clamav > /dev/null 2>&1
+          sudo sed -i 's/^Example/#Example/' /etc/clamav/freshclam.conf 2>/dev/null || true
+          grep -q "DatabaseMirror" /etc/clamav/freshclam.conf 2>/dev/null || \
+            echo "DatabaseMirror database.clamav.net" | sudo tee -a /etc/clamav/freshclam.conf > /dev/null
+          sudo freshclam --quiet
+          echo "=== ClamAV scan ==="
+          clamscan --no-summary ./codebase-memory-mcp
+          echo "=== ClamAV: clean ==="
+
+      - name: ClamAV scan (macOS)
+        if: matrix.variant == 'standard' && startsWith(matrix.os, 'macos')
+        run: |
+          brew install clamav > /dev/null 2>&1
+          CLAMAV_ETC=$(brew --prefix)/etc/clamav
+          if [ ! -f "$CLAMAV_ETC/freshclam.conf" ]; then
+            cp "$CLAMAV_ETC/freshclam.conf.sample" "$CLAMAV_ETC/freshclam.conf" 2>/dev/null || true
+            sed -i '' 's/^Example/#Example/' "$CLAMAV_ETC/freshclam.conf" 2>/dev/null || true
+            echo "DatabaseMirror database.clamav.net" >> "$CLAMAV_ETC/freshclam.conf"
+          fi
+          freshclam --quiet --no-warnings 2>/dev/null || freshclam --quiet 2>/dev/null || echo "WARNING: freshclam update failed, using bundled signatures"
+          echo "=== ClamAV scan (macOS) ==="
+          clamscan --no-summary ./codebase-memory-mcp
+          echo "=== ClamAV: clean ==="
+
+  smoke-windows:
+    if: ${{ !cancelled() && inputs.skip_builds != true }}
+    needs: [build-windows]
+    strategy:
+      fail-fast: false
+      matrix:
+        variant: [standard, ui]
+    runs-on: windows-latest
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
+
+      - uses: msys2/setup-msys2@4f806de0a5a7294ffabaff804b38a9b435a73bda # v2
+        with:
+          msystem: CLANG64
+          path-type: inherit
+          install: >-
+            mingw-w64-clang-x86_64-python3
+            unzip
+            zip
+            coreutils
+
+      - uses: actions/download-artifact@d3f86a106a0bac45b974a628896c90dbdf5c8093 # v4
+        with:
+          name: binaries-windows-amd64
+
+      - name: Extract binary
+        shell: msys2 {0}
+        run: |
+          SUFFIX=${{ matrix.variant == 'ui' && '-ui' || '' }}
+          unzip -o "codebase-memory-mcp${SUFFIX}-windows-amd64.zip"
+          [ -n "$SUFFIX" ] && cp "codebase-memory-mcp${SUFFIX}.exe" codebase-memory-mcp.exe || true
+
+      - name: Start artifact server for E2E smoke tests
+        shell: msys2 {0}
+        run: |
+          mkdir -p /tmp/smoke-server
+          cp codebase-memory-mcp.exe /tmp/smoke-server/codebase-memory-mcp.exe
+          SUFFIX=${{ matrix.variant == 'ui' && '-ui' || '' }}
+          cd /tmp/smoke-server
+          zip -q "codebase-memory-mcp${SUFFIX}-windows-amd64.zip" codebase-memory-mcp.exe
+          # Also serve under standard name
+          if [ -n "$SUFFIX" ]; then
+            cp "codebase-memory-mcp${SUFFIX}-windows-amd64.zip" "codebase-memory-mcp-windows-amd64.zip"
+          fi
+          sha256sum *.zip > checksums.txt
+          python3 -m http.server 18080 -d /tmp/smoke-server &
+
+      - name: Smoke test (${{ matrix.variant }}, windows-amd64)
+        shell: msys2 {0}
+        run: scripts/smoke-test.sh ./codebase-memory-mcp.exe
+        env:
+          SMOKE_DOWNLOAD_URL: http://localhost:18080
+
+      - name: Binary string audit (windows-amd64)
+        if: matrix.variant == 'standard'
+        shell: msys2 {0}
+        run: scripts/security-strings.sh ./codebase-memory-mcp.exe
+
+      - name: Install output audit (windows-amd64)
+        if: matrix.variant == 'standard'
+        shell: msys2 {0}
+        run: scripts/security-install.sh ./codebase-memory-mcp.exe
+
+      - name: Windows Defender scan
+        if: matrix.variant == 'standard'
+        shell: pwsh
+        run: |
+          Write-Host "=== Windows Defender scan (with ML heuristics) ==="
+          & "C:\Program Files\Windows Defender\MpCmdRun.exe" -SignatureUpdate 2>$null
+          $result = & "C:\Program Files\Windows Defender\MpCmdRun.exe" -Scan -ScanType 3 -File "$PWD\codebase-memory-mcp.exe" -DisableRemediation
+          Write-Host $result
+          if ($LASTEXITCODE -ne 0) {
+            Write-Host "BLOCKED: Windows Defender flagged the binary!"
+            exit 1
+          }
+          Write-Host "=== Windows Defender: clean ==="
+
+  # ── Step 6: Soak tests (after smoke, per-platform) ──────────
+  soak-quick:
+    if: ${{ !cancelled() && inputs.soak_level != 'none' && inputs.skip_builds != true }}
+    needs: [build-unix]
+    runs-on: ${{ matrix.os }}
+    timeout-minutes: 30
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          - os: ubuntu-latest
+            goos: linux
+            goarch: amd64
+            cc: gcc
+            cxx: g++
+          - os: ubuntu-24.04-arm
+            goos: linux
+            goarch: arm64
+            cc: gcc
+            cxx: g++
+          - os: macos-14
+            goos: darwin
+            goarch: arm64
+            cc: cc
+            cxx: c++
+          - os: macos-15-intel
+            goos: darwin
+            goarch: amd64
+            cc: cc
+            cxx: c++
+    steps:
+      - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4
+
+      - name: Install deps (Linux)
+        if: startsWith(matrix.os, 'ubuntu')
+        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev python3 git
+
+      - name: Build (release mode)
+        run: scripts/build.sh CC=${{ matrix.cc }} CXX=${{ matrix.cxx }}
+
+      - name: Quick soak (10 min)
+        run: scripts/soak-test.sh build/c/codebase-memory-mcp 10
+
+      - name: Upload soak metrics
+        if: always()
+        uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4
+        with:
+          name: soak-quick-${{ matrix.goos }}-${{ matrix.goarch }}
+          path: soak-results/
+          retention-days: 14
+
+  soak-quick-windows:
+    if: ${{ !cancelled() && inputs.soak_level != 'none' && inputs.skip_builds != true }}
+    needs: [build-windows]
+    runs-on: windows-latest
+    timeout-minutes: 30
+    steps:
+      - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4
+
+      - uses: msys2/setup-msys2@4f806de0a5a7294ffabaff804b38a9b435a73bda # v2
+        with:
+          msystem: CLANG64
+          path-type: inherit
+          install: >-
+            mingw-w64-clang-x86_64-clang
+            mingw-w64-clang-x86_64-zlib
+            mingw-w64-clang-x86_64-python3
+            make
+            git
+            coreutils
+
+      - name: Build (release mode)
+        shell: msys2 {0}
+        run: scripts/build.sh CC=clang CXX=clang++
+
+      - name: Quick soak (10 min)
+        shell: msys2 {0}
+        run: |
+          BIN=build/c/codebase-memory-mcp
+          [ -f "${BIN}.exe" ] && BIN="${BIN}.exe"
+          scripts/soak-test.sh "$BIN" 10
+
+      - name: Upload soak metrics
+        if: always()
+        uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4
+        with:
+          name: soak-quick-windows-amd64
+          path: soak-results/
+          retention-days: 14
+
+  soak-asan:
+    if: ${{ !cancelled() && inputs.soak_level == 'full' && inputs.skip_builds != true }}
+    needs: [build-unix]
+    runs-on: ${{ matrix.os }}
+    timeout-minutes: 45
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          - os: ubuntu-latest
+            goos: linux
+            goarch: amd64
+            cc: gcc
+            cxx: g++
+          - os: ubuntu-24.04-arm
+            goos: linux
+            goarch: arm64
+            cc: gcc
+            cxx: g++
+          - os: macos-14
+            goos: darwin
+            goarch: arm64
+            cc: cc
+            cxx: c++
+          - os: macos-15-intel
+            goos: darwin
+            goarch: amd64
+            cc: cc
+            cxx: c++
+    steps:
+      - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4
+
+      - name: Install deps (Linux)
+        if: startsWith(matrix.os, 'ubuntu')
+        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev python3 git
+
+      - name: Build (ASan + LeakSanitizer)
+        run: |
+          SANITIZE="-fsanitize=address,undefined -fno-omit-frame-pointer"
+          scripts/build.sh CC=${{ matrix.cc }} CXX=${{ matrix.cxx }} EXTRA_CFLAGS="$SANITIZE" EXTRA_LDFLAGS="$SANITIZE"
+
+      - name: ASan soak (15 min)
+        env:
+          ASAN_OPTIONS: "detect_leaks=1:halt_on_error=0:log_path=soak-results/asan"
+        run: scripts/soak-test.sh build/c/codebase-memory-mcp 15
+
+      - name: Upload ASan soak metrics
+        if: always()
+        uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4
+        with:
+          name: soak-asan-${{ matrix.goos }}-${{ matrix.goarch }}
+          path: soak-results/
+          retention-days: 14
+
+  soak-asan-windows:
+    if: ${{ !cancelled() && inputs.soak_level == 'full' && inputs.skip_builds != true }}
+    needs: [build-windows]
+    runs-on: windows-latest
+    timeout-minutes: 45
+    steps:
+      - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4
+      - uses: msys2/setup-msys2@4f806de0a5a7294ffabaff804b38a9b435a73bda # v2
+        with:
+          msystem: CLANG64
+          path-type: inherit
+          install: >-
+            mingw-w64-clang-x86_64-clang
+            mingw-w64-clang-x86_64-zlib
+            mingw-w64-clang-x86_64-python3
+            make
+            git
+            coreutils
+      - name: Build (ASan, no LeakSan on Windows)
+        shell: msys2 {0}
+        run: |
+          SANITIZE="-fsanitize=address,undefined -fno-omit-frame-pointer"
+          scripts/build.sh CC=clang CXX=clang++ EXTRA_CFLAGS="$SANITIZE" EXTRA_LDFLAGS="$SANITIZE"
+      - name: ASan soak (15 min, no leak detection)
+        shell: msys2 {0}
+        env:
+          ASAN_OPTIONS: "detect_leaks=0:halt_on_error=0:log_path=soak-results/asan"
+        run: |
+          BIN=build/c/codebase-memory-mcp
+          [ -f "${BIN}.exe" ] && BIN="${BIN}.exe"
+          scripts/soak-test.sh "$BIN" 15
+      - name: Upload ASan soak metrics
+        if: always()
+        uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4
+        with:
+          name: soak-asan-windows-amd64
+          path: soak-results/
+          retention-days: 14
diff --git a/.github/workflows/nightly-soak.yml b/.github/workflows/nightly-soak.yml
index e3a8310..ae48615 100644
--- a/.github/workflows/nightly-soak.yml
+++ b/.github/workflows/nightly-soak.yml
@@ -1,4 +1,3 @@
-# Weekly soak test: 4h sustained load + ASan leak detection
 name: Nightly Soak
 
 on:
@@ -10,13 +9,111 @@ on:
         description: 'Soak duration in minutes (default: 240 = 4h)'
         type: number
         default: 240
+      platforms:
+        description: 'Platforms to test'
+        type: choice
+        options: ['all', 'linux-only', 'macos-only']
+        default: 'all'
 
 permissions:
   contents: read
 
 jobs:
-  soak:
-    uses: ./.github/workflows/_soak.yml
-    with:
-      duration_minutes: ${{ inputs.duration_minutes || 240 }}
-      run_asan: true
+  soak-nightly:
+    runs-on: ${{ matrix.os }}
+    timeout-minutes: 330 # 5.5h safety cap (4h soak + build + analysis)
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          - os: ubuntu-latest
+            goos: linux
+            goarch: amd64
+            cc: gcc
+            cxx: g++
+            filter: all linux-only
+          - os: ubuntu-24.04-arm
+            goos: linux
+            goarch: arm64
+            cc: gcc
+            cxx: g++
+            filter: all linux-only
+          - os: macos-14
+            goos: darwin
+            goarch: arm64
+            cc: cc
+            cxx: c++
+            filter: all macos-only
+    steps:
+      - name: Check platform filter
+        if: ${{ !contains(matrix.filter, inputs.platforms || 'all') }}
+        run: |
+          echo "Skipping ${{ matrix.goos }}-${{ matrix.goarch }} (filter: ${{ inputs.platforms }})"
+          exit 0
+
+      - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4
+
+      - name: Install deps (Linux)
+        if: startsWith(matrix.os, 'ubuntu')
+        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev python3 git
+
+      - name: Build (release mode)
+        run: scripts/build.sh CC=${{ matrix.cc }} CXX=${{ matrix.cxx }}
+
+      - name: Nightly soak (${{ inputs.duration_minutes || 240 }} min)
+        run: scripts/soak-test.sh build/c/codebase-memory-mcp ${{ inputs.duration_minutes || 240 }}
+
+      - name: Upload soak metrics
+        if: always()
+        uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4
+        with:
+          name: nightly-soak-${{ matrix.goos }}-${{ matrix.goarch }}
+          path: soak-results/
+          retention-days: 30
+
+  soak-nightly-asan:
+    runs-on: ${{ matrix.os }}
+    timeout-minutes: 120 # ASan runs shorter (60 min) due to 2-3x overhead
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          - os: ubuntu-latest
+            goos: linux
+            goarch: amd64
+            cc: gcc
+            cxx: g++
+            filter: all linux-only
+          - os: ubuntu-24.04-arm
+            goos: linux
+            goarch: arm64
+            cc: gcc
+            cxx: g++
+            filter: all linux-only
+    steps:
+      - name: Check platform filter
+        if: ${{ !contains(matrix.filter, inputs.platforms || 'all') }}
+        run: exit 0
+
+      - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4
+
+      - name: Install deps
+        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev python3 git
+
+      - name: Build (ASan + LeakSanitizer)
+        run: |
+          SANITIZE="-fsanitize=address,undefined -fno-omit-frame-pointer"
+          scripts/build.sh CC=${{ matrix.cc }} CXX=${{ matrix.cxx }} EXTRA_CFLAGS="$SANITIZE" EXTRA_LDFLAGS="$SANITIZE"
+
+      - name: ASan soak (60 min)
+        env:
+          ASAN_OPTIONS: "detect_leaks=1:halt_on_error=0:log_path=soak-results/asan"
+        run: scripts/soak-test.sh build/c/codebase-memory-mcp 60
+
+      - name: Upload ASan soak metrics
+        if: always()
+        uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4
+        with:
+          name: nightly-asan-${{ matrix.goos }}-${{ matrix.goarch }}
+          path: soak-results/
+          retention-days: 30
diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 05078e7..61e1b78 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -1,4 +1,3 @@
-# Release pipeline: lint → test → build → smoke → soak → draft → verify → publish
 name: Release
 
 on:
@@ -18,52 +17,684 @@ on:
         type: boolean
         default: false
       soak_level:
-        description: 'Soak: full (quick+asan), quick (10min), none'
+        description: 'Soak test level: full (quick+asan), quick (10min only), none (skip)'
         type: choice
         options: ['full', 'quick', 'none']
         default: 'quick'
 
 permissions:
-  contents: read
+  contents: write
+  id-token: write
+  attestations: write
 
 jobs:
-  # ── 1. Lint + Security + CodeQL ────────────────────────────────
+  # ── Step 1: Lint (clang-format + cppcheck) ───────────────────
   lint:
-    uses: ./.github/workflows/_lint.yml
-    secrets: inherit
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
+
+      - name: Install build deps
+        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev cmake
+
+      - name: Install LLVM 20
+        run: |
+          wget -qO- https://apt.llvm.org/llvm-snapshot.gpg.key | sudo tee /etc/apt/trusted.gpg.d/apt.llvm.org.asc
+          echo "deb http://apt.llvm.org/noble/ llvm-toolchain-noble-20 main" | sudo tee /etc/apt/sources.list.d/llvm-20.list
+          sudo apt-get update
+          sudo apt-get install -y clang-format-20
+
+      - uses: actions/cache@0057852bfaa89a56745cba8c7296529d2fc39830 # v4
+        id: cppcheck-cache
+        with:
+          path: /opt/cppcheck
+          key: cppcheck-2.20.0-ubuntu-amd64
+
+      - name: Build cppcheck 2.20.0
+        if: steps.cppcheck-cache.outputs.cache-hit != 'true'
+        run: |
+          git clone --depth 1 --branch 2.20.0 https://github.com/danmar/cppcheck.git /tmp/cppcheck
+          cmake -S /tmp/cppcheck -B /tmp/cppcheck/build -DCMAKE_BUILD_TYPE=Release -DHAVE_RULES=OFF -DCMAKE_INSTALL_PREFIX=/opt/cppcheck
+          cmake --build /tmp/cppcheck/build -j$(nproc)
+          cmake --install /tmp/cppcheck/build
+
+      - name: Add cppcheck to PATH
+        run: echo "/opt/cppcheck/bin" >> "$GITHUB_PATH"
+
+      - name: Lint
+        run: scripts/lint.sh CLANG_FORMAT=clang-format-20
 
-  # ── 2. Tests (all platforms, full suite for release) ───────────
-  test:
+  # ── Step 1b: Security audit (source-only, runs parallel with lint+tests) ──
+  # No build needed — scans source files and vendored deps only.
+  # Binary-level security (L2/L3/L4/L7) runs in smoke jobs per-platform.
+  security-static:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
+
+      - name: "Layer 1: Static allow-list audit"
+        run: scripts/security-audit.sh
+
+      - name: "Layer 6: UI security audit"
+        run: scripts/security-ui.sh
+
+      - name: "Layer 8: Vendored dependency integrity"
+        run: scripts/security-vendored.sh
+
+  # ── Step 1c: CodeQL SAST gate ────────────────────────────────
+  # Verifies CodeQL has run on the current commit AND has 0 open alerts.
+  # Prevents false green from stale/missing scans.
+  codeql-gate:
+    runs-on: ubuntu-latest
+    steps:
+      - name: Wait for CodeQL on current commit (max 45 min)
+        env:
+          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+        run: |
+          CURRENT_SHA="${{ github.sha }}"
+          echo "Current commit: $CURRENT_SHA"
+          echo "Waiting for CodeQL to complete on this commit..."
+
+          for attempt in $(seq 1 90); do
+            LATEST=$(gh api repos/${{ github.repository }}/actions/workflows/codeql.yml/runs?per_page=5 \
+              --jq '.workflow_runs[] | select(.head_sha == "'"$CURRENT_SHA"'") | "\(.conclusion) \(.status)"' 2>/dev/null | head -1 || echo "")
+
+            if [ -z "$LATEST" ]; then
+              echo "  Attempt $attempt/90: No CodeQL run found for $CURRENT_SHA yet..."
+              sleep 30
+              continue
+            fi
+
+            CONCLUSION=$(echo "$LATEST" | cut -d' ' -f1)
+            STATUS=$(echo "$LATEST" | cut -d' ' -f2)
+
+            if [ "$STATUS" = "completed" ] && [ "$CONCLUSION" = "success" ]; then
+              echo "=== CodeQL completed successfully on current commit ==="
+              exit 0
+            elif [ "$STATUS" = "completed" ]; then
+              echo "BLOCKED: CodeQL completed with conclusion: $CONCLUSION"
+              exit 1
+            fi
+
+            echo "  Attempt $attempt/90: CodeQL status=$STATUS (waiting 30s)..."
+            sleep 30
+          done
+
+          echo "BLOCKED: CodeQL did not complete within 45 minutes"
+          exit 1
+
+      - name: Check for open code scanning alerts
+        env:
+          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+        run: |
+          # Wait for GitHub to finish processing alert state changes.
+          # There is a race between CodeQL marking the workflow as "completed"
+          # and the alerts API reflecting new/closed alerts from that scan.
+          echo "Waiting 60s for alert API to settle after CodeQL completion..."
+          sleep 60
+
+          # Poll alerts twice with a gap to confirm the count is stable
+          ALERTS1=$(gh api 'repos/${{ github.repository }}/code-scanning/alerts?state=open' --jq 'length' 2>/dev/null || echo "0")
+          echo "Open alerts (check 1): $ALERTS1"
+          sleep 15
+          ALERTS2=$(gh api 'repos/${{ github.repository }}/code-scanning/alerts?state=open' --jq 'length' 2>/dev/null || echo "0")
+          echo "Open alerts (check 2): $ALERTS2"
+
+          # Use the higher count (conservative — if either check sees alerts, block)
+          ALERTS=$ALERTS2
+          if [ "$ALERTS1" -gt "$ALERTS2" ]; then
+            ALERTS=$ALERTS1
+          fi
+
+          if [ "$ALERTS" -gt 0 ]; then
+            echo "BLOCKED: $ALERTS open code scanning alert(s) found."
+            gh api 'repos/${{ github.repository }}/code-scanning/alerts?state=open' \
+              --jq '.[] | "  #\(.number) [\(.rule.security_severity_level // .rule.severity)] \(.rule.id) — \(.most_recent_instance.location.path):\(.most_recent_instance.location.start_line)"' 2>/dev/null || true
+            echo "Fix them: https://github.com/${{ github.repository }}/security/code-scanning"
+            exit 1
+          fi
+          echo "=== CodeQL gate passed (0 open alerts on current commit) ==="
+
+  # ── Step 2: Unit tests (ASan + UBSan) ───────────────────────
+  # macOS: use cc (Apple Clang) — GCC on macOS doesn't ship ASan runtime
+  # Linux: use system gcc — full ASan/UBSan support
+  # Windows: MSYS2 MinGW GCC
+  test-unix:
+    needs: [lint]
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          - os: ubuntu-latest
+            arch: amd64
+            cc: gcc
+            cxx: g++
+          - os: ubuntu-24.04-arm
+            arch: arm64
+            cc: gcc
+            cxx: g++
+          - os: macos-14
+            arch: arm64
+            cc: cc
+            cxx: c++
+          - os: macos-15-intel
+            arch: amd64
+            cc: cc
+            cxx: c++
+    runs-on: ${{ matrix.os }}
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
+
+      - name: Install deps (Ubuntu)
+        if: startsWith(matrix.os, 'ubuntu')
+        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev
+
+      - name: Test
+        run: scripts/test.sh CC=${{ matrix.cc }} CXX=${{ matrix.cxx }}
+
+  test-windows:
     needs: [lint]
-    uses: ./.github/workflows/_test.yml
-    with:
-      skip_perf: false
-
-  # ── 3. Build all platforms ─────────────────────────────────────
-  build:
-    needs: [test]
-    uses: ./.github/workflows/_build.yml
-    with:
-      version: ${{ inputs.version }}
-
-  # ── 4. Smoke test every binary ─────────────────────────────────
-  smoke:
-    needs: [build]
-    uses: ./.github/workflows/_smoke.yml
-
-  # ── 5. Soak tests ─────────────────────────────────────────────
-  soak:
+    runs-on: windows-latest
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
+
+      - uses: msys2/setup-msys2@4f806de0a5a7294ffabaff804b38a9b435a73bda # v2
+        with:
+          msystem: CLANG64
+          path-type: inherit
+          install: >-
+            mingw-w64-clang-x86_64-clang
+            mingw-w64-clang-x86_64-compiler-rt
+            mingw-w64-clang-x86_64-zlib
+            make
+
+      - name: Test
+        shell: msys2 {0}
+        run: scripts/test.sh CC=clang CXX=clang++
+
+  # ── Step 3: Build binaries (standard + UI, all OS) ──────────
+  build-unix:
+    needs: [test-unix, test-windows]
+    strategy:
+      matrix:
+        include:
+          - os: ubuntu-latest
+            goos: linux
+            goarch: amd64
+            cc: gcc
+            cxx: g++
+          - os: ubuntu-24.04-arm
+            goos: linux
+            goarch: arm64
+            cc: gcc
+            cxx: g++
+          - os: macos-14
+            goos: darwin
+            goarch: arm64
+            cc: cc
+            cxx: c++
+          - os: macos-15-intel
+            goos: darwin
+            goarch: amd64
+            cc: cc
+            cxx: c++
+    runs-on: ${{ matrix.os }}
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
+
+      - name: Install deps (Ubuntu)
+        if: startsWith(matrix.os, 'ubuntu')
+        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev
+
+      - uses: actions/setup-node@53b83947a5a98c8d113130e565377fae1a50d02f # v6.3.0
+        with:
+          node-version: "22"
+
+      - name: Build standard binary
+        run: scripts/build.sh --version ${{ inputs.version }} CC=${{ matrix.cc }} CXX=${{ matrix.cxx }}
+
+      - name: Ad-hoc sign macOS binary
+        if: startsWith(matrix.os, 'macos')
+        run: codesign --sign - --force build/c/codebase-memory-mcp
+
+      - name: Archive standard binary
+        run: |
+          cp LICENSE install.sh build/c/
+          tar -czf codebase-memory-mcp-${{ matrix.goos }}-${{ matrix.goarch }}.tar.gz \
+            -C build/c codebase-memory-mcp LICENSE install.sh
+
+      - name: Build UI binary
+        run: scripts/build.sh --with-ui --version ${{ inputs.version }} CC=${{ matrix.cc }} CXX=${{ matrix.cxx }}
+
+      - name: Ad-hoc sign macOS UI binary
+        if: startsWith(matrix.os, 'macos')
+        run: codesign --sign - --force build/c/codebase-memory-mcp
+
+      - name: Frontend integrity scan (post-build dist/)
+        if: matrix.goos == 'linux' && matrix.goarch == 'amd64'
+        run: scripts/security-ui.sh
+
+      - name: Archive UI binary
+        run: |
+          cp LICENSE install.sh build/c/
+          tar -czf codebase-memory-mcp-ui-${{ matrix.goos }}-${{ matrix.goarch }}.tar.gz \
+            -C build/c codebase-memory-mcp LICENSE install.sh
+
+      - uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4
+        with:
+          name: binaries-${{ matrix.goos }}-${{ matrix.goarch }}
+          path: "*.tar.gz"
+
+  build-windows:
+    needs: [test-unix, test-windows]
+    runs-on: windows-latest
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
+
+      - uses: msys2/setup-msys2@4f806de0a5a7294ffabaff804b38a9b435a73bda # v2
+        with:
+          msystem: CLANG64
+          path-type: inherit
+          install: >-
+            mingw-w64-clang-x86_64-clang
+            mingw-w64-clang-x86_64-zlib
+            make
+            zip
+
+      - uses: actions/setup-node@53b83947a5a98c8d113130e565377fae1a50d02f # v6.3.0
+        with:
+          node-version: "22"
+
+      - name: Build standard binary
+        shell: msys2 {0}
+        run: scripts/build.sh --version ${{ inputs.version }} CC=clang CXX=clang++
+
+      - name: Archive standard binary
+        shell: msys2 {0}
+        run: |
+          BIN=build/c/codebase-memory-mcp
+          [ -f "${BIN}.exe" ] && BIN="${BIN}.exe"
+          cp "$BIN" codebase-memory-mcp.exe
+          zip codebase-memory-mcp-windows-amd64.zip codebase-memory-mcp.exe LICENSE install.ps1
+
+      - name: Build UI binary
+        shell: msys2 {0}
+        run: scripts/build.sh --with-ui --version ${{ inputs.version }} CC=clang CXX=clang++
+
+      - name: Archive UI binary
+        shell: msys2 {0}
+        run: |
+          BIN=build/c/codebase-memory-mcp
+          [ -f "${BIN}.exe" ] && BIN="${BIN}.exe"
+          cp "$BIN" codebase-memory-mcp.exe
+          zip codebase-memory-mcp-ui-windows-amd64.zip codebase-memory-mcp.exe LICENSE install.ps1
+
+      - uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4
+        with:
+          name: binaries-windows-amd64
+          path: "*.zip"
+
+  # ── Step 4: Smoke test every binary ─────────────────────────
+  smoke-unix:
+    needs: [build-unix]
+    strategy:
+      matrix:
+        include:
+          - os: ubuntu-latest
+            goos: linux
+            goarch: amd64
+          - os: ubuntu-24.04-arm
+            goos: linux
+            goarch: arm64
+          - os: macos-14
+            goos: darwin
+            goarch: arm64
+          - os: macos-15-intel
+            goos: darwin
+            goarch: amd64
+        variant: [standard, ui]
+    runs-on: ${{ matrix.os }}
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
+
+      - uses: actions/download-artifact@d3f86a106a0bac45b974a628896c90dbdf5c8093 # v4
+        with:
+          name: binaries-${{ matrix.goos }}-${{ matrix.goarch }}
+
+      - name: Extract binary
+        run: |
+          SUFFIX=${{ matrix.variant == 'ui' && '-ui' || '' }}
+          tar -xzf codebase-memory-mcp${SUFFIX}-${{ matrix.goos }}-${{ matrix.goarch }}.tar.gz
+          chmod +x codebase-memory-mcp
+
+      - name: Start artifact server for E2E smoke tests
+        run: |
+          mkdir -p /tmp/smoke-server
+          cp codebase-memory-mcp /tmp/smoke-server/
+          OS=${{ matrix.goos }}
+          ARCH=${{ matrix.goarch }}
+          SUFFIX=${{ matrix.variant == 'ui' && '-ui' || '' }}
+          tar -czf "/tmp/smoke-server/codebase-memory-mcp${SUFFIX}-${OS}-${ARCH}.tar.gz" \
+            -C /tmp/smoke-server codebase-memory-mcp
+          # Also serve under standard name so install.sh + update --standard work
+          if [ -n "$SUFFIX" ]; then
+            cp "/tmp/smoke-server/codebase-memory-mcp${SUFFIX}-${OS}-${ARCH}.tar.gz" \
+               "/tmp/smoke-server/codebase-memory-mcp-${OS}-${ARCH}.tar.gz"
+          fi
+          cd /tmp/smoke-server
+          sha256sum *.tar.gz > checksums.txt 2>/dev/null || shasum -a 256 *.tar.gz > checksums.txt
+          python3 -m http.server 18080 -d /tmp/smoke-server &
+
+      - name: Smoke test (${{ matrix.variant }}, ${{ matrix.goos }}-${{ matrix.goarch }})
+        run: scripts/smoke-test.sh ./codebase-memory-mcp
+        env:
+          SMOKE_DOWNLOAD_URL: http://localhost:18080
+
+      - name: Binary string audit (${{ matrix.goos }}-${{ matrix.goarch }})
+        if: matrix.variant == 'standard'
+        run: scripts/security-strings.sh ./codebase-memory-mcp
+
+      - name: Install output audit (${{ matrix.goos }}-${{ matrix.goarch }})
+        if: matrix.variant == 'standard'
+        run: scripts/security-install.sh ./codebase-memory-mcp
+
+      - name: Network egress test (${{ matrix.goos }}-${{ matrix.goarch }})
+        if: matrix.variant == 'standard'
+        run: scripts/security-network.sh ./codebase-memory-mcp
+
+      - name: MCP robustness test
+        if: matrix.variant == 'standard' && matrix.goos == 'linux' && matrix.goarch == 'amd64'
+        run: scripts/security-fuzz.sh ./codebase-memory-mcp
+
+      - name: Fuzz testing (60s random input)
+        if: matrix.variant == 'standard' && matrix.goos == 'linux' && matrix.goarch == 'amd64'
+        run: scripts/security-fuzz-random.sh ./codebase-memory-mcp 60
+
+      # Native platform antivirus scan
+      - name: ClamAV scan (Linux)
+        if: matrix.variant == 'standard' && startsWith(matrix.os, 'ubuntu')
+        run: |
+          sudo apt-get update -qq && sudo apt-get install -y -qq clamav > /dev/null 2>&1
+          # Ensure freshclam config has DatabaseMirror set
+          sudo sed -i 's/^Example/#Example/' /etc/clamav/freshclam.conf 2>/dev/null || true
+          grep -q "DatabaseMirror" /etc/clamav/freshclam.conf 2>/dev/null || \
+            echo "DatabaseMirror database.clamav.net" | sudo tee -a /etc/clamav/freshclam.conf > /dev/null
+          sudo freshclam --quiet
+          echo "=== ClamAV scan ==="
+          clamscan --no-summary ./codebase-memory-mcp
+          echo "=== ClamAV: clean ==="
+
+      - name: ClamAV scan (macOS)
+        if: matrix.variant == 'standard' && startsWith(matrix.os, 'macos')
+        run: |
+          brew install clamav > /dev/null 2>&1
+          CLAMAV_ETC=$(brew --prefix)/etc/clamav
+          if [ ! -f "$CLAMAV_ETC/freshclam.conf" ]; then
+            cp "$CLAMAV_ETC/freshclam.conf.sample" "$CLAMAV_ETC/freshclam.conf" 2>/dev/null || true
+            sed -i '' 's/^Example/#Example/' "$CLAMAV_ETC/freshclam.conf" 2>/dev/null || true
+            echo "DatabaseMirror database.clamav.net" >> "$CLAMAV_ETC/freshclam.conf"
+          fi
+          # Download signatures (--no-warnings suppresses X509 store errors on macOS)
+          freshclam --quiet --no-warnings 2>/dev/null || freshclam --quiet 2>/dev/null || echo "WARNING: freshclam update failed, using bundled signatures"
+          echo "=== ClamAV scan (macOS) ==="
+          clamscan --no-summary ./codebase-memory-mcp
+          echo "=== ClamAV: clean ==="
+
+  smoke-windows:
+    needs: [build-windows]
+    strategy:
+      matrix:
+        variant: [standard, ui]
+    runs-on: windows-latest
+    steps:
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
+
+      - uses: msys2/setup-msys2@4f806de0a5a7294ffabaff804b38a9b435a73bda # v2
+        with:
+          msystem: CLANG64
+          path-type: inherit
+          install: >-
+            mingw-w64-clang-x86_64-python3
+            unzip
+            zip
+            coreutils
+
+      - uses: actions/download-artifact@d3f86a106a0bac45b974a628896c90dbdf5c8093 # v4
+        with:
+          name: binaries-windows-amd64
+
+      - name: Extract binary
+        shell: msys2 {0}
+        run: |
+          SUFFIX=${{ matrix.variant == 'ui' && '-ui' || '' }}
+          unzip -o "codebase-memory-mcp${SUFFIX}-windows-amd64.zip"
+          [ -n "$SUFFIX" ] && cp "codebase-memory-mcp${SUFFIX}.exe" codebase-memory-mcp.exe || true
+
+      - name: Start artifact server for E2E smoke tests
+        shell: msys2 {0}
+        run: |
+          mkdir -p /tmp/smoke-server
+          cp codebase-memory-mcp.exe /tmp/smoke-server/codebase-memory-mcp.exe
+          SUFFIX=${{ matrix.variant == 'ui' && '-ui' || '' }}
+          cd /tmp/smoke-server
+          zip -q "codebase-memory-mcp${SUFFIX}-windows-amd64.zip" codebase-memory-mcp.exe
+          # Also serve under standard name
+          if [ -n "$SUFFIX" ]; then
+            cp "codebase-memory-mcp${SUFFIX}-windows-amd64.zip" "codebase-memory-mcp-windows-amd64.zip"
+          fi
+          sha256sum *.zip > checksums.txt
+          python3 -m http.server 18080 -d /tmp/smoke-server &
+
+      - name: Smoke test (${{ matrix.variant }}, windows-amd64)
+        shell: msys2 {0}
+        run: scripts/smoke-test.sh ./codebase-memory-mcp.exe
+        env:
+          SMOKE_DOWNLOAD_URL: http://localhost:18080
+
+      - name: Binary string audit (windows-amd64)
+        if: matrix.variant == 'standard'
+        shell: msys2 {0}
+        run: scripts/security-strings.sh ./codebase-memory-mcp.exe
+
+      - name: Install output audit (windows-amd64)
+        if: matrix.variant == 'standard'
+        shell: msys2 {0}
+        run: scripts/security-install.sh ./codebase-memory-mcp.exe
+
+      # Windows Defender scan (includes ML heuristics — catches what VirusTotal misses)
+      - name: Windows Defender scan
+        if: matrix.variant == 'standard'
+        shell: pwsh
+        run: |
+          Write-Host "=== Windows Defender scan (with ML heuristics) ==="
+          # Update definitions first
+          & "C:\Program Files\Windows Defender\MpCmdRun.exe" -SignatureUpdate 2>$null
+          # Full scan of the binary
+          $result = & "C:\Program Files\Windows Defender\MpCmdRun.exe" -Scan -ScanType 3 -File "$PWD\codebase-memory-mcp.exe" -DisableRemediation
+          Write-Host $result
+          if ($LASTEXITCODE -ne 0) {
+            Write-Host "BLOCKED: Windows Defender flagged the binary!"
+            Write-Host "Exit code: $LASTEXITCODE"
+            exit 1
+          }
+          Write-Host "=== Windows Defender: clean ==="
+
+  # ── Step 5a: Quick soak (parallel with smoke, per-platform) ────
+  soak-quick:
+    if: ${{ inputs.soak_level != 'none' }}
+    needs: [build-unix]
+    runs-on: ${{ matrix.os }}
+    timeout-minutes: 30
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          - os: ubuntu-latest
+            goos: linux
+            goarch: amd64
+            cc: gcc
+            cxx: g++
+          - os: ubuntu-24.04-arm
+            goos: linux
+            goarch: arm64
+            cc: gcc
+            cxx: g++
+          - os: macos-14
+            goos: darwin
+            goarch: arm64
+            cc: cc
+            cxx: c++
+          - os: macos-15-intel
+            goos: darwin
+            goarch: amd64
+            cc: cc
+            cxx: c++
+    steps:
+      - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4
+      - name: Install deps (Linux)
+        if: startsWith(matrix.os, 'ubuntu')
+        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev python3 git
+      - name: Build (release mode)
+        run: scripts/build.sh --version ${{ inputs.version }} CC=${{ matrix.cc }} CXX=${{ matrix.cxx }}
+      - name: Quick soak (10 min)
+        run: scripts/soak-test.sh build/c/codebase-memory-mcp 10
+      - name: Upload soak metrics
+        if: always()
+        uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4
+        with:
+          name: soak-quick-${{ matrix.goos }}-${{ matrix.goarch }}
+          path: soak-results/
+          retention-days: 14
+
+  # ── Step 5a-win: Quick soak (Windows, separate job) ─────────────
+  soak-quick-windows:
     if: ${{ inputs.soak_level != 'none' }}
-    needs: [build]
-    uses: ./.github/workflows/_soak.yml
-    with:
-      duration_minutes: 10
-      run_asan: ${{ inputs.soak_level == 'full' }}
-      version: ${{ inputs.version }}
-
-  # ── 6. Create DRAFT release ───────────────────────────────────
+    needs: [build-windows]
+    runs-on: windows-latest
+    timeout-minutes: 30
+    steps:
+      - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4
+      - uses: msys2/setup-msys2@4f806de0a5a7294ffabaff804b38a9b435a73bda # v2
+        with:
+          msystem: CLANG64
+          path-type: inherit
+          install: >-
+            mingw-w64-clang-x86_64-clang
+            mingw-w64-clang-x86_64-zlib
+            mingw-w64-clang-x86_64-python3
+            make
+            git
+            coreutils
+      - name: Build (release mode)
+        shell: msys2 {0}
+        run: scripts/build.sh --version ${{ inputs.version }} CC=clang CXX=clang++
+      - name: Quick soak (10 min)
+        shell: msys2 {0}
+        run: |
+          BIN=build/c/codebase-memory-mcp
+          [ -f "${BIN}.exe" ] && BIN="${BIN}.exe"
+          scripts/soak-test.sh "$BIN" 10
+      - name: Upload soak metrics
+        if: always()
+        uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4
+        with:
+          name: soak-quick-windows-amd64
+          path: soak-results/
+          retention-days: 14
+
+  # ── Step 5b: ASan soak (Linux + macOS, parallel with smoke) ────
+  soak-asan:
+    if: ${{ inputs.soak_level == 'full' }}
+    needs: [build-unix]
+    runs-on: ${{ matrix.os }}
+    timeout-minutes: 45
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          - os: ubuntu-latest
+            goos: linux
+            goarch: amd64
+            cc: gcc
+            cxx: g++
+          - os: ubuntu-24.04-arm
+            goos: linux
+            goarch: arm64
+            cc: gcc
+            cxx: g++
+          - os: macos-14
+            goos: darwin
+            goarch: arm64
+            cc: cc
+            cxx: c++
+          - os: macos-15-intel
+            goos: darwin
+            goarch: amd64
+            cc: cc
+            cxx: c++
+    steps:
+      - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4
+      - name: Install deps (Linux)
+        if: startsWith(matrix.os, 'ubuntu')
+        run: sudo apt-get update && sudo apt-get install -y zlib1g-dev python3 git
+      - name: Build (ASan + LeakSanitizer)
+        run: |
+          SANITIZE="-fsanitize=address,undefined -fno-omit-frame-pointer"
+          scripts/build.sh --version ${{ inputs.version }} CC=${{ matrix.cc }} CXX=${{ matrix.cxx }} EXTRA_CFLAGS="$SANITIZE" EXTRA_LDFLAGS="$SANITIZE"
+      - name: ASan soak (15 min)
+        env:
+          ASAN_OPTIONS: "detect_leaks=1:halt_on_error=0:log_path=soak-results/asan"
+        run: scripts/soak-test.sh build/c/codebase-memory-mcp 15
+      - name: Upload ASan soak metrics
+        if: always()
+        uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4
+        with:
+          name: soak-asan-${{ matrix.goos }}-${{ matrix.goarch }}
+          path: soak-results/
+          retention-days: 14
+
+  soak-asan-windows:
+    if: ${{ inputs.soak_level == 'full' }}
+    needs: [build-windows]
+    runs-on: windows-latest
+    timeout-minutes: 45
+    steps:
+      - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4
+      - uses: msys2/setup-msys2@4f806de0a5a7294ffabaff804b38a9b435a73bda # v2
+        with:
+          msystem: CLANG64
+          path-type: inherit
+          install: >-
+            mingw-w64-clang-x86_64-clang
+            mingw-w64-clang-x86_64-zlib
+            mingw-w64-clang-x86_64-python3
+            make
+            git
+            coreutils
+      - name: Build (ASan, no LeakSan on Windows)
+        shell: msys2 {0}
+        run: |
+          SANITIZE="-fsanitize=address,undefined -fno-omit-frame-pointer"
+          scripts/build.sh --version ${{ inputs.version }} CC=clang CXX=clang++ EXTRA_CFLAGS="$SANITIZE" EXTRA_LDFLAGS="$SANITIZE"
+      - name: ASan soak (15 min, no leak detection)
+        shell: msys2 {0}
+        env:
+          ASAN_OPTIONS: "detect_leaks=0:halt_on_error=0:log_path=soak-results/asan"
+        run: |
+          BIN=build/c/codebase-memory-mcp
+          [ -f "${BIN}.exe" ] && BIN="${BIN}.exe"
+          scripts/soak-test.sh "$BIN" 15
+      - name: Upload ASan soak metrics
+        if: always()
+        uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4
+        with:
+          name: soak-asan-windows-amd64
+          path: soak-results/
+          retention-days: 14
+
+  # ── Step 6: Create DRAFT release (not public yet) ─────────────
   release-draft:
-    needs: [smoke, soak, lint]
+    needs: [smoke-unix, smoke-windows, security-static, codeql-gate, soak-quick, soak-quick-windows, soak-asan, soak-asan-windows]
     if: ${{ !cancelled() && !failure() }}
     runs-on: ubuntu-latest
     permissions:
@@ -71,7 +702,7 @@ jobs:
       id-token: write
       attestations: write
     steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
 
       - uses: actions/download-artifact@d3f86a106a0bac45b974a628896c90dbdf5c8093 # v4
         with:
@@ -83,15 +714,27 @@ jobs:
       - name: Generate checksums
         run: sha256sum *.tar.gz *.zip > checksums.txt
 
-      - name: Attest build provenance
-        uses: actions/attest-build-provenance@a2bbfa25375fe432b6a289bc6b6cd05ecd0c4c32 # v4.1.0
+      # ── Artifact attestations (SLSA provenance) ──────────────
+      - name: Attest build provenance (tar.gz)
+        uses: actions/attest-build-provenance@e8998f949152b193b063cb0ec769d69d929409be # v2
+        with:
+          subject-path: '*.tar.gz'
+
+      - name: Attest build provenance (zip)
+        uses: actions/attest-build-provenance@e8998f949152b193b063cb0ec769d69d929409be # v2
+        with:
+          subject-path: '*.zip'
+
+      - name: Attest build provenance (checksums)
+        uses: actions/attest-build-provenance@e8998f949152b193b063cb0ec769d69d929409be # v2
         with:
-          subject-path: '*.tar.gz,*.zip,checksums.txt'
+          subject-path: 'checksums.txt'
 
+      # ── SBOM generation (SPDX format) ──────────────────────────
       - name: Generate SBOM
         run: |
           python3 -c "
-          import json
+          import json, uuid
           sbom = {
             'spdxVersion': 'SPDX-2.3',
             'dataLicense': 'CC0-1.0',
@@ -121,15 +764,17 @@ jobs:
           subject-path: '*.tar.gz'
           sbom-path: 'sbom.json'
 
+      # ── Sigstore cosign signing ──────────────────────────────
       - name: Install cosign
         uses: sigstore/cosign-installer@398d4b0eeef1380460a10c8013a76f728fb906ac # v3
 
-      - name: Sign artifacts
+      - name: Sign release artifacts with cosign
         run: |
           for f in *.tar.gz *.zip checksums.txt; do
             cosign sign-blob --yes --bundle "${f}.bundle" "$f"
           done
 
+      # ── Create DRAFT release (not visible to users yet) ──────
       - name: Delete existing release
         if: ${{ inputs.replace }}
         env:
@@ -157,17 +802,24 @@ jobs:
           body: ${{ inputs.release_notes || '' }}
           generate_release_notes: ${{ inputs.release_notes == '' }}
 
-  # ── 7. Verify + Publish ────────────────────────────────────────
+  # ── Step 6: Verify draft release ─────────────────────────────
+  # Scans binaries with VirusTotal, runs OpenSSF Scorecard.
+  # If verification passes, appends results and publishes.
+  # If it fails, the draft stays unpublished.
   verify:
     needs: [release-draft]
     runs-on: ubuntu-latest
     permissions:
       contents: write
     steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
         with:
           persist-credentials: false
 
+      # ── VirusTotal scan ──────────────────────────────────────
+      # Extract raw binaries from archives before scanning.
+      # VirusTotal may not unpack archives >3MB, so we scan the
+      # actual executables that users will run.
       - name: Download and extract release binaries
         env:
           GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
@@ -175,35 +827,205 @@ jobs:
         run: |
           mkdir -p assets binaries
           gh release download "$VERSION" --dir assets --repo "$GITHUB_REPOSITORY" --pattern '*.tar.gz' --pattern '*.zip'
+          ls -la assets/
+
+          # Extract binaries from archives for scanning
           for f in assets/*.tar.gz; do
             NAME=$(basename "$f" .tar.gz)
             tar -xzf "$f" -C binaries/ 2>/dev/null || true
-            [ -f binaries/codebase-memory-mcp ] && mv binaries/codebase-memory-mcp "binaries/${NAME}"
+            # Rename to include platform for identification
+            if [ -f binaries/codebase-memory-mcp ]; then
+              mv binaries/codebase-memory-mcp "binaries/${NAME}"
+            fi
           done
           for f in assets/*.zip; do
             NAME=$(basename "$f" .zip)
             unzip -o "$f" -d binaries/ 2>/dev/null || true
-            [ -f binaries/codebase-memory-mcp.exe ] && mv binaries/codebase-memory-mcp.exe "binaries/${NAME}.exe"
+            if [ -f binaries/codebase-memory-mcp.exe ]; then
+              mv binaries/codebase-memory-mcp.exe "binaries/${NAME}.exe"
+            fi
           done
-          cp install.sh binaries/ 2>/dev/null || true
-          cp install.ps1 binaries/ 2>/dev/null || true
+          # Also include install scripts (users curl | sh these)
+          cp install.sh binaries/install.sh 2>/dev/null || true
+          cp install.ps1 binaries/install.ps1 2>/dev/null || true
+
+          echo "=== Files for scanning ==="
           ls -la binaries/
 
-      - name: VirusTotal scan
+      - name: Scan extracted binaries with VirusTotal
         uses: crazy-max/ghaction-virustotal@936d8c5c00afe97d3d9a1af26d017cfdf26800a2 # v5.0.0
         id: virustotal
         with:
           vt_api_key: ${{ secrets.VIRUS_TOTAL_SCANNER_API_KEY }}
-          files: binaries/*
+          files: |
+            binaries/*
 
-      - name: Wait for VirusTotal results
+      # ── Wait for ALL VirusTotal engines to complete, then check ──
+      # The action outputs comma-separated "file=URL" pairs.
+      # URLs are /gui/file-analysis/<base64_id>/detection — we extract the
+      # base64 analysis ID and poll /api/v3/analyses/<id> until completed.
+      - name: Check VirusTotal scan results (wait for 100% completion)
         env:
           VT_API_KEY: ${{ secrets.VIRUS_TOTAL_SCANNER_API_KEY }}
           VT_ANALYSIS: ${{ steps.virustotal.outputs.analysis }}
-        run: scripts/ci/check-virustotal.sh
+        run: |
+          echo "=== Waiting for VirusTotal scans to fully complete ==="
+          MIN_ENGINES=60
+          rm -f /tmp/vt_gate_fail
+
+          echo "$VT_ANALYSIS" | tr ',' '\n' | while IFS= read -r entry; do
+            [ -z "$entry" ] && continue
+            FILE=$(echo "$entry" | cut -d'=' -f1)
+            URL=$(echo "$entry" | cut -d'=' -f2-)
+            BASENAME=$(basename "$FILE")
+
+            # Extract base64 analysis ID from URL: /gui/file-analysis/<ID>/detection
+            ANALYSIS_ID=$(echo "$URL" | sed -n 's|.*/file-analysis/\([^/]*\)/.*|\1|p')
+            if [ -z "$ANALYSIS_ID" ]; then
+              echo "WARNING: Could not extract analysis ID from $URL"
+              # Try SHA256 fallback (older action versions use /gui/file/<sha256>)
+              ANALYSIS_ID=$(echo "$URL" | grep -oE '[a-f0-9]{64}')
+              if [ -z "$ANALYSIS_ID" ]; then
+                echo "BLOCKED: Cannot parse VirusTotal URL: $URL"
+                echo "FAIL" >> /tmp/vt_gate_fail
+                continue
+              fi
+            fi
+
+            # Poll /api/v3/analyses/<id> until status=completed (max 120 min)
+            SCAN_COMPLETE=false
+            for attempt in $(seq 1 720); do
+              RESULT=$(curl -sf --max-time 10 \
+                -H "x-apikey: $VT_API_KEY" \
+                "https://www.virustotal.com/api/v3/analyses/$ANALYSIS_ID" 2>/dev/null || echo "")
+
+              if [ -z "$RESULT" ]; then
+                echo "  $BASENAME: waiting (attempt $attempt)..."
+                sleep 10
+                continue
+              fi
+
+              STATS=$(echo "$RESULT" | python3 -c "
+          import json, sys
+          d = json.loads(sys.stdin.read())
+          attrs = d.get('data', {}).get('attributes', {})
+          status = attrs.get('status', 'queued')
+          stats = attrs.get('stats', {})
+          malicious = stats.get('malicious', 0)
+          suspicious = stats.get('suspicious', 0)
+          undetected = stats.get('undetected', 0)
+          harmless = stats.get('harmless', 0)
+          total = sum(stats.values())
+          completed = malicious + suspicious + undetected + harmless
+          print(f'{status},{malicious},{suspicious},{completed},{total}')
+          " 2>/dev/null || echo "queued,0,0,0,0")
+
+              STATUS=$(echo "$STATS" | cut -d',' -f1)
+              MALICIOUS=$(echo "$STATS" | cut -d',' -f2)
+              SUSPICIOUS=$(echo "$STATS" | cut -d',' -f3)
+              COMPLETED=$(echo "$STATS" | cut -d',' -f4)
+              TOTAL=$(echo "$STATS" | cut -d',' -f5)
 
-      - name: Publish release
+              if [ "$STATUS" = "completed" ]; then
+                echo "$BASENAME: $MALICIOUS malicious, $SUSPICIOUS suspicious ($COMPLETED completed, $TOTAL total engines)"
+
+                if [ "$MALICIOUS" -gt 0 ] || [ "$SUSPICIOUS" -gt 0 ]; then
+                  echo "BLOCKED: $BASENAME flagged! See $URL"
+                  echo "FAIL" >> /tmp/vt_gate_fail
+                fi
+                SCAN_COMPLETE=true
+                break
+              fi
+
+              echo "  $BASENAME: $STATUS (attempt $attempt)..."
+              sleep 10
+            done
+
+            if [ "$SCAN_COMPLETE" != "true" ]; then
+              # Script files (sh, ps1) are low-priority in VT queue — warn but don't block
+              echo "BLOCKED: $BASENAME scan did not complete within 120 minutes!"
+              echo "FAIL" >> /tmp/vt_gate_fail
+            fi
+          done
+
+          if [ -f /tmp/vt_gate_fail ]; then
+            FAIL_COUNT=$(wc -l < /tmp/vt_gate_fail | tr -d ' ')
+            echo ""
+            echo "=== VIRUSTOTAL GATE FAILED ==="
+            echo "$FAIL_COUNT binary(ies) flagged or scan incomplete."
+            echo "Draft release will NOT be published. Investigate before retrying."
+            exit 1
+          fi
+
+          echo "=== All binaries clean (all engines completed) ==="
+
+      # ── OpenSSF Scorecard gate ──────────────────────────────────
+      # Fetch public score and block release if repo health degrades below threshold.
+      - name: OpenSSF Scorecard gate (minimum 4.0)
+        run: |
+          SCORE=$(curl -sf "https://api.scorecard.dev/projects/github.com/DeusData/codebase-memory-mcp" 2>/dev/null \
+            | python3 -c "import json,sys; print(json.loads(sys.stdin.read()).get('score',0))" 2>/dev/null \
+            || echo "0")
+          echo "OpenSSF Scorecard: $SCORE/10"
+          if python3 -c "exit(0 if float('$SCORE') >= 4.0 else 1)" 2>/dev/null; then
+            echo "=== Scorecard gate passed (>= 4.0) ==="
+          else
+            echo "BLOCKED: Scorecard $SCORE/10 is below minimum 4.0"
+            echo "Check https://scorecard.dev/viewer/?uri=github.com/DeusData/codebase-memory-mcp"
+            exit 1
+          fi
+
+      # ── Append results + publish ─────────────────────────────
+      - name: Append security verification and publish release
         env:
+          VT_ANALYSIS: ${{ steps.virustotal.outputs.analysis }}
           GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
           VERSION: ${{ inputs.version }}
-        run: gh release edit "$VERSION" --draft=false --repo "$GITHUB_REPOSITORY"
+        run: |
+          echo "=== Building security verification report ==="
+
+          REPORT=$'---\n\n### Security Verification\n\n'
+          REPORT+=$'All release binaries have been independently verified:\n\n'
+
+          # VirusTotal results (comma-separated "file=URL" pairs)
+          REPORT+=$'**VirusTotal** — scanned by 70+ antivirus engines:\n\n'
+          REPORT+=$'| Binary | Scan |\n|--------|------|\n'
+          echo "$VT_ANALYSIS" | tr ',' '\n' | while IFS= read -r entry; do
+            [ -z "$entry" ] && continue
+            FILE=$(echo "$entry" | cut -d'=' -f1)
+            URL=$(echo "$entry" | cut -d'=' -f2-)
+            BASENAME=$(basename "$FILE")
+            echo "| $BASENAME | [View Report]($URL) |"
+          done >> /tmp/vt_table
+          if [ -f /tmp/vt_table ]; then
+            REPORT+=$(cat /tmp/vt_table)$'\n'
+            rm -f /tmp/vt_table
+          fi
+
+          # Build provenance
+          REPORT+=$'**Build Provenance (SLSA)** — cryptographic proof each binary was built by GitHub Actions from this repo:\n'
+          REPORT+=$'```\ngh attestation verify <downloaded-file> --repo DeusData/codebase-memory-mcp\n```\n\n'
+
+          # Cosign
+          REPORT+=$'**Sigstore cosign** — keyless signature verification:\n'
+          REPORT+=$'```\ncosign verify-blob --bundle <file>.bundle <file>\n```\n\n'
+
+          # Native AV scans
+          REPORT+=$'**Native antivirus scans** — all binaries passed these scans before this release was created (any detection would have blocked the release):\n'
+          REPORT+=$'- Windows: Windows Defender with ML heuristics (the same engine end users run)\n'
+          REPORT+=$'- Linux: ClamAV with daily signature updates\n'
+          REPORT+=$'- macOS: ClamAV with daily signature updates\n\n'
+
+          # SBOM
+          REPORT+=$'**SBOM** — Software Bill of Materials (`sbom.json`) lists all vendored dependencies.\n\n'
+
+          REPORT+=$'See [SECURITY.md](https://github.com/DeusData/codebase-memory-mcp/blob/main/SECURITY.md) for full details.\n'
+
+          # Append to release notes
+          EXISTING=$(gh release view "$VERSION" --json body --jq '.body' --repo "$GITHUB_REPOSITORY")
+          printf '%s\n\n%s\n' "$EXISTING" "$REPORT" | gh release edit "$VERSION" --notes-file - --repo "$GITHUB_REPOSITORY"
+
+          # ── Publish: promote draft to public release ─────────
+          gh release edit "$VERSION" --draft=false --repo "$GITHUB_REPOSITORY"
+
+          echo "=== Release verified and published ==="
diff --git a/.github/workflows/scorecard.yml b/.github/workflows/scorecard.yml
index 15610e4..1b7d656 100644
--- a/.github/workflows/scorecard.yml
+++ b/.github/workflows/scorecard.yml
@@ -15,7 +15,7 @@ jobs:
       security-events: write
       id-token: write
     steps:
-      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
+      - uses: actions/checkout@34e114876b0b11c390a56381ad16ebd13914f8d5 # v4
         with:
           persist-credentials: false
 
@@ -27,6 +27,6 @@ jobs:
           publish_results: true
 
       - name: Upload SARIF results
-        uses: github/codeql-action/upload-sarif@c10b8064de6f491fea524254123dbe5e09572f13 # v4
+        uses: github/codeql-action/upload-sarif@38697555549f1db7851b81482ff19f1fa5c4fedc # v4
         with:
           sarif_file: results.sarif
diff --git a/Makefile.cbm b/Makefile.cbm
index c432f7c..6c7453c 100644
--- a/Makefile.cbm
+++ b/Makefile.cbm
@@ -227,8 +227,8 @@ MIMALLOC_CFLAGS_TEST = -std=c11 -g -O1 -w \
 
 # sqlite3 (vendored amalgamation — compiled ourselves for ASan instrumentation)
 SQLITE3_SRC = vendored/sqlite3/sqlite3.c
-SQLITE3_CFLAGS = -std=c11 -O2 -w -DSQLITE_DQS=0 -DSQLITE_THREADSAFE=1
-SQLITE3_CFLAGS_TEST = -std=c11 -g -O1 -w -DSQLITE_DQS=0 -DSQLITE_THREADSAFE=1
+SQLITE3_CFLAGS = -std=c11 -O2 -w -DSQLITE_DQS=0 -DSQLITE_THREADSAFE=1 -DSQLITE_ENABLE_FTS5
+SQLITE3_CFLAGS_TEST = -std=c11 -g -O1 -w -DSQLITE_DQS=0 -DSQLITE_THREADSAFE=1 -DSQLITE_ENABLE_FTS5
 
 # TRE regex (vendored, Windows only — POSIX uses system <regex.h>)
 TRE_SRC = vendored/tre/tre_all.c
diff --git a/src/mcp/mcp.c b/src/mcp/mcp.c
index c4073e5..9a91b71 100644
--- a/src/mcp/mcp.c
+++ b/src/mcp/mcp.c
@@ -40,8 +40,11 @@ enum {
 #define SLEN(s) (sizeof(s) - 1)
 #include "mcp/mcp.h"
 #include "store/store.h"
+#include <sqlite3/sqlite3.h>
 #include "cypher/cypher.h"
 #include "pipeline/pipeline.h"
+#include "pipeline/embedding.h"
+#include "store/cross_repo.h"
 #include "cli/cli.h"
 #include "watcher/watcher.h"
 #include "foundation/mem.h"
@@ -264,13 +267,24 @@ static const tool_def_t TOOLS[] = {
     {"search_graph",
      "Search the code knowledge graph for functions, classes, routes, and variables. Use INSTEAD "
      "OF grep/glob when finding code definitions, implementations, or relationships. Returns "
-     "precise results in one call.",
-     "{\"type\":\"object\",\"properties\":{\"project\":{\"type\":\"string\"},\"label\":{\"type\":"
-     "\"string\"},\"name_pattern\":{\"type\":\"string\"},\"qn_pattern\":{\"type\":\"string\"},"
-     "\"file_pattern\":{\"type\":\"string\"},\"relationship\":{\"type\":\"string\"},\"min_degree\":"
-     "{\"type\":\"integer\"},\"max_degree\":{\"type\":\"integer\"},\"exclude_entry_points\":{"
-     "\"type\":\"boolean\"},\"include_connected\":{\"type\":\"boolean\"},\"limit\":{\"type\":"
-     "\"integer\",\"description\":\"Max results. Default: "
+     "precise results in one call. Two modes: (1) query='search terms' for BM25 ranked full-text "
+     "search with structural boosting (recommended for discovery and conceptual search), "
+     "(2) name_pattern='regex' for exact pattern matching.",
+     "{\"type\":\"object\",\"properties\":{\"project\":{\"type\":\"string\"},"
+     "\"query\":{\"type\":\"string\",\"description\":\"Natural language or keyword search using "
+     "BM25 full-text ranking. Searches function names, class names, qualified names, and file "
+     "paths. Results ranked by relevance with structural boosting (Functions/Methods +10, "
+     "Routes +8, Classes +5). Filters out noise nodes (File/Folder/Module/Variable). "
+     "Example: 'session management' or 'error handling'. When provided, name_pattern is ignored.\"},"
+     "\"label\":{\"type\":\"string\"},\"name_pattern\":{\"type\":\"string\"},"
+     "\"qn_pattern\":{\"type\":\"string\"},"
+     "\"file_pattern\":{\"type\":\"string\"},\"relationship\":{\"type\":\"string\"},"
+     "\"min_degree\":{\"type\":\"integer\"},\"max_degree\":{\"type\":\"integer\"},"
+     "\"exclude_entry_points\":{\"type\":\"boolean\"},\"include_connected\":{\"type\":"
+     "\"boolean\"},"
+     "\"sort_by\":{\"type\":\"string\",\"description\":\"Sort by: relevance (default with "
+     "query), name, file_path\"},"
+     "\"limit\":{\"type\":\"integer\",\"description\":\"Max results. Default: "
      "unlimited\"},\"offset\":{\"type\":\"integer\",\"default\":0}},\"required\":[\"project\"]}"},
 
     {"query_graph",
@@ -363,6 +377,28 @@ static const tool_def_t TOOLS[] = {
      "{\"type\":\"object\",\"properties\":{\"traces\":{\"type\":\"array\",\"items\":{\"type\":"
      "\"object\"}},\"project\":{\"type\":"
      "\"string\"}},\"required\":[\"traces\",\"project\"]}"},
+
+    {"generate_embeddings",
+     "Generate semantic embeddings for code symbols via external embedding server. "
+     "Requires CBM_EMBEDDING_URL environment variable (e.g., http://localhost:11434/v1 for Ollama). "
+     "Embeddings enable hybrid BM25+vector search in search_graph.",
+     "{\"type\":\"object\",\"properties\":{\"project\":{\"type\":\"string\"},"
+     "\"force\":{\"type\":\"boolean\",\"default\":false,\"description\":"
+     "\"Re-generate all embeddings even if they already exist\"}},\"required\":[\"project\"]}"},
+
+    {"build_cross_repo_index",
+     "Build unified cross-repo index for cross-repository search, channel matching, and flow tracing. "
+     "Scans all indexed project databases and builds a _cross_repo.db with node stubs, channels, "
+     "and embeddings from all repos.",
+     "{\"type\":\"object\",\"properties\":{}}"},
+
+    {"trace_cross_repo",
+     "Trace message/event channels across repositories. Shows which services produce and consume "
+     "a specific channel, with file-level and function-level detail.",
+     "{\"type\":\"object\",\"properties\":{"
+     "\"channel\":{\"type\":\"string\",\"description\":\"Channel name to trace (partial match). "
+     "Omit to list all cross-repo channels.\"},"
+     "\"repo\":{\"type\":\"string\",\"description\":\"Filter to channels involving a specific repo.\"}}}"},
 };
 
 static const int TOOL_COUNT = sizeof(TOOLS) / sizeof(TOOLS[0]);
@@ -1031,6 +1067,8 @@ static char *handle_search_graph(cbm_mcp_server_t *srv, const char *args) {
         return not_indexed;
     }
 
+    char *query = cbm_mcp_get_string_arg(args, "query");
+    char *sort_by = cbm_mcp_get_string_arg(args, "sort_by");
     char *label = cbm_mcp_get_string_arg(args, "label");
     char *name_pattern = cbm_mcp_get_string_arg(args, "name_pattern");
     char *qn_pattern = cbm_mcp_get_string_arg(args, "qn_pattern");
@@ -1043,6 +1081,110 @@ static char *handle_search_graph(cbm_mcp_server_t *srv, const char *args) {
     int min_degree = cbm_mcp_get_int_arg(args, "min_degree", CBM_NOT_FOUND);
     int max_degree = cbm_mcp_get_int_arg(args, "max_degree", CBM_NOT_FOUND);
 
+    /* BM25 FTS5 search path: when query is provided, use ranked full-text search
+     * instead of SQL LIKE patterns. camelCase splitting is done at index time. */
+    if (query && query[0]) {
+        struct sqlite3 *db = cbm_store_get_db(store);
+        if (!db) goto fallback_search;
+
+        /* Tokenize query: split on whitespace, join with OR */
+        char fts_query[1024];
+        {
+            char tmp[1024];
+            snprintf(tmp, sizeof(tmp), "%s", query);
+            int fq_len = 0;
+            char *tok = strtok(tmp, " \t\n");
+            while (tok && fq_len < (int)sizeof(fts_query) - 20) {
+                if (fq_len > 0) fq_len += snprintf(fts_query + fq_len,
+                    sizeof(fts_query) - (size_t)fq_len, " OR ");
+                fq_len += snprintf(fts_query + fq_len,
+                    sizeof(fts_query) - (size_t)fq_len, "%s", tok);
+                tok = strtok(NULL, " \t\n");
+            }
+            fts_query[fq_len] = '\0';
+        }
+
+        /* BM25 query with label-type structural boosting */
+        char sql[4096];
+        snprintf(sql, sizeof(sql),
+            "SELECT n.id, n.project, n.label, n.name, n.qualified_name, "
+            "n.file_path, n.start_line, n.end_line, n.properties, "
+            "(SELECT COUNT(*) FROM edges e WHERE e.target_id = n.id AND e.type = 'CALLS') AS in_deg, "
+            "(SELECT COUNT(*) FROM edges e WHERE e.source_id = n.id AND e.type = 'CALLS') AS out_deg, "
+            "(bm25(nodes_fts) "
+            " - CASE WHEN n.label IN ('Function','Method') THEN 10.0 "
+            "        WHEN n.label IN ('Class','Interface','Type') THEN 5.0 "
+            "        WHEN n.label = 'Route' THEN 8.0 "
+            "        ELSE 0.0 END) AS rank "
+            "FROM nodes_fts "
+            "JOIN nodes n ON n.id = nodes_fts.rowid "
+            "WHERE nodes_fts MATCH ?1"
+            " AND n.label NOT IN ('File','Folder','Module','Section','Variable','Project')"
+            " AND n.project = ?2"
+            " ORDER BY rank LIMIT ?3 OFFSET ?4");
+
+        sqlite3_stmt *stmt = NULL;
+        if (sqlite3_prepare_v2(db, sql, -1, &stmt, NULL) != SQLITE_OK) goto fallback_search;
+
+        sqlite3_bind_text(stmt, 1, fts_query, -1, SQLITE_TRANSIENT);
+        sqlite3_bind_text(stmt, 2, project, -1, SQLITE_TRANSIENT);
+        sqlite3_bind_int(stmt, 3, limit > 0 ? limit : 100);
+        sqlite3_bind_int(stmt, 4, offset);
+
+        /* Count total matches */
+        int total = 0;
+        {
+            char count_sql[1024];
+            snprintf(count_sql, sizeof(count_sql),
+                "SELECT COUNT(*) FROM nodes_fts JOIN nodes n ON n.id = nodes_fts.rowid "
+                "WHERE nodes_fts MATCH ?1 AND n.project = ?2 "
+                "AND n.label NOT IN ('File','Folder','Module','Section','Variable','Project')");
+            sqlite3_stmt *cs = NULL;
+            if (sqlite3_prepare_v2(db, count_sql, -1, &cs, NULL) == SQLITE_OK) {
+                sqlite3_bind_text(cs, 1, fts_query, -1, SQLITE_TRANSIENT);
+                sqlite3_bind_text(cs, 2, project, -1, SQLITE_TRANSIENT);
+                if (sqlite3_step(cs) == SQLITE_ROW) total = sqlite3_column_int(cs, 0);
+                sqlite3_finalize(cs);
+            }
+        }
+
+        yyjson_mut_doc *doc = yyjson_mut_doc_new(NULL);
+        yyjson_mut_val *root = yyjson_mut_obj(doc);
+        yyjson_mut_doc_set_root(doc, root);
+        yyjson_mut_obj_add_int(doc, root, "total", total);
+        yyjson_mut_obj_add_str(doc, root, "search_mode", "bm25");
+
+        yyjson_mut_val *results = yyjson_mut_arr(doc);
+        while (sqlite3_step(stmt) == SQLITE_ROW) {
+            yyjson_mut_val *item = yyjson_mut_obj(doc);
+            yyjson_mut_obj_add_strcpy(doc, item, "name",
+                (const char *)sqlite3_column_text(stmt, 3));
+            yyjson_mut_obj_add_strcpy(doc, item, "qualified_name",
+                (const char *)sqlite3_column_text(stmt, 4));
+            yyjson_mut_obj_add_strcpy(doc, item, "label",
+                (const char *)sqlite3_column_text(stmt, 2));
+            yyjson_mut_obj_add_strcpy(doc, item, "file_path",
+                (const char *)sqlite3_column_text(stmt, 5));
+            yyjson_mut_obj_add_int(doc, item, "start_line", sqlite3_column_int(stmt, 6));
+            yyjson_mut_obj_add_int(doc, item, "end_line", sqlite3_column_int(stmt, 7));
+            yyjson_mut_obj_add_int(doc, item, "in_degree", sqlite3_column_int(stmt, 9));
+            yyjson_mut_obj_add_int(doc, item, "out_degree", sqlite3_column_int(stmt, 10));
+            yyjson_mut_arr_add_val(results, item);
+        }
+        sqlite3_finalize(stmt);
+
+        yyjson_mut_obj_add_val(doc, root, "results", results);
+        char *json = yy_doc_to_str(doc);
+        yyjson_mut_doc_free(doc);
+        free(project); free(label); free(name_pattern); free(qn_pattern);
+        free(file_pattern); free(query); free(sort_by); free(relationship);
+        char *result = cbm_mcp_text_result(json, false);
+        free(json);
+        return result;
+    }
+fallback_search:
+    (void)sort_by; /* used in BM25 path, suppressed in regex path */
+
     if (relationship && !validate_edge_type(relationship)) {
         free(project);
         free(label);
@@ -1050,6 +1192,8 @@ static char *handle_search_graph(cbm_mcp_server_t *srv, const char *args) {
         free(qn_pattern);
         free(file_pattern);
         free(relationship);
+        free(query);
+        free(sort_by);
         return cbm_mcp_text_result("relationship must be uppercase letters and underscores", true);
     }
 
@@ -1109,6 +1253,8 @@ static char *handle_search_graph(cbm_mcp_server_t *srv, const char *args) {
     free(qn_pattern);
     free(file_pattern);
     free(relationship);
+    free(query);
+    free(sort_by);
 
     char *result = cbm_mcp_text_result(json, false);
     free(json);
@@ -3033,6 +3179,126 @@ static char *handle_ingest_traces(cbm_mcp_server_t *srv, const char *args) {
 
 /* ── Tool dispatch ────────────────────────────────────────────── */
 
+/* ── generate_embeddings handler ─────────────────────────────── */
+
+static char *handle_generate_embeddings(cbm_mcp_server_t *srv, const char *args) {
+    char *project = cbm_mcp_get_string_arg(args, "project");
+    cbm_store_t *store = resolve_store(srv, project);
+    REQUIRE_STORE(store, project);
+
+    if (!cbm_embedding_is_configured()) {
+        free(project);
+        return cbm_mcp_text_result(
+            "{\"error\":\"CBM_EMBEDDING_URL not set. Set to an OpenAI-compatible endpoint.\"}", true);
+    }
+
+    bool force = cbm_mcp_get_bool_arg(args, "force");
+    int existing = cbm_store_count_embeddings(store, project);
+    int generated = cbm_embedding_generate_for_project(store, project, force);
+
+    yyjson_mut_doc *doc = yyjson_mut_doc_new(NULL);
+    yyjson_mut_val *root = yyjson_mut_obj(doc);
+    yyjson_mut_doc_set_root(doc, root);
+    yyjson_mut_obj_add_str(doc, root, "status", generated >= 0 ? "success" : "error");
+    yyjson_mut_obj_add_int(doc, root, "generated", generated >= 0 ? generated : 0);
+    yyjson_mut_obj_add_int(doc, root, "existing_before", existing);
+    yyjson_mut_obj_add_int(doc, root, "total_embeddings", cbm_store_count_embeddings(store, project));
+
+    char *json = yy_doc_to_str(doc);
+    yyjson_mut_doc_free(doc);
+    free(project);
+    char *result = cbm_mcp_text_result(json, generated < 0);
+    free(json);
+    return result;
+}
+
+/* ── build_cross_repo_index handler ─────────────────────────── */
+
+static char *handle_build_cross_repo_index(cbm_mcp_server_t *srv, const char *args) {
+    (void)srv; (void)args;
+    cbm_cross_repo_stats_t stats = cbm_cross_repo_build();
+
+    yyjson_mut_doc *doc = yyjson_mut_doc_new(NULL);
+    yyjson_mut_val *root = yyjson_mut_obj(doc);
+    yyjson_mut_doc_set_root(doc, root);
+    yyjson_mut_obj_add_str(doc, root, "status", stats.repos_scanned >= 0 ? "success" : "error");
+    yyjson_mut_obj_add_int(doc, root, "repos_scanned", stats.repos_scanned);
+    yyjson_mut_obj_add_int(doc, root, "nodes_copied", stats.nodes_copied);
+    yyjson_mut_obj_add_int(doc, root, "channels_copied", stats.channels_copied);
+    yyjson_mut_obj_add_int(doc, root, "embeddings_copied", stats.embeddings_copied);
+    yyjson_mut_obj_add_int(doc, root, "cross_repo_channel_matches", stats.cross_repo_matches);
+    yyjson_mut_obj_add_real(doc, root, "build_time_ms", stats.build_time_ms);
+
+    char *json = yy_doc_to_str(doc);
+    yyjson_mut_doc_free(doc);
+    char *result = cbm_mcp_text_result(json, stats.repos_scanned < 0);
+    free(json);
+    return result;
+}
+
+/* ── trace_cross_repo handler ────────────────────────────────── */
+
+static char *handle_trace_cross_repo(cbm_mcp_server_t *srv, const char *args) {
+    (void)srv;
+    char *channel = cbm_mcp_get_string_arg(args, "channel");
+
+    cbm_cross_repo_t *cr = cbm_cross_repo_open();
+    if (!cr) {
+        free(channel);
+        return cbm_mcp_text_result(
+            "{\"error\":\"Cross-repo index not built. Run build_cross_repo_index first.\"}", true);
+    }
+
+    cbm_cross_repo_info_t info = {0};
+    cbm_cross_repo_get_info(cr, &info);
+
+    cbm_cross_channel_match_t *matches = NULL;
+    int match_count = 0;
+    cbm_cross_repo_match_channels(cr, channel, &matches, &match_count);
+
+    yyjson_mut_doc *doc = yyjson_mut_doc_new(NULL);
+    yyjson_mut_val *root = yyjson_mut_obj(doc);
+    yyjson_mut_doc_set_root(doc, root);
+    yyjson_mut_obj_add_int(doc, root, "total_repos", info.total_repos);
+    yyjson_mut_obj_add_int(doc, root, "total_cross_repo_channels", info.cross_repo_channel_count);
+    yyjson_mut_obj_add_int(doc, root, "matches", match_count);
+
+    yyjson_mut_val *arr = yyjson_mut_arr(doc);
+    for (int i = 0; i < match_count; i++) {
+        cbm_cross_channel_match_t *m = &matches[i];
+        yyjson_mut_val *item = yyjson_mut_obj(doc);
+        yyjson_mut_obj_add_strcpy(doc, item, "channel", m->channel_name ? m->channel_name : "");
+        yyjson_mut_obj_add_strcpy(doc, item, "transport", m->transport ? m->transport : "");
+
+        yyjson_mut_val *emit = yyjson_mut_obj(doc);
+        yyjson_mut_obj_add_strcpy(doc, emit, "project", m->emit_project ? m->emit_project : "");
+        yyjson_mut_obj_add_strcpy(doc, emit, "file", m->emit_file ? m->emit_file : "");
+        yyjson_mut_obj_add_strcpy(doc, emit, "function", m->emit_function ? m->emit_function : "");
+        yyjson_mut_obj_add_val(doc, item, "emitter", emit);
+
+        yyjson_mut_val *listen = yyjson_mut_obj(doc);
+        yyjson_mut_obj_add_strcpy(doc, listen, "project", m->listen_project ? m->listen_project : "");
+        yyjson_mut_obj_add_strcpy(doc, listen, "file", m->listen_file ? m->listen_file : "");
+        yyjson_mut_obj_add_strcpy(doc, listen, "function", m->listen_function ? m->listen_function : "");
+        yyjson_mut_obj_add_val(doc, item, "listener", listen);
+
+        yyjson_mut_arr_add_val(arr, item);
+    }
+    yyjson_mut_obj_add_val(doc, root, "channel_flows", arr);
+
+    char *json = yy_doc_to_str(doc);
+    yyjson_mut_doc_free(doc);
+    cbm_cross_channel_free(matches, match_count);
+    cbm_cross_repo_info_free(&info);
+    cbm_cross_repo_close(cr);
+    free(channel);
+    char *result = cbm_mcp_text_result(json, false);
+    free(json);
+    return result;
+}
+
+/* ── Tool dispatch ────────────────────────────────────────────── */
+
 char *cbm_mcp_handle_tool(cbm_mcp_server_t *srv, const char *tool_name, const char *args_json) {
     if (!tool_name) {
         return cbm_mcp_text_result("missing tool name", true);
@@ -3082,6 +3348,15 @@ char *cbm_mcp_handle_tool(cbm_mcp_server_t *srv, const char *tool_name, const ch
     if (strcmp(tool_name, "ingest_traces") == 0) {
         return handle_ingest_traces(srv, args_json);
     }
+    if (strcmp(tool_name, "generate_embeddings") == 0) {
+        return handle_generate_embeddings(srv, args_json);
+    }
+    if (strcmp(tool_name, "build_cross_repo_index") == 0) {
+        return handle_build_cross_repo_index(srv, args_json);
+    }
+    if (strcmp(tool_name, "trace_cross_repo") == 0) {
+        return handle_trace_cross_repo(srv, args_json);
+    }
     char msg[CBM_SZ_256];
     snprintf(msg, sizeof(msg), "unknown tool: %s", tool_name);
     return cbm_mcp_text_result(msg, true);
diff --git a/src/pipeline/pipeline.c b/src/pipeline/pipeline.c
index dd88a82..fc0b152 100644
--- a/src/pipeline/pipeline.c
+++ b/src/pipeline/pipeline.c
@@ -794,11 +794,19 @@ int cbm_pipeline_run(cbm_pipeline_t *p) {
 
         cbm_store_t *post_store = cbm_store_open_path(db_path);
         if (post_store) {
-            /* FTS5 backfill with camelCase splitting */
-            cbm_store_exec(post_store, "DELETE FROM nodes_fts;");
+            /* FTS5 backfill. Contentless FTS5 requires 'delete-all' command.
+             * Try camelCase splitting first, fall back to plain names. */
             cbm_store_exec(post_store,
-                "INSERT INTO nodes_fts(rowid, name, qualified_name, label, file_path) "
-                "SELECT id, cbm_camel_split(name), qualified_name, label, file_path FROM nodes;");
+                "INSERT INTO nodes_fts(nodes_fts) VALUES('delete-all');");
+            if (cbm_store_exec(post_store,
+                    "INSERT INTO nodes_fts(rowid, name, qualified_name, label, file_path) "
+                    "SELECT id, cbm_camel_split(name), qualified_name, label, file_path "
+                    "FROM nodes;") != 0) {
+                /* Fallback: plain names without camelCase splitting */
+                cbm_store_exec(post_store,
+                    "INSERT INTO nodes_fts(rowid, name, qualified_name, label, file_path) "
+                    "SELECT id, name, qualified_name, label, file_path FROM nodes;");
+            }
 
             /* Embedding generation (if configured) */
             if (cbm_embedding_is_configured()) {
diff --git a/src/pipeline/pipeline_incremental.c b/src/pipeline/pipeline_incremental.c
index 0768f8c..abaf940 100644
--- a/src/pipeline/pipeline_incremental.c
+++ b/src/pipeline/pipeline_incremental.c
@@ -271,10 +271,17 @@ static void dump_and_persist(cbm_gbuf_t *gbuf, const char *db_path, const char *
         persist_hashes(hash_store, project, files, file_count);
 
         /* Rebuild FTS5 index: btree dump bypasses triggers */
-        cbm_store_exec(hash_store, "DELETE FROM nodes_fts;");
+        /* FTS5 rebuild — contentless requires 'delete-all' */
         cbm_store_exec(hash_store,
-            "INSERT INTO nodes_fts(rowid, name, qualified_name, label, file_path) "
-            "SELECT id, cbm_camel_split(name), qualified_name, label, file_path FROM nodes;");
+            "INSERT INTO nodes_fts(nodes_fts) VALUES('delete-all');");
+        if (cbm_store_exec(hash_store,
+                "INSERT INTO nodes_fts(rowid, name, qualified_name, label, file_path) "
+                "SELECT id, cbm_camel_split(name), qualified_name, label, file_path "
+                "FROM nodes;") != 0) {
+            cbm_store_exec(hash_store,
+                "INSERT INTO nodes_fts(rowid, name, qualified_name, label, file_path) "
+                "SELECT id, name, qualified_name, label, file_path FROM nodes;");
+        }
 
         cbm_store_close(hash_store);
     }

From 465527ef8e8393d8777d79e6291deb6624d13e6a Mon Sep 17 00:00:00 2001
From: Your Name <your.email@example.com>
Date: Sat, 4 Apr 2026 23:45:00 -0400
Subject: [PATCH 3/4] fix(csharp): explicit base_list handler for C# class
 inheritance extraction
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The fallback base_types[] approach (find_base_from_children) includes the
':' separator in the extracted text for C# base_list nodes, producing
names like ': IExamService' instead of 'IExamService'. The registry lookup
fails because no node has a colon-prefixed name.

Fix: add explicit C# base_list handler that iterates named children of the
base_list node, extracting identifier/generic_name/qualified_name text
directly. Strips generic type args (List<int> → List).

Tested: 0 → 5 INHERITS→Interface edges on C# repo.
---
 internal/cbm/extract_defs.c | 42 ++++++++++++++++++++++++++++++++++++-
 1 file changed, 41 insertions(+), 1 deletion(-)

diff --git a/internal/cbm/extract_defs.c b/internal/cbm/extract_defs.c
index cc930f5..f197eb2 100644
--- a/internal/cbm/extract_defs.c
+++ b/internal/cbm/extract_defs.c
@@ -944,6 +944,47 @@ static const char **extract_base_classes(CBMArena *a, TSNode node, const char *s
         }
     }
 
+    // C# specific: handle base_list node (contains base types after ':')
+    {
+        uint32_t count = ts_node_child_count(node);
+        for (uint32_t i = 0; i < count; i++) {
+            TSNode child = ts_node_child(node, i);
+            if (strcmp(ts_node_type(child), "base_list") == 0) {
+                const char *bases[16];
+                int base_count = 0;
+                uint32_t bnc = ts_node_named_child_count(child);
+                for (uint32_t bi = 0; bi < bnc && base_count < MAX_BASES_MINUS_1; bi++) {
+                    TSNode bc = ts_node_named_child(child, bi);
+                    const char *bk = ts_node_type(bc);
+                    char *text = NULL;
+                    if (strcmp(bk, "identifier") == 0 || strcmp(bk, "generic_name") == 0 ||
+                        strcmp(bk, "qualified_name") == 0) {
+                        text = cbm_node_text(a, bc, source);
+                    } else {
+                        TSNode inner = ts_node_named_child(bc, 0);
+                        if (!ts_node_is_null(inner)) {
+                            text = cbm_node_text(a, inner, source);
+                        }
+                    }
+                    if (text && text[0]) {
+                        char *angle = strchr(text, '<');
+                        if (angle) *angle = '\0';
+                        bases[base_count++] = text;
+                    }
+                }
+                if (base_count > 0) {
+                    const char **result =
+                        (const char **)cbm_arena_alloc(a, (base_count + 1) * sizeof(const char *));
+                    if (result) {
+                        for (int j = 0; j < base_count; j++) result[j] = bases[j];
+                        result[base_count] = NULL;
+                        return result;
+                    }
+                }
+            }
+        }
+    }
+
     // Fallback: search for common base class node types as children
     static const char *base_types[] = {"superclass",
                                        "superinterfaces",
@@ -955,7 +996,6 @@ static const char **extract_base_classes(CBMArena *a, TSNode node, const char *s
                                        "implements_clause",
                                        "argument_list",
                                        "inheritance_specifier",
-                                       "base_list", /* C# class Foo : IBar */
                                        NULL};
     return find_base_from_children(a, node, source, base_types);
 }

From 7829b5e2c3f1c59dd86d0784a5af1624ff3e6b6b Mon Sep 17 00:00:00 2001
From: Your Name <your.email@example.com>
Date: Mon, 6 Apr 2026 12:09:01 -0400
Subject: [PATCH 4/4] fix(mcp+cypher): short-name project resolution + Cypher
 quality improvements
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Four fixes addressing composite tool failures and Cypher dialect gaps:

1. Short-name project resolution in resolve_store():
   When exact .db file lookup fails, scans the cache directory for a
   file ending with '-{name}.db'. If exactly one match, recursively
   resolves with the full project name. Also adds suffix-match fallback
   to verify_project_indexed(). Plus resolved_project() helper to ensure
   BM25 search and Cypher queries use the resolved name.

   Before: search_graph(project='myrepo') → 'project not found'
   After:  search_graph(project='myrepo') → resolves to full key, works

2. SQL-style -- comments in Cypher lexer:
   Added '--' as single-line comment (same as '//'). Skips to EOL.
   Before: '-- comment' caused parse error (two TOK_DASH tokens)
   After:  '-- comment' silently skipped

3. Virtual in_degree/out_degree properties in Cypher node accessor:
   Enables dead code detection via Cypher:
     MATCH (n:Function) WHERE n.in_degree = '0' RETURN n.name
   Uses file-static store pointer set during query execution to compute
   degree on demand via cbm_store_node_degree().

4. Regex matching in inline Cypher property filters:
   MATCH (n {file_path: '.*test.*'}) now uses regex when the value
   contains regex metacharacters. Falls back to exact strcmp otherwise.
   Uses cbm_regcomp/cbm_regexec (POSIX ERE).

All 4 fixes tested on indexed repo with short project name.
---
 src/cypher/cypher.c | 45 ++++++++++++++++++++++++++--
 src/mcp/mcp.c       | 71 +++++++++++++++++++++++++++++++++++++++++++--
 2 files changed, 111 insertions(+), 5 deletions(-)

diff --git a/src/cypher/cypher.c b/src/cypher/cypher.c
index 6aedeb9..941a753 100644
--- a/src/cypher/cypher.c
+++ b/src/cypher/cypher.c
@@ -326,6 +326,13 @@ static bool lex_skip_whitespace_comments(const char *input, int len, int *i) {
         }
         return true;
     }
+    /* SQL-style -- single-line comment */
+    if (*i + SKIP_ONE < len && input[*i] == '-' && input[*i + SKIP_ONE] == '-') {
+        while (*i < len && input[*i] != '\n') {
+            (*i)++;
+        }
+        return true;
+    }
     if (*i + SKIP_ONE < len && input[*i] == '/' && input[*i + SKIP_ONE] == '*') {
         *i += PAIR_LEN;
         while (*i + SKIP_ONE < len && !(input[*i] == '*' && input[*i + SKIP_ONE] == '/')) {
@@ -1641,6 +1648,10 @@ typedef struct {
     int edge_var_count;
 } binding_t;
 
+/* File-static store for degree queries in node_prop.
+ * Set at the start of execute_single(), cleared after. */
+static cbm_store_t *_cyp_exec_store = NULL;
+
 /* Get node property by name */
 static const char *node_prop(const cbm_node_t *n, const char *prop) {
     if (!n || !prop) {
@@ -1669,6 +1680,16 @@ static const char *node_prop(const cbm_node_t *n, const char *prop) {
         snprintf(buf, sizeof(buf), "%d", n->end_line);
         return buf;
     }
+    /* Virtual computed properties: in_degree, out_degree (CALLS edges).
+     * Enables Cypher: WHERE n.in_degree = 0 (dead code detection). */
+    if ((strcmp(prop, "in_degree") == 0 || strcmp(prop, "out_degree") == 0) && _cyp_exec_store) {
+        int in_deg = 0, out_deg = 0;
+        cbm_store_node_degree(_cyp_exec_store, n->id, &in_deg, &out_deg);
+        static char deg_buf[CBM_SZ_32];
+        snprintf(deg_buf, sizeof(deg_buf), "%d",
+                 strcmp(prop, "in_degree") == 0 ? in_deg : out_deg);
+        return deg_buf;
+    }
     return "";
 }
 
@@ -1992,11 +2013,30 @@ static bool eval_where(const cbm_where_clause_t *w, binding_t *b) {
 }
 
 /* Check inline property filters */
+/* Check if a string value looks like a regex pattern. */
+static bool looks_like_regex(const char *s) {
+    return s && (strchr(s, '*') || strchr(s, '?') || strchr(s, '[') ||
+                 strchr(s, '(') || strchr(s, '|') || strchr(s, '^') ||
+                 strchr(s, '$') || strstr(s, ".*") || strstr(s, ".+"));
+}
+
 static bool check_inline_props(const cbm_node_t *n, const cbm_prop_filter_t *props, int count) {
     for (int i = 0; i < count; i++) {
         const char *actual = node_prop(n, props[i].key);
-        if (strcmp(actual, props[i].value) != 0) {
-            return false;
+        /* If the value looks like a regex, use regex matching */
+        if (looks_like_regex(props[i].value)) {
+            cbm_regex_t re;
+            if (cbm_regcomp(&re, props[i].value,
+                            CBM_REG_EXTENDED | CBM_REG_NOSUB) == 0) {
+                bool match = cbm_regexec(&re, actual, 0, NULL, 0) == 0;
+                cbm_regfree(&re);
+                if (!match) return false;
+            } else {
+                /* Regex compile failed — fall back to exact match */
+                if (strcmp(actual, props[i].value) != 0) return false;
+            }
+        } else {
+            if (strcmp(actual, props[i].value) != 0) return false;
         }
     }
     return true;
@@ -3272,6 +3312,7 @@ static void execute_return_clause(cbm_query_t *q, cbm_return_clause_t *ret, bind
 
 static int execute_single(cbm_store_t *store, cbm_query_t *q, const char *project, int max_rows,
                           result_builder_t *rb) {
+    _cyp_exec_store = store; /* enable in_degree/out_degree in node_prop */
     cbm_pattern_t *pat0 = &q->patterns[0];
 
     /* Step 1: Scan initial nodes */
diff --git a/src/mcp/mcp.c b/src/mcp/mcp.c
index 9a91b71..1bfec9a 100644
--- a/src/mcp/mcp.c
+++ b/src/mcp/mcp.c
@@ -728,6 +728,44 @@ static cbm_store_t *resolve_store(cbm_mcp_server_t *srv, const char *project) {
     char path[CBM_SZ_1K];
     project_db_path(project, path, sizeof(path));
     srv->store = cbm_store_open_path_query(path);
+
+    /* Short-name resolution: if exact match fails, scan cache dir for a
+     * .db file whose name ends with "-{project}.db". This allows callers
+     * to use a short name instead of the full slugified path key.
+     * Only resolves when exactly one candidate matches (no ambiguity). */
+    if (!srv->store) {
+        char suffix[CBM_SZ_512];
+        snprintf(suffix, sizeof(suffix), "-%s.db", project);
+        size_t suffix_len = strlen(suffix);
+
+        char dir_path[CBM_SZ_1K];
+        cache_dir(dir_path, sizeof(dir_path));
+        cbm_dir_t *d = cbm_opendir(dir_path);
+        if (d) {
+            char resolved[CBM_SZ_1K] = "";
+            int matches = 0;
+            cbm_dirent_t *ent;
+            while ((ent = cbm_readdir(d)) != NULL) {
+                size_t name_len = strlen(ent->name);
+                if (name_len > suffix_len &&
+                    strcmp(ent->name + name_len - suffix_len, suffix) == 0) {
+                    /* Strip .db extension to get the project name */
+                    snprintf(resolved, sizeof(resolved), "%.*s",
+                             (int)(name_len - 3), ent->name);
+                    matches++;
+                }
+            }
+            cbm_closedir(d);
+
+            if (matches == 1 && resolved[0]) {
+                /* Retry with the resolved full project name.
+                 * Recursive call ensures integrity check and project
+                 * verification use the correct (resolved) project name. */
+                return resolve_store(srv, resolved);
+            }
+        }
+    }
+
     if (srv->store) {
         /* Check DB integrity — auto-clean corrupt databases */
         if (!cbm_store_check_integrity(srv->store)) {
@@ -765,6 +803,13 @@ static cbm_store_t *resolve_store(cbm_mcp_server_t *srv, const char *project) {
     return srv->store;
 }
 
+/* After resolve_store, the resolved project name may differ from the input
+ * (e.g., "myrepo" resolved to "path-to-myrepo").
+ * This helper returns the resolved name, or the original if no resolution. */
+static const char *resolved_project(cbm_mcp_server_t *srv, const char *project) {
+    return (srv && srv->current_project) ? srv->current_project : project;
+}
+
 /* Scan cache dir for .db files, writing comma-separated quoted names into out.
  * Returns the number of projects found. */
 static int collect_db_project_names(const char *dir_path, char *out, size_t out_sz) {
@@ -941,6 +986,26 @@ static char *handle_list_projects(cbm_mcp_server_t *srv, const char *args) {
 static char *verify_project_indexed(cbm_store_t *store, const char *project) {
     cbm_project_t proj_check = {0};
     if (cbm_store_get_project(store, project, &proj_check) != CBM_STORE_OK) {
+        /* Short-name fallback: scan projects table for suffix match.
+         * This handles the case where resolve_store resolved a short name to
+         * the full project key, but the caller still passes the short name here. */
+        struct sqlite3 *db = cbm_store_get_db(store);
+        if (db) {
+            char like_pattern[CBM_SZ_512];
+            snprintf(like_pattern, sizeof(like_pattern), "%%-%s", project);
+            sqlite3_stmt *s = NULL;
+            if (sqlite3_prepare_v2(db,
+                    "SELECT name FROM projects WHERE name LIKE ?1 LIMIT 1",
+                    -1, &s, NULL) == SQLITE_OK) {
+                sqlite3_bind_text(s, 1, like_pattern, -1, SQLITE_TRANSIENT);
+                if (sqlite3_step(s) == SQLITE_ROW) {
+                    /* Found via suffix match — project is indexed */
+                    sqlite3_finalize(s);
+                    return NULL;
+                }
+                sqlite3_finalize(s);
+            }
+        }
         return cbm_mcp_text_result(
             "{\"error\":\"project not indexed — run index_repository first\"}", true);
     }
@@ -1127,7 +1192,7 @@ static char *handle_search_graph(cbm_mcp_server_t *srv, const char *args) {
         if (sqlite3_prepare_v2(db, sql, -1, &stmt, NULL) != SQLITE_OK) goto fallback_search;
 
         sqlite3_bind_text(stmt, 1, fts_query, -1, SQLITE_TRANSIENT);
-        sqlite3_bind_text(stmt, 2, project, -1, SQLITE_TRANSIENT);
+        sqlite3_bind_text(stmt, 2, resolved_project(srv, project), -1, SQLITE_TRANSIENT);
         sqlite3_bind_int(stmt, 3, limit > 0 ? limit : 100);
         sqlite3_bind_int(stmt, 4, offset);
 
@@ -1142,7 +1207,7 @@ static char *handle_search_graph(cbm_mcp_server_t *srv, const char *args) {
             sqlite3_stmt *cs = NULL;
             if (sqlite3_prepare_v2(db, count_sql, -1, &cs, NULL) == SQLITE_OK) {
                 sqlite3_bind_text(cs, 1, fts_query, -1, SQLITE_TRANSIENT);
-                sqlite3_bind_text(cs, 2, project, -1, SQLITE_TRANSIENT);
+                sqlite3_bind_text(cs, 2, resolved_project(srv, project), -1, SQLITE_TRANSIENT);
                 if (sqlite3_step(cs) == SQLITE_ROW) total = sqlite3_column_int(cs, 0);
                 sqlite3_finalize(cs);
             }
@@ -1288,7 +1353,7 @@ static char *handle_query_graph(cbm_mcp_server_t *srv, const char *args) {
     }
 
     cbm_cypher_result_t result = {0};
-    int rc = cbm_cypher_execute(store, query, project, max_rows, &result);
+    int rc = cbm_cypher_execute(store, query, resolved_project(srv, project), max_rows, &result);
 
     if (rc < 0) {
         char *err_msg = result.error ? result.error : "query execution failed";