From 3e64560094b25411173b24355f29e50ea97538da Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Wed, 22 Apr 2026 18:15:46 +0000
Subject: [PATCH 01/30] feat(embeddings): add nomic daemon + IPC client +
 protocol
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Introduce a long-lived embedding daemon backed by @huggingface/transformers
(nomic-embed-text-v1.5) that plugin hooks and the virtual shell can call over
a per-user Unix socket. Hooks run as one-shot subprocesses, so loading the
model per invocation would add ~600 ms cold-start and ~200 MB RAM to every
tool call — the daemon keeps the model resident and replies in ~15 ms.

Components:
- protocol.ts: JSON-line request/response types, socket/pid path helpers
- nomic.ts: thin wrapper around the pipeline with Matryoshka-style truncation
  and the search_document / search_query prefix rules
- daemon.ts: net.createServer on /tmp/hivemind-embed-<uid>.sock, idle
  auto-shutdown (15 min default), warmup-on-start, graceful SIGINT/SIGTERM,
  pidfile overwritten early so the client's spawn-lock stays valid
- client.ts: fire-and-forget connect; first caller wins an O_EXCL pidfile
  lock and spawns the daemon detached, the rest just poll the socket.
  Writes its own pid first so concurrent clients see a live owner during
  the start-up window; the daemon overwrites it once it's listening.
  embed() returns null on any failure so hook callers can degrade to a
  no-embedding INSERT instead of blocking the write path
- sql.ts: embeddingSqlLiteral() emits ARRAY[...]::float4[] or NULL

Socket + pidfile under /tmp, 0600-perm so only the owning user can talk
to them. Kill-switches via HIVEMIND_EMBED_* env vars.
---
 claude-code/tests/embedding-sql.test.ts     |  42 ++++
 claude-code/tests/embeddings-client.test.ts | 118 ++++++++++
 src/embeddings/client.ts                    | 242 ++++++++++++++++++++
 src/embeddings/daemon.ts                    | 157 +++++++++++++
 src/embeddings/nomic.ts                     |  90 ++++++++
 src/embeddings/protocol.ts                  |  50 ++++
 src/embeddings/sql.ts                       |  16 ++
 7 files changed, 715 insertions(+)
 create mode 100644 claude-code/tests/embedding-sql.test.ts
 create mode 100644 claude-code/tests/embeddings-client.test.ts
 create mode 100644 src/embeddings/client.ts
 create mode 100644 src/embeddings/daemon.ts
 create mode 100644 src/embeddings/nomic.ts
 create mode 100644 src/embeddings/protocol.ts
 create mode 100644 src/embeddings/sql.ts
diff --git a/claude-code/tests/embedding-sql.test.ts b/claude-code/tests/embedding-sql.test.ts
new file mode 100644
index 0000000..a4d469f
--- /dev/null
+++ b/claude-code/tests/embedding-sql.test.ts
@@ -0,0 +1,42 @@
+import { describe, it, expect } from "vitest";
+import { embeddingSqlLiteral } from "../../src/embeddings/sql.js";
+
+describe("embeddingSqlLiteral", () => {
+  it("returns NULL for null input", () => {
+    expect(embeddingSqlLiteral(null)).toBe("NULL");
+  });
+
+  it("returns NULL for undefined", () => {
+    expect(embeddingSqlLiteral(undefined)).toBe("NULL");
+  });
+
+  it("returns NULL for empty array", () => {
+    expect(embeddingSqlLiteral([])).toBe("NULL");
+  });
+
+  it("returns ARRAY[...]::float4[] for a vector", () => {
+    expect(embeddingSqlLiteral([0.1, 0.2, -0.3])).toBe("ARRAY[0.1,0.2,-0.3]::float4[]");
+  });
+
+  it("returns NULL if any element is NaN / Infinity", () => {
+    expect(embeddingSqlLiteral([0.1, NaN, 0.3])).toBe("NULL");
+    expect(embeddingSqlLiteral([0.1, Infinity, 0.3])).toBe("NULL");
+    expect(embeddingSqlLiteral([-Infinity, 0.1])).toBe("NULL");
+  });
+
+  it("uses shortest round-trip representation (no toFixed truncation)", () => {
+    // A value that toFixed(6) would round is preserved
+    const vec = [0.123456789];
+    expect(embeddingSqlLiteral(vec)).toBe("ARRAY[0.123456789]::float4[]");
+  });
+
+  it("handles a realistic 768-dim vector without truncation", () => {
+    const vec = Array.from({ length: 768 }, (_, i) => i / 1000);
+    const sql = embeddingSqlLiteral(vec);
+    expect(sql.startsWith("ARRAY[")).toBe(true);
+    expect(sql.endsWith("]::float4[]")).toBe(true);
+    // Count commas → 767 separators → 768 elements
+    const commas = (sql.match(/,/g) ?? []).length;
+    expect(commas).toBe(767);
+  });
+});
diff --git a/claude-code/tests/embeddings-client.test.ts b/claude-code/tests/embeddings-client.test.ts
new file mode 100644
index 0000000..de13060
--- /dev/null
+++ b/claude-code/tests/embeddings-client.test.ts
@@ -0,0 +1,118 @@
+// Unit tests for the embedding client — avoid loading the model by spinning up
+// a tiny fake daemon that speaks the protocol.
+
+import { describe, it, expect, afterEach } from "vitest";
+import { createServer, type Server, type Socket } from "node:net";
+import { mkdtempSync, rmSync, existsSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { EmbedClient } from "../../src/embeddings/client.js";
+import type { DaemonRequest, DaemonResponse } from "../../src/embeddings/protocol.js";
+
+let servers: Server[] = [];
+let tmpDirs: string[] = [];
+
+afterEach(() => {
+  for (const s of servers) try { s.close(); } catch { /* */ }
+  servers = [];
+  for (const d of tmpDirs) try { rmSync(d, { recursive: true, force: true }); } catch { /* */ }
+  tmpDirs = [];
+});
+
+function makeTmpDir(): string {
+  const d = mkdtempSync(join(tmpdir(), "hvm-embed-test-"));
+  tmpDirs.push(d);
+  return d;
+}
+
+async function startFakeDaemon(dir: string, handler: (req: DaemonRequest) => DaemonResponse): Promise<Server> {
+  const uid = String(process.getuid?.() ?? "test");
+  const sockPath = join(dir, `hivemind-embed-${uid}.sock`);
+  const srv = createServer((sock: Socket) => {
+    let buf = "";
+    sock.setEncoding("utf-8");
+    sock.on("data", (chunk: string) => {
+      buf += chunk;
+      let nl: number;
+      while ((nl = buf.indexOf("\n")) !== -1) {
+        const line = buf.slice(0, nl);
+        buf = buf.slice(nl + 1);
+        if (!line) continue;
+        const req = JSON.parse(line) as DaemonRequest;
+        const resp = handler(req);
+        sock.write(JSON.stringify(resp) + "\n");
+      }
+    });
+    sock.on("error", () => { /* */ });
+  });
+  servers.push(srv);
+  await new Promise<void>((resolve) => srv.listen(sockPath, resolve));
+  return srv;
+}
+
+describe("EmbedClient", () => {
+  it("returns the embedding vector when the daemon responds", async () => {
+    const dir = makeTmpDir();
+    await startFakeDaemon(dir, (req) => {
+      if (req.op === "embed") return { id: req.id, embedding: [0.1, 0.2, 0.3] };
+      return { id: req.id, ready: true };
+    });
+    const client = new EmbedClient({ socketDir: dir, timeoutMs: 500, autoSpawn: false });
+    const vec = await client.embed("hello", "document");
+    expect(vec).toEqual([0.1, 0.2, 0.3]);
+  });
+
+  it("returns null when the daemon returns an error", async () => {
+    const dir = makeTmpDir();
+    await startFakeDaemon(dir, (req) => ({ id: req.id, error: "boom" }));
+    const client = new EmbedClient({ socketDir: dir, timeoutMs: 500, autoSpawn: false });
+    const vec = await client.embed("hello");
+    expect(vec).toBeNull();
+  });
+
+  it("returns null when no daemon is running and autoSpawn is disabled", async () => {
+    const dir = makeTmpDir();
+    const client = new EmbedClient({ socketDir: dir, timeoutMs: 100, autoSpawn: false });
+    const vec = await client.embed("hello");
+    expect(vec).toBeNull();
+  });
+
+  it("does not create a duplicate pidfile under concurrent first-call race", async () => {
+    const dir = makeTmpDir();
+    const client1 = new EmbedClient({
+      socketDir: dir,
+      timeoutMs: 50,
+      autoSpawn: true,
+      daemonEntry: "/nonexistent/daemon.js", // guarantee spawn can't succeed
+    });
+    const client2 = new EmbedClient({
+      socketDir: dir,
+      timeoutMs: 50,
+      autoSpawn: true,
+      daemonEntry: "/nonexistent/daemon.js",
+    });
+    // Both clients see no socket, both try spawnDaemon. O_EXCL guarantees only
+    // one actually tries to spawn. Both return null because no daemon comes up.
+    const [a, b] = await Promise.all([
+      client1.embed("one"),
+      client2.embed("two"),
+    ]);
+    expect(a).toBeNull();
+    expect(b).toBeNull();
+    // pidfile should have been cleaned up when spawn couldn't find the entry.
+    const uid = String(process.getuid?.() ?? "test");
+    expect(existsSync(join(dir, `hivemind-embed-${uid}.pid`))).toBe(false);
+  });
+
+  it("round-trips multiple requests on the same client without leaking sockets", async () => {
+    const dir = makeTmpDir();
+    await startFakeDaemon(dir, (req) => ({ id: req.id, embedding: [Math.random()] }));
+    const client = new EmbedClient({ socketDir: dir, timeoutMs: 500, autoSpawn: false });
+    const results = await Promise.all([
+      client.embed("a"),
+      client.embed("b"),
+      client.embed("c"),
+    ]);
+    expect(results.every((r) => r !== null && r.length === 1)).toBe(true);
+  });
+});
diff --git a/src/embeddings/client.ts b/src/embeddings/client.ts
new file mode 100644
index 0000000..9798829
--- /dev/null
+++ b/src/embeddings/client.ts
@@ -0,0 +1,242 @@
+// Thin client used by hooks to request embeddings from the daemon.
+// Self-heals: if the socket is missing, the first caller spawns the daemon
+// under an O_EXCL pidfile lock so concurrent callers don't spawn duplicates.
+
+import { connect, type Socket } from "node:net";
+import { spawn } from "node:child_process";
+import { openSync, closeSync, writeSync, unlinkSync, existsSync, readFileSync } from "node:fs";
+import {
+  DEFAULT_CLIENT_TIMEOUT_MS,
+  pidPathFor,
+  socketPathFor,
+  type DaemonResponse,
+  type EmbedKind,
+  type EmbedRequest,
+} from "./protocol.js";
+import { log as _log } from "../utils/debug.js";
+
+const log = (m: string) => _log("embed-client", m);
+
+function getUid(): string {
+  const uid = typeof process.getuid === "function" ? process.getuid() : undefined;
+  return uid !== undefined ? String(uid) : (process.env.USER ?? "default");
+}
+
+export interface ClientOptions {
+  socketDir?: string;
+  timeoutMs?: number;
+  daemonEntry?: string; // path to bundled embed-daemon.js
+  autoSpawn?: boolean;
+  spawnWaitMs?: number;
+}
+
+export class EmbedClient {
+  private socketPath: string;
+  private pidPath: string;
+  private timeoutMs: number;
+  private daemonEntry: string | undefined;
+  private autoSpawn: boolean;
+  private spawnWaitMs: number;
+  private nextId = 0;
+
+  constructor(opts: ClientOptions = {}) {
+    const uid = getUid();
+    const dir = opts.socketDir ?? "/tmp";
+    this.socketPath = socketPathFor(uid, dir);
+    this.pidPath = pidPathFor(uid, dir);
+    this.timeoutMs = opts.timeoutMs ?? DEFAULT_CLIENT_TIMEOUT_MS;
+    this.daemonEntry = opts.daemonEntry ?? process.env.HIVEMIND_EMBED_DAEMON;
+    this.autoSpawn = opts.autoSpawn ?? true;
+    this.spawnWaitMs = opts.spawnWaitMs ?? 5000;
+  }
+
+  /**
+   * Returns an embedding vector, or null on timeout/failure. Hooks MUST treat
+   * null as "skip embedding column" — never block the write path on us.
+   *
+   * Fire-and-forget spawn on miss: if the daemon isn't up, this call returns
+   * null AND kicks off a background spawn. The next call finds a ready daemon.
+   */
+  async embed(text: string, kind: EmbedKind = "document"): Promise<number[] | null> {
+    let sock: Socket;
+    try {
+      sock = await this.connectOnce();
+    } catch {
+      if (this.autoSpawn) this.trySpawnDaemon();
+      return null;
+    }
+    try {
+      const id = String(++this.nextId);
+      const req: EmbedRequest = { op: "embed", id, kind, text };
+      const resp = await this.sendAndWait(sock, req);
+      if (resp.error || !("embedding" in resp) || !resp.embedding) {
+        log(`embed err: ${resp.error ?? "no embedding"}`);
+        return null;
+      }
+      return resp.embedding;
+    } catch (e: unknown) {
+      const err = e instanceof Error ? e.message : String(e);
+      log(`embed failed: ${err}`);
+      return null;
+    } finally {
+      try { sock.end(); } catch { /* best-effort */ }
+    }
+  }
+
+  /**
+   * Wait up to spawnWaitMs for the daemon to accept connections, spawning if
+   * necessary. Meant for SessionStart / long-running batches — not the hot path.
+   */
+  async warmup(): Promise<boolean> {
+    try {
+      const s = await this.connectOnce();
+      s.end();
+      return true;
+    } catch {
+      if (!this.autoSpawn) return false;
+      this.trySpawnDaemon();
+      try {
+        const s = await this.waitForSocket();
+        s.end();
+        return true;
+      } catch {
+        return false;
+      }
+    }
+  }
+
+  private connectOnce(): Promise<Socket> {
+    return new Promise((resolve, reject) => {
+      const sock = connect(this.socketPath);
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("connect timeout"));
+      }, this.timeoutMs);
+      sock.once("connect", () => {
+        clearTimeout(to);
+        resolve(sock);
+      });
+      sock.once("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+    });
+  }
+
+  private trySpawnDaemon(): void {
+    // O_EXCL pidfile — only the first caller wins. Others find the pid file
+    // and wait for the socket to appear.
+    //
+    // Race subtlety: we IMMEDIATELY write our own PID into the file to close
+    // the window where another worker could see an empty pidfile and interpret
+    // it as "stale". The daemon itself overwrites the file with its own PID
+    // during startup (see daemon.ts start()).
+    let fd: number;
+    try {
+      fd = openSync(this.pidPath, "wx", 0o600);
+      writeSync(fd, String(process.pid));
+    } catch (e: unknown) {
+      // Someone else is spawning (EEXIST) — or pidfile is stale. If stale, clean up and retry.
+      if (this.isPidFileStale()) {
+        try { unlinkSync(this.pidPath); } catch { /* best-effort */ }
+        try {
+          fd = openSync(this.pidPath, "wx", 0o600);
+          writeSync(fd, String(process.pid));
+        } catch {
+          return; // someone else just claimed it; let waitForSocket handle it
+        }
+      } else {
+        return;
+      }
+    }
+
+    if (!this.daemonEntry || !existsSync(this.daemonEntry)) {
+      log(`daemonEntry not configured or missing: ${this.daemonEntry}`);
+      try { closeSync(fd); unlinkSync(this.pidPath); } catch { /* best-effort */ }
+      return;
+    }
+
+    try {
+      const child = spawn(process.execPath, [this.daemonEntry], {
+        detached: true,
+        stdio: "ignore",
+        env: process.env,
+      });
+      child.unref();
+      log(`spawned daemon pid=${child.pid}`);
+    } finally {
+      closeSync(fd);
+    }
+  }
+
+  private isPidFileStale(): boolean {
+    try {
+      const raw = readFileSync(this.pidPath, "utf-8").trim();
+      const pid = Number(raw);
+      if (!pid || Number.isNaN(pid)) return true;
+      // kill(pid, 0) throws if process is gone.
+      try {
+        process.kill(pid, 0);
+        // Process is alive — the daemon might just be loading the model and
+        // hasn't bound the socket yet. DON'T treat as stale; let waitForSocket
+        // poll. A hung daemon will eventually time out at the caller.
+        return false;
+      } catch {
+        return true;
+      }
+    } catch {
+      return true;
+    }
+  }
+
+  private async waitForSocket(): Promise<Socket> {
+    const deadline = Date.now() + this.spawnWaitMs;
+    let delay = 30;
+    while (Date.now() < deadline) {
+      await sleep(delay);
+      delay = Math.min(delay * 1.5, 300);
+      if (!existsSync(this.socketPath)) continue;
+      try {
+        return await this.connectOnce();
+      } catch {
+        // socket appeared but daemon not ready yet — keep waiting
+      }
+    }
+    throw new Error("daemon did not become ready within spawnWaitMs");
+  }
+
+  private sendAndWait(sock: Socket, req: EmbedRequest): Promise<DaemonResponse> {
+    return new Promise((resolve, reject) => {
+      let buf = "";
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("request timeout"));
+      }, this.timeoutMs);
+      sock.setEncoding("utf-8");
+      sock.on("data", (chunk: string) => {
+        buf += chunk;
+        const nl = buf.indexOf("\n");
+        if (nl === -1) return;
+        const line = buf.slice(0, nl);
+        clearTimeout(to);
+        try {
+          resolve(JSON.parse(line) as DaemonResponse);
+        } catch (e) {
+          reject(e as Error);
+        }
+      });
+      sock.on("error", (e) => { clearTimeout(to); reject(e); });
+      sock.write(JSON.stringify(req) + "\n");
+    });
+  }
+}
+
+function sleep(ms: number): Promise<void> {
+  return new Promise(r => setTimeout(r, ms));
+}
+
+let singleton: EmbedClient | null = null;
+export function getEmbedClient(): EmbedClient {
+  if (!singleton) singleton = new EmbedClient();
+  return singleton;
+}
diff --git a/src/embeddings/daemon.ts b/src/embeddings/daemon.ts
new file mode 100644
index 0000000..3a01899
--- /dev/null
+++ b/src/embeddings/daemon.ts
@@ -0,0 +1,157 @@
+#!/usr/bin/env node
+
+// Long-lived embedding daemon. Holds the nomic model in RAM and serves
+// embed requests over a per-user Unix socket. Exits after an idle window
+// so it doesn't sit around consuming ~200 MB of RAM forever.
+
+import { createServer, type Server, type Socket } from "node:net";
+import { unlinkSync, writeFileSync, existsSync, mkdirSync, chmodSync } from "node:fs";
+import { NomicEmbedder } from "./nomic.js";
+import {
+  DEFAULT_IDLE_TIMEOUT_MS,
+  pidPathFor,
+  socketPathFor,
+  type DaemonRequest,
+  type DaemonResponse,
+  type EmbedRequest,
+  type PingRequest,
+} from "./protocol.js";
+import { log as _log } from "../utils/debug.js";
+
+const log = (m: string) => _log("embed-daemon", m);
+
+function getUid(): string {
+  const uid = typeof process.getuid === "function" ? process.getuid() : undefined;
+  return uid !== undefined ? String(uid) : (process.env.USER ?? "default");
+}
+
+export interface DaemonOptions {
+  socketDir?: string;
+  idleTimeoutMs?: number;
+  dims?: number;
+  dtype?: string;
+  repo?: string;
+}
+
+export class EmbedDaemon {
+  private server: Server | null = null;
+  private embedder: NomicEmbedder;
+  private socketPath: string;
+  private pidPath: string;
+  private idleTimeoutMs: number;
+  private idleTimer: NodeJS.Timeout | null = null;
+
+  constructor(opts: DaemonOptions = {}) {
+    const uid = getUid();
+    const dir = opts.socketDir ?? "/tmp";
+    this.socketPath = socketPathFor(uid, dir);
+    this.pidPath = pidPathFor(uid, dir);
+    this.idleTimeoutMs = opts.idleTimeoutMs ?? DEFAULT_IDLE_TIMEOUT_MS;
+    this.embedder = new NomicEmbedder({ repo: opts.repo, dtype: opts.dtype, dims: opts.dims });
+  }
+
+  async start(): Promise<void> {
+    mkdirSync(this.socketPath.replace(/\/[^/]+$/, ""), { recursive: true });
+    // Overwrite pidfile FIRST — the client wrote its own (transient) pid as a
+    // placeholder during spawn to avoid a race; now that the daemon is live,
+    // replace it with ours so subsequent clients see the long-lived pid.
+    writeFileSync(this.pidPath, String(process.pid), { mode: 0o600 });
+    if (existsSync(this.socketPath)) {
+      // Stale from a previous crash. unlink so bind() can succeed.
+      try { unlinkSync(this.socketPath); } catch { /* best-effort */ }
+    }
+
+    // Warmup the model in the background so the first real request is fast.
+    this.embedder.load().then(() => log("model ready")).catch(e => log(`load err: ${e.message}`));
+
+    this.server = createServer((sock) => this.handleConnection(sock));
+    await new Promise<void>((resolve, reject) => {
+      this.server!.once("error", reject);
+      this.server!.listen(this.socketPath, () => {
+        try { chmodSync(this.socketPath, 0o600); } catch { /* best-effort */ }
+        log(`listening on ${this.socketPath}`);
+        resolve();
+      });
+    });
+
+    this.resetIdleTimer();
+    process.on("SIGINT", () => this.shutdown());
+    process.on("SIGTERM", () => this.shutdown());
+  }
+
+  private resetIdleTimer(): void {
+    if (this.idleTimer) clearTimeout(this.idleTimer);
+    this.idleTimer = setTimeout(() => {
+      log(`idle timeout ${this.idleTimeoutMs}ms reached, shutting down`);
+      this.shutdown();
+    }, this.idleTimeoutMs);
+    this.idleTimer.unref();
+  }
+
+  shutdown(): void {
+    try { this.server?.close(); } catch { /* best-effort */ }
+    try { if (existsSync(this.socketPath)) unlinkSync(this.socketPath); } catch { /* best-effort */ }
+    try { if (existsSync(this.pidPath)) unlinkSync(this.pidPath); } catch { /* best-effort */ }
+    process.exit(0);
+  }
+
+  private handleConnection(sock: Socket): void {
+    let buf = "";
+    sock.setEncoding("utf-8");
+    sock.on("data", (chunk: string) => {
+      buf += chunk;
+      let nl: number;
+      while ((nl = buf.indexOf("\n")) !== -1) {
+        const line = buf.slice(0, nl);
+        buf = buf.slice(nl + 1);
+        if (line.length === 0) continue;
+        this.handleLine(sock, line);
+      }
+    });
+    sock.on("error", () => { /* client disconnect is normal */ });
+  }
+
+  private async handleLine(sock: Socket, line: string): Promise<void> {
+    this.resetIdleTimer();
+    let req: DaemonRequest;
+    try {
+      req = JSON.parse(line);
+    } catch {
+      return;
+    }
+    try {
+      const resp = await this.dispatch(req);
+      sock.write(JSON.stringify(resp) + "\n");
+    } catch (e: unknown) {
+      const err = e instanceof Error ? e.message : String(e);
+      const resp: DaemonResponse = { id: req.id, error: err };
+      sock.write(JSON.stringify(resp) + "\n");
+    }
+  }
+
+  private async dispatch(req: DaemonRequest): Promise<DaemonResponse> {
+    if (req.op === "ping") {
+      const p = req as PingRequest;
+      return { id: p.id, ready: true, model: this.embedder.repo, dims: this.embedder.dims };
+    }
+    if (req.op === "embed") {
+      const e = req as EmbedRequest;
+      const vec = await this.embedder.embed(e.text, e.kind);
+      return { id: e.id, embedding: vec };
+    }
+    return { id: (req as { id: string }).id, error: "unknown op" };
+  }
+}
+
+const invokedDirectly = import.meta.url === `file://${process.argv[1]}`
+  || (process.argv[1] && import.meta.url.endsWith(process.argv[1].split("/").pop() ?? ""));
+
+if (invokedDirectly) {
+  const dims = process.env.HIVEMIND_EMBED_DIMS ? Number(process.env.HIVEMIND_EMBED_DIMS) : undefined;
+  const idleTimeoutMs = process.env.HIVEMIND_EMBED_IDLE_MS ? Number(process.env.HIVEMIND_EMBED_IDLE_MS) : undefined;
+  const d = new EmbedDaemon({ dims, idleTimeoutMs });
+  d.start().catch((e) => {
+    log(`fatal: ${e.message}`);
+    process.exit(1);
+  });
+}
diff --git a/src/embeddings/nomic.ts b/src/embeddings/nomic.ts
new file mode 100644
index 0000000..d9dd77d
--- /dev/null
+++ b/src/embeddings/nomic.ts
@@ -0,0 +1,90 @@
+// Thin wrapper around @huggingface/transformers. Only loaded inside the daemon
+// process — hooks never import this. Kept isolated so the heavyweight transformer
+// dependency is not pulled into every bundled hook.
+
+import {
+  DEFAULT_DIMS,
+  DEFAULT_DTYPE,
+  DEFAULT_MODEL_REPO,
+  DOC_PREFIX,
+  QUERY_PREFIX,
+  type EmbedKind,
+} from "./protocol.js";
+
+type Embedder = (input: string | string[], opts: Record<string, unknown>) => Promise<{ data: Float32Array | number[] }>;
+
+export interface NomicOptions {
+  repo?: string;
+  dtype?: string;
+  dims?: number;
+}
+
+export class NomicEmbedder {
+  private pipeline: Embedder | null = null;
+  private loading: Promise<void> | null = null;
+  readonly repo: string;
+  readonly dtype: string;
+  readonly dims: number;
+
+  constructor(opts: NomicOptions = {}) {
+    this.repo = opts.repo ?? DEFAULT_MODEL_REPO;
+    this.dtype = opts.dtype ?? DEFAULT_DTYPE;
+    this.dims = opts.dims ?? DEFAULT_DIMS;
+  }
+
+  async load(): Promise<void> {
+    if (this.pipeline) return;
+    if (this.loading) return this.loading;
+    this.loading = (async () => {
+      const mod = await import("@huggingface/transformers");
+      mod.env.allowLocalModels = false;
+      mod.env.useFSCache = true;
+      this.pipeline = (await mod.pipeline("feature-extraction", this.repo, { dtype: this.dtype as "fp32" | "q8" })) as unknown as Embedder;
+    })();
+    try {
+      await this.loading;
+    } finally {
+      this.loading = null;
+    }
+  }
+
+  private addPrefix(text: string, kind: EmbedKind): string {
+    return (kind === "query" ? QUERY_PREFIX : DOC_PREFIX) + text;
+  }
+
+  async embed(text: string, kind: EmbedKind = "document"): Promise<number[]> {
+    await this.load();
+    if (!this.pipeline) throw new Error("embedder not loaded");
+    const out = await this.pipeline(this.addPrefix(text, kind), { pooling: "mean", normalize: true });
+    const full = Array.from(out.data as ArrayLike<number>);
+    return this.truncate(full);
+  }
+
+  async embedBatch(texts: string[], kind: EmbedKind = "document"): Promise<number[][]> {
+    if (texts.length === 0) return [];
+    await this.load();
+    if (!this.pipeline) throw new Error("embedder not loaded");
+    const prefixed = texts.map(t => this.addPrefix(t, kind));
+    const out = await this.pipeline(prefixed, { pooling: "mean", normalize: true });
+    const flat = Array.from(out.data as ArrayLike<number>);
+    const total = flat.length;
+    const full = total / texts.length;
+    const batches: number[][] = [];
+    for (let i = 0; i < texts.length; i++) {
+      batches.push(this.truncate(flat.slice(i * full, (i + 1) * full)));
+    }
+    return batches;
+  }
+
+  private truncate(vec: number[]): number[] {
+    if (this.dims >= vec.length) return vec;
+    // Matryoshka: truncate then re-normalize.
+    const head = vec.slice(0, this.dims);
+    let norm = 0;
+    for (const v of head) norm += v * v;
+    norm = Math.sqrt(norm);
+    if (norm === 0) return head;
+    for (let i = 0; i < head.length; i++) head[i] /= norm;
+    return head;
+  }
+}
diff --git a/src/embeddings/protocol.ts b/src/embeddings/protocol.ts
new file mode 100644
index 0000000..9959ced
--- /dev/null
+++ b/src/embeddings/protocol.ts
@@ -0,0 +1,50 @@
+// Shared types for the embedding daemon <-> client IPC.
+// Newline-delimited JSON over Unix socket.
+
+export type EmbedKind = "document" | "query";
+
+export interface EmbedRequest {
+  op: "embed";
+  id: string;
+  kind: EmbedKind;
+  text: string;
+}
+
+export interface EmbedResponse {
+  id: string;
+  embedding?: number[];
+  error?: string;
+}
+
+export interface PingRequest {
+  op: "ping";
+  id: string;
+}
+
+export interface PingResponse {
+  id: string;
+  ready: boolean;
+  model?: string;
+  dims?: number;
+  error?: string;
+}
+
+export type DaemonRequest = EmbedRequest | PingRequest;
+export type DaemonResponse = EmbedResponse | PingResponse;
+
+export const DEFAULT_SOCKET_DIR = "/tmp";
+export const DEFAULT_MODEL_REPO = "nomic-ai/nomic-embed-text-v1.5";
+export const DEFAULT_DTYPE = "q8";
+export const DEFAULT_DIMS = 768;
+export const DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1000;
+export const DEFAULT_CLIENT_TIMEOUT_MS = 200;
+export const DOC_PREFIX = "search_document: ";
+export const QUERY_PREFIX = "search_query: ";
+
+export function socketPathFor(uid: number | string, dir = DEFAULT_SOCKET_DIR): string {
+  return `${dir}/hivemind-embed-${uid}.sock`;
+}
+
+export function pidPathFor(uid: number | string, dir = DEFAULT_SOCKET_DIR): string {
+  return `${dir}/hivemind-embed-${uid}.pid`;
+}
diff --git a/src/embeddings/sql.ts b/src/embeddings/sql.ts
new file mode 100644
index 0000000..4387f7e
--- /dev/null
+++ b/src/embeddings/sql.ts
@@ -0,0 +1,16 @@
+// Helpers for embedding values in SQL. Deeplake stores vectors as `FLOAT4[]`;
+// the literal form is `ARRAY[f1, f2, ...]::float4[]`. When the embedding is
+// missing (daemon unavailable, timeout, etc.) we emit `NULL`.
+
+export function embeddingSqlLiteral(vec: number[] | null | undefined): string {
+  if (!vec || vec.length === 0) return "NULL";
+  // FLOAT4 is IEEE-754 single-precision. `toFixed` would lose precision; use
+  // the raw JS Number → string conversion which yields the shortest round-trip.
+  // Safety: only allow finite numbers; otherwise NULL.
+  const parts: string[] = [];
+  for (const v of vec) {
+    if (!Number.isFinite(v)) return "NULL";
+    parts.push(String(v));
+  }
+  return `ARRAY[${parts.join(",")}]::float4[]`;
+}

From 8d375a3297df0cd4dc5ca7a37e3bda3981e9ba13 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Wed, 22 Apr 2026 18:16:01 +0000
Subject: [PATCH 02/30] chore(build): add @huggingface/transformers +
 embed-daemon bundle entry

Pins @huggingface/transformers ^3.0.0 (resolves to 3.8.1) in dependencies
and registers src/embeddings/daemon.ts as a new esbuild entry point for
both the Claude Code and Codex bundles, outputting to
bundle/embeddings/embed-daemon.js.

The daemon imports transformers + onnxruntime-node dynamically, so both
are marked external in the esbuild config (the native .node binaries
can't be inlined). Consumers of the plugin need these installed
alongside the bundle; without them the daemon fails to start and the
client gracefully degrades to no-embedding writes.
---
 esbuild.config.mjs |  32 +++-
 package-lock.json  | 440 ++++++++++++++++++++++++++++++++++++++++++++-
 package.json       |   1 +
 3 files changed, 460 insertions(+), 13 deletions(-)

diff --git a/esbuild.config.mjs b/esbuild.config.mjs
index 95b2490..a4c13a4 100644
--- a/esbuild.config.mjs
+++ b/esbuild.config.mjs
@@ -21,7 +21,11 @@ const ccCommands = [
   { entry: "dist/src/commands/auth-login.js", out: "commands/auth-login" },
 ];
 
-const ccAll = [...ccHooks, ...ccShell, ...ccCommands];
+const ccEmbed = [
+  { entry: "dist/src/embeddings/daemon.js", out: "embeddings/embed-daemon" },
+];
+
+const ccAll = [...ccHooks, ...ccShell, ...ccCommands, ...ccEmbed];
 
 await build({
   entryPoints: Object.fromEntries(ccAll.map(h => [h.out, h.entry])),
@@ -29,7 +33,15 @@ await build({
   platform: "node",
   format: "esm",
   outdir: "claude-code/bundle",
-  external: ["node:*", "node-liblzma", "@mongodb-js/zstd"],
+  external: [
+    "node:*",
+    "node-liblzma",
+    "@mongodb-js/zstd",
+    "@huggingface/transformers",
+    "onnxruntime-node",
+    "onnxruntime-common",
+    "sharp",
+  ],
 });
 
 for (const h of ccAll) {
@@ -55,7 +67,11 @@ const codexCommands = [
   { entry: "dist/src/commands/auth-login.js", out: "commands/auth-login" },
 ];
 
-const codexAll = [...codexHooks, ...codexShell, ...codexCommands];
+const codexEmbed = [
+  { entry: "dist/src/embeddings/daemon.js", out: "embeddings/embed-daemon" },
+];
+
+const codexAll = [...codexHooks, ...codexShell, ...codexCommands, ...codexEmbed];
 
 await build({
   entryPoints: Object.fromEntries(codexAll.map(h => [h.out, h.entry])),
@@ -63,7 +79,15 @@ await build({
   platform: "node",
   format: "esm",
   outdir: "codex/bundle",
-  external: ["node:*", "node-liblzma", "@mongodb-js/zstd"],
+  external: [
+    "node:*",
+    "node-liblzma",
+    "@mongodb-js/zstd",
+    "@huggingface/transformers",
+    "onnxruntime-node",
+    "onnxruntime-common",
+    "sharp",
+  ],
 });
 
 for (const h of codexAll) {
diff --git a/package-lock.json b/package-lock.json
index f0ebfcc..e742826 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -8,6 +8,7 @@
       "name": "hivemind",
       "version": "0.6.38",
       "dependencies": {
+        "@huggingface/transformers": "^3.0.0",
         "deeplake": "^0.3.30",
         "just-bash": "^2.14.0",
         "yargs-parser": "^22.0.0"
@@ -1544,12 +1545,32 @@
         "node": ">=18"
       }
     },
+    "node_modules/@huggingface/jinja": {
+      "version": "0.5.7",
+      "resolved": "https://registry.npmjs.org/@huggingface/jinja/-/jinja-0.5.7.tgz",
+      "integrity": "sha512-OosMEbF/R6zkKNNzqhI7kvKYCpo1F0UeIv46/h4D4UjVEKKd6k3TiV8sgu6fkreX4lbBiRI+lZG8UnXnqVQmEQ==",
+      "license": "MIT",
+      "engines": {
+        "node": ">=18"
+      }
+    },
+    "node_modules/@huggingface/transformers": {
+      "version": "3.8.1",
+      "resolved": "https://registry.npmjs.org/@huggingface/transformers/-/transformers-3.8.1.tgz",
+      "integrity": "sha512-tsTk4zVjImqdqjS8/AOZg2yNLd1z9S5v+7oUPpXaasDRwEDhB+xnglK1k5cad26lL5/ZIaeREgWWy0bs9y9pPA==",
+      "license": "Apache-2.0",
+      "dependencies": {
+        "@huggingface/jinja": "^0.5.3",
+        "onnxruntime-node": "1.21.0",
+        "onnxruntime-web": "1.22.0-dev.20250409-89f8206ba4",
+        "sharp": "^0.34.1"
+      }
+    },
     "node_modules/@img/colour": {
       "version": "1.1.0",
       "resolved": "https://registry.npmjs.org/@img/colour/-/colour-1.1.0.tgz",
       "integrity": "sha512-Td76q7j57o/tLVdgS746cYARfSyxk8iEfRxewL9h4OMzYhbW4TAcppl0mT4eyqXddh6L/jwoM75mo7ixa/pCeQ==",
       "license": "MIT",
-      "optional": true,
       "engines": {
         "node": ">=18"
       }
@@ -2010,6 +2031,18 @@
         "url": "https://opencollective.com/libvips"
       }
     },
+    "node_modules/@isaacs/fs-minipass": {
+      "version": "4.0.1",
+      "resolved": "https://registry.npmjs.org/@isaacs/fs-minipass/-/fs-minipass-4.0.1.tgz",
+      "integrity": "sha512-wgm9Ehl2jpeqP3zw/7mo3kRHFp5MEDhqAdwy1fTGkHAwnkGOVsgpvQhL8B5n1qlb01jV3n/bI0ZfZp5lWA1k4w==",
+      "license": "ISC",
+      "dependencies": {
+        "minipass": "^7.0.4"
+      },
+      "engines": {
+        "node": ">=18.0.0"
+      }
+    },
     "node_modules/@jitl/quickjs-ffi-types": {
       "version": "0.32.0",
       "resolved": "https://registry.npmjs.org/@jitl/quickjs-ffi-types/-/quickjs-ffi-types-0.32.0.tgz",
@@ -2233,6 +2266,70 @@
         "url": "https://github.com/sponsors/Boshen"
       }
     },
+    "node_modules/@protobufjs/aspromise": {
+      "version": "1.1.2",
+      "resolved": "https://registry.npmjs.org/@protobufjs/aspromise/-/aspromise-1.1.2.tgz",
+      "integrity": "sha512-j+gKExEuLmKwvz3OgROXtrJ2UG2x8Ch2YZUxahh+s1F2HZ+wAceUNLkvy6zKCPVRkU++ZWQrdxsUeQXmcg4uoQ==",
+      "license": "BSD-3-Clause"
+    },
+    "node_modules/@protobufjs/base64": {
+      "version": "1.1.2",
+      "resolved": "https://registry.npmjs.org/@protobufjs/base64/-/base64-1.1.2.tgz",
+      "integrity": "sha512-AZkcAA5vnN/v4PDqKyMR5lx7hZttPDgClv83E//FMNhR2TMcLUhfRUBHCmSl0oi9zMgDDqRUJkSxO3wm85+XLg==",
+      "license": "BSD-3-Clause"
+    },
+    "node_modules/@protobufjs/codegen": {
+      "version": "2.0.4",
+      "resolved": "https://registry.npmjs.org/@protobufjs/codegen/-/codegen-2.0.4.tgz",
+      "integrity": "sha512-YyFaikqM5sH0ziFZCN3xDC7zeGaB/d0IUb9CATugHWbd1FRFwWwt4ld4OYMPWu5a3Xe01mGAULCdqhMlPl29Jg==",
+      "license": "BSD-3-Clause"
+    },
+    "node_modules/@protobufjs/eventemitter": {
+      "version": "1.1.0",
+      "resolved": "https://registry.npmjs.org/@protobufjs/eventemitter/-/eventemitter-1.1.0.tgz",
+      "integrity": "sha512-j9ednRT81vYJ9OfVuXG6ERSTdEL1xVsNgqpkxMsbIabzSo3goCjDIveeGv5d03om39ML71RdmrGNjG5SReBP/Q==",
+      "license": "BSD-3-Clause"
+    },
+    "node_modules/@protobufjs/fetch": {
+      "version": "1.1.0",
+      "resolved": "https://registry.npmjs.org/@protobufjs/fetch/-/fetch-1.1.0.tgz",
+      "integrity": "sha512-lljVXpqXebpsijW71PZaCYeIcE5on1w5DlQy5WH6GLbFryLUrBD4932W/E2BSpfRJWseIL4v/KPgBFxDOIdKpQ==",
+      "license": "BSD-3-Clause",
+      "dependencies": {
+        "@protobufjs/aspromise": "^1.1.1",
+        "@protobufjs/inquire": "^1.1.0"
+      }
+    },
+    "node_modules/@protobufjs/float": {
+      "version": "1.0.2",
+      "resolved": "https://registry.npmjs.org/@protobufjs/float/-/float-1.0.2.tgz",
+      "integrity": "sha512-Ddb+kVXlXst9d+R9PfTIxh1EdNkgoRe5tOX6t01f1lYWOvJnSPDBlG241QLzcyPdoNTsblLUdujGSE4RzrTZGQ==",
+      "license": "BSD-3-Clause"
+    },
+    "node_modules/@protobufjs/inquire": {
+      "version": "1.1.0",
+      "resolved": "https://registry.npmjs.org/@protobufjs/inquire/-/inquire-1.1.0.tgz",
+      "integrity": "sha512-kdSefcPdruJiFMVSbn801t4vFK7KB/5gd2fYvrxhuJYg8ILrmn9SKSX2tZdV6V+ksulWqS7aXjBcRXl3wHoD9Q==",
+      "license": "BSD-3-Clause"
+    },
+    "node_modules/@protobufjs/path": {
+      "version": "1.1.2",
+      "resolved": "https://registry.npmjs.org/@protobufjs/path/-/path-1.1.2.tgz",
+      "integrity": "sha512-6JOcJ5Tm08dOHAbdR3GrvP+yUUfkjG5ePsHYczMFLq3ZmMkAD98cDgcT2iA1lJ9NVwFd4tH/iSSoe44YWkltEA==",
+      "license": "BSD-3-Clause"
+    },
+    "node_modules/@protobufjs/pool": {
+      "version": "1.1.0",
+      "resolved": "https://registry.npmjs.org/@protobufjs/pool/-/pool-1.1.0.tgz",
+      "integrity": "sha512-0kELaGSIDBKvcgS4zkjz1PeddatrjYcmMWOlAuAPwAeccUrPHdUqo/J6LiymHHEiJT5NrF1UVwxY14f+fy4WQw==",
+      "license": "BSD-3-Clause"
+    },
+    "node_modules/@protobufjs/utf8": {
+      "version": "1.1.0",
+      "resolved": "https://registry.npmjs.org/@protobufjs/utf8/-/utf8-1.1.0.tgz",
+      "integrity": "sha512-Vvn3zZrhQZkkBE8LSuW3em98c0FwgO4nxzv6OdSxPKJIEKY2bGbHn+mhGIPerzI4twdxaP8/0+06HBpwf345Lw==",
+      "license": "BSD-3-Clause"
+    },
     "node_modules/@rolldown/binding-android-arm64": {
       "version": "1.0.0-rc.13",
       "resolved": "https://registry.npmjs.org/@rolldown/binding-android-arm64/-/binding-android-arm64-1.0.0-rc.13.tgz",
@@ -3346,7 +3443,6 @@
       "version": "25.5.2",
       "resolved": "https://registry.npmjs.org/@types/node/-/node-25.5.2.tgz",
       "integrity": "sha512-tO4ZIRKNC+MDWV4qKVZe3Ql/woTnmHDr5JD8UI5hn2pwBrHEwOEMZK7WlNb5RKB6EoJ02gwmQS9OrjuFnZYdpg==",
-      "dev": true,
       "license": "MIT",
       "dependencies": {
         "undici-types": "~7.18.0"
@@ -3686,6 +3782,13 @@
         "node": ">=8.9"
       }
     },
+    "node_modules/boolean": {
+      "version": "3.2.0",
+      "resolved": "https://registry.npmjs.org/boolean/-/boolean-3.2.0.tgz",
+      "integrity": "sha512-d0II/GO9uf9lfUHH2BQsjxzRJZBdsjgsBiW4BvhWk/3qoKwQFjIDVN19PfX8F2D/r9PCMTtLWjYVCFrpeYUzsw==",
+      "deprecated": "Package no longer supported. Contact Support at https://www.npmjs.com/support for more info.",
+      "license": "MIT"
+    },
     "node_modules/bowser": {
       "version": "2.14.1",
       "resolved": "https://registry.npmjs.org/bowser/-/bowser-2.14.1.tgz",
@@ -4048,16 +4151,55 @@
         "sharp": "^0.34.5"
       }
     },
+    "node_modules/define-data-property": {
+      "version": "1.1.4",
+      "resolved": "https://registry.npmjs.org/define-data-property/-/define-data-property-1.1.4.tgz",
+      "integrity": "sha512-rBMvIzlpA8v6E+SJZoo++HAYqsLrkg7MSfIinMPFhmkorw7X+dOXVJQs+QT69zGkzMyfDnIMN2Wid1+NbL3T+A==",
+      "license": "MIT",
+      "dependencies": {
+        "es-define-property": "^1.0.0",
+        "es-errors": "^1.3.0",
+        "gopd": "^1.0.1"
+      },
+      "engines": {
+        "node": ">= 0.4"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/ljharb"
+      }
+    },
+    "node_modules/define-properties": {
+      "version": "1.2.1",
+      "resolved": "https://registry.npmjs.org/define-properties/-/define-properties-1.2.1.tgz",
+      "integrity": "sha512-8QmQKqEASLd5nx0U1B1okLElbUuuttJ/AnYmRXbbbGDWh6uS208EjD4Xqq/I9wK7u0v6O08XhTWnt5XtEbR6Dg==",
+      "license": "MIT",
+      "dependencies": {
+        "define-data-property": "^1.0.1",
+        "has-property-descriptors": "^1.0.0",
+        "object-keys": "^1.1.1"
+      },
+      "engines": {
+        "node": ">= 0.4"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/ljharb"
+      }
+    },
     "node_modules/detect-libc": {
       "version": "2.1.2",
       "resolved": "https://registry.npmjs.org/detect-libc/-/detect-libc-2.1.2.tgz",
       "integrity": "sha512-Btj2BOOO83o3WyH59e8MgXsxEQVcarkUOpEYrubB0urwnN10yQ364rsiByU11nZlqWYZm05i/of7io4mzihBtQ==",
-      "devOptional": true,
       "license": "Apache-2.0",
       "engines": {
         "node": ">=8"
       }
     },
+    "node_modules/detect-node": {
+      "version": "2.1.0",
+      "resolved": "https://registry.npmjs.org/detect-node/-/detect-node-2.1.0.tgz",
+      "integrity": "sha512-T0NIuQpnTvFDATNuHN5roPwSBG83rFsuO+MXXH9/3N1eFbn4wcPjttvjMLEPWJ0RGUYgQE7cGgS3tNxbqCGM7g==",
+      "license": "MIT"
+    },
     "node_modules/diff": {
       "version": "8.0.4",
       "resolved": "https://registry.npmjs.org/diff/-/diff-8.0.4.tgz",
@@ -4123,7 +4265,6 @@
       "version": "1.0.1",
       "resolved": "https://registry.npmjs.org/es-define-property/-/es-define-property-1.0.1.tgz",
       "integrity": "sha512-e3nRfgfUZ4rNGL232gUgX06QNyyez04KdjFrF+LTRoOXmrOgFKDg4BCdsjW8EnT69eqdYGmRpJwiPVYNrCaW3g==",
-      "dev": true,
       "license": "MIT",
       "engines": {
         "node": ">= 0.4"
@@ -4133,7 +4274,6 @@
       "version": "1.3.0",
       "resolved": "https://registry.npmjs.org/es-errors/-/es-errors-1.3.0.tgz",
       "integrity": "sha512-Zf5H2Kxt2xjTvbJvP2ZWLEICxA6j+hAmMzIlypy4xcBg1vKVnx89Wy0GbS+kf5cwCVFFzdCFh2XSCFNULS6csw==",
-      "dev": true,
       "license": "MIT",
       "engines": {
         "node": ">= 0.4"
@@ -4159,6 +4299,12 @@
         "node": ">= 0.4"
       }
     },
+    "node_modules/es6-error": {
+      "version": "4.1.1",
+      "resolved": "https://registry.npmjs.org/es6-error/-/es6-error-4.1.1.tgz",
+      "integrity": "sha512-Um/+FxMr9CISWh0bi5Zv0iOD+4cFh5qLeks1qhAopKVAJw3drgKbKySikp7wGhDL0HPeaja0P5ULZrxLkniUVg==",
+      "license": "MIT"
+    },
     "node_modules/esbuild": {
       "version": "0.28.0",
       "resolved": "https://registry.npmjs.org/esbuild/-/esbuild-0.28.0.tgz",
@@ -4201,6 +4347,18 @@
         "@esbuild/win32-x64": "0.28.0"
       }
     },
+    "node_modules/escape-string-regexp": {
+      "version": "4.0.0",
+      "resolved": "https://registry.npmjs.org/escape-string-regexp/-/escape-string-regexp-4.0.0.tgz",
+      "integrity": "sha512-TtpcNJ3XAzx3Gq8sWRzJaVajRs0uVxA2YAkdb1jm2YkPz4G6egUFAyA3n5vtEIZefPk5Wa4UXbKuS5fKkJWdgA==",
+      "license": "MIT",
+      "engines": {
+        "node": ">=10"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/sindresorhus"
+      }
+    },
     "node_modules/estree-walker": {
       "version": "3.0.3",
       "resolved": "https://registry.npmjs.org/estree-walker/-/estree-walker-3.0.3.tgz",
@@ -4396,6 +4554,12 @@
         "node": ">=8"
       }
     },
+    "node_modules/flatbuffers": {
+      "version": "25.9.23",
+      "resolved": "https://registry.npmjs.org/flatbuffers/-/flatbuffers-25.9.23.tgz",
+      "integrity": "sha512-MI1qs7Lo4Syw0EOzUl0xjs2lsoeqFku44KpngfIduHBYvzm8h2+7K8YMQh1JtVVVrUvhLpNwqVi4DERegUJhPQ==",
+      "license": "Apache-2.0"
+    },
     "node_modules/fs-constants": {
       "version": "1.0.0",
       "resolved": "https://registry.npmjs.org/fs-constants/-/fs-constants-1.0.0.tgz",
@@ -4544,11 +4708,43 @@
         "node": ">= 6"
       }
     },
+    "node_modules/global-agent": {
+      "version": "3.0.0",
+      "resolved": "https://registry.npmjs.org/global-agent/-/global-agent-3.0.0.tgz",
+      "integrity": "sha512-PT6XReJ+D07JvGoxQMkT6qji/jVNfX/h364XHZOWeRzy64sSFr+xJ5OX7LI3b4MPQzdL4H8Y8M0xzPpsVMwA8Q==",
+      "license": "BSD-3-Clause",
+      "dependencies": {
+        "boolean": "^3.0.1",
+        "es6-error": "^4.1.1",
+        "matcher": "^3.0.0",
+        "roarr": "^2.15.3",
+        "semver": "^7.3.2",
+        "serialize-error": "^7.0.1"
+      },
+      "engines": {
+        "node": ">=10.0"
+      }
+    },
+    "node_modules/globalthis": {
+      "version": "1.0.4",
+      "resolved": "https://registry.npmjs.org/globalthis/-/globalthis-1.0.4.tgz",
+      "integrity": "sha512-DpLKbNU4WylpxJykQujfCcwYWiV/Jhm50Goo0wrVILAv5jOr9d+H+UR3PhSCD2rCCEIg0uc+G+muBTwD54JhDQ==",
+      "license": "MIT",
+      "dependencies": {
+        "define-properties": "^1.2.1",
+        "gopd": "^1.0.1"
+      },
+      "engines": {
+        "node": ">= 0.4"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/ljharb"
+      }
+    },
     "node_modules/gopd": {
       "version": "1.2.0",
       "resolved": "https://registry.npmjs.org/gopd/-/gopd-1.2.0.tgz",
       "integrity": "sha512-ZUKRh6/kUFoAiTAtTYPZJ3hw9wNxx+BIBOijnlG9PnrJsCcSjs1wyyD6vJpaYtgnzDrKYRSqf3OO6Rfa93xsRg==",
-      "dev": true,
       "license": "MIT",
       "engines": {
         "node": ">= 0.4"
@@ -4570,6 +4766,12 @@
       "integrity": "sha512-8tLu60LgxF6XpdbK8OW3FA+IfTNBn1ZHGHKF4KQbEeSkajYw5PlYJcKluntgegDPTg8UkHjpet1T82vk6TQ68w==",
       "license": "MIT"
     },
+    "node_modules/guid-typescript": {
+      "version": "1.0.9",
+      "resolved": "https://registry.npmjs.org/guid-typescript/-/guid-typescript-1.0.9.tgz",
+      "integrity": "sha512-Y8T4vYhEfwJOTbouREvG+3XDsjr8E3kIr7uf+JZ0BYloFsttiHU0WfvANVsR7TxNUJa/WpCnw/Ino/p+DeBhBQ==",
+      "license": "ISC"
+    },
     "node_modules/has-flag": {
       "version": "4.0.0",
       "resolved": "https://registry.npmjs.org/has-flag/-/has-flag-4.0.0.tgz",
@@ -4580,6 +4782,18 @@
         "node": ">=8"
       }
     },
+    "node_modules/has-property-descriptors": {
+      "version": "1.0.2",
+      "resolved": "https://registry.npmjs.org/has-property-descriptors/-/has-property-descriptors-1.0.2.tgz",
+      "integrity": "sha512-55JNKuIW+vq4Ke1BjOTjM2YctQIvCT7GFzHwmfZPGo5wnrgkid0YQtnAleFSqumZm4az3n2BS+erby5ipJdgrg==",
+      "license": "MIT",
+      "dependencies": {
+        "es-define-property": "^1.0.0"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/ljharb"
+      }
+    },
     "node_modules/has-symbols": {
       "version": "1.1.0",
       "resolved": "https://registry.npmjs.org/has-symbols/-/has-symbols-1.1.0.tgz",
@@ -4909,6 +5123,12 @@
         "node": ">= 6"
       }
     },
+    "node_modules/json-stringify-safe": {
+      "version": "5.0.1",
+      "resolved": "https://registry.npmjs.org/json-stringify-safe/-/json-stringify-safe-5.0.1.tgz",
+      "integrity": "sha512-ZClg6AaYvamvYEE82d3Iyd3vSSIjQ+odgjaTzRuO3s7toCdFKczob2i0zCh7JE8kWn17yvAWhUVxvqGwUalsRA==",
+      "license": "ISC"
+    },
     "node_modules/jsonfile": {
       "version": "6.2.1",
       "resolved": "https://registry.npmjs.org/jsonfile/-/jsonfile-6.2.1.tgz",
@@ -5314,6 +5534,12 @@
         "url": "https://github.com/chalk/slice-ansi?sponsor=1"
       }
     },
+    "node_modules/long": {
+      "version": "5.3.2",
+      "resolved": "https://registry.npmjs.org/long/-/long-5.3.2.tgz",
+      "integrity": "sha512-mNAgZ1GmyNhD7AuqnTG3/VQ26o760+ZYBPKjPvugO8+nLbYfX6TVpJPseBvopbdY+qpZ/lKUnmEc1LeZYS3QAA==",
+      "license": "Apache-2.0"
+    },
     "node_modules/magic-string": {
       "version": "0.30.21",
       "resolved": "https://registry.npmjs.org/magic-string/-/magic-string-0.30.21.tgz",
@@ -5366,6 +5592,18 @@
         "url": "https://github.com/sponsors/wooorm"
       }
     },
+    "node_modules/matcher": {
+      "version": "3.0.0",
+      "resolved": "https://registry.npmjs.org/matcher/-/matcher-3.0.0.tgz",
+      "integrity": "sha512-OkeDaAZ/bQCxeFAozM55PKcKU0yJMPGifLwV4Qgjitu+5MoAfSQN4lsLJeXZ1b8w0x+/Emda6MZgXS1jvsapng==",
+      "license": "MIT",
+      "dependencies": {
+        "escape-string-regexp": "^4.0.0"
+      },
+      "engines": {
+        "node": ">=10"
+      }
+    },
     "node_modules/math-intrinsics": {
       "version": "1.1.0",
       "resolved": "https://registry.npmjs.org/math-intrinsics/-/math-intrinsics-1.1.0.tgz",
@@ -5481,6 +5719,27 @@
         "url": "https://github.com/sponsors/ljharb"
       }
     },
+    "node_modules/minipass": {
+      "version": "7.1.3",
+      "resolved": "https://registry.npmjs.org/minipass/-/minipass-7.1.3.tgz",
+      "integrity": "sha512-tEBHqDnIoM/1rXME1zgka9g6Q2lcoCkxHLuc7ODJ5BxbP5d4c2Z5cGgtXAku59200Cx7diuHTOYfSBD8n6mm8A==",
+      "license": "BlueOak-1.0.0",
+      "engines": {
+        "node": ">=16 || 14 >=14.17"
+      }
+    },
+    "node_modules/minizlib": {
+      "version": "3.1.0",
+      "resolved": "https://registry.npmjs.org/minizlib/-/minizlib-3.1.0.tgz",
+      "integrity": "sha512-KZxYo1BUkWD2TVFLr0MQoM8vUUigWD3LlD83a/75BqC+4qE0Hb1Vo5v1FgcfaNXvfXzr+5EhQ6ing/CaBijTlw==",
+      "license": "MIT",
+      "dependencies": {
+        "minipass": "^7.1.2"
+      },
+      "engines": {
+        "node": ">= 18"
+      }
+    },
     "node_modules/mkdirp-classic": {
       "version": "0.5.3",
       "resolved": "https://registry.npmjs.org/mkdirp-classic/-/mkdirp-classic-0.5.3.tgz",
@@ -5623,6 +5882,15 @@
         "node": ">=0.10.0"
       }
     },
+    "node_modules/object-keys": {
+      "version": "1.1.1",
+      "resolved": "https://registry.npmjs.org/object-keys/-/object-keys-1.1.1.tgz",
+      "integrity": "sha512-NuAESUOUMrlIXOfHKzD6bpPu3tYt3xvjNdRIQ+FeT0lNb4K8WR70CaDxhuNguS2XG+GjkyMwOzsN5ZktImfhLA==",
+      "license": "MIT",
+      "engines": {
+        "node": ">= 0.4"
+      }
+    },
     "node_modules/obug": {
       "version": "2.1.1",
       "resolved": "https://registry.npmjs.org/obug/-/obug-2.1.1.tgz",
@@ -5660,6 +5928,49 @@
         "url": "https://github.com/sponsors/sindresorhus"
       }
     },
+    "node_modules/onnxruntime-common": {
+      "version": "1.21.0",
+      "resolved": "https://registry.npmjs.org/onnxruntime-common/-/onnxruntime-common-1.21.0.tgz",
+      "integrity": "sha512-Q632iLLrtCAVOTO65dh2+mNbQir/QNTVBG3h/QdZBpns7mZ0RYbLRBgGABPbpU9351AgYy7SJf1WaeVwMrBFPQ==",
+      "license": "MIT"
+    },
+    "node_modules/onnxruntime-node": {
+      "version": "1.21.0",
+      "resolved": "https://registry.npmjs.org/onnxruntime-node/-/onnxruntime-node-1.21.0.tgz",
+      "integrity": "sha512-NeaCX6WW2L8cRCSqy3bInlo5ojjQqu2fD3D+9W5qb5irwxhEyWKXeH2vZ8W9r6VxaMPUan+4/7NDwZMtouZxEw==",
+      "hasInstallScript": true,
+      "license": "MIT",
+      "os": [
+        "win32",
+        "darwin",
+        "linux"
+      ],
+      "dependencies": {
+        "global-agent": "^3.0.0",
+        "onnxruntime-common": "1.21.0",
+        "tar": "^7.0.1"
+      }
+    },
+    "node_modules/onnxruntime-web": {
+      "version": "1.22.0-dev.20250409-89f8206ba4",
+      "resolved": "https://registry.npmjs.org/onnxruntime-web/-/onnxruntime-web-1.22.0-dev.20250409-89f8206ba4.tgz",
+      "integrity": "sha512-0uS76OPgH0hWCPrFKlL8kYVV7ckM7t/36HfbgoFw6Nd0CZVVbQC4PkrR8mBX8LtNUFZO25IQBqV2Hx2ho3FlbQ==",
+      "license": "MIT",
+      "dependencies": {
+        "flatbuffers": "^25.1.24",
+        "guid-typescript": "^1.0.9",
+        "long": "^5.2.3",
+        "onnxruntime-common": "1.22.0-dev.20250409-89f8206ba4",
+        "platform": "^1.3.6",
+        "protobufjs": "^7.2.4"
+      }
+    },
+    "node_modules/onnxruntime-web/node_modules/onnxruntime-common": {
+      "version": "1.22.0-dev.20250409-89f8206ba4",
+      "resolved": "https://registry.npmjs.org/onnxruntime-common/-/onnxruntime-common-1.22.0-dev.20250409-89f8206ba4.tgz",
+      "integrity": "sha512-vDJMkfCfb0b1A836rgHj+ORuZf4B4+cc2bASQtpeoJLueuFc5DuYwjIZUBrSvx/fO5IrLjLz+oTrB3pcGlhovQ==",
+      "license": "MIT"
+    },
     "node_modules/papaparse": {
       "version": "5.5.3",
       "resolved": "https://registry.npmjs.org/papaparse/-/papaparse-5.5.3.tgz",
@@ -5821,6 +6132,12 @@
         "url": "https://github.com/sponsors/jonschlinkert"
       }
     },
+    "node_modules/platform": {
+      "version": "1.3.6",
+      "resolved": "https://registry.npmjs.org/platform/-/platform-1.3.6.tgz",
+      "integrity": "sha512-fnWVljUchTro6RiCFvCXBbNhJc2NijN7oIQxbwsyL0buWJPG85v81ehlHI9fXrJsMNgTofEoWIQeClKpgxFLrg==",
+      "license": "MIT"
+    },
     "node_modules/postcss": {
       "version": "8.5.8",
       "resolved": "https://registry.npmjs.org/postcss/-/postcss-8.5.8.tgz",
@@ -5931,6 +6248,30 @@
         "asap": "~2.0.3"
       }
     },
+    "node_modules/protobufjs": {
+      "version": "7.5.5",
+      "resolved": "https://registry.npmjs.org/protobufjs/-/protobufjs-7.5.5.tgz",
+      "integrity": "sha512-3wY1AxV+VBNW8Yypfd1yQY9pXnqTAN+KwQxL8iYm3/BjKYMNg4i0owhEe26PWDOMaIrzeeF98Lqd5NGz4omiIg==",
+      "hasInstallScript": true,
+      "license": "BSD-3-Clause",
+      "dependencies": {
+        "@protobufjs/aspromise": "^1.1.2",
+        "@protobufjs/base64": "^1.1.2",
+        "@protobufjs/codegen": "^2.0.4",
+        "@protobufjs/eventemitter": "^1.1.0",
+        "@protobufjs/fetch": "^1.1.0",
+        "@protobufjs/float": "^1.0.2",
+        "@protobufjs/inquire": "^1.1.0",
+        "@protobufjs/path": "^1.1.2",
+        "@protobufjs/pool": "^1.1.0",
+        "@protobufjs/utf8": "^1.1.0",
+        "@types/node": ">=13.7.0",
+        "long": "^5.0.0"
+      },
+      "engines": {
+        "node": ">=12.0.0"
+      }
+    },
     "node_modules/pug": {
       "version": "3.0.4",
       "resolved": "https://registry.npmjs.org/pug/-/pug-3.0.4.tgz",
@@ -6252,6 +6593,23 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/roarr": {
+      "version": "2.15.4",
+      "resolved": "https://registry.npmjs.org/roarr/-/roarr-2.15.4.tgz",
+      "integrity": "sha512-CHhPh+UNHD2GTXNYhPWLnU8ONHdI+5DI+4EYIAOaiD63rHeYlZvyh8P+in5999TTSFgUYuKUAjzRI4mdh/p+2A==",
+      "license": "BSD-3-Clause",
+      "dependencies": {
+        "boolean": "^3.0.1",
+        "detect-node": "^2.0.4",
+        "globalthis": "^1.0.1",
+        "json-stringify-safe": "^5.0.1",
+        "semver-compare": "^1.0.0",
+        "sprintf-js": "^1.1.2"
+      },
+      "engines": {
+        "node": ">=8.0"
+      }
+    },
     "node_modules/rolldown": {
       "version": "1.0.0-rc.13",
       "resolved": "https://registry.npmjs.org/rolldown/-/rolldown-1.0.0-rc.13.tgz",
@@ -6335,7 +6693,6 @@
       "version": "7.7.4",
       "resolved": "https://registry.npmjs.org/semver/-/semver-7.7.4.tgz",
       "integrity": "sha512-vFKC2IEtQnVhpT78h1Yp8wzwrf8CM+MzKMHGJZfBtzhZNycRFnXsHk6E5TxIkkMsgNS7mdX3AGB7x2QM2di4lA==",
-      "devOptional": true,
       "license": "ISC",
       "bin": {
         "semver": "bin/semver.js"
@@ -6344,13 +6701,33 @@
         "node": ">=10"
       }
     },
+    "node_modules/semver-compare": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/semver-compare/-/semver-compare-1.0.0.tgz",
+      "integrity": "sha512-YM3/ITh2MJ5MtzaM429anh+x2jiLVjqILF4m4oyQB18W7Ggea7BfqdH/wGMK7dDiMghv/6WG7znWMwUDzJiXow==",
+      "license": "MIT"
+    },
+    "node_modules/serialize-error": {
+      "version": "7.0.1",
+      "resolved": "https://registry.npmjs.org/serialize-error/-/serialize-error-7.0.1.tgz",
+      "integrity": "sha512-8I8TjW5KMOKsZQTvoxjuSIa7foAwPWGOts+6o7sgjz41/qMD9VQHEDxi6PBvK2l0MXUmqZyNpUK+T2tQaaElvw==",
+      "license": "MIT",
+      "dependencies": {
+        "type-fest": "^0.13.1"
+      },
+      "engines": {
+        "node": ">=10"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/sindresorhus"
+      }
+    },
     "node_modules/sharp": {
       "version": "0.34.5",
       "resolved": "https://registry.npmjs.org/sharp/-/sharp-0.34.5.tgz",
       "integrity": "sha512-Ou9I5Ft9WNcCbXrU9cMgPBcCK8LiwLqcbywW3t4oDV37n1pzpuNLsYiAV8eODnjbtQlSDwZ2cUEeQz4E54Hltg==",
       "hasInstallScript": true,
       "license": "Apache-2.0",
-      "optional": true,
       "dependencies": {
         "@img/colour": "^1.0.0",
         "detect-libc": "^2.1.2",
@@ -6688,6 +7065,22 @@
         "url": "https://github.com/sponsors/ljharb"
       }
     },
+    "node_modules/tar": {
+      "version": "7.5.13",
+      "resolved": "https://registry.npmjs.org/tar/-/tar-7.5.13.tgz",
+      "integrity": "sha512-tOG/7GyXpFevhXVh8jOPJrmtRpOTsYqUIkVdVooZYJS/z8WhfQUX8RJILmeuJNinGAMSu1veBr4asSHFt5/hng==",
+      "license": "BlueOak-1.0.0",
+      "dependencies": {
+        "@isaacs/fs-minipass": "^4.0.0",
+        "chownr": "^3.0.0",
+        "minipass": "^7.1.2",
+        "minizlib": "^3.1.0",
+        "yallist": "^5.0.0"
+      },
+      "engines": {
+        "node": ">=18"
+      }
+    },
     "node_modules/tar-fs": {
       "version": "2.1.4",
       "resolved": "https://registry.npmjs.org/tar-fs/-/tar-fs-2.1.4.tgz",
@@ -6718,6 +7111,15 @@
         "node": ">=6"
       }
     },
+    "node_modules/tar/node_modules/chownr": {
+      "version": "3.0.0",
+      "resolved": "https://registry.npmjs.org/chownr/-/chownr-3.0.0.tgz",
+      "integrity": "sha512-+IxzY9BZOQd/XuYPRmrvEVjF/nqj5kgT4kEq7VofrDoM1MxoRjEWkrCC3EtLi59TVawxTAn+orJwFQcrqEN1+g==",
+      "license": "BlueOak-1.0.0",
+      "engines": {
+        "node": ">=18"
+      }
+    },
     "node_modules/tinybench": {
       "version": "2.9.0",
       "resolved": "https://registry.npmjs.org/tinybench/-/tinybench-2.9.0.tgz",
@@ -7337,6 +7739,18 @@
         "npm": ">=9"
       }
     },
+    "node_modules/type-fest": {
+      "version": "0.13.1",
+      "resolved": "https://registry.npmjs.org/type-fest/-/type-fest-0.13.1.tgz",
+      "integrity": "sha512-34R7HTnG0XIJcBSn5XhDd7nNFPRcXYRZrBB2O2jdKqYODldSzBAqzsWoZYYvduky73toYS/ESqxPvkDf/F0XMg==",
+      "license": "(MIT OR CC0-1.0)",
+      "engines": {
+        "node": ">=10"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/sindresorhus"
+      }
+    },
     "node_modules/typescript": {
       "version": "6.0.2",
       "resolved": "https://registry.npmjs.org/typescript/-/typescript-6.0.2.tgz",
@@ -7367,7 +7781,6 @@
       "version": "7.18.2",
       "resolved": "https://registry.npmjs.org/undici-types/-/undici-types-7.18.2.tgz",
       "integrity": "sha512-AsuCzffGHJybSaRrmr5eHr81mwJU3kjw6M+uprWvCXiNeN9SOGwQ3Jn8jb8m3Z6izVgknn1R0FTCEAP2QrLY/w==",
-      "dev": true,
       "license": "MIT"
     },
     "node_modules/universalify": {
@@ -7667,6 +8080,15 @@
         "node": ">=0.4"
       }
     },
+    "node_modules/yallist": {
+      "version": "5.0.0",
+      "resolved": "https://registry.npmjs.org/yallist/-/yallist-5.0.0.tgz",
+      "integrity": "sha512-YgvUTfwqyc7UXVMrB+SImsVYSmTS8X/tSrtdNZMImM+n7+QTriRXyXim0mBrTXNeqzVF0KWGgHPeiyViFFrNDw==",
+      "license": "BlueOak-1.0.0",
+      "engines": {
+        "node": ">=18"
+      }
+    },
     "node_modules/yaml": {
       "version": "2.8.3",
       "resolved": "https://registry.npmjs.org/yaml/-/yaml-2.8.3.tgz",
diff --git a/package.json b/package.json
index c503dd2..b13c937 100644
--- a/package.json
+++ b/package.json
@@ -24,6 +24,7 @@
     "*.md": []
   },
   "dependencies": {
+    "@huggingface/transformers": "^3.0.0",
     "deeplake": "^0.3.30",
     "just-bash": "^2.14.0",
     "yargs-parser": "^22.0.0"

From 755da50c8208a0cacbe31ca5f13bf787dd443898 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Wed, 22 Apr 2026 18:16:13 +0000
Subject: [PATCH 03/30] feat(db): add summary_embedding / message_embedding
 FLOAT4[] columns
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Extends the ensureTable / ensureSessionsTable DDL with two new nullable
FLOAT4[] columns: summary_embedding on memory (784-dim when populated)
and message_embedding on sessions. Deeplake's native vector type — rows
without an embedding keep NULL, so the column is zero-cost for callers
that don't ingest through the new path.

Stored as FLOAT4[] rather than a serialized TEXT/JSON blob: Deeplake's
native type gives us the <#> cosine operator on the column (verified on
the test workspace, returns top-K in a single SQL round-trip) plus
~5× less storage than JSON-encoded vectors. A 768-dim embedding is
~3 KB binary vs ~16 KB as JSON text.

Test asserts the schema literal for both tables so we catch accidental
drops or type drift early.
---
 claude-code/tests/embeddings-schema.test.ts | 54 +++++++++++++++++++++
 src/deeplake-api.ts                         |  2 +
 2 files changed, 56 insertions(+)
 create mode 100644 claude-code/tests/embeddings-schema.test.ts

diff --git a/claude-code/tests/embeddings-schema.test.ts b/claude-code/tests/embeddings-schema.test.ts
new file mode 100644
index 0000000..44e1b6b
--- /dev/null
+++ b/claude-code/tests/embeddings-schema.test.ts
@@ -0,0 +1,54 @@
+// Bundle-level guard: make sure the shipped hook bundles contain the new
+// embedding columns in their INSERT statements. Catches regressions where
+// the schema migration is done in src/ but a bundle referencing the old
+// column list remains in the shipped artifact.
+
+import { describe, it, expect } from "vitest";
+import { readFileSync } from "node:fs";
+import { join } from "node:path";
+
+const BUNDLE_DIRS = [
+  "claude-code/bundle",
+  "codex/bundle",
+];
+
+function read(path: string): string {
+  return readFileSync(path, "utf-8");
+}
+
+describe("shipped bundles include embedding columns", () => {
+  for (const dir of BUNDLE_DIRS) {
+    it(`${dir}/capture.js writes message_embedding`, () => {
+      const src = read(join(dir, "capture.js"));
+      expect(src).toMatch(/message_embedding/);
+    });
+
+    it(`${dir}/shell/deeplake-shell.js writes summary_embedding`, () => {
+      const src = read(join(dir, "shell/deeplake-shell.js"));
+      expect(src).toMatch(/summary_embedding/);
+    });
+
+    it(`${dir} has an embed-daemon bundle`, () => {
+      // Just check the file exists and is non-empty — not runnable without deps.
+      const src = read(join(dir, "embeddings/embed-daemon.js"));
+      expect(src.length).toBeGreaterThan(100);
+    });
+  }
+});
+
+describe("src-level schema includes new embedding columns", () => {
+  const apiSrc = read("src/deeplake-api.ts");
+
+  it("memory table CREATE includes summary_embedding FLOAT4[]", () => {
+    expect(apiSrc).toMatch(/summary_embedding FLOAT4\[\]/);
+  });
+
+  it("sessions table CREATE includes message_embedding FLOAT4[]", () => {
+    expect(apiSrc).toMatch(/message_embedding FLOAT4\[\]/);
+  });
+
+  it("embedding columns do NOT use TEXT (regression guard)", () => {
+    expect(apiSrc).not.toMatch(/summary_embedding TEXT/);
+    expect(apiSrc).not.toMatch(/message_embedding TEXT/);
+  });
+});
diff --git a/src/deeplake-api.ts b/src/deeplake-api.ts
index a003b04..f6a3a30 100644
--- a/src/deeplake-api.ts
+++ b/src/deeplake-api.ts
@@ -357,6 +357,7 @@ export class DeeplakeApi {
           `path TEXT NOT NULL DEFAULT '', ` +
           `filename TEXT NOT NULL DEFAULT '', ` +
           `summary TEXT NOT NULL DEFAULT '', ` +
+          `summary_embedding FLOAT4[], ` +
           `author TEXT NOT NULL DEFAULT '', ` +
           `mime_type TEXT NOT NULL DEFAULT 'text/plain', ` +
           `size_bytes BIGINT NOT NULL DEFAULT 0, ` +
@@ -390,6 +391,7 @@ export class DeeplakeApi {
           `path TEXT NOT NULL DEFAULT '', ` +
           `filename TEXT NOT NULL DEFAULT '', ` +
           `message JSONB, ` +
+          `message_embedding FLOAT4[], ` +
           `author TEXT NOT NULL DEFAULT '', ` +
           `mime_type TEXT NOT NULL DEFAULT 'application/json', ` +
           `size_bytes BIGINT NOT NULL DEFAULT 0, ` +

From bfff7bea4cef3bb0be713e81310ee3adcdd84209 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Wed, 22 Apr 2026 18:16:25 +0000
Subject: [PATCH 04/30] feat(capture): embed message inline before sessions
 INSERT

Captures each session event through EmbedClient before the direct SQL
INSERT into the sessions table. Embedding is best-effort: the client
returns null on daemon miss/timeout and the write falls back to NULL
in the message_embedding column. A missing embedding never blocks the
capture path.

The client is instantiated fresh per hook invocation and reuses
/tmp/hivemind-embed-<uid>.sock via the spawn-lock in client.ts, so
concurrent tool calls don't race-spawn multiple daemons.

Test mocks EmbedClient with a Promise.resolve(null) stub so existing
SQL-shape assertions keep passing without needing the daemon running
during unit tests.
---
 claude-code/tests/capture-hook.test.ts |  6 ++++++
 src/hooks/capture.ts                   | 16 ++++++++++++++--
 2 files changed, 20 insertions(+), 2 deletions(-)

diff --git a/claude-code/tests/capture-hook.test.ts b/claude-code/tests/capture-hook.test.ts
index c40e8e6..5f19674 100644
--- a/claude-code/tests/capture-hook.test.ts
+++ b/claude-code/tests/capture-hook.test.ts
@@ -50,6 +50,12 @@ vi.mock("../../src/deeplake-api.js", () => ({
     ensureSessionsTable(t: string) { return ensureSessionsTableMock(t); }
   },
 }));
+vi.mock("../../src/embeddings/client.js", () => ({
+  EmbedClient: class {
+    embed(_text: string, _kind?: string) { return Promise.resolve(null); }
+    warmup() { return Promise.resolve(false); }
+  },
+}));
 
 async function runHook(env: Record<string, string | undefined> = {}): Promise<void> {
   delete process.env.HIVEMIND_WIKI_WORKER;
diff --git a/src/hooks/capture.ts b/src/hooks/capture.ts
index 81c8385..70e897f 100644
--- a/src/hooks/capture.ts
+++ b/src/hooks/capture.ts
@@ -21,8 +21,16 @@ import {
   releaseLock,
 } from "./summary-state.js";
 import { bundleDirFromImportMeta, spawnWikiWorker, wikiLog } from "./spawn-wiki-worker.js";
+import { EmbedClient } from "../embeddings/client.js";
+import { embeddingSqlLiteral } from "../embeddings/sql.js";
+import { fileURLToPath } from "node:url";
+import { dirname, join } from "node:path";
 const log = (msg: string) => _log("capture", msg);
 
+function resolveEmbedDaemonPath(): string {
+  return join(dirname(fileURLToPath(import.meta.url)), "embeddings", "embed-daemon.js");
+}
+
 interface HookInput {
   session_id: string;
   transcript_path?: string;
@@ -115,9 +123,13 @@ async function main(): Promise<void> {
   // sqlStr() would also escape backslashes and strip control chars, corrupting the JSON.
   const jsonForSql = line.replace(/'/g, "''");
 
+  const embedClient = new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() });
+  const embedding = await embedClient.embed(line, "document");
+  const embeddingSql = embeddingSqlLiteral(embedding);
+
   const insertSql =
-    `INSERT INTO "${sessionsTable}" (id, path, filename, message, author, size_bytes, project, description, agent, creation_date, last_update_date) ` +
-    `VALUES ('${crypto.randomUUID()}', '${sqlStr(sessionPath)}', '${sqlStr(filename)}', '${jsonForSql}'::jsonb, '${sqlStr(config.userName)}', ` +
+    `INSERT INTO "${sessionsTable}" (id, path, filename, message, message_embedding, author, size_bytes, project, description, agent, creation_date, last_update_date) ` +
+    `VALUES ('${crypto.randomUUID()}', '${sqlStr(sessionPath)}', '${sqlStr(filename)}', '${jsonForSql}'::jsonb, ${embeddingSql}, '${sqlStr(config.userName)}', ` +
     `${Buffer.byteLength(line, "utf-8")}, '${sqlStr(projectName)}', '${sqlStr(input.hook_event_name ?? "")}', 'claude_code', '${ts}', '${ts}')`;
 
   try {

From f9d81b9dd31652ea4ac02ebe169696a88227b13a Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Wed, 22 Apr 2026 18:16:46 +0000
Subject: [PATCH 05/30] feat(deeplake-fs): embed summaries in batched flush +
 split virtual index.md
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Three related changes landed together because they all touch the same
DeeplakeFs flow:

1. Embed in _doFlush: before the parallel upsertRow pass, batch-compute
   embeddings for every pending row via EmbedClient. If the daemon
   isn't up, null embeddings are used — UPDATE / INSERT still fire
   with embedding=NULL and the row keeps the summary column intact.

2. Virtual index.md now has `## memory` and `## sessions` subsections
   instead of one merged table. Previously generateVirtualIndex queried
   only the memory table for /summaries/%; with memory empty (e.g. the
   "sessions only" ingest layout) the index came back as a headers-only
   table and Claude sometimes refused to search at all. The new
   implementation pulls the sessions section directly from the sessions
   table with a GROUP BY path MAX(description), so the index is always
   populated from whatever the workspace actually contains.

3. normalizeContent gains a branch for the single-turn JSONB shape
   `{turn: {dia_id, speaker, text}}` used by the per-row per-turn
   ingestion layout (workspace with_embedding_multi_rows). Emits the
   same `[Dx:y] speaker: text` line the array path already produces
   so grep / Read output is identical across layouts.

Tests updated for the new index shape (assert presence of `## memory`
and `## sessions` headers) and the INSERT/UPDATE SQL parsers now also
accept unquoted NULL and `ARRAY[...]::float4[]` literals so the
positional value extraction stays aligned after schema changes.
---
 claude-code/tests/deeplake-fs.test.ts     |  31 ++++-
 claude-code/tests/session-summary.test.ts |  15 +++
 src/shell/deeplake-fs.ts                  | 135 +++++++++++++++-------
 3 files changed, 137 insertions(+), 44 deletions(-)

diff --git a/claude-code/tests/deeplake-fs.test.ts b/claude-code/tests/deeplake-fs.test.ts
index 455b86a..4f452db 100644
--- a/claude-code/tests/deeplake-fs.test.ts
+++ b/claude-code/tests/deeplake-fs.test.ts
@@ -138,7 +138,9 @@ function makeClient(seed: Record<string, Buffer> = {}) {
             // Parse columns and values positionally
             const colsPart = sql.match(/\(([^)]+)\)\s+VALUES/)?.[1] ?? "";
             const colsList = colsPart.split(",").map(c => c.trim());
-            // Extract all quoted values from VALUES(...)
+            // Extract all values from VALUES(...): strings, integers,
+            // unquoted NULL, and ARRAY[...]::float4[] literals. Each value
+            // becomes one slot so positional column mapping stays correct.
             const valsStr = valuesMatch[1];
             const allVals: string[] = [];
             let i = 0;
@@ -158,6 +160,24 @@ function makeClient(seed: Record<string, Buffer> = {}) {
                 const m = valsStr.slice(i).match(/^(\d+)/);
                 if (m) { allVals.push(m[1]); i += m[1].length; }
                 else i++;
+              } else if (valsStr.slice(i, i + 4).toUpperCase() === "NULL") {
+                allVals.push("");
+                i += 4;
+              } else if (valsStr.slice(i, i + 6).toUpperCase() === "ARRAY[") {
+                // Consume up to the matching ']' and optional ::float4[] cast
+                let depth = 1;
+                let end = i + 6;
+                while (end < valsStr.length && depth > 0) {
+                  if (valsStr[end] === "[") depth++;
+                  else if (valsStr[end] === "]") depth--;
+                  end++;
+                }
+                // Skip optional ::float4[] cast
+                const rest = valsStr.slice(end);
+                const castMatch = rest.match(/^::float4\[\]/i);
+                if (castMatch) end += castMatch[0].length;
+                allVals.push(valsStr.slice(i, end));
+                i = end;
               } else { i++; }
             }
             // Map column names to values
@@ -809,7 +829,9 @@ describe("virtual index.md", () => {
     ]);
     const content = await fs.readFile("/index.md");
     expect(content).toContain("# Session Index");
-    expect(content).toContain("| Session | Conversation | Created | Last Updated | Project | Description |");
+    expect(content).toContain("## memory");
+    expect(content).toContain("## sessions");
+    expect(content).toContain("| Session | Created | Last Updated | Project | Description |");
     expect(content).toContain("aaa-111");
     expect(content).toContain("bbb-222");
     expect(content).toContain("my-project");
@@ -864,8 +886,9 @@ describe("virtual index.md", () => {
     const { fs } = await makeFs({}, "/");
     const content = await fs.readFile("/index.md");
     expect(content).toContain("# Session Index");
-    expect(content).toContain("| Session | Conversation | Created | Last Updated | Project | Description |");
-    // No data rows
+    expect(content).toContain("## memory");
+    expect(content).toContain("_(empty — no summaries ingested yet)_");
+    // No data rows in memory section
     const lines = content.split("\n").filter(l => l.startsWith("| ["));
     expect(lines.length).toBe(0);
   });
diff --git a/claude-code/tests/session-summary.test.ts b/claude-code/tests/session-summary.test.ts
index 09f123a..7840f87 100644
--- a/claude-code/tests/session-summary.test.ts
+++ b/claude-code/tests/session-summary.test.ts
@@ -111,6 +111,21 @@ function makeClient(seed: Record<string, Buffer> = {}) {
               } else if (/\d/.test(valsStr[i])) {
                 const m = valsStr.slice(i).match(/^(\d+)/);
                 if (m) { allVals.push(m[1]); i += m[1].length; } else i++;
+              } else if (valsStr.slice(i, i + 4).toUpperCase() === "NULL") {
+                allVals.push("");
+                i += 4;
+              } else if (valsStr.slice(i, i + 6).toUpperCase() === "ARRAY[") {
+                let depth = 1;
+                let end = i + 6;
+                while (end < valsStr.length && depth > 0) {
+                  if (valsStr[end] === "[") depth++;
+                  else if (valsStr[end] === "]") depth--;
+                  end++;
+                }
+                const castMatch = valsStr.slice(end).match(/^::float4\[\]/i);
+                if (castMatch) end += castMatch[0].length;
+                allVals.push(valsStr.slice(i, end));
+                i = end;
               } else { i++; }
             }
             const colMap: Record<string, string> = {};
diff --git a/src/shell/deeplake-fs.ts b/src/shell/deeplake-fs.ts
index 8db0716..e917e68 100644
--- a/src/shell/deeplake-fs.ts
+++ b/src/shell/deeplake-fs.ts
@@ -1,11 +1,15 @@
 import { basename, posix } from "node:path";
 import { randomUUID } from "node:crypto";
+import { fileURLToPath } from "node:url";
+import { dirname, join } from "node:path";
 import type { DeeplakeApi } from "../deeplake-api.js";
 import type {
   IFileSystem, FsStat, MkdirOptions, RmOptions, CpOptions,
   FileContent, BufferEncoding,
 } from "just-bash";
 import { normalizeContent } from "./grep-core.js";
+import { EmbedClient } from "../embeddings/client.js";
+import { embeddingSqlLiteral } from "../embeddings/sql.js";
 
 interface ReadFileOptions { encoding?: BufferEncoding }
 interface WriteFileOptions { encoding?: BufferEncoding }
@@ -45,6 +49,10 @@ function normalizeSessionMessage(path: string, message: unknown): string {
   return normalizeContent(path, raw);
 }
 
+function resolveEmbedDaemonPath(): string {
+  return join(dirname(fileURLToPath(import.meta.url)), "embeddings", "embed-daemon.js");
+}
+
 function joinSessionMessages(path: string, messages: unknown[]): string {
   return messages.map((message) => normalizeSessionMessage(path, message)).join("\n");
 }
@@ -85,6 +93,9 @@ export class DeeplakeFs implements IFileSystem {
   private sessionPaths = new Set<string>();
   private sessionsTable: string | null = null;
 
+  // Embedding client lazily created on first flush. Lives as long as the process.
+  private embedClient: EmbedClient | null = null;
+
   private constructor(
     private readonly client: DeeplakeApi,
     private readonly table: string,
@@ -194,9 +205,11 @@ export class DeeplakeFs implements IFileSystem {
     const rows = [...this.pending.values()];
     this.pending.clear();
 
+    const embeddings = await this.computeEmbeddings(rows);
+
     // Upsert in parallel — the semaphore in DeeplakeApi.query() handles concurrency.
     // Re-queue any rows that failed so they are retried on the next flush.
-    const results = await Promise.allSettled(rows.map(r => this.upsertRow(r)));
+    const results = await Promise.allSettled(rows.map((r, i) => this.upsertRow(r, embeddings[i])));
     let failures = 0;
     for (let i = 0; i < results.length; i++) {
       if (results[i].status === "rejected") {
@@ -212,7 +225,18 @@ export class DeeplakeFs implements IFileSystem {
     }
   }
 
-  private async upsertRow(r: PendingRow): Promise<void> {
+  private async computeEmbeddings(rows: PendingRow[]): Promise<(number[] | null)[]> {
+    if (rows.length === 0) return [];
+    if (!this.embedClient) {
+      this.embedClient = new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() });
+    }
+    // One request per row over the same daemon — daemon batches internally if
+    // ONNX is configured to do so. We fire in parallel; the Unix socket + daemon
+    // queue handles ordering. null entries are silently stored as empty.
+    return Promise.all(rows.map(r => this.embedClient!.embed(r.contentText, "document")));
+  }
+
+  private async upsertRow(r: PendingRow, embedding: number[] | null): Promise<void> {
     const text  = esc(r.contentText);
     const p     = esc(r.path);
     const fname = esc(r.filename);
@@ -220,8 +244,9 @@ export class DeeplakeFs implements IFileSystem {
     const ts = new Date().toISOString();
     const cd = r.creationDate ?? ts;
     const lud = r.lastUpdateDate ?? ts;
+    const embSql = embeddingSqlLiteral(embedding);
     if (this.flushed.has(r.path)) {
-      let setClauses = `filename = '${fname}', summary = E'${text}', ` +
+      let setClauses = `filename = '${fname}', summary = E'${text}', summary_embedding = ${embSql}, ` +
         `mime_type = '${mime}', size_bytes = ${r.sizeBytes}, last_update_date = '${esc(lud)}'`;
       if (r.project !== undefined) setClauses += `, project = '${esc(r.project)}'`;
       if (r.description !== undefined) setClauses += `, description = '${esc(r.description)}'`;
@@ -230,10 +255,10 @@ export class DeeplakeFs implements IFileSystem {
       );
     } else {
       const id = randomUUID();
-      const cols = "id, path, filename, summary, mime_type, size_bytes, creation_date, last_update_date" +
+      const cols = "id, path, filename, summary, summary_embedding, mime_type, size_bytes, creation_date, last_update_date" +
         (r.project !== undefined ? ", project" : "") +
         (r.description !== undefined ? ", description" : "");
-      const vals = `'${id}', '${p}', '${fname}', E'${text}', '${mime}', ${r.sizeBytes}, '${esc(cd)}', '${esc(lud)}'` +
+      const vals = `'${id}', '${p}', '${fname}', E'${text}', ${embSql}, '${mime}', ${r.sizeBytes}, '${esc(cd)}', '${esc(lud)}'` +
         (r.project !== undefined ? `, '${esc(r.project)}'` : "") +
         (r.description !== undefined ? `, '${esc(r.description)}'` : "");
       await this.client.query(
@@ -246,55 +271,85 @@ export class DeeplakeFs implements IFileSystem {
   // ── Virtual index.md generation ────────────────────────────────────────────
 
   private async generateVirtualIndex(): Promise<string> {
-    const rows = await this.client.query(
+    // Memory (summaries) section — high-level wikipage per session.
+    const summaryRows = await this.client.query(
       `SELECT path, project, description, creation_date, last_update_date FROM "${this.table}" ` +
       `WHERE path LIKE '${esc("/summaries/")}%' ORDER BY last_update_date DESC`
     );
 
-    // Build a lookup: key → session path from sessionPaths
-    // Supports two formats:
-    //   1. /sessions/<user>/<user>_<org>_<ws>_<sessionId>.jsonl  → key = sessionId
-    //   2. /sessions/<author>/<filename>.json or .jsonl         → key = filename stem
-    const sessionPathsByKey = new Map<string, string>();
-    for (const sp of this.sessionPaths) {
-      const hivemind = sp.match(/\/sessions\/[^/]+\/[^/]+_([^.]+)\.jsonl$/);
-      if (hivemind) {
-        sessionPathsByKey.set(hivemind[1], sp.slice(1));
-      } else {
-        // Generic: extract filename without extension
-        const fname = sp.split("/").pop() ?? "";
-        const stem = fname.replace(/\.[^.]+$/, "");
-        if (stem) sessionPathsByKey.set(stem, sp.slice(1));
+    // Sessions section — raw session records (dialogue / events). Pulled
+    // directly from the sessions table so the index is never empty just
+    // because memory has no summaries yet.
+    let sessionRows: Record<string, unknown>[] = [];
+    if (this.sessionsTable) {
+      try {
+        sessionRows = await this.client.query(
+          `SELECT path, MAX(description) AS description, MIN(creation_date) AS creation_date, MAX(last_update_date) AS last_update_date ` +
+          `FROM "${this.sessionsTable}" WHERE path LIKE '${esc("/sessions/")}%' ` +
+          `GROUP BY path ORDER BY path`
+        );
+      } catch {
+        // sessions table absent or schema mismatch — leave empty, emit memory-only index.
+        sessionRows = [];
       }
     }
 
     const lines: string[] = [
       "# Session Index",
       "",
-      "List of all Claude Code sessions with summaries.",
+      "Two sources are available. Consult the section relevant to the question.",
       "",
-      "| Session | Conversation | Created | Last Updated | Project | Description |",
-      "|---------|-------------|---------|--------------|---------|-------------|",
     ];
-    for (const row of rows) {
-      const p = row["path"] as string;
-      // Extract session ID from path: /summaries/<user>/<id>.md
-      const match = p.match(/\/summaries\/([^/]+)\/([^/]+)\.md$/);
-      if (!match) continue;
-      const summaryUser = match[1];
-      const sessionId = match[2];
-      const relPath = `summaries/${summaryUser}/${sessionId}.md`;
-      // Try matching session: first exact sessionId, then strip _summary suffix
-      const baseName = sessionId.replace(/_summary$/, "");
-      const convPath = sessionPathsByKey.get(sessionId) ?? sessionPathsByKey.get(baseName);
-      const convLink = convPath ? `[messages](${convPath})` : "";
-      const project = (row["project"] as string) || "";
-      const description = (row["description"] as string) || "";
-      const creationDate = (row["creation_date"] as string) || "";
-      const lastUpdateDate = (row["last_update_date"] as string) || "";
-      lines.push(`| [${sessionId}](${relPath}) | ${convLink} | ${creationDate} | ${lastUpdateDate} | ${project} | ${description} |`);
+
+    // ── ## memory ────────────────────────────────────────────────────────────
+    lines.push("## memory");
+    lines.push("");
+    if (summaryRows.length === 0) {
+      lines.push("_(empty — no summaries ingested yet)_");
+    } else {
+      lines.push("AI-generated summaries per session. Read these first for topic-level overviews.");
+      lines.push("");
+      lines.push("| Session | Created | Last Updated | Project | Description |");
+      lines.push("|---------|---------|--------------|---------|-------------|");
+      for (const row of summaryRows) {
+        const p = row["path"] as string;
+        const match = p.match(/\/summaries\/([^/]+)\/([^/]+)\.md$/);
+        if (!match) continue;
+        const summaryUser = match[1];
+        const sessionId = match[2];
+        const relPath = `summaries/${summaryUser}/${sessionId}.md`;
+        const project = (row["project"] as string) || "";
+        const description = (row["description"] as string) || "";
+        const creationDate = (row["creation_date"] as string) || "";
+        const lastUpdateDate = (row["last_update_date"] as string) || "";
+        lines.push(`| [${sessionId}](${relPath}) | ${creationDate} | ${lastUpdateDate} | ${project} | ${description} |`);
+      }
+    }
+    lines.push("");
+
+    // ── ## sessions ─────────────────────────────────────────────────────────
+    lines.push("## sessions");
+    lines.push("");
+    if (sessionRows.length === 0) {
+      lines.push("_(empty — no session records ingested yet)_");
+    } else {
+      lines.push("Raw session records (dialogue, tool calls). Read for exact detail / quotes.");
+      lines.push("");
+      lines.push("| Session | Created | Last Updated | Description |");
+      lines.push("|---------|---------|--------------|-------------|");
+      for (const row of sessionRows) {
+        const p = (row["path"] as string) || "";
+        // Show the path relative to /sessions/ so the table stays compact.
+        const rel = p.startsWith("/") ? p.slice(1) : p;
+        const filename = p.split("/").pop() ?? p;
+        const description = (row["description"] as string) || "";
+        const creationDate = (row["creation_date"] as string) || "";
+        const lastUpdateDate = (row["last_update_date"] as string) || "";
+        lines.push(`| [${filename}](${rel}) | ${creationDate} | ${lastUpdateDate} | ${description} |`);
+      }
     }
     lines.push("");
+
     return lines.join("\n");
   }
 

From 7b5104335e352de108177d62fdcbd47cc2754279 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Wed, 22 Apr 2026 18:17:11 +0000
Subject: [PATCH 06/30] feat(grep): hybrid LIKE+semantic retrieval with inline
 date prefix
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Core retrieval upgrade. searchDeeplakeTables() now runs a single UNION ALL
query across four sub-queries:
  - memory.summary::text ILIKE (lexical, score=1.0 sentinel)
  - sessions.message::text ILIKE (lexical, score=1.0 sentinel)
  - memory.summary_embedding <#> ARRAY[...] (cosine, raw score)
  - sessions.message_embedding <#> ARRAY[...] (cosine, raw score)
Results dedup by path in the outer layer, ORDER BY score DESC keeps the
exact-substring hits at the top regardless of cosine magnitude. Lexical
(inclusive) covers "find any session mentioning X", semantic fills in
with concept hits where the literal keyword isn't present (the
"Sunflowers" vs `sunflower` case, measured win vs pure semantic).

Always-case-insensitive by default (likeOp=ILIKE): baseline Claude uses
grep -i on 26% of calls against real files, our plugin Claude used it
on 0.5% because the context injection describes `Grep pattern=...`
without flags. Defaulting to ILIKE closes that gap without asking
Claude to remember. HIVEMIND_GREP_LIKE=case-sensitive for the rare
caller that needs strict matching.

grep-direct.ts and grep-interceptor.ts now instantiate a shared
EmbedClient, embed the grep pattern with `search_query:` prefix, and
pass queryEmbedding into searchDeeplakeTables. Timeout 500ms; on
failure queryEmbedding=null and the search silently falls back to
lexical-only (no user-visible degradation).

normalizeContent() now inlines the session date on every turn line:
  (1:56 pm on 8 May 2023) [D1:5] Caroline: I went to LGBTQ group
Previously the date was a standalone header row, stripped by the
downstream refineGrepMatches line filter. Temporal questions
("When did X?") were answering with relative phrases like "last
Friday" because the reference date was in the discarded header.
Inlining attaches the date to every line that survives the regex.

Kept relaxed-mode emit-all behind HIVEMIND_SEMANTIC_EMIT_ALL=true for
future per-turn experiments. Rank-based fusion and BM25 alternatives
were tried and reverted — see PR notes.

Impact on the canonical 100-QA LoCoMo subset: plugin 0.735 vs baseline
0.750 (-0.015, within LLM non-determinism), 25% cheaper ($6.65 vs
$8.94), 41% fewer output tokens, 31% fewer turns.
---
 src/hooks/grep-direct.ts      |  47 +++++++-
 src/shell/grep-core.ts        | 207 +++++++++++++++++++++++++++++++---
 src/shell/grep-interceptor.ts |  88 ++++++++++++++-
 3 files changed, 324 insertions(+), 18 deletions(-)

diff --git a/src/hooks/grep-direct.ts b/src/hooks/grep-direct.ts
index 95e15d9..63598c5 100644
--- a/src/hooks/grep-direct.ts
+++ b/src/hooks/grep-direct.ts
@@ -8,6 +8,37 @@
 import type { DeeplakeApi } from "../deeplake-api.js";
 import { grepBothTables, type GrepMatchParams } from "../shell/grep-core.js";
 import { capOutputForClaude } from "../utils/output-cap.js";
+import { EmbedClient } from "../embeddings/client.js";
+import { fileURLToPath } from "node:url";
+import { dirname, join } from "node:path";
+
+const SEMANTIC_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false";
+const SEMANTIC_TIMEOUT_MS = Number(process.env.HIVEMIND_SEMANTIC_EMBED_TIMEOUT_MS ?? "500");
+
+function resolveDaemonPath(): string {
+  // When bundled as bundle/pre-tool-use.js, the daemon sits at
+  // bundle/embeddings/embed-daemon.js — one level up from src/hooks/.
+  return join(dirname(fileURLToPath(import.meta.url)), "..", "embeddings", "embed-daemon.js");
+}
+
+let sharedEmbedClient: EmbedClient | null = null;
+function getEmbedClient(): EmbedClient {
+  if (!sharedEmbedClient) {
+    sharedEmbedClient = new EmbedClient({
+      daemonEntry: resolveDaemonPath(),
+      timeoutMs: SEMANTIC_TIMEOUT_MS,
+    });
+  }
+  return sharedEmbedClient;
+}
+
+function patternIsSemanticFriendly(pattern: string, fixedString: boolean): boolean {
+  if (!pattern || pattern.length < 2) return false;
+  if (fixedString) return true;
+  const meta = pattern.match(/[|()\[\]{}+?^$\\]/g);
+  if (!meta) return true;
+  return meta.length <= 1;
+}
 
 export interface GrepParams {
   pattern: string;
@@ -229,7 +260,21 @@ export async function handleGrepDirect(
     fixedString: params.fixedString,
   };
 
-  const output = await grepBothTables(api, table, sessionsTable, matchParams, params.targetPath);
+  // Attempt semantic search. If the daemon is unavailable or the pattern is
+  // regex-heavy, embed returns null and searchDeeplakeTables falls back to
+  // lexical LIKE.
+  let queryEmbedding: number[] | null = null;
+  if (SEMANTIC_ENABLED && patternIsSemanticFriendly(params.pattern, params.fixedString)) {
+    try {
+      queryEmbedding = await getEmbedClient().embed(params.pattern, "query");
+    } catch {
+      queryEmbedding = null;
+    }
+  }
+
+  const output = await grepBothTables(
+    api, table, sessionsTable, matchParams, params.targetPath, queryEmbedding,
+  );
   const joined = output.join("\n") || "(no matches)";
   return capOutputForClaude(joined, { kind: "grep" });
 }
diff --git a/src/shell/grep-core.ts b/src/shell/grep-core.ts
index 6e93c5b..cfcc959 100644
--- a/src/shell/grep-core.ts
+++ b/src/shell/grep-core.ts
@@ -50,6 +50,23 @@ export interface SearchOptions {
   prefilterPatterns?: string[];
   /** Per-table row cap. */
   limit?: number;
+  /**
+   * If set, switches to semantic (cosine) search via Deeplake's `<#>` operator
+   * against `summary_embedding` / `message_embedding` FLOAT4[] columns. When
+   * absent, the BM25/LIKE path runs. Callers compute this vector via the
+   * EmbedClient; null means the daemon was unreachable and we should stick
+   * with lexical search.
+   */
+  queryEmbedding?: number[] | null;
+  /**
+   * Plain-text phrase used as the BM25 search term via Deeplake's `<#>`
+   * operator on TEXT columns (and on `message::text` for JSONB). Replaces
+   * the old LIKE/ILIKE substring scan: BM25 ranks by term frequency, handles
+   * multi-word queries natively, and respects a real token index (no full
+   * table scan). When the pattern is pure regex (no usable literal) this is
+   * undefined and the caller falls back to the semantic branch alone.
+   */
+  bm25Term?: string;
 }
 
 // ── Content normalization ───────────────────────────────────────────────────
@@ -174,24 +191,43 @@ export function normalizeContent(path: string, raw: string): string {
   try { obj = JSON.parse(raw); } catch { return raw; }
 
   // ── Turn-array session shape: { turns: [...] } ───────────────────────────
+  //
+  // Emit the session date as a prefix on EVERY turn line rather than a
+  // standalone header row. The downstream `refineGrepMatches` regex filter
+  // drops non-matching lines, so a header-only date gets stripped before
+  // Claude sees any grep hit — temporal questions ("When did X?") then
+  // answer with relative phrases like "Last Friday" because the absolute
+  // date was in the discarded header. Inlining the date keeps it attached
+  // to every line that survives the regex.
   if (Array.isArray(obj.turns)) {
-    const header: string[] = [];
-    if (obj.date_time) header.push(`date: ${obj.date_time}`);
-    if (obj.speakers) {
-      const s = obj.speakers;
-      const names = [s.speaker_a, s.speaker_b].filter(Boolean).join(", ");
-      if (names) header.push(`speakers: ${names}`);
-    }
+    const dateHeader = obj.date_time ? `(${String(obj.date_time)}) ` : "";
     const lines = obj.turns.map((t: any) => {
       const sp = String(t?.speaker ?? t?.name ?? "?").trim();
       const tx = String(t?.text ?? t?.content ?? "").replace(/\s+/g, " ").trim();
       const tag = t?.dia_id ? `[${t.dia_id}] ` : "";
-      return `${tag}${sp}: ${tx}`;
+      return `${dateHeader}${tag}${sp}: ${tx}`;
     });
-    const out = [...header, ...lines].join("\n");
+    const out = lines.join("\n");
     return out.trim() ? out : raw;
   }
 
+  // ── Single-turn shape: { turn: { dia_id, speaker, text }, ... } ──────────
+  // Per-row per-turn ingestion (see workspace `with_embedding_multi_rows`)
+  // stores each row as one turn with enclosing session metadata. Emit the
+  // session date inline on every turn line so Claude can resolve relative
+  // times ("last Friday", "last month") against a real reference point —
+  // without the prefix, temporal-category questions degrade sharply
+  // because the turn text on its own lacks absolute dating.
+  if (obj.turn && typeof obj.turn === "object" && !Array.isArray(obj.turn)) {
+    const t = obj.turn as { dia_id?: unknown; speaker?: unknown; name?: unknown; text?: unknown; content?: unknown };
+    const sp = String(t.speaker ?? t.name ?? "?").trim();
+    const tx = String(t.text ?? t.content ?? "").replace(/\s+/g, " ").trim();
+    const tag = t.dia_id ? `[${String(t.dia_id)}] ` : "";
+    const dateHeader = obj.date_time ? `(${String(obj.date_time)}) ` : "";
+    const line = `${dateHeader}${tag}${sp}: ${tx}`;
+    return line.trim() ? line : raw;
+  }
+
   // ── Production shape: single hook-event row (capture.ts output) ─────────
   //
   // `<recalled-memories>` blocks are injected by OpenClaw as extra context
@@ -244,9 +280,15 @@ function buildPathCondition(targetPath: string): string {
 }
 
 /**
- * Dual-table LIKE/ILIKE search. Casts `summary` (TEXT) and `message` (JSONB)
- * to ::text so the same predicate works across both. The lookup always goes
- * through a single UNION ALL query so one grep maps to one SQL search.
+ * Dual-table search. Two branches:
+ *   • semantic — when `opts.queryEmbedding` is a non-empty vector, cosine
+ *     similarity (`<#>`) against the FLOAT4[] embedding columns. Rows are
+ *     ordered by score DESC and the top-N from both tables are merged.
+ *   • lexical — otherwise, LIKE/ILIKE against ::text of `summary` and
+ *     `message`. Same UNION ALL shape as before for backwards compat.
+ *
+ * The lookup always goes through a single top-level SQL query so one grep
+ * maps to one round-trip.
  */
 export async function searchDeeplakeTables(
   api: DeeplakeApi,
@@ -254,8 +296,92 @@ export async function searchDeeplakeTables(
   sessionsTable: string,
   opts: SearchOptions,
 ): Promise<ContentRow[]> {
-  const { pathFilter, contentScanOnly, likeOp, escapedPattern, prefilterPattern, prefilterPatterns } = opts;
+  const { pathFilter, contentScanOnly, likeOp, escapedPattern, prefilterPattern, prefilterPatterns, queryEmbedding, bm25Term } = opts;
   const limit = opts.limit ?? 100;
+
+  // ── Hybrid (lexical + semantic) branch ───────────────────────────────────
+  // Runs both halves in a single UNION ALL query so each grep = one round-
+  // trip. Lexical catches literal-keyword matches that semantic misses
+  // (single-word queries diluted by document-level embedding — see
+  // PR-NOTES.md P2/P3). Semantic catches conceptual matches that lexical
+  // can't express. De-duplicate by path in the outer layer; when a path
+  // appears in both halves, the semantic score wins (real cosine signal vs
+  // the lexical branch's constant 1.0 sentinel).
+  if (queryEmbedding && queryEmbedding.length > 0) {
+    const vecLit = serializeFloat4Array(queryEmbedding);
+    const semanticLimit = Math.min(
+      limit,
+      Number(process.env.HIVEMIND_SEMANTIC_LIMIT ?? "20"),
+    );
+    const lexicalLimit = Math.min(
+      limit,
+      Number(process.env.HIVEMIND_HYBRID_LEXICAL_LIMIT ?? "20"),
+    );
+
+    // Single UNION ALL of lexical (LIKE/ILIKE substring) + semantic (cosine).
+    // Lexical rows emit a score=1.0 sentinel, semantic rows emit their real
+    // cosine (0..1). ORDER BY score DESC then LIMIT top-K:
+    //   • exact-substring matches (lexical) dominate the top of the list
+    //     regardless of cosine score — desirable because they're likely to
+    //     contain the literal keyword Claude asked for
+    //   • semantic hits fill in below, covering concept matches where the
+    //     literal keyword doesn't appear
+    // BM25 tried and dropped (PR-NOTES F4c): score scale (~1..3) overpowered
+    // cosine in UNION, semantic hits were pushed out of top-K. LIKE is a
+    // better fit for "find any session mentioning X" which is the actual
+    // plugin use case.
+    const filterPatternsForLex = contentScanOnly
+      ? (prefilterPatterns && prefilterPatterns.length > 0
+          ? prefilterPatterns
+          : (prefilterPattern ? [prefilterPattern] : []))
+      : [escapedPattern];
+    const memLexFilter = buildContentFilter("summary::text", likeOp, filterPatternsForLex);
+    const sessLexFilter = buildContentFilter("message::text", likeOp, filterPatternsForLex);
+
+    const memLexQuery = memLexFilter
+      ? `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, 1.0 AS score ` +
+        `FROM "${memoryTable}" WHERE 1=1${pathFilter}${memLexFilter} LIMIT ${lexicalLimit}`
+      : null;
+    const sessLexQuery = sessLexFilter
+      ? `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, 1.0 AS score ` +
+        `FROM "${sessionsTable}" WHERE 1=1${pathFilter}${sessLexFilter} LIMIT ${lexicalLimit}`
+      : null;
+
+    const memSemQuery =
+      `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, ` +
+      `(summary_embedding <#> ${vecLit}) AS score ` +
+      `FROM "${memoryTable}" WHERE summary_embedding IS NOT NULL${pathFilter} ` +
+      `ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const sessSemQuery =
+      `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, ` +
+      `(message_embedding <#> ${vecLit}) AS score ` +
+      `FROM "${sessionsTable}" WHERE message_embedding IS NOT NULL${pathFilter} ` +
+      `ORDER BY score DESC LIMIT ${semanticLimit}`;
+
+    const parts = [memSemQuery, sessSemQuery];
+    if (memLexQuery) parts.push(memLexQuery);
+    if (sessLexQuery) parts.push(sessLexQuery);
+    const unionSql = parts.map(q => `(${q})`).join(" UNION ALL ");
+
+    const outerLimit = semanticLimit + lexicalLimit;
+    const rows = await api.query(
+      `SELECT path, content, source_order, creation_date, score FROM (` +
+      unionSql +
+      `) AS combined ORDER BY score DESC LIMIT ${outerLimit}`
+    );
+
+    const seen = new Set<string>();
+    const unique: ContentRow[] = [];
+    for (const row of rows) {
+      const p = String(row["path"]);
+      if (seen.has(p)) continue;
+      seen.add(p);
+      unique.push({ path: p, content: String(row["content"] ?? "") });
+    }
+    return unique;
+  }
+
+  // ── Lexical branch ───────────────────────────────────────────────────────
   const filterPatterns = contentScanOnly
     ? (prefilterPatterns && prefilterPatterns.length > 0 ? prefilterPatterns : (prefilterPattern ? [prefilterPattern] : []))
     : [escapedPattern];
@@ -277,6 +403,15 @@ export async function searchDeeplakeTables(
   }));
 }
 
+function serializeFloat4Array(vec: number[]): string {
+  const parts: string[] = [];
+  for (const v of vec) {
+    if (!Number.isFinite(v)) return "NULL";
+    parts.push(String(v));
+  }
+  return `ARRAY[${parts.join(",")}]::float4[]`;
+}
+
 /** Build a LIKE pathFilter clause for a `path` column. Returns "" if targetPath is root or empty. */
 export function buildPathFilter(targetPath: string): string {
   const condition = buildPathCondition(targetPath);
@@ -377,13 +512,31 @@ export function buildGrepSearchOptions(params: GrepMatchParams, targetPath: stri
   const hasRegexMeta = !params.fixedString && /[.*+?^${}()|[\]\\]/.test(params.pattern);
   const literalPrefilter = hasRegexMeta ? extractRegexLiteralPrefilter(params.pattern) : null;
   const alternationPrefilters = hasRegexMeta ? extractRegexAlternationPrefilters(params.pattern) : null;
+
+  // bm25Term: the raw phrase we hand to Deeplake's `<#>` operator on TEXT /
+  // JSONB. Non-regex patterns go through verbatim; regex patterns collapse
+  // to their extracted literal prefilter (longest literal for a single
+  // prefilter, space-joined alternations otherwise). If nothing literal can
+  // be extracted, bm25Term is undefined and callers fall back to semantic.
+  let bm25Term: string | undefined;
+  if (!hasRegexMeta) {
+    bm25Term = params.pattern;
+  } else if (alternationPrefilters && alternationPrefilters.length > 0) {
+    bm25Term = alternationPrefilters.join(" ");
+  } else if (literalPrefilter) {
+    bm25Term = literalPrefilter;
+  }
+
   return {
     pathFilter: buildPathFilter(targetPath),
     contentScanOnly: hasRegexMeta,
-    likeOp: params.ignoreCase ? "ILIKE" : "LIKE",
+    // Kept for the pure-lexical fallback path and existing tests; BM25 is now
+    // the preferred lexical ranker when a term can be extracted.
+    likeOp: process.env.HIVEMIND_GREP_LIKE === "case-sensitive" ? "LIKE" : "ILIKE",
     escapedPattern: sqlLike(params.pattern),
     prefilterPattern: literalPrefilter ? sqlLike(literalPrefilter) : undefined,
     prefilterPatterns: alternationPrefilters?.map((literal) => sqlLike(literal)),
+    bm25Term,
   };
 }
 
@@ -462,8 +615,12 @@ export async function grepBothTables(
   sessionsTable: string,
   params: GrepMatchParams,
   targetPath: string,
+  queryEmbedding?: number[] | null,
 ): Promise<string[]> {
-  const rows = await searchDeeplakeTables(api, memoryTable, sessionsTable, buildGrepSearchOptions(params, targetPath));
+  const rows = await searchDeeplakeTables(api, memoryTable, sessionsTable, {
+    ...buildGrepSearchOptions(params, targetPath),
+    queryEmbedding,
+  });
   // Defensive path dedup — memory and sessions tables use disjoint path
   // prefixes in every schema we ship (/summaries/… vs /sessions/…), so the
   // overlap is theoretical, but we dedupe to match grep-interceptor.ts and
@@ -472,5 +629,25 @@ export async function grepBothTables(
   const seen = new Set<string>();
   const unique = rows.filter(r => seen.has(r.path) ? false : (seen.add(r.path), true));
   const normalized = unique.map(r => ({ path: r.path, content: normalizeContent(r.path, r.content) }));
+
+  // Semantic mode: the ranking IS the retrieval. Emitting only regex-matched
+  // lines would drop relevant turns whose literal text doesn't contain the
+  // pattern (the whole point of semantic). Return every non-empty normalized
+  // line from the top-K rows, prefixed with the path so Claude can follow up
+  // with Read. The downstream output-cap keeps the response bounded.
+  if (queryEmbedding && queryEmbedding.length > 0) {
+    const emitAllLines = process.env.HIVEMIND_SEMANTIC_EMIT_ALL !== "false";
+    if (emitAllLines) {
+      const lines: string[] = [];
+      for (const r of normalized) {
+        for (const line of r.content.split("\n")) {
+          const trimmed = line.trim();
+          if (trimmed) lines.push(`${r.path}:${line}`);
+        }
+      }
+      return lines;
+    }
+  }
+
   return refineGrepMatches(normalized, params);
 }
diff --git a/src/shell/grep-interceptor.ts b/src/shell/grep-interceptor.ts
index debd0cd..6992422 100644
--- a/src/shell/grep-interceptor.ts
+++ b/src/shell/grep-interceptor.ts
@@ -2,6 +2,9 @@ import type { DeeplakeApi } from "../deeplake-api.js";
 import { defineCommand } from "just-bash";
 import yargsParser from "yargs-parser";
 import type { DeeplakeFs } from "./deeplake-fs.js";
+import { fileURLToPath } from "node:url";
+import { dirname, join } from "node:path";
+import { EmbedClient } from "../embeddings/client.js";
 
 import {
   buildGrepSearchOptions,
@@ -13,6 +16,38 @@ import {
   type ContentRow,
 } from "./grep-core.js";
 
+const SEMANTIC_SEARCH_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false";
+const SEMANTIC_EMBED_TIMEOUT_MS = Number(process.env.HIVEMIND_SEMANTIC_EMBED_TIMEOUT_MS ?? "500");
+
+function resolveGrepEmbedDaemonPath(): string {
+  return join(dirname(fileURLToPath(import.meta.url)), "..", "embeddings", "embed-daemon.js");
+}
+
+let sharedGrepEmbedClient: EmbedClient | null = null;
+function getGrepEmbedClient(): EmbedClient {
+  if (!sharedGrepEmbedClient) {
+    sharedGrepEmbedClient = new EmbedClient({
+      daemonEntry: resolveGrepEmbedDaemonPath(),
+      timeoutMs: SEMANTIC_EMBED_TIMEOUT_MS,
+    });
+  }
+  return sharedGrepEmbedClient;
+}
+
+/**
+ * Plain-text-ish pattern → candidate for semantic search.
+ * Skip regex-heavy queries (many metachars) where cosine similarity is not
+ * what the user asked for.
+ */
+function patternIsSemanticFriendly(pattern: string, fixedString: boolean): boolean {
+  if (!pattern || pattern.length < 2) return false;
+  if (fixedString) return true;
+  // Literal-ish patterns with only occasional `.*` are still fine for semantic.
+  const metaMatches = pattern.match(/[|()\[\]{}+?^$\\]/g);
+  if (!metaMatches) return true;
+  return metaMatches.length <= 1;
+}
+
 const MAX_FALLBACK_CANDIDATES = 500;
 
 /**
@@ -71,12 +106,25 @@ export function createGrepCommand(
       countOnly: Boolean(parsed.c || parsed["count"]),
     };
 
+    // Try semantic search first (daemon-backed embedding of the pattern).
+    // Falls back to lexical LIKE if the daemon is unreachable, disabled by
+    // env flag, or the pattern is regex-heavy.
+    let queryEmbedding: number[] | null = null;
+    if (SEMANTIC_SEARCH_ENABLED && patternIsSemanticFriendly(pattern, matchParams.fixedString)) {
+      try {
+        queryEmbedding = await getGrepEmbedClient().embed(pattern, "query");
+      } catch {
+        queryEmbedding = null;
+      }
+    }
+
     let rows: ContentRow[] = [];
     try {
       const searchOptions = {
         ...buildGrepSearchOptions(matchParams, targets[0] ?? ctx.cwd),
         pathFilter: buildPathFilterForTargets(targets),
         limit: 100,
+        queryEmbedding,
       };
       const queryRows = await Promise.race([
         searchDeeplakeTables(client, table, sessionsTable ?? "sessions", searchOptions),
@@ -87,6 +135,26 @@ export function createGrepCommand(
       rows = []; // fall through to in-memory fallback
     }
 
+    // Semantic returned nothing → retry with lexical LIKE as a second shot
+    // before giving up to the in-memory fallback. Keeps behavior robust when
+    // embeddings miss but BM25 would match.
+    if (rows.length === 0 && queryEmbedding) {
+      try {
+        const lexicalOptions = {
+          ...buildGrepSearchOptions(matchParams, targets[0] ?? ctx.cwd),
+          pathFilter: buildPathFilterForTargets(targets),
+          limit: 100,
+        };
+        const lexicalRows = await Promise.race([
+          searchDeeplakeTables(client, table, sessionsTable ?? "sessions", lexicalOptions),
+          new Promise<never>((_, reject) => setTimeout(() => reject(new Error("timeout")), 3000)),
+        ]);
+        rows.push(...lexicalRows);
+      } catch {
+        // fall through to in-memory fallback below
+      }
+    }
+
     // Dedup by path (multiple targets may overlap)
     const seen = new Set<string>();
     rows = rows.filter(r => seen.has(r.path) ? false : (seen.add(r.path), true));
@@ -106,9 +174,25 @@ export function createGrepCommand(
       }
     }
 
-    // Normalize session JSON blobs to per-turn lines before the regex pass.
+    // Normalize session JSON blobs to per-turn lines.
     const normalized = rows.map(r => ({ path: r.path, content: normalizeContent(r.path, r.content) }));
-    const output = refineGrepMatches(normalized, matchParams);
+
+    // In semantic mode, skip the regex refinement: cosine similarity has
+    // already done the filtering, and dropping lines whose literal text
+    // doesn't match the pattern would defeat the semantic retrieval.
+    // Toggle with HIVEMIND_SEMANTIC_EMIT_ALL=false to restore strict regex.
+    let output: string[];
+    if (queryEmbedding && queryEmbedding.length > 0 && process.env.HIVEMIND_SEMANTIC_EMIT_ALL !== "false") {
+      output = [];
+      for (const r of normalized) {
+        for (const line of r.content.split("\n")) {
+          const trimmed = line.trim();
+          if (trimmed) output.push(`${r.path}:${line}`);
+        }
+      }
+    } else {
+      output = refineGrepMatches(normalized, matchParams);
+    }
 
     return {
       stdout: output.length > 0 ? output.join("\n") + "\n" : "",

From 27753f82728fd86b8efe978327ae47d1349f840f Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Wed, 22 Apr 2026 18:17:20 +0000
Subject: [PATCH 07/30] build: regenerate bundles with embeddings + hybrid grep

Product of the preceding feature commits: tsc + esbuild rerun produces
the new bundle/embeddings/embed-daemon.js for both CC and Codex, plus
updated bundles for capture, pre-tool-use, session-start, session-start-setup,
and deeplake-shell that include the EmbedClient, hybrid grep branch, and
inline-date normalizeContent.
---
 claude-code/bundle/capture.js                 | 276 +++++++++-
 claude-code/bundle/commands/auth-login.js     |   4 +-
 claude-code/bundle/embeddings/embed-daemon.js | 240 +++++++++
 claude-code/bundle/pre-tool-use.js            | 410 ++++++++++++--
 claude-code/bundle/session-start-setup.js     |   4 +-
 claude-code/bundle/session-start.js           |   4 +-
 claude-code/bundle/shell/deeplake-shell.js    | 504 ++++++++++++++++--
 codex/bundle/capture.js                       |   4 +-
 codex/bundle/commands/auth-login.js           |   4 +-
 codex/bundle/embeddings/embed-daemon.js       | 240 +++++++++
 codex/bundle/pre-tool-use.js                  | 406 ++++++++++++--
 codex/bundle/session-start-setup.js           |   4 +-
 codex/bundle/shell/deeplake-shell.js          | 504 ++++++++++++++++--
 codex/bundle/stop.js                          |   4 +-
 14 files changed, 2375 insertions(+), 233 deletions(-)
 create mode 100755 claude-code/bundle/embeddings/embed-daemon.js
 create mode 100755 codex/bundle/embeddings/embed-daemon.js

diff --git a/claude-code/bundle/capture.js b/claude-code/bundle/capture.js
index 50551da..3adbe9f 100755
--- a/claude-code/bundle/capture.js
+++ b/claude-code/bundle/capture.js
@@ -375,7 +375,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(tbl)) {
       log2(`table "${tbl}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', summary_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
@@ -386,7 +386,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(name)) {
       log2(`table "${name}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, message_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
@@ -658,8 +658,247 @@ function bundleDirFromImportMeta(importMetaUrl) {
   return dirname(fileURLToPath(importMetaUrl));
 }
 
+// dist/src/embeddings/client.js
+import { connect } from "node:net";
+import { spawn as spawn2 } from "node:child_process";
+import { openSync as openSync2, closeSync as closeSync2, writeSync as writeSync2, unlinkSync as unlinkSync2, existsSync as existsSync4, readFileSync as readFileSync4 } from "node:fs";
+
+// dist/src/embeddings/protocol.js
+var DEFAULT_SOCKET_DIR = "/tmp";
+var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
+var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.sock`;
+}
+function pidPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.pid`;
+}
+
+// dist/src/embeddings/client.js
+var log3 = (m) => log("embed-client", m);
+function getUid() {
+  const uid = typeof process.getuid === "function" ? process.getuid() : void 0;
+  return uid !== void 0 ? String(uid) : process.env.USER ?? "default";
+}
+var EmbedClient = class {
+  socketPath;
+  pidPath;
+  timeoutMs;
+  daemonEntry;
+  autoSpawn;
+  spawnWaitMs;
+  nextId = 0;
+  constructor(opts = {}) {
+    const uid = getUid();
+    const dir = opts.socketDir ?? "/tmp";
+    this.socketPath = socketPathFor(uid, dir);
+    this.pidPath = pidPathFor(uid, dir);
+    this.timeoutMs = opts.timeoutMs ?? DEFAULT_CLIENT_TIMEOUT_MS;
+    this.daemonEntry = opts.daemonEntry ?? process.env.HIVEMIND_EMBED_DAEMON;
+    this.autoSpawn = opts.autoSpawn ?? true;
+    this.spawnWaitMs = opts.spawnWaitMs ?? 5e3;
+  }
+  /**
+   * Returns an embedding vector, or null on timeout/failure. Hooks MUST treat
+   * null as "skip embedding column" — never block the write path on us.
+   *
+   * Fire-and-forget spawn on miss: if the daemon isn't up, this call returns
+   * null AND kicks off a background spawn. The next call finds a ready daemon.
+   */
+  async embed(text, kind = "document") {
+    let sock;
+    try {
+      sock = await this.connectOnce();
+    } catch {
+      if (this.autoSpawn)
+        this.trySpawnDaemon();
+      return null;
+    }
+    try {
+      const id = String(++this.nextId);
+      const req = { op: "embed", id, kind, text };
+      const resp = await this.sendAndWait(sock, req);
+      if (resp.error || !("embedding" in resp) || !resp.embedding) {
+        log3(`embed err: ${resp.error ?? "no embedding"}`);
+        return null;
+      }
+      return resp.embedding;
+    } catch (e) {
+      const err = e instanceof Error ? e.message : String(e);
+      log3(`embed failed: ${err}`);
+      return null;
+    } finally {
+      try {
+        sock.end();
+      } catch {
+      }
+    }
+  }
+  /**
+   * Wait up to spawnWaitMs for the daemon to accept connections, spawning if
+   * necessary. Meant for SessionStart / long-running batches — not the hot path.
+   */
+  async warmup() {
+    try {
+      const s = await this.connectOnce();
+      s.end();
+      return true;
+    } catch {
+      if (!this.autoSpawn)
+        return false;
+      this.trySpawnDaemon();
+      try {
+        const s = await this.waitForSocket();
+        s.end();
+        return true;
+      } catch {
+        return false;
+      }
+    }
+  }
+  connectOnce() {
+    return new Promise((resolve, reject) => {
+      const sock = connect(this.socketPath);
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("connect timeout"));
+      }, this.timeoutMs);
+      sock.once("connect", () => {
+        clearTimeout(to);
+        resolve(sock);
+      });
+      sock.once("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+    });
+  }
+  trySpawnDaemon() {
+    let fd;
+    try {
+      fd = openSync2(this.pidPath, "wx", 384);
+      writeSync2(fd, String(process.pid));
+    } catch (e) {
+      if (this.isPidFileStale()) {
+        try {
+          unlinkSync2(this.pidPath);
+        } catch {
+        }
+        try {
+          fd = openSync2(this.pidPath, "wx", 384);
+          writeSync2(fd, String(process.pid));
+        } catch {
+          return;
+        }
+      } else {
+        return;
+      }
+    }
+    if (!this.daemonEntry || !existsSync4(this.daemonEntry)) {
+      log3(`daemonEntry not configured or missing: ${this.daemonEntry}`);
+      try {
+        closeSync2(fd);
+        unlinkSync2(this.pidPath);
+      } catch {
+      }
+      return;
+    }
+    try {
+      const child = spawn2(process.execPath, [this.daemonEntry], {
+        detached: true,
+        stdio: "ignore",
+        env: process.env
+      });
+      child.unref();
+      log3(`spawned daemon pid=${child.pid}`);
+    } finally {
+      closeSync2(fd);
+    }
+  }
+  isPidFileStale() {
+    try {
+      const raw = readFileSync4(this.pidPath, "utf-8").trim();
+      const pid = Number(raw);
+      if (!pid || Number.isNaN(pid))
+        return true;
+      try {
+        process.kill(pid, 0);
+        return false;
+      } catch {
+        return true;
+      }
+    } catch {
+      return true;
+    }
+  }
+  async waitForSocket() {
+    const deadline = Date.now() + this.spawnWaitMs;
+    let delay = 30;
+    while (Date.now() < deadline) {
+      await sleep2(delay);
+      delay = Math.min(delay * 1.5, 300);
+      if (!existsSync4(this.socketPath))
+        continue;
+      try {
+        return await this.connectOnce();
+      } catch {
+      }
+    }
+    throw new Error("daemon did not become ready within spawnWaitMs");
+  }
+  sendAndWait(sock, req) {
+    return new Promise((resolve, reject) => {
+      let buf = "";
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("request timeout"));
+      }, this.timeoutMs);
+      sock.setEncoding("utf-8");
+      sock.on("data", (chunk) => {
+        buf += chunk;
+        const nl = buf.indexOf("\n");
+        if (nl === -1)
+          return;
+        const line = buf.slice(0, nl);
+        clearTimeout(to);
+        try {
+          resolve(JSON.parse(line));
+        } catch (e) {
+          reject(e);
+        }
+      });
+      sock.on("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+      sock.write(JSON.stringify(req) + "\n");
+    });
+  }
+};
+function sleep2(ms) {
+  return new Promise((r) => setTimeout(r, ms));
+}
+
+// dist/src/embeddings/sql.js
+function embeddingSqlLiteral(vec) {
+  if (!vec || vec.length === 0)
+    return "NULL";
+  const parts = [];
+  for (const v of vec) {
+    if (!Number.isFinite(v))
+      return "NULL";
+    parts.push(String(v));
+  }
+  return `ARRAY[${parts.join(",")}]::float4[]`;
+}
+
 // dist/src/hooks/capture.js
-var log3 = (msg) => log("capture", msg);
+import { fileURLToPath as fileURLToPath2 } from "node:url";
+import { dirname as dirname2, join as join7 } from "node:path";
+var log4 = (msg) => log("capture", msg);
+function resolveEmbedDaemonPath() {
+  return join7(dirname2(fileURLToPath2(import.meta.url)), "embeddings", "embed-daemon.js");
+}
 var CAPTURE = process.env.HIVEMIND_CAPTURE !== "false";
 async function main() {
   if (!CAPTURE)
@@ -667,7 +906,7 @@ async function main() {
   const input = await readStdin();
   const config = loadConfig();
   if (!config) {
-    log3("no config");
+    log4("no config");
     return;
   }
   const sessionsTable = config.sessionsTableName;
@@ -685,7 +924,7 @@ async function main() {
   };
   let entry;
   if (input.prompt !== void 0) {
-    log3(`user session=${input.session_id}`);
+    log4(`user session=${input.session_id}`);
     entry = {
       id: crypto.randomUUID(),
       ...meta,
@@ -693,7 +932,7 @@ async function main() {
       content: input.prompt
     };
   } else if (input.tool_name !== void 0) {
-    log3(`tool=${input.tool_name} session=${input.session_id}`);
+    log4(`tool=${input.tool_name} session=${input.session_id}`);
     entry = {
       id: crypto.randomUUID(),
       ...meta,
@@ -704,7 +943,7 @@ async function main() {
       tool_response: JSON.stringify(input.tool_response)
     };
   } else if (input.last_assistant_message !== void 0) {
-    log3(`assistant session=${input.session_id}`);
+    log4(`assistant session=${input.session_id}`);
     entry = {
       id: crypto.randomUUID(),
       ...meta,
@@ -713,28 +952,31 @@ async function main() {
       ...input.agent_transcript_path ? { agent_transcript_path: input.agent_transcript_path } : {}
     };
   } else {
-    log3("unknown event, skipping");
+    log4("unknown event, skipping");
     return;
   }
   const sessionPath = buildSessionPath(config, input.session_id);
   const line = JSON.stringify(entry);
-  log3(`writing to ${sessionPath}`);
+  log4(`writing to ${sessionPath}`);
   const projectName = (input.cwd ?? "").split("/").pop() || "unknown";
   const filename = sessionPath.split("/").pop() ?? "";
   const jsonForSql = line.replace(/'/g, "''");
-  const insertSql = `INSERT INTO "${sessionsTable}" (id, path, filename, message, author, size_bytes, project, description, agent, creation_date, last_update_date) VALUES ('${crypto.randomUUID()}', '${sqlStr(sessionPath)}', '${sqlStr(filename)}', '${jsonForSql}'::jsonb, '${sqlStr(config.userName)}', ${Buffer.byteLength(line, "utf-8")}, '${sqlStr(projectName)}', '${sqlStr(input.hook_event_name ?? "")}', 'claude_code', '${ts}', '${ts}')`;
+  const embedClient = new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() });
+  const embedding = await embedClient.embed(line, "document");
+  const embeddingSql = embeddingSqlLiteral(embedding);
+  const insertSql = `INSERT INTO "${sessionsTable}" (id, path, filename, message, message_embedding, author, size_bytes, project, description, agent, creation_date, last_update_date) VALUES ('${crypto.randomUUID()}', '${sqlStr(sessionPath)}', '${sqlStr(filename)}', '${jsonForSql}'::jsonb, ${embeddingSql}, '${sqlStr(config.userName)}', ${Buffer.byteLength(line, "utf-8")}, '${sqlStr(projectName)}', '${sqlStr(input.hook_event_name ?? "")}', 'claude_code', '${ts}', '${ts}')`;
   try {
     await api.query(insertSql);
   } catch (e) {
     if (e.message?.includes("permission denied") || e.message?.includes("does not exist")) {
-      log3("table missing, creating and retrying");
+      log4("table missing, creating and retrying");
       await api.ensureSessionsTable(sessionsTable);
       await api.query(insertSql);
     } else {
       throw e;
     }
   }
-  log3("capture ok \u2192 cloud");
+  log4("capture ok \u2192 cloud");
   maybeTriggerPeriodicSummary(input.session_id, input.cwd ?? "", config);
 }
 function maybeTriggerPeriodicSummary(sessionId, cwd, config) {
@@ -746,7 +988,7 @@ function maybeTriggerPeriodicSummary(sessionId, cwd, config) {
     if (!shouldTrigger(state, cfg))
       return;
     if (!tryAcquireLock(sessionId)) {
-      log3(`periodic trigger suppressed (lock held) session=${sessionId}`);
+      log4(`periodic trigger suppressed (lock held) session=${sessionId}`);
       return;
     }
     wikiLog(`Periodic: threshold hit (total=${state.totalCount}, since=${state.totalCount - state.lastSummaryCount}, N=${cfg.everyNMessages}, hours=${cfg.everyHours})`);
@@ -759,19 +1001,19 @@ function maybeTriggerPeriodicSummary(sessionId, cwd, config) {
         reason: "Periodic"
       });
     } catch (e) {
-      log3(`periodic spawn failed: ${e.message}`);
+      log4(`periodic spawn failed: ${e.message}`);
       try {
         releaseLock(sessionId);
       } catch (releaseErr) {
-        log3(`releaseLock after periodic spawn failure also failed: ${releaseErr.message}`);
+        log4(`releaseLock after periodic spawn failure also failed: ${releaseErr.message}`);
       }
       throw e;
     }
   } catch (e) {
-    log3(`periodic trigger error: ${e.message}`);
+    log4(`periodic trigger error: ${e.message}`);
   }
 }
 main().catch((e) => {
-  log3(`fatal: ${e.message}`);
+  log4(`fatal: ${e.message}`);
   process.exit(0);
 });
diff --git a/claude-code/bundle/commands/auth-login.js b/claude-code/bundle/commands/auth-login.js
index 064f11e..ff51f9f 100755
--- a/claude-code/bundle/commands/auth-login.js
+++ b/claude-code/bundle/commands/auth-login.js
@@ -556,7 +556,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(tbl)) {
       log2(`table "${tbl}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', summary_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
@@ -567,7 +567,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(name)) {
       log2(`table "${name}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, message_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
diff --git a/claude-code/bundle/embeddings/embed-daemon.js b/claude-code/bundle/embeddings/embed-daemon.js
new file mode 100755
index 0000000..9437063
--- /dev/null
+++ b/claude-code/bundle/embeddings/embed-daemon.js
@@ -0,0 +1,240 @@
+#!/usr/bin/env node
+
+// dist/src/embeddings/daemon.js
+import { createServer } from "node:net";
+import { unlinkSync, writeFileSync, existsSync, mkdirSync, chmodSync } from "node:fs";
+
+// dist/src/embeddings/protocol.js
+var DEFAULT_SOCKET_DIR = "/tmp";
+var DEFAULT_MODEL_REPO = "nomic-ai/nomic-embed-text-v1.5";
+var DEFAULT_DTYPE = "q8";
+var DEFAULT_DIMS = 768;
+var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
+var DOC_PREFIX = "search_document: ";
+var QUERY_PREFIX = "search_query: ";
+function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.sock`;
+}
+function pidPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.pid`;
+}
+
+// dist/src/embeddings/nomic.js
+var NomicEmbedder = class {
+  pipeline = null;
+  loading = null;
+  repo;
+  dtype;
+  dims;
+  constructor(opts = {}) {
+    this.repo = opts.repo ?? DEFAULT_MODEL_REPO;
+    this.dtype = opts.dtype ?? DEFAULT_DTYPE;
+    this.dims = opts.dims ?? DEFAULT_DIMS;
+  }
+  async load() {
+    if (this.pipeline)
+      return;
+    if (this.loading)
+      return this.loading;
+    this.loading = (async () => {
+      const mod = await import("@huggingface/transformers");
+      mod.env.allowLocalModels = false;
+      mod.env.useFSCache = true;
+      this.pipeline = await mod.pipeline("feature-extraction", this.repo, { dtype: this.dtype });
+    })();
+    try {
+      await this.loading;
+    } finally {
+      this.loading = null;
+    }
+  }
+  addPrefix(text, kind) {
+    return (kind === "query" ? QUERY_PREFIX : DOC_PREFIX) + text;
+  }
+  async embed(text, kind = "document") {
+    await this.load();
+    if (!this.pipeline)
+      throw new Error("embedder not loaded");
+    const out = await this.pipeline(this.addPrefix(text, kind), { pooling: "mean", normalize: true });
+    const full = Array.from(out.data);
+    return this.truncate(full);
+  }
+  async embedBatch(texts, kind = "document") {
+    if (texts.length === 0)
+      return [];
+    await this.load();
+    if (!this.pipeline)
+      throw new Error("embedder not loaded");
+    const prefixed = texts.map((t) => this.addPrefix(t, kind));
+    const out = await this.pipeline(prefixed, { pooling: "mean", normalize: true });
+    const flat = Array.from(out.data);
+    const total = flat.length;
+    const full = total / texts.length;
+    const batches = [];
+    for (let i = 0; i < texts.length; i++) {
+      batches.push(this.truncate(flat.slice(i * full, (i + 1) * full)));
+    }
+    return batches;
+  }
+  truncate(vec) {
+    if (this.dims >= vec.length)
+      return vec;
+    const head = vec.slice(0, this.dims);
+    let norm = 0;
+    for (const v of head)
+      norm += v * v;
+    norm = Math.sqrt(norm);
+    if (norm === 0)
+      return head;
+    for (let i = 0; i < head.length; i++)
+      head[i] /= norm;
+    return head;
+  }
+};
+
+// dist/src/utils/debug.js
+import { appendFileSync } from "node:fs";
+import { join } from "node:path";
+import { homedir } from "node:os";
+var DEBUG = (process.env.HIVEMIND_DEBUG ?? process.env.DEEPLAKE_DEBUG) === "1";
+var LOG = join(homedir(), ".deeplake", "hook-debug.log");
+function log(tag, msg) {
+  if (!DEBUG)
+    return;
+  appendFileSync(LOG, `${(/* @__PURE__ */ new Date()).toISOString()} [${tag}] ${msg}
+`);
+}
+
+// dist/src/embeddings/daemon.js
+var log2 = (m) => log("embed-daemon", m);
+function getUid() {
+  const uid = typeof process.getuid === "function" ? process.getuid() : void 0;
+  return uid !== void 0 ? String(uid) : process.env.USER ?? "default";
+}
+var EmbedDaemon = class {
+  server = null;
+  embedder;
+  socketPath;
+  pidPath;
+  idleTimeoutMs;
+  idleTimer = null;
+  constructor(opts = {}) {
+    const uid = getUid();
+    const dir = opts.socketDir ?? "/tmp";
+    this.socketPath = socketPathFor(uid, dir);
+    this.pidPath = pidPathFor(uid, dir);
+    this.idleTimeoutMs = opts.idleTimeoutMs ?? DEFAULT_IDLE_TIMEOUT_MS;
+    this.embedder = new NomicEmbedder({ repo: opts.repo, dtype: opts.dtype, dims: opts.dims });
+  }
+  async start() {
+    mkdirSync(this.socketPath.replace(/\/[^/]+$/, ""), { recursive: true });
+    writeFileSync(this.pidPath, String(process.pid), { mode: 384 });
+    if (existsSync(this.socketPath)) {
+      try {
+        unlinkSync(this.socketPath);
+      } catch {
+      }
+    }
+    this.embedder.load().then(() => log2("model ready")).catch((e) => log2(`load err: ${e.message}`));
+    this.server = createServer((sock) => this.handleConnection(sock));
+    await new Promise((resolve, reject) => {
+      this.server.once("error", reject);
+      this.server.listen(this.socketPath, () => {
+        try {
+          chmodSync(this.socketPath, 384);
+        } catch {
+        }
+        log2(`listening on ${this.socketPath}`);
+        resolve();
+      });
+    });
+    this.resetIdleTimer();
+    process.on("SIGINT", () => this.shutdown());
+    process.on("SIGTERM", () => this.shutdown());
+  }
+  resetIdleTimer() {
+    if (this.idleTimer)
+      clearTimeout(this.idleTimer);
+    this.idleTimer = setTimeout(() => {
+      log2(`idle timeout ${this.idleTimeoutMs}ms reached, shutting down`);
+      this.shutdown();
+    }, this.idleTimeoutMs);
+    this.idleTimer.unref();
+  }
+  shutdown() {
+    try {
+      this.server?.close();
+    } catch {
+    }
+    try {
+      if (existsSync(this.socketPath))
+        unlinkSync(this.socketPath);
+    } catch {
+    }
+    try {
+      if (existsSync(this.pidPath))
+        unlinkSync(this.pidPath);
+    } catch {
+    }
+    process.exit(0);
+  }
+  handleConnection(sock) {
+    let buf = "";
+    sock.setEncoding("utf-8");
+    sock.on("data", (chunk) => {
+      buf += chunk;
+      let nl;
+      while ((nl = buf.indexOf("\n")) !== -1) {
+        const line = buf.slice(0, nl);
+        buf = buf.slice(nl + 1);
+        if (line.length === 0)
+          continue;
+        this.handleLine(sock, line);
+      }
+    });
+    sock.on("error", () => {
+    });
+  }
+  async handleLine(sock, line) {
+    this.resetIdleTimer();
+    let req;
+    try {
+      req = JSON.parse(line);
+    } catch {
+      return;
+    }
+    try {
+      const resp = await this.dispatch(req);
+      sock.write(JSON.stringify(resp) + "\n");
+    } catch (e) {
+      const err = e instanceof Error ? e.message : String(e);
+      const resp = { id: req.id, error: err };
+      sock.write(JSON.stringify(resp) + "\n");
+    }
+  }
+  async dispatch(req) {
+    if (req.op === "ping") {
+      const p = req;
+      return { id: p.id, ready: true, model: this.embedder.repo, dims: this.embedder.dims };
+    }
+    if (req.op === "embed") {
+      const e = req;
+      const vec = await this.embedder.embed(e.text, e.kind);
+      return { id: e.id, embedding: vec };
+    }
+    return { id: req.id, error: "unknown op" };
+  }
+};
+var invokedDirectly = import.meta.url === `file://${process.argv[1]}` || process.argv[1] && import.meta.url.endsWith(process.argv[1].split("/").pop() ?? "");
+if (invokedDirectly) {
+  const dims = process.env.HIVEMIND_EMBED_DIMS ? Number(process.env.HIVEMIND_EMBED_DIMS) : void 0;
+  const idleTimeoutMs = process.env.HIVEMIND_EMBED_IDLE_MS ? Number(process.env.HIVEMIND_EMBED_IDLE_MS) : void 0;
+  const d = new EmbedDaemon({ dims, idleTimeoutMs });
+  d.start().catch((e) => {
+    log2(`fatal: ${e.message}`);
+    process.exit(1);
+  });
+}
+export {
+  EmbedDaemon
+};
diff --git a/claude-code/bundle/pre-tool-use.js b/claude-code/bundle/pre-tool-use.js
index a231ff5..e648bf7 100755
--- a/claude-code/bundle/pre-tool-use.js
+++ b/claude-code/bundle/pre-tool-use.js
@@ -1,10 +1,10 @@
 #!/usr/bin/env node
 
 // dist/src/hooks/pre-tool-use.js
-import { existsSync as existsSync3, mkdirSync as mkdirSync3, writeFileSync as writeFileSync3 } from "node:fs";
+import { existsSync as existsSync4, mkdirSync as mkdirSync3, writeFileSync as writeFileSync3 } from "node:fs";
 import { homedir as homedir5 } from "node:os";
-import { join as join6, dirname, sep } from "node:path";
-import { fileURLToPath as fileURLToPath2 } from "node:url";
+import { join as join7, dirname as dirname2, sep } from "node:path";
+import { fileURLToPath as fileURLToPath3 } from "node:url";
 
 // dist/src/utils/stdin.js
 function readStdin() {
@@ -381,7 +381,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(tbl)) {
       log2(`table "${tbl}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', summary_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
@@ -392,7 +392,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(name)) {
       log2(`table "${name}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, message_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
@@ -579,24 +579,25 @@ function normalizeContent(path, raw) {
     return raw;
   }
   if (Array.isArray(obj.turns)) {
-    const header = [];
-    if (obj.date_time)
-      header.push(`date: ${obj.date_time}`);
-    if (obj.speakers) {
-      const s = obj.speakers;
-      const names = [s.speaker_a, s.speaker_b].filter(Boolean).join(", ");
-      if (names)
-        header.push(`speakers: ${names}`);
-    }
+    const dateHeader = obj.date_time ? `(${String(obj.date_time)}) ` : "";
     const lines = obj.turns.map((t) => {
       const sp = String(t?.speaker ?? t?.name ?? "?").trim();
       const tx = String(t?.text ?? t?.content ?? "").replace(/\s+/g, " ").trim();
       const tag = t?.dia_id ? `[${t.dia_id}] ` : "";
-      return `${tag}${sp}: ${tx}`;
+      return `${dateHeader}${tag}${sp}: ${tx}`;
     });
-    const out2 = [...header, ...lines].join("\n");
+    const out2 = lines.join("\n");
     return out2.trim() ? out2 : raw;
   }
+  if (obj.turn && typeof obj.turn === "object" && !Array.isArray(obj.turn)) {
+    const t = obj.turn;
+    const sp = String(t.speaker ?? t.name ?? "?").trim();
+    const tx = String(t.text ?? t.content ?? "").replace(/\s+/g, " ").trim();
+    const tag = t.dia_id ? `[${String(t.dia_id)}] ` : "";
+    const dateHeader = obj.date_time ? `(${String(obj.date_time)}) ` : "";
+    const line = `${dateHeader}${tag}${sp}: ${tx}`;
+    return line.trim() ? line : raw;
+  }
   const stripRecalled = (t) => {
     const i = t.indexOf("<recalled-memories>");
     if (i === -1)
@@ -639,8 +640,38 @@ function buildPathCondition(targetPath) {
   return `(path = '${sqlStr(clean)}' OR path LIKE '${sqlLike(clean)}/%' ESCAPE '\\')`;
 }
 async function searchDeeplakeTables(api, memoryTable, sessionsTable, opts) {
-  const { pathFilter, contentScanOnly, likeOp, escapedPattern, prefilterPattern, prefilterPatterns } = opts;
+  const { pathFilter, contentScanOnly, likeOp, escapedPattern, prefilterPattern, prefilterPatterns, queryEmbedding, bm25Term } = opts;
   const limit = opts.limit ?? 100;
+  if (queryEmbedding && queryEmbedding.length > 0) {
+    const vecLit = serializeFloat4Array(queryEmbedding);
+    const semanticLimit = Math.min(limit, Number(process.env.HIVEMIND_SEMANTIC_LIMIT ?? "20"));
+    const lexicalLimit = Math.min(limit, Number(process.env.HIVEMIND_HYBRID_LEXICAL_LIMIT ?? "20"));
+    const filterPatternsForLex = contentScanOnly ? prefilterPatterns && prefilterPatterns.length > 0 ? prefilterPatterns : prefilterPattern ? [prefilterPattern] : [] : [escapedPattern];
+    const memLexFilter = buildContentFilter("summary::text", likeOp, filterPatternsForLex);
+    const sessLexFilter = buildContentFilter("message::text", likeOp, filterPatternsForLex);
+    const memLexQuery = memLexFilter ? `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, 1.0 AS score FROM "${memoryTable}" WHERE 1=1${pathFilter}${memLexFilter} LIMIT ${lexicalLimit}` : null;
+    const sessLexQuery = sessLexFilter ? `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, 1.0 AS score FROM "${sessionsTable}" WHERE 1=1${pathFilter}${sessLexFilter} LIMIT ${lexicalLimit}` : null;
+    const memSemQuery = `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, (summary_embedding <#> ${vecLit}) AS score FROM "${memoryTable}" WHERE summary_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const sessSemQuery = `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, (message_embedding <#> ${vecLit}) AS score FROM "${sessionsTable}" WHERE message_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const parts = [memSemQuery, sessSemQuery];
+    if (memLexQuery)
+      parts.push(memLexQuery);
+    if (sessLexQuery)
+      parts.push(sessLexQuery);
+    const unionSql = parts.map((q) => `(${q})`).join(" UNION ALL ");
+    const outerLimit = semanticLimit + lexicalLimit;
+    const rows2 = await api.query(`SELECT path, content, source_order, creation_date, score FROM (` + unionSql + `) AS combined ORDER BY score DESC LIMIT ${outerLimit}`);
+    const seen = /* @__PURE__ */ new Set();
+    const unique = [];
+    for (const row of rows2) {
+      const p = String(row["path"]);
+      if (seen.has(p))
+        continue;
+      seen.add(p);
+      unique.push({ path: p, content: String(row["content"] ?? "") });
+    }
+    return unique;
+  }
   const filterPatterns = contentScanOnly ? prefilterPatterns && prefilterPatterns.length > 0 ? prefilterPatterns : prefilterPattern ? [prefilterPattern] : [] : [escapedPattern];
   const memFilter = buildContentFilter("summary::text", likeOp, filterPatterns);
   const sessFilter = buildContentFilter("message::text", likeOp, filterPatterns);
@@ -652,6 +683,15 @@ async function searchDeeplakeTables(api, memoryTable, sessionsTable, opts) {
     content: String(row["content"] ?? "")
   }));
 }
+function serializeFloat4Array(vec) {
+  const parts = [];
+  for (const v of vec) {
+    if (!Number.isFinite(v))
+      return "NULL";
+    parts.push(String(v));
+  }
+  return `ARRAY[${parts.join(",")}]::float4[]`;
+}
 function buildPathFilter(targetPath) {
   const condition = buildPathCondition(targetPath);
   return condition ? ` AND ${condition}` : "";
@@ -730,13 +770,24 @@ function buildGrepSearchOptions(params, targetPath) {
   const hasRegexMeta = !params.fixedString && /[.*+?^${}()|[\]\\]/.test(params.pattern);
   const literalPrefilter = hasRegexMeta ? extractRegexLiteralPrefilter(params.pattern) : null;
   const alternationPrefilters = hasRegexMeta ? extractRegexAlternationPrefilters(params.pattern) : null;
+  let bm25Term;
+  if (!hasRegexMeta) {
+    bm25Term = params.pattern;
+  } else if (alternationPrefilters && alternationPrefilters.length > 0) {
+    bm25Term = alternationPrefilters.join(" ");
+  } else if (literalPrefilter) {
+    bm25Term = literalPrefilter;
+  }
   return {
     pathFilter: buildPathFilter(targetPath),
     contentScanOnly: hasRegexMeta,
-    likeOp: params.ignoreCase ? "ILIKE" : "LIKE",
+    // Kept for the pure-lexical fallback path and existing tests; BM25 is now
+    // the preferred lexical ranker when a term can be extracted.
+    likeOp: process.env.HIVEMIND_GREP_LIKE === "case-sensitive" ? "LIKE" : "ILIKE",
     escapedPattern: sqlLike(params.pattern),
     prefilterPattern: literalPrefilter ? sqlLike(literalPrefilter) : void 0,
-    prefilterPatterns: alternationPrefilters?.map((literal) => sqlLike(literal))
+    prefilterPatterns: alternationPrefilters?.map((literal) => sqlLike(literal)),
+    bm25Term
   };
 }
 function buildContentFilter(column, likeOp, patterns) {
@@ -787,11 +838,28 @@ function refineGrepMatches(rows, params, forceMultiFilePrefix) {
   }
   return output;
 }
-async function grepBothTables(api, memoryTable, sessionsTable, params, targetPath) {
-  const rows = await searchDeeplakeTables(api, memoryTable, sessionsTable, buildGrepSearchOptions(params, targetPath));
+async function grepBothTables(api, memoryTable, sessionsTable, params, targetPath, queryEmbedding) {
+  const rows = await searchDeeplakeTables(api, memoryTable, sessionsTable, {
+    ...buildGrepSearchOptions(params, targetPath),
+    queryEmbedding
+  });
   const seen = /* @__PURE__ */ new Set();
   const unique = rows.filter((r) => seen.has(r.path) ? false : (seen.add(r.path), true));
   const normalized = unique.map((r) => ({ path: r.path, content: normalizeContent(r.path, r.content) }));
+  if (queryEmbedding && queryEmbedding.length > 0) {
+    const emitAllLines = process.env.HIVEMIND_SEMANTIC_EMIT_ALL !== "false";
+    if (emitAllLines) {
+      const lines = [];
+      for (const r of normalized) {
+        for (const line of r.content.split("\n")) {
+          const trimmed = line.trim();
+          if (trimmed)
+            lines.push(`${r.path}:${line}`);
+        }
+      }
+      return lines;
+    }
+  }
   return refineGrepMatches(normalized, params);
 }
 
@@ -831,7 +899,255 @@ function capOutputForClaude(output, options = {}) {
   return keptLines.join("\n") + footer;
 }
 
+// dist/src/embeddings/client.js
+import { connect } from "node:net";
+import { spawn } from "node:child_process";
+import { openSync, closeSync, writeSync, unlinkSync, existsSync as existsSync3, readFileSync as readFileSync3 } from "node:fs";
+
+// dist/src/embeddings/protocol.js
+var DEFAULT_SOCKET_DIR = "/tmp";
+var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
+var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.sock`;
+}
+function pidPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.pid`;
+}
+
+// dist/src/embeddings/client.js
+var log3 = (m) => log("embed-client", m);
+function getUid() {
+  const uid = typeof process.getuid === "function" ? process.getuid() : void 0;
+  return uid !== void 0 ? String(uid) : process.env.USER ?? "default";
+}
+var EmbedClient = class {
+  socketPath;
+  pidPath;
+  timeoutMs;
+  daemonEntry;
+  autoSpawn;
+  spawnWaitMs;
+  nextId = 0;
+  constructor(opts = {}) {
+    const uid = getUid();
+    const dir = opts.socketDir ?? "/tmp";
+    this.socketPath = socketPathFor(uid, dir);
+    this.pidPath = pidPathFor(uid, dir);
+    this.timeoutMs = opts.timeoutMs ?? DEFAULT_CLIENT_TIMEOUT_MS;
+    this.daemonEntry = opts.daemonEntry ?? process.env.HIVEMIND_EMBED_DAEMON;
+    this.autoSpawn = opts.autoSpawn ?? true;
+    this.spawnWaitMs = opts.spawnWaitMs ?? 5e3;
+  }
+  /**
+   * Returns an embedding vector, or null on timeout/failure. Hooks MUST treat
+   * null as "skip embedding column" — never block the write path on us.
+   *
+   * Fire-and-forget spawn on miss: if the daemon isn't up, this call returns
+   * null AND kicks off a background spawn. The next call finds a ready daemon.
+   */
+  async embed(text, kind = "document") {
+    let sock;
+    try {
+      sock = await this.connectOnce();
+    } catch {
+      if (this.autoSpawn)
+        this.trySpawnDaemon();
+      return null;
+    }
+    try {
+      const id = String(++this.nextId);
+      const req = { op: "embed", id, kind, text };
+      const resp = await this.sendAndWait(sock, req);
+      if (resp.error || !("embedding" in resp) || !resp.embedding) {
+        log3(`embed err: ${resp.error ?? "no embedding"}`);
+        return null;
+      }
+      return resp.embedding;
+    } catch (e) {
+      const err = e instanceof Error ? e.message : String(e);
+      log3(`embed failed: ${err}`);
+      return null;
+    } finally {
+      try {
+        sock.end();
+      } catch {
+      }
+    }
+  }
+  /**
+   * Wait up to spawnWaitMs for the daemon to accept connections, spawning if
+   * necessary. Meant for SessionStart / long-running batches — not the hot path.
+   */
+  async warmup() {
+    try {
+      const s = await this.connectOnce();
+      s.end();
+      return true;
+    } catch {
+      if (!this.autoSpawn)
+        return false;
+      this.trySpawnDaemon();
+      try {
+        const s = await this.waitForSocket();
+        s.end();
+        return true;
+      } catch {
+        return false;
+      }
+    }
+  }
+  connectOnce() {
+    return new Promise((resolve2, reject) => {
+      const sock = connect(this.socketPath);
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("connect timeout"));
+      }, this.timeoutMs);
+      sock.once("connect", () => {
+        clearTimeout(to);
+        resolve2(sock);
+      });
+      sock.once("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+    });
+  }
+  trySpawnDaemon() {
+    let fd;
+    try {
+      fd = openSync(this.pidPath, "wx", 384);
+      writeSync(fd, String(process.pid));
+    } catch (e) {
+      if (this.isPidFileStale()) {
+        try {
+          unlinkSync(this.pidPath);
+        } catch {
+        }
+        try {
+          fd = openSync(this.pidPath, "wx", 384);
+          writeSync(fd, String(process.pid));
+        } catch {
+          return;
+        }
+      } else {
+        return;
+      }
+    }
+    if (!this.daemonEntry || !existsSync3(this.daemonEntry)) {
+      log3(`daemonEntry not configured or missing: ${this.daemonEntry}`);
+      try {
+        closeSync(fd);
+        unlinkSync(this.pidPath);
+      } catch {
+      }
+      return;
+    }
+    try {
+      const child = spawn(process.execPath, [this.daemonEntry], {
+        detached: true,
+        stdio: "ignore",
+        env: process.env
+      });
+      child.unref();
+      log3(`spawned daemon pid=${child.pid}`);
+    } finally {
+      closeSync(fd);
+    }
+  }
+  isPidFileStale() {
+    try {
+      const raw = readFileSync3(this.pidPath, "utf-8").trim();
+      const pid = Number(raw);
+      if (!pid || Number.isNaN(pid))
+        return true;
+      try {
+        process.kill(pid, 0);
+        return false;
+      } catch {
+        return true;
+      }
+    } catch {
+      return true;
+    }
+  }
+  async waitForSocket() {
+    const deadline = Date.now() + this.spawnWaitMs;
+    let delay = 30;
+    while (Date.now() < deadline) {
+      await sleep2(delay);
+      delay = Math.min(delay * 1.5, 300);
+      if (!existsSync3(this.socketPath))
+        continue;
+      try {
+        return await this.connectOnce();
+      } catch {
+      }
+    }
+    throw new Error("daemon did not become ready within spawnWaitMs");
+  }
+  sendAndWait(sock, req) {
+    return new Promise((resolve2, reject) => {
+      let buf = "";
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("request timeout"));
+      }, this.timeoutMs);
+      sock.setEncoding("utf-8");
+      sock.on("data", (chunk) => {
+        buf += chunk;
+        const nl = buf.indexOf("\n");
+        if (nl === -1)
+          return;
+        const line = buf.slice(0, nl);
+        clearTimeout(to);
+        try {
+          resolve2(JSON.parse(line));
+        } catch (e) {
+          reject(e);
+        }
+      });
+      sock.on("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+      sock.write(JSON.stringify(req) + "\n");
+    });
+  }
+};
+function sleep2(ms) {
+  return new Promise((r) => setTimeout(r, ms));
+}
+
 // dist/src/hooks/grep-direct.js
+import { fileURLToPath as fileURLToPath2 } from "node:url";
+import { dirname, join as join4 } from "node:path";
+var SEMANTIC_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false";
+var SEMANTIC_TIMEOUT_MS = Number(process.env.HIVEMIND_SEMANTIC_EMBED_TIMEOUT_MS ?? "500");
+function resolveDaemonPath() {
+  return join4(dirname(fileURLToPath2(import.meta.url)), "..", "embeddings", "embed-daemon.js");
+}
+var sharedEmbedClient = null;
+function getEmbedClient() {
+  if (!sharedEmbedClient) {
+    sharedEmbedClient = new EmbedClient({
+      daemonEntry: resolveDaemonPath(),
+      timeoutMs: SEMANTIC_TIMEOUT_MS
+    });
+  }
+  return sharedEmbedClient;
+}
+function patternIsSemanticFriendly(pattern, fixedString) {
+  if (!pattern || pattern.length < 2)
+    return false;
+  if (fixedString)
+    return true;
+  const meta = pattern.match(/[|()\[\]{}+?^$\\]/g);
+  if (!meta)
+    return true;
+  return meta.length <= 1;
+}
 function splitFirstPipelineStage(cmd) {
   const input = cmd.trim();
   let quote = null;
@@ -1069,7 +1385,15 @@ async function handleGrepDirect(api, table, sessionsTable, params) {
     invertMatch: params.invertMatch,
     fixedString: params.fixedString
   };
-  const output = await grepBothTables(api, table, sessionsTable, matchParams, params.targetPath);
+  let queryEmbedding = null;
+  if (SEMANTIC_ENABLED && patternIsSemanticFriendly(params.pattern, params.fixedString)) {
+    try {
+      queryEmbedding = await getEmbedClient().embed(params.pattern, "query");
+    } catch {
+      queryEmbedding = null;
+    }
+  }
+  const output = await grepBothTables(api, table, sessionsTable, matchParams, params.targetPath, queryEmbedding);
   const joined = output.join("\n") || "(no matches)";
   return capOutputForClaude(joined, { kind: "grep" });
 }
@@ -1690,20 +2014,20 @@ async function executeCompiledBashCommand(api, memoryTable, sessionsTable, cmd,
 }
 
 // dist/src/hooks/query-cache.js
-import { mkdirSync as mkdirSync2, readFileSync as readFileSync3, rmSync, writeFileSync as writeFileSync2 } from "node:fs";
-import { join as join4 } from "node:path";
+import { mkdirSync as mkdirSync2, readFileSync as readFileSync4, rmSync, writeFileSync as writeFileSync2 } from "node:fs";
+import { join as join5 } from "node:path";
 import { homedir as homedir3 } from "node:os";
-var log3 = (msg) => log("query-cache", msg);
-var DEFAULT_CACHE_ROOT = join4(homedir3(), ".deeplake", "query-cache");
+var log4 = (msg) => log("query-cache", msg);
+var DEFAULT_CACHE_ROOT = join5(homedir3(), ".deeplake", "query-cache");
 var INDEX_CACHE_FILE = "index.md";
 function getSessionQueryCacheDir(sessionId, deps = {}) {
   const { cacheRoot = DEFAULT_CACHE_ROOT } = deps;
-  return join4(cacheRoot, sessionId);
+  return join5(cacheRoot, sessionId);
 }
 function readCachedIndexContent(sessionId, deps = {}) {
-  const { logFn = log3 } = deps;
+  const { logFn = log4 } = deps;
   try {
-    return readFileSync3(join4(getSessionQueryCacheDir(sessionId, deps), INDEX_CACHE_FILE), "utf-8");
+    return readFileSync4(join5(getSessionQueryCacheDir(sessionId, deps), INDEX_CACHE_FILE), "utf-8");
   } catch (e) {
     if (e?.code === "ENOENT")
       return null;
@@ -1712,11 +2036,11 @@ function readCachedIndexContent(sessionId, deps = {}) {
   }
 }
 function writeCachedIndexContent(sessionId, content, deps = {}) {
-  const { logFn = log3 } = deps;
+  const { logFn = log4 } = deps;
   try {
     const dir = getSessionQueryCacheDir(sessionId, deps);
     mkdirSync2(dir, { recursive: true });
-    writeFileSync2(join4(dir, INDEX_CACHE_FILE), content, "utf-8");
+    writeFileSync2(join5(dir, INDEX_CACHE_FILE), content, "utf-8");
   } catch (e) {
     logFn(`write failed for session=${sessionId}: ${e.message}`);
   }
@@ -1724,8 +2048,8 @@ function writeCachedIndexContent(sessionId, content, deps = {}) {
 
 // dist/src/hooks/memory-path-utils.js
 import { homedir as homedir4 } from "node:os";
-import { join as join5 } from "node:path";
-var MEMORY_PATH = join5(homedir4(), ".deeplake", "memory");
+import { join as join6 } from "node:path";
+var MEMORY_PATH = join6(homedir4(), ".deeplake", "memory");
 var TILDE_PATH = "~/.deeplake/memory";
 var HOME_VAR_PATH = "$HOME/.deeplake/memory";
 var SAFE_BUILTINS = /* @__PURE__ */ new Set([
@@ -1841,20 +2165,20 @@ function rewritePaths(cmd) {
 }
 
 // dist/src/hooks/pre-tool-use.js
-var log4 = (msg) => log("pre", msg);
-var __bundleDir = dirname(fileURLToPath2(import.meta.url));
-var SHELL_BUNDLE = existsSync3(join6(__bundleDir, "shell", "deeplake-shell.js")) ? join6(__bundleDir, "shell", "deeplake-shell.js") : join6(__bundleDir, "..", "shell", "deeplake-shell.js");
-var READ_CACHE_ROOT = join6(homedir5(), ".deeplake", "query-cache");
+var log5 = (msg) => log("pre", msg);
+var __bundleDir = dirname2(fileURLToPath3(import.meta.url));
+var SHELL_BUNDLE = existsSync4(join7(__bundleDir, "shell", "deeplake-shell.js")) ? join7(__bundleDir, "shell", "deeplake-shell.js") : join7(__bundleDir, "..", "shell", "deeplake-shell.js");
+var READ_CACHE_ROOT = join7(homedir5(), ".deeplake", "query-cache");
 function writeReadCacheFile(sessionId, virtualPath, content, deps = {}) {
   const { cacheRoot = READ_CACHE_ROOT } = deps;
   const safeSessionId = sessionId.replace(/[^a-zA-Z0-9._-]/g, "_") || "unknown";
   const rel = virtualPath.replace(/^\/+/, "") || "content";
-  const expectedRoot = join6(cacheRoot, safeSessionId, "read");
-  const absPath = join6(expectedRoot, rel);
+  const expectedRoot = join7(cacheRoot, safeSessionId, "read");
+  const absPath = join7(expectedRoot, rel);
   if (absPath !== expectedRoot && !absPath.startsWith(expectedRoot + sep)) {
     throw new Error(`writeReadCacheFile: path escapes cache root: ${absPath}`);
   }
-  mkdirSync3(dirname(absPath), { recursive: true });
+  mkdirSync3(dirname2(absPath), { recursive: true });
   writeFileSync3(absPath, content, "utf-8");
   return absPath;
 }
@@ -1901,7 +2225,7 @@ function getShellCommand(toolName, toolInput) {
         break;
       const rewritten = rewritePaths(cmd);
       if (!isSafe(rewritten)) {
-        log4(`unsafe command blocked: ${rewritten}`);
+        log5(`unsafe command blocked: ${rewritten}`);
         return null;
       }
       return rewritten;
@@ -1941,7 +2265,7 @@ function buildFallbackDecision(shellCmd, shellBundle = SHELL_BUNDLE) {
   return buildAllowDecision(`node "${shellBundle}" -c "${shellCmd.replace(/"/g, '\\"')}"`, `[DeepLake shell] ${shellCmd}`);
 }
 async function processPreToolUse(input, deps = {}) {
-  const { config = loadConfig(), createApi = (table2, activeConfig) => new DeeplakeApi(activeConfig.token, activeConfig.apiUrl, activeConfig.orgId, activeConfig.workspaceId, table2), executeCompiledBashCommandFn = executeCompiledBashCommand, handleGrepDirectFn = handleGrepDirect, readVirtualPathContentsFn = readVirtualPathContents, readVirtualPathContentFn = readVirtualPathContent, listVirtualPathRowsFn = listVirtualPathRows, findVirtualPathsFn = findVirtualPaths, readCachedIndexContentFn = readCachedIndexContent, writeCachedIndexContentFn = writeCachedIndexContent, writeReadCacheFileFn = writeReadCacheFile, shellBundle = SHELL_BUNDLE, logFn = log4 } = deps;
+  const { config = loadConfig(), createApi = (table2, activeConfig) => new DeeplakeApi(activeConfig.token, activeConfig.apiUrl, activeConfig.orgId, activeConfig.workspaceId, table2), executeCompiledBashCommandFn = executeCompiledBashCommand, handleGrepDirectFn = handleGrepDirect, readVirtualPathContentsFn = readVirtualPathContents, readVirtualPathContentFn = readVirtualPathContent, listVirtualPathRowsFn = listVirtualPathRows, findVirtualPathsFn = findVirtualPaths, readCachedIndexContentFn = readCachedIndexContent, writeCachedIndexContentFn = writeCachedIndexContent, writeReadCacheFileFn = writeReadCacheFile, shellBundle = SHELL_BUNDLE, logFn = log5 } = deps;
   const cmd = input.tool_input.command ?? "";
   const shellCmd = getShellCommand(input.tool_name, input.tool_input);
   const toolPath = getReadTargetPath(input.tool_input) ?? input.tool_input.path ?? "";
@@ -2153,7 +2477,7 @@ async function main() {
 }
 if (isDirectRun(import.meta.url)) {
   main().catch((e) => {
-    log4(`fatal: ${e.message}`);
+    log5(`fatal: ${e.message}`);
     process.exit(0);
   });
 }
diff --git a/claude-code/bundle/session-start-setup.js b/claude-code/bundle/session-start-setup.js
index c0f05cc..7d33e4d 100755
--- a/claude-code/bundle/session-start-setup.js
+++ b/claude-code/bundle/session-start-setup.js
@@ -386,7 +386,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(tbl)) {
       log2(`table "${tbl}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', summary_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
@@ -397,7 +397,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(name)) {
       log2(`table "${name}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, message_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
diff --git a/claude-code/bundle/session-start.js b/claude-code/bundle/session-start.js
index 1f815ee..cdccb55 100755
--- a/claude-code/bundle/session-start.js
+++ b/claude-code/bundle/session-start.js
@@ -387,7 +387,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(tbl)) {
       log2(`table "${tbl}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', summary_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
@@ -398,7 +398,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(name)) {
       log2(`table "${name}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, message_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
diff --git a/claude-code/bundle/shell/deeplake-shell.js b/claude-code/bundle/shell/deeplake-shell.js
index 0793149..eecc463 100755
--- a/claude-code/bundle/shell/deeplake-shell.js
+++ b/claude-code/bundle/shell/deeplake-shell.js
@@ -46081,14 +46081,14 @@ var require_turndown_cjs = __commonJS({
         } else if (node.nodeType === 1) {
           replacement = replacementForNode.call(self2, node);
         }
-        return join7(output, replacement);
+        return join9(output, replacement);
       }, "");
     }
     function postProcess(output) {
       var self2 = this;
       this.rules.forEach(function(rule) {
         if (typeof rule.append === "function") {
-          output = join7(output, rule.append(self2.options));
+          output = join9(output, rule.append(self2.options));
         }
       });
       return output.replace(/^[\t\r\n]+/, "").replace(/[\t\r\n\s]+$/, "");
@@ -46100,7 +46100,7 @@ var require_turndown_cjs = __commonJS({
       if (whitespace.leading || whitespace.trailing) content = content.trim();
       return whitespace.leading + rule.replacement(content, node, this.options) + whitespace.trailing;
     }
-    function join7(output, replacement) {
+    function join9(output, replacement) {
       var s12 = trimTrailingNewlines(output);
       var s22 = trimLeadingNewlines(replacement);
       var nls = Math.max(output.length - s12.length, replacement.length - s22.length);
@@ -67078,7 +67078,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(tbl)) {
       log2(`table "${tbl}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', summary_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
@@ -67089,7 +67089,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(name)) {
       log2(`table "${name}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, message_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
@@ -67101,6 +67101,8 @@ var DeeplakeApi = class {
 // dist/src/shell/deeplake-fs.js
 import { basename as basename4, posix } from "node:path";
 import { randomUUID as randomUUID2 } from "node:crypto";
+import { fileURLToPath } from "node:url";
+import { dirname as dirname4, join as join7 } from "node:path";
 
 // dist/src/shell/grep-core.js
 var TOOL_INPUT_FIELDS = [
@@ -67266,24 +67268,25 @@ function normalizeContent(path2, raw) {
     return raw;
   }
   if (Array.isArray(obj.turns)) {
-    const header = [];
-    if (obj.date_time)
-      header.push(`date: ${obj.date_time}`);
-    if (obj.speakers) {
-      const s10 = obj.speakers;
-      const names = [s10.speaker_a, s10.speaker_b].filter(Boolean).join(", ");
-      if (names)
-        header.push(`speakers: ${names}`);
-    }
+    const dateHeader = obj.date_time ? `(${String(obj.date_time)}) ` : "";
     const lines = obj.turns.map((t6) => {
       const sp = String(t6?.speaker ?? t6?.name ?? "?").trim();
       const tx = String(t6?.text ?? t6?.content ?? "").replace(/\s+/g, " ").trim();
       const tag = t6?.dia_id ? `[${t6.dia_id}] ` : "";
-      return `${tag}${sp}: ${tx}`;
+      return `${dateHeader}${tag}${sp}: ${tx}`;
     });
-    const out2 = [...header, ...lines].join("\n");
+    const out2 = lines.join("\n");
     return out2.trim() ? out2 : raw;
   }
+  if (obj.turn && typeof obj.turn === "object" && !Array.isArray(obj.turn)) {
+    const t6 = obj.turn;
+    const sp = String(t6.speaker ?? t6.name ?? "?").trim();
+    const tx = String(t6.text ?? t6.content ?? "").replace(/\s+/g, " ").trim();
+    const tag = t6.dia_id ? `[${String(t6.dia_id)}] ` : "";
+    const dateHeader = obj.date_time ? `(${String(obj.date_time)}) ` : "";
+    const line = `${dateHeader}${tag}${sp}: ${tx}`;
+    return line.trim() ? line : raw;
+  }
   const stripRecalled = (t6) => {
     const i11 = t6.indexOf("<recalled-memories>");
     if (i11 === -1)
@@ -67326,8 +67329,38 @@ function buildPathCondition(targetPath) {
   return `(path = '${sqlStr(clean)}' OR path LIKE '${sqlLike(clean)}/%' ESCAPE '\\')`;
 }
 async function searchDeeplakeTables(api, memoryTable, sessionsTable, opts) {
-  const { pathFilter, contentScanOnly, likeOp, escapedPattern, prefilterPattern, prefilterPatterns } = opts;
+  const { pathFilter, contentScanOnly, likeOp, escapedPattern, prefilterPattern, prefilterPatterns, queryEmbedding, bm25Term } = opts;
   const limit = opts.limit ?? 100;
+  if (queryEmbedding && queryEmbedding.length > 0) {
+    const vecLit = serializeFloat4Array(queryEmbedding);
+    const semanticLimit = Math.min(limit, Number(process.env.HIVEMIND_SEMANTIC_LIMIT ?? "20"));
+    const lexicalLimit = Math.min(limit, Number(process.env.HIVEMIND_HYBRID_LEXICAL_LIMIT ?? "20"));
+    const filterPatternsForLex = contentScanOnly ? prefilterPatterns && prefilterPatterns.length > 0 ? prefilterPatterns : prefilterPattern ? [prefilterPattern] : [] : [escapedPattern];
+    const memLexFilter = buildContentFilter("summary::text", likeOp, filterPatternsForLex);
+    const sessLexFilter = buildContentFilter("message::text", likeOp, filterPatternsForLex);
+    const memLexQuery = memLexFilter ? `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, 1.0 AS score FROM "${memoryTable}" WHERE 1=1${pathFilter}${memLexFilter} LIMIT ${lexicalLimit}` : null;
+    const sessLexQuery = sessLexFilter ? `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, 1.0 AS score FROM "${sessionsTable}" WHERE 1=1${pathFilter}${sessLexFilter} LIMIT ${lexicalLimit}` : null;
+    const memSemQuery = `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, (summary_embedding <#> ${vecLit}) AS score FROM "${memoryTable}" WHERE summary_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const sessSemQuery = `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, (message_embedding <#> ${vecLit}) AS score FROM "${sessionsTable}" WHERE message_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const parts = [memSemQuery, sessSemQuery];
+    if (memLexQuery)
+      parts.push(memLexQuery);
+    if (sessLexQuery)
+      parts.push(sessLexQuery);
+    const unionSql = parts.map((q17) => `(${q17})`).join(" UNION ALL ");
+    const outerLimit = semanticLimit + lexicalLimit;
+    const rows2 = await api.query(`SELECT path, content, source_order, creation_date, score FROM (` + unionSql + `) AS combined ORDER BY score DESC LIMIT ${outerLimit}`);
+    const seen = /* @__PURE__ */ new Set();
+    const unique = [];
+    for (const row of rows2) {
+      const p22 = String(row["path"]);
+      if (seen.has(p22))
+        continue;
+      seen.add(p22);
+      unique.push({ path: p22, content: String(row["content"] ?? "") });
+    }
+    return unique;
+  }
   const filterPatterns = contentScanOnly ? prefilterPatterns && prefilterPatterns.length > 0 ? prefilterPatterns : prefilterPattern ? [prefilterPattern] : [] : [escapedPattern];
   const memFilter = buildContentFilter("summary::text", likeOp, filterPatterns);
   const sessFilter = buildContentFilter("message::text", likeOp, filterPatterns);
@@ -67339,6 +67372,15 @@ async function searchDeeplakeTables(api, memoryTable, sessionsTable, opts) {
     content: String(row["content"] ?? "")
   }));
 }
+function serializeFloat4Array(vec) {
+  const parts = [];
+  for (const v27 of vec) {
+    if (!Number.isFinite(v27))
+      return "NULL";
+    parts.push(String(v27));
+  }
+  return `ARRAY[${parts.join(",")}]::float4[]`;
+}
 function buildPathFilter(targetPath) {
   const condition = buildPathCondition(targetPath);
   return condition ? ` AND ${condition}` : "";
@@ -67427,13 +67469,24 @@ function buildGrepSearchOptions(params, targetPath) {
   const hasRegexMeta = !params.fixedString && /[.*+?^${}()|[\]\\]/.test(params.pattern);
   const literalPrefilter = hasRegexMeta ? extractRegexLiteralPrefilter(params.pattern) : null;
   const alternationPrefilters = hasRegexMeta ? extractRegexAlternationPrefilters(params.pattern) : null;
+  let bm25Term;
+  if (!hasRegexMeta) {
+    bm25Term = params.pattern;
+  } else if (alternationPrefilters && alternationPrefilters.length > 0) {
+    bm25Term = alternationPrefilters.join(" ");
+  } else if (literalPrefilter) {
+    bm25Term = literalPrefilter;
+  }
   return {
     pathFilter: buildPathFilter(targetPath),
     contentScanOnly: hasRegexMeta,
-    likeOp: params.ignoreCase ? "ILIKE" : "LIKE",
+    // Kept for the pure-lexical fallback path and existing tests; BM25 is now
+    // the preferred lexical ranker when a term can be extracted.
+    likeOp: process.env.HIVEMIND_GREP_LIKE === "case-sensitive" ? "LIKE" : "ILIKE",
     escapedPattern: sqlLike(params.pattern),
     prefilterPattern: literalPrefilter ? sqlLike(literalPrefilter) : void 0,
-    prefilterPatterns: alternationPrefilters?.map((literal) => sqlLike(literal))
+    prefilterPatterns: alternationPrefilters?.map((literal) => sqlLike(literal)),
+    bm25Term
   };
 }
 function buildContentFilter(column, likeOp, patterns) {
@@ -67485,6 +67538,240 @@ function refineGrepMatches(rows, params, forceMultiFilePrefix) {
   return output;
 }
 
+// dist/src/embeddings/client.js
+import { connect } from "node:net";
+import { spawn } from "node:child_process";
+import { openSync, closeSync, writeSync, unlinkSync, existsSync as existsSync4, readFileSync as readFileSync3 } from "node:fs";
+
+// dist/src/embeddings/protocol.js
+var DEFAULT_SOCKET_DIR = "/tmp";
+var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
+var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.sock`;
+}
+function pidPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.pid`;
+}
+
+// dist/src/embeddings/client.js
+var log3 = (m26) => log("embed-client", m26);
+function getUid() {
+  const uid = typeof process.getuid === "function" ? process.getuid() : void 0;
+  return uid !== void 0 ? String(uid) : process.env.USER ?? "default";
+}
+var EmbedClient = class {
+  socketPath;
+  pidPath;
+  timeoutMs;
+  daemonEntry;
+  autoSpawn;
+  spawnWaitMs;
+  nextId = 0;
+  constructor(opts = {}) {
+    const uid = getUid();
+    const dir = opts.socketDir ?? "/tmp";
+    this.socketPath = socketPathFor(uid, dir);
+    this.pidPath = pidPathFor(uid, dir);
+    this.timeoutMs = opts.timeoutMs ?? DEFAULT_CLIENT_TIMEOUT_MS;
+    this.daemonEntry = opts.daemonEntry ?? process.env.HIVEMIND_EMBED_DAEMON;
+    this.autoSpawn = opts.autoSpawn ?? true;
+    this.spawnWaitMs = opts.spawnWaitMs ?? 5e3;
+  }
+  /**
+   * Returns an embedding vector, or null on timeout/failure. Hooks MUST treat
+   * null as "skip embedding column" — never block the write path on us.
+   *
+   * Fire-and-forget spawn on miss: if the daemon isn't up, this call returns
+   * null AND kicks off a background spawn. The next call finds a ready daemon.
+   */
+  async embed(text, kind = "document") {
+    let sock;
+    try {
+      sock = await this.connectOnce();
+    } catch {
+      if (this.autoSpawn)
+        this.trySpawnDaemon();
+      return null;
+    }
+    try {
+      const id = String(++this.nextId);
+      const req = { op: "embed", id, kind, text };
+      const resp = await this.sendAndWait(sock, req);
+      if (resp.error || !("embedding" in resp) || !resp.embedding) {
+        log3(`embed err: ${resp.error ?? "no embedding"}`);
+        return null;
+      }
+      return resp.embedding;
+    } catch (e6) {
+      const err = e6 instanceof Error ? e6.message : String(e6);
+      log3(`embed failed: ${err}`);
+      return null;
+    } finally {
+      try {
+        sock.end();
+      } catch {
+      }
+    }
+  }
+  /**
+   * Wait up to spawnWaitMs for the daemon to accept connections, spawning if
+   * necessary. Meant for SessionStart / long-running batches — not the hot path.
+   */
+  async warmup() {
+    try {
+      const s10 = await this.connectOnce();
+      s10.end();
+      return true;
+    } catch {
+      if (!this.autoSpawn)
+        return false;
+      this.trySpawnDaemon();
+      try {
+        const s10 = await this.waitForSocket();
+        s10.end();
+        return true;
+      } catch {
+        return false;
+      }
+    }
+  }
+  connectOnce() {
+    return new Promise((resolve5, reject) => {
+      const sock = connect(this.socketPath);
+      const to3 = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("connect timeout"));
+      }, this.timeoutMs);
+      sock.once("connect", () => {
+        clearTimeout(to3);
+        resolve5(sock);
+      });
+      sock.once("error", (e6) => {
+        clearTimeout(to3);
+        reject(e6);
+      });
+    });
+  }
+  trySpawnDaemon() {
+    let fd;
+    try {
+      fd = openSync(this.pidPath, "wx", 384);
+      writeSync(fd, String(process.pid));
+    } catch (e6) {
+      if (this.isPidFileStale()) {
+        try {
+          unlinkSync(this.pidPath);
+        } catch {
+        }
+        try {
+          fd = openSync(this.pidPath, "wx", 384);
+          writeSync(fd, String(process.pid));
+        } catch {
+          return;
+        }
+      } else {
+        return;
+      }
+    }
+    if (!this.daemonEntry || !existsSync4(this.daemonEntry)) {
+      log3(`daemonEntry not configured or missing: ${this.daemonEntry}`);
+      try {
+        closeSync(fd);
+        unlinkSync(this.pidPath);
+      } catch {
+      }
+      return;
+    }
+    try {
+      const child = spawn(process.execPath, [this.daemonEntry], {
+        detached: true,
+        stdio: "ignore",
+        env: process.env
+      });
+      child.unref();
+      log3(`spawned daemon pid=${child.pid}`);
+    } finally {
+      closeSync(fd);
+    }
+  }
+  isPidFileStale() {
+    try {
+      const raw = readFileSync3(this.pidPath, "utf-8").trim();
+      const pid = Number(raw);
+      if (!pid || Number.isNaN(pid))
+        return true;
+      try {
+        process.kill(pid, 0);
+        return false;
+      } catch {
+        return true;
+      }
+    } catch {
+      return true;
+    }
+  }
+  async waitForSocket() {
+    const deadline = Date.now() + this.spawnWaitMs;
+    let delay = 30;
+    while (Date.now() < deadline) {
+      await sleep2(delay);
+      delay = Math.min(delay * 1.5, 300);
+      if (!existsSync4(this.socketPath))
+        continue;
+      try {
+        return await this.connectOnce();
+      } catch {
+      }
+    }
+    throw new Error("daemon did not become ready within spawnWaitMs");
+  }
+  sendAndWait(sock, req) {
+    return new Promise((resolve5, reject) => {
+      let buf = "";
+      const to3 = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("request timeout"));
+      }, this.timeoutMs);
+      sock.setEncoding("utf-8");
+      sock.on("data", (chunk) => {
+        buf += chunk;
+        const nl3 = buf.indexOf("\n");
+        if (nl3 === -1)
+          return;
+        const line = buf.slice(0, nl3);
+        clearTimeout(to3);
+        try {
+          resolve5(JSON.parse(line));
+        } catch (e6) {
+          reject(e6);
+        }
+      });
+      sock.on("error", (e6) => {
+        clearTimeout(to3);
+        reject(e6);
+      });
+      sock.write(JSON.stringify(req) + "\n");
+    });
+  }
+};
+function sleep2(ms3) {
+  return new Promise((r10) => setTimeout(r10, ms3));
+}
+
+// dist/src/embeddings/sql.js
+function embeddingSqlLiteral(vec) {
+  if (!vec || vec.length === 0)
+    return "NULL";
+  const parts = [];
+  for (const v27 of vec) {
+    if (!Number.isFinite(v27))
+      return "NULL";
+    parts.push(String(v27));
+  }
+  return `ARRAY[${parts.join(",")}]::float4[]`;
+}
+
 // dist/src/shell/deeplake-fs.js
 var BATCH_SIZE = 10;
 var PREFETCH_BATCH_SIZE = 50;
@@ -67513,6 +67800,9 @@ function normalizeSessionMessage(path2, message) {
   const raw = typeof message === "string" ? message : JSON.stringify(message);
   return normalizeContent(path2, raw);
 }
+function resolveEmbedDaemonPath() {
+  return join7(dirname4(fileURLToPath(import.meta.url)), "embeddings", "embed-daemon.js");
+}
 function joinSessionMessages(path2, messages) {
   return messages.map((message) => normalizeSessionMessage(path2, message)).join("\n");
 }
@@ -67542,6 +67832,8 @@ var DeeplakeFs = class _DeeplakeFs {
   // Paths that live in the sessions table (multi-row, read by concatenation)
   sessionPaths = /* @__PURE__ */ new Set();
   sessionsTable = null;
+  // Embedding client lazily created on first flush. Lives as long as the process.
+  embedClient = null;
   constructor(client, table, mountPoint) {
     this.client = client;
     this.table = table;
@@ -67635,7 +67927,8 @@ var DeeplakeFs = class _DeeplakeFs {
     }
     const rows = [...this.pending.values()];
     this.pending.clear();
-    const results = await Promise.allSettled(rows.map((r10) => this.upsertRow(r10)));
+    const embeddings = await this.computeEmbeddings(rows);
+    const results = await Promise.allSettled(rows.map((r10, i11) => this.upsertRow(r10, embeddings[i11])));
     let failures = 0;
     for (let i11 = 0; i11 < results.length; i11++) {
       if (results[i11].status === "rejected") {
@@ -67649,7 +67942,15 @@ var DeeplakeFs = class _DeeplakeFs {
       throw new Error(`flush: ${failures}/${rows.length} writes failed and were re-queued`);
     }
   }
-  async upsertRow(r10) {
+  async computeEmbeddings(rows) {
+    if (rows.length === 0)
+      return [];
+    if (!this.embedClient) {
+      this.embedClient = new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() });
+    }
+    return Promise.all(rows.map((r10) => this.embedClient.embed(r10.contentText, "document")));
+  }
+  async upsertRow(r10, embedding) {
     const text = sqlStr(r10.contentText);
     const p22 = sqlStr(r10.path);
     const fname = sqlStr(r10.filename);
@@ -67657,8 +67958,9 @@ var DeeplakeFs = class _DeeplakeFs {
     const ts3 = (/* @__PURE__ */ new Date()).toISOString();
     const cd = r10.creationDate ?? ts3;
     const lud = r10.lastUpdateDate ?? ts3;
+    const embSql = embeddingSqlLiteral(embedding);
     if (this.flushed.has(r10.path)) {
-      let setClauses = `filename = '${fname}', summary = E'${text}', mime_type = '${mime}', size_bytes = ${r10.sizeBytes}, last_update_date = '${sqlStr(lud)}'`;
+      let setClauses = `filename = '${fname}', summary = E'${text}', summary_embedding = ${embSql}, mime_type = '${mime}', size_bytes = ${r10.sizeBytes}, last_update_date = '${sqlStr(lud)}'`;
       if (r10.project !== void 0)
         setClauses += `, project = '${sqlStr(r10.project)}'`;
       if (r10.description !== void 0)
@@ -67666,51 +67968,72 @@ var DeeplakeFs = class _DeeplakeFs {
       await this.client.query(`UPDATE "${this.table}" SET ${setClauses} WHERE path = '${p22}'`);
     } else {
       const id = randomUUID2();
-      const cols = "id, path, filename, summary, mime_type, size_bytes, creation_date, last_update_date" + (r10.project !== void 0 ? ", project" : "") + (r10.description !== void 0 ? ", description" : "");
-      const vals = `'${id}', '${p22}', '${fname}', E'${text}', '${mime}', ${r10.sizeBytes}, '${sqlStr(cd)}', '${sqlStr(lud)}'` + (r10.project !== void 0 ? `, '${sqlStr(r10.project)}'` : "") + (r10.description !== void 0 ? `, '${sqlStr(r10.description)}'` : "");
+      const cols = "id, path, filename, summary, summary_embedding, mime_type, size_bytes, creation_date, last_update_date" + (r10.project !== void 0 ? ", project" : "") + (r10.description !== void 0 ? ", description" : "");
+      const vals = `'${id}', '${p22}', '${fname}', E'${text}', ${embSql}, '${mime}', ${r10.sizeBytes}, '${sqlStr(cd)}', '${sqlStr(lud)}'` + (r10.project !== void 0 ? `, '${sqlStr(r10.project)}'` : "") + (r10.description !== void 0 ? `, '${sqlStr(r10.description)}'` : "");
       await this.client.query(`INSERT INTO "${this.table}" (${cols}) VALUES (${vals})`);
       this.flushed.add(r10.path);
     }
   }
   // ── Virtual index.md generation ────────────────────────────────────────────
   async generateVirtualIndex() {
-    const rows = await this.client.query(`SELECT path, project, description, creation_date, last_update_date FROM "${this.table}" WHERE path LIKE '${sqlStr("/summaries/")}%' ORDER BY last_update_date DESC`);
-    const sessionPathsByKey = /* @__PURE__ */ new Map();
-    for (const sp of this.sessionPaths) {
-      const hivemind = sp.match(/\/sessions\/[^/]+\/[^/]+_([^.]+)\.jsonl$/);
-      if (hivemind) {
-        sessionPathsByKey.set(hivemind[1], sp.slice(1));
-      } else {
-        const fname = sp.split("/").pop() ?? "";
-        const stem = fname.replace(/\.[^.]+$/, "");
-        if (stem)
-          sessionPathsByKey.set(stem, sp.slice(1));
+    const summaryRows = await this.client.query(`SELECT path, project, description, creation_date, last_update_date FROM "${this.table}" WHERE path LIKE '${sqlStr("/summaries/")}%' ORDER BY last_update_date DESC`);
+    let sessionRows = [];
+    if (this.sessionsTable) {
+      try {
+        sessionRows = await this.client.query(`SELECT path, MAX(description) AS description, MIN(creation_date) AS creation_date, MAX(last_update_date) AS last_update_date FROM "${this.sessionsTable}" WHERE path LIKE '${sqlStr("/sessions/")}%' GROUP BY path ORDER BY path`);
+      } catch {
+        sessionRows = [];
       }
     }
     const lines = [
       "# Session Index",
       "",
-      "List of all Claude Code sessions with summaries.",
-      "",
-      "| Session | Conversation | Created | Last Updated | Project | Description |",
-      "|---------|-------------|---------|--------------|---------|-------------|"
+      "Two sources are available. Consult the section relevant to the question.",
+      ""
     ];
-    for (const row of rows) {
-      const p22 = row["path"];
-      const match2 = p22.match(/\/summaries\/([^/]+)\/([^/]+)\.md$/);
-      if (!match2)
-        continue;
-      const summaryUser = match2[1];
-      const sessionId = match2[2];
-      const relPath = `summaries/${summaryUser}/${sessionId}.md`;
-      const baseName = sessionId.replace(/_summary$/, "");
-      const convPath = sessionPathsByKey.get(sessionId) ?? sessionPathsByKey.get(baseName);
-      const convLink = convPath ? `[messages](${convPath})` : "";
-      const project = row["project"] || "";
-      const description = row["description"] || "";
-      const creationDate = row["creation_date"] || "";
-      const lastUpdateDate = row["last_update_date"] || "";
-      lines.push(`| [${sessionId}](${relPath}) | ${convLink} | ${creationDate} | ${lastUpdateDate} | ${project} | ${description} |`);
+    lines.push("## memory");
+    lines.push("");
+    if (summaryRows.length === 0) {
+      lines.push("_(empty \u2014 no summaries ingested yet)_");
+    } else {
+      lines.push("AI-generated summaries per session. Read these first for topic-level overviews.");
+      lines.push("");
+      lines.push("| Session | Created | Last Updated | Project | Description |");
+      lines.push("|---------|---------|--------------|---------|-------------|");
+      for (const row of summaryRows) {
+        const p22 = row["path"];
+        const match2 = p22.match(/\/summaries\/([^/]+)\/([^/]+)\.md$/);
+        if (!match2)
+          continue;
+        const summaryUser = match2[1];
+        const sessionId = match2[2];
+        const relPath = `summaries/${summaryUser}/${sessionId}.md`;
+        const project = row["project"] || "";
+        const description = row["description"] || "";
+        const creationDate = row["creation_date"] || "";
+        const lastUpdateDate = row["last_update_date"] || "";
+        lines.push(`| [${sessionId}](${relPath}) | ${creationDate} | ${lastUpdateDate} | ${project} | ${description} |`);
+      }
+    }
+    lines.push("");
+    lines.push("## sessions");
+    lines.push("");
+    if (sessionRows.length === 0) {
+      lines.push("_(empty \u2014 no session records ingested yet)_");
+    } else {
+      lines.push("Raw session records (dialogue, tool calls). Read for exact detail / quotes.");
+      lines.push("");
+      lines.push("| Session | Created | Last Updated | Description |");
+      lines.push("|---------|---------|--------------|-------------|");
+      for (const row of sessionRows) {
+        const p22 = row["path"] || "";
+        const rel = p22.startsWith("/") ? p22.slice(1) : p22;
+        const filename = p22.split("/").pop() ?? p22;
+        const description = row["description"] || "";
+        const creationDate = row["creation_date"] || "";
+        const lastUpdateDate = row["last_update_date"] || "";
+        lines.push(`| [${filename}](${rel}) | ${creationDate} | ${lastUpdateDate} | ${description} |`);
+      }
     }
     lines.push("");
     return lines.join("\n");
@@ -69021,7 +69344,7 @@ function stripQuotes(val) {
 }
 
 // node_modules/yargs-parser/build/lib/index.js
-import { readFileSync as readFileSync3 } from "fs";
+import { readFileSync as readFileSync4 } from "fs";
 import { createRequire } from "node:module";
 var _a3;
 var _b;
@@ -69048,7 +69371,7 @@ var parser = new YargsParser({
     if (typeof require2 !== "undefined") {
       return require2(path2);
     } else if (path2.match(/\.json$/)) {
-      return JSON.parse(readFileSync3(path2, "utf8"));
+      return JSON.parse(readFileSync4(path2, "utf8"));
     } else {
       throw Error("only .json config files are supported in ESM");
     }
@@ -69067,6 +69390,33 @@ yargsParser.looksLikeNumber = looksLikeNumber;
 var lib_default = yargsParser;
 
 // dist/src/shell/grep-interceptor.js
+import { fileURLToPath as fileURLToPath2 } from "node:url";
+import { dirname as dirname5, join as join8 } from "node:path";
+var SEMANTIC_SEARCH_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false";
+var SEMANTIC_EMBED_TIMEOUT_MS = Number(process.env.HIVEMIND_SEMANTIC_EMBED_TIMEOUT_MS ?? "500");
+function resolveGrepEmbedDaemonPath() {
+  return join8(dirname5(fileURLToPath2(import.meta.url)), "..", "embeddings", "embed-daemon.js");
+}
+var sharedGrepEmbedClient = null;
+function getGrepEmbedClient() {
+  if (!sharedGrepEmbedClient) {
+    sharedGrepEmbedClient = new EmbedClient({
+      daemonEntry: resolveGrepEmbedDaemonPath(),
+      timeoutMs: SEMANTIC_EMBED_TIMEOUT_MS
+    });
+  }
+  return sharedGrepEmbedClient;
+}
+function patternIsSemanticFriendly(pattern, fixedString) {
+  if (!pattern || pattern.length < 2)
+    return false;
+  if (fixedString)
+    return true;
+  const metaMatches = pattern.match(/[|()\[\]{}+?^$\\]/g);
+  if (!metaMatches)
+    return true;
+  return metaMatches.length <= 1;
+}
 var MAX_FALLBACK_CANDIDATES = 500;
 function createGrepCommand(client, fs3, table, sessionsTable) {
   return Yi2("grep", async (args, ctx) => {
@@ -69108,12 +69458,21 @@ function createGrepCommand(client, fs3, table, sessionsTable) {
       filesOnly: Boolean(parsed.l || parsed["files-with-matches"]),
       countOnly: Boolean(parsed.c || parsed["count"])
     };
+    let queryEmbedding = null;
+    if (SEMANTIC_SEARCH_ENABLED && patternIsSemanticFriendly(pattern, matchParams.fixedString)) {
+      try {
+        queryEmbedding = await getGrepEmbedClient().embed(pattern, "query");
+      } catch {
+        queryEmbedding = null;
+      }
+    }
     let rows = [];
     try {
       const searchOptions = {
         ...buildGrepSearchOptions(matchParams, targets[0] ?? ctx.cwd),
         pathFilter: buildPathFilterForTargets(targets),
-        limit: 100
+        limit: 100,
+        queryEmbedding
       };
       const queryRows = await Promise.race([
         searchDeeplakeTables(client, table, sessionsTable ?? "sessions", searchOptions),
@@ -69123,6 +69482,21 @@ function createGrepCommand(client, fs3, table, sessionsTable) {
     } catch {
       rows = [];
     }
+    if (rows.length === 0 && queryEmbedding) {
+      try {
+        const lexicalOptions = {
+          ...buildGrepSearchOptions(matchParams, targets[0] ?? ctx.cwd),
+          pathFilter: buildPathFilterForTargets(targets),
+          limit: 100
+        };
+        const lexicalRows = await Promise.race([
+          searchDeeplakeTables(client, table, sessionsTable ?? "sessions", lexicalOptions),
+          new Promise((_16, reject) => setTimeout(() => reject(new Error("timeout")), 3e3))
+        ]);
+        rows.push(...lexicalRows);
+      } catch {
+      }
+    }
     const seen = /* @__PURE__ */ new Set();
     rows = rows.filter((r10) => seen.has(r10.path) ? false : (seen.add(r10.path), true));
     if (rows.length === 0) {
@@ -69136,7 +69510,19 @@ function createGrepCommand(client, fs3, table, sessionsTable) {
       }
     }
     const normalized = rows.map((r10) => ({ path: r10.path, content: normalizeContent(r10.path, r10.content) }));
-    const output = refineGrepMatches(normalized, matchParams);
+    let output;
+    if (queryEmbedding && queryEmbedding.length > 0 && process.env.HIVEMIND_SEMANTIC_EMIT_ALL !== "false") {
+      output = [];
+      for (const r10 of normalized) {
+        for (const line of r10.content.split("\n")) {
+          const trimmed = line.trim();
+          if (trimmed)
+            output.push(`${r10.path}:${line}`);
+        }
+      }
+    } else {
+      output = refineGrepMatches(normalized, matchParams);
+    }
     return {
       stdout: output.length > 0 ? output.join("\n") + "\n" : "",
       stderr: "",
diff --git a/codex/bundle/capture.js b/codex/bundle/capture.js
index 67b7919..10ecdb3 100755
--- a/codex/bundle/capture.js
+++ b/codex/bundle/capture.js
@@ -375,7 +375,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(tbl)) {
       log2(`table "${tbl}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', summary_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
@@ -386,7 +386,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(name)) {
       log2(`table "${name}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, message_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
diff --git a/codex/bundle/commands/auth-login.js b/codex/bundle/commands/auth-login.js
index 064f11e..ff51f9f 100755
--- a/codex/bundle/commands/auth-login.js
+++ b/codex/bundle/commands/auth-login.js
@@ -556,7 +556,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(tbl)) {
       log2(`table "${tbl}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', summary_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
@@ -567,7 +567,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(name)) {
       log2(`table "${name}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, message_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
diff --git a/codex/bundle/embeddings/embed-daemon.js b/codex/bundle/embeddings/embed-daemon.js
new file mode 100755
index 0000000..9437063
--- /dev/null
+++ b/codex/bundle/embeddings/embed-daemon.js
@@ -0,0 +1,240 @@
+#!/usr/bin/env node
+
+// dist/src/embeddings/daemon.js
+import { createServer } from "node:net";
+import { unlinkSync, writeFileSync, existsSync, mkdirSync, chmodSync } from "node:fs";
+
+// dist/src/embeddings/protocol.js
+var DEFAULT_SOCKET_DIR = "/tmp";
+var DEFAULT_MODEL_REPO = "nomic-ai/nomic-embed-text-v1.5";
+var DEFAULT_DTYPE = "q8";
+var DEFAULT_DIMS = 768;
+var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
+var DOC_PREFIX = "search_document: ";
+var QUERY_PREFIX = "search_query: ";
+function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.sock`;
+}
+function pidPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.pid`;
+}
+
+// dist/src/embeddings/nomic.js
+var NomicEmbedder = class {
+  pipeline = null;
+  loading = null;
+  repo;
+  dtype;
+  dims;
+  constructor(opts = {}) {
+    this.repo = opts.repo ?? DEFAULT_MODEL_REPO;
+    this.dtype = opts.dtype ?? DEFAULT_DTYPE;
+    this.dims = opts.dims ?? DEFAULT_DIMS;
+  }
+  async load() {
+    if (this.pipeline)
+      return;
+    if (this.loading)
+      return this.loading;
+    this.loading = (async () => {
+      const mod = await import("@huggingface/transformers");
+      mod.env.allowLocalModels = false;
+      mod.env.useFSCache = true;
+      this.pipeline = await mod.pipeline("feature-extraction", this.repo, { dtype: this.dtype });
+    })();
+    try {
+      await this.loading;
+    } finally {
+      this.loading = null;
+    }
+  }
+  addPrefix(text, kind) {
+    return (kind === "query" ? QUERY_PREFIX : DOC_PREFIX) + text;
+  }
+  async embed(text, kind = "document") {
+    await this.load();
+    if (!this.pipeline)
+      throw new Error("embedder not loaded");
+    const out = await this.pipeline(this.addPrefix(text, kind), { pooling: "mean", normalize: true });
+    const full = Array.from(out.data);
+    return this.truncate(full);
+  }
+  async embedBatch(texts, kind = "document") {
+    if (texts.length === 0)
+      return [];
+    await this.load();
+    if (!this.pipeline)
+      throw new Error("embedder not loaded");
+    const prefixed = texts.map((t) => this.addPrefix(t, kind));
+    const out = await this.pipeline(prefixed, { pooling: "mean", normalize: true });
+    const flat = Array.from(out.data);
+    const total = flat.length;
+    const full = total / texts.length;
+    const batches = [];
+    for (let i = 0; i < texts.length; i++) {
+      batches.push(this.truncate(flat.slice(i * full, (i + 1) * full)));
+    }
+    return batches;
+  }
+  truncate(vec) {
+    if (this.dims >= vec.length)
+      return vec;
+    const head = vec.slice(0, this.dims);
+    let norm = 0;
+    for (const v of head)
+      norm += v * v;
+    norm = Math.sqrt(norm);
+    if (norm === 0)
+      return head;
+    for (let i = 0; i < head.length; i++)
+      head[i] /= norm;
+    return head;
+  }
+};
+
+// dist/src/utils/debug.js
+import { appendFileSync } from "node:fs";
+import { join } from "node:path";
+import { homedir } from "node:os";
+var DEBUG = (process.env.HIVEMIND_DEBUG ?? process.env.DEEPLAKE_DEBUG) === "1";
+var LOG = join(homedir(), ".deeplake", "hook-debug.log");
+function log(tag, msg) {
+  if (!DEBUG)
+    return;
+  appendFileSync(LOG, `${(/* @__PURE__ */ new Date()).toISOString()} [${tag}] ${msg}
+`);
+}
+
+// dist/src/embeddings/daemon.js
+var log2 = (m) => log("embed-daemon", m);
+function getUid() {
+  const uid = typeof process.getuid === "function" ? process.getuid() : void 0;
+  return uid !== void 0 ? String(uid) : process.env.USER ?? "default";
+}
+var EmbedDaemon = class {
+  server = null;
+  embedder;
+  socketPath;
+  pidPath;
+  idleTimeoutMs;
+  idleTimer = null;
+  constructor(opts = {}) {
+    const uid = getUid();
+    const dir = opts.socketDir ?? "/tmp";
+    this.socketPath = socketPathFor(uid, dir);
+    this.pidPath = pidPathFor(uid, dir);
+    this.idleTimeoutMs = opts.idleTimeoutMs ?? DEFAULT_IDLE_TIMEOUT_MS;
+    this.embedder = new NomicEmbedder({ repo: opts.repo, dtype: opts.dtype, dims: opts.dims });
+  }
+  async start() {
+    mkdirSync(this.socketPath.replace(/\/[^/]+$/, ""), { recursive: true });
+    writeFileSync(this.pidPath, String(process.pid), { mode: 384 });
+    if (existsSync(this.socketPath)) {
+      try {
+        unlinkSync(this.socketPath);
+      } catch {
+      }
+    }
+    this.embedder.load().then(() => log2("model ready")).catch((e) => log2(`load err: ${e.message}`));
+    this.server = createServer((sock) => this.handleConnection(sock));
+    await new Promise((resolve, reject) => {
+      this.server.once("error", reject);
+      this.server.listen(this.socketPath, () => {
+        try {
+          chmodSync(this.socketPath, 384);
+        } catch {
+        }
+        log2(`listening on ${this.socketPath}`);
+        resolve();
+      });
+    });
+    this.resetIdleTimer();
+    process.on("SIGINT", () => this.shutdown());
+    process.on("SIGTERM", () => this.shutdown());
+  }
+  resetIdleTimer() {
+    if (this.idleTimer)
+      clearTimeout(this.idleTimer);
+    this.idleTimer = setTimeout(() => {
+      log2(`idle timeout ${this.idleTimeoutMs}ms reached, shutting down`);
+      this.shutdown();
+    }, this.idleTimeoutMs);
+    this.idleTimer.unref();
+  }
+  shutdown() {
+    try {
+      this.server?.close();
+    } catch {
+    }
+    try {
+      if (existsSync(this.socketPath))
+        unlinkSync(this.socketPath);
+    } catch {
+    }
+    try {
+      if (existsSync(this.pidPath))
+        unlinkSync(this.pidPath);
+    } catch {
+    }
+    process.exit(0);
+  }
+  handleConnection(sock) {
+    let buf = "";
+    sock.setEncoding("utf-8");
+    sock.on("data", (chunk) => {
+      buf += chunk;
+      let nl;
+      while ((nl = buf.indexOf("\n")) !== -1) {
+        const line = buf.slice(0, nl);
+        buf = buf.slice(nl + 1);
+        if (line.length === 0)
+          continue;
+        this.handleLine(sock, line);
+      }
+    });
+    sock.on("error", () => {
+    });
+  }
+  async handleLine(sock, line) {
+    this.resetIdleTimer();
+    let req;
+    try {
+      req = JSON.parse(line);
+    } catch {
+      return;
+    }
+    try {
+      const resp = await this.dispatch(req);
+      sock.write(JSON.stringify(resp) + "\n");
+    } catch (e) {
+      const err = e instanceof Error ? e.message : String(e);
+      const resp = { id: req.id, error: err };
+      sock.write(JSON.stringify(resp) + "\n");
+    }
+  }
+  async dispatch(req) {
+    if (req.op === "ping") {
+      const p = req;
+      return { id: p.id, ready: true, model: this.embedder.repo, dims: this.embedder.dims };
+    }
+    if (req.op === "embed") {
+      const e = req;
+      const vec = await this.embedder.embed(e.text, e.kind);
+      return { id: e.id, embedding: vec };
+    }
+    return { id: req.id, error: "unknown op" };
+  }
+};
+var invokedDirectly = import.meta.url === `file://${process.argv[1]}` || process.argv[1] && import.meta.url.endsWith(process.argv[1].split("/").pop() ?? "");
+if (invokedDirectly) {
+  const dims = process.env.HIVEMIND_EMBED_DIMS ? Number(process.env.HIVEMIND_EMBED_DIMS) : void 0;
+  const idleTimeoutMs = process.env.HIVEMIND_EMBED_IDLE_MS ? Number(process.env.HIVEMIND_EMBED_IDLE_MS) : void 0;
+  const d = new EmbedDaemon({ dims, idleTimeoutMs });
+  d.start().catch((e) => {
+    log2(`fatal: ${e.message}`);
+    process.exit(1);
+  });
+}
+export {
+  EmbedDaemon
+};
diff --git a/codex/bundle/pre-tool-use.js b/codex/bundle/pre-tool-use.js
index 997faff..851e257 100755
--- a/codex/bundle/pre-tool-use.js
+++ b/codex/bundle/pre-tool-use.js
@@ -2,9 +2,9 @@
 
 // dist/src/hooks/codex/pre-tool-use.js
 import { execFileSync } from "node:child_process";
-import { existsSync as existsSync3 } from "node:fs";
-import { join as join6, dirname } from "node:path";
-import { fileURLToPath as fileURLToPath2 } from "node:url";
+import { existsSync as existsSync4 } from "node:fs";
+import { join as join7, dirname as dirname2 } from "node:path";
+import { fileURLToPath as fileURLToPath3 } from "node:url";
 
 // dist/src/utils/stdin.js
 function readStdin() {
@@ -381,7 +381,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(tbl)) {
       log2(`table "${tbl}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', summary_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
@@ -392,7 +392,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(name)) {
       log2(`table "${name}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, message_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
@@ -565,24 +565,25 @@ function normalizeContent(path, raw) {
     return raw;
   }
   if (Array.isArray(obj.turns)) {
-    const header = [];
-    if (obj.date_time)
-      header.push(`date: ${obj.date_time}`);
-    if (obj.speakers) {
-      const s = obj.speakers;
-      const names = [s.speaker_a, s.speaker_b].filter(Boolean).join(", ");
-      if (names)
-        header.push(`speakers: ${names}`);
-    }
+    const dateHeader = obj.date_time ? `(${String(obj.date_time)}) ` : "";
     const lines = obj.turns.map((t) => {
       const sp = String(t?.speaker ?? t?.name ?? "?").trim();
       const tx = String(t?.text ?? t?.content ?? "").replace(/\s+/g, " ").trim();
       const tag = t?.dia_id ? `[${t.dia_id}] ` : "";
-      return `${tag}${sp}: ${tx}`;
+      return `${dateHeader}${tag}${sp}: ${tx}`;
     });
-    const out2 = [...header, ...lines].join("\n");
+    const out2 = lines.join("\n");
     return out2.trim() ? out2 : raw;
   }
+  if (obj.turn && typeof obj.turn === "object" && !Array.isArray(obj.turn)) {
+    const t = obj.turn;
+    const sp = String(t.speaker ?? t.name ?? "?").trim();
+    const tx = String(t.text ?? t.content ?? "").replace(/\s+/g, " ").trim();
+    const tag = t.dia_id ? `[${String(t.dia_id)}] ` : "";
+    const dateHeader = obj.date_time ? `(${String(obj.date_time)}) ` : "";
+    const line = `${dateHeader}${tag}${sp}: ${tx}`;
+    return line.trim() ? line : raw;
+  }
   const stripRecalled = (t) => {
     const i = t.indexOf("<recalled-memories>");
     if (i === -1)
@@ -625,8 +626,38 @@ function buildPathCondition(targetPath) {
   return `(path = '${sqlStr(clean)}' OR path LIKE '${sqlLike(clean)}/%' ESCAPE '\\')`;
 }
 async function searchDeeplakeTables(api, memoryTable, sessionsTable, opts) {
-  const { pathFilter, contentScanOnly, likeOp, escapedPattern, prefilterPattern, prefilterPatterns } = opts;
+  const { pathFilter, contentScanOnly, likeOp, escapedPattern, prefilterPattern, prefilterPatterns, queryEmbedding, bm25Term } = opts;
   const limit = opts.limit ?? 100;
+  if (queryEmbedding && queryEmbedding.length > 0) {
+    const vecLit = serializeFloat4Array(queryEmbedding);
+    const semanticLimit = Math.min(limit, Number(process.env.HIVEMIND_SEMANTIC_LIMIT ?? "20"));
+    const lexicalLimit = Math.min(limit, Number(process.env.HIVEMIND_HYBRID_LEXICAL_LIMIT ?? "20"));
+    const filterPatternsForLex = contentScanOnly ? prefilterPatterns && prefilterPatterns.length > 0 ? prefilterPatterns : prefilterPattern ? [prefilterPattern] : [] : [escapedPattern];
+    const memLexFilter = buildContentFilter("summary::text", likeOp, filterPatternsForLex);
+    const sessLexFilter = buildContentFilter("message::text", likeOp, filterPatternsForLex);
+    const memLexQuery = memLexFilter ? `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, 1.0 AS score FROM "${memoryTable}" WHERE 1=1${pathFilter}${memLexFilter} LIMIT ${lexicalLimit}` : null;
+    const sessLexQuery = sessLexFilter ? `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, 1.0 AS score FROM "${sessionsTable}" WHERE 1=1${pathFilter}${sessLexFilter} LIMIT ${lexicalLimit}` : null;
+    const memSemQuery = `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, (summary_embedding <#> ${vecLit}) AS score FROM "${memoryTable}" WHERE summary_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const sessSemQuery = `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, (message_embedding <#> ${vecLit}) AS score FROM "${sessionsTable}" WHERE message_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const parts = [memSemQuery, sessSemQuery];
+    if (memLexQuery)
+      parts.push(memLexQuery);
+    if (sessLexQuery)
+      parts.push(sessLexQuery);
+    const unionSql = parts.map((q) => `(${q})`).join(" UNION ALL ");
+    const outerLimit = semanticLimit + lexicalLimit;
+    const rows2 = await api.query(`SELECT path, content, source_order, creation_date, score FROM (` + unionSql + `) AS combined ORDER BY score DESC LIMIT ${outerLimit}`);
+    const seen = /* @__PURE__ */ new Set();
+    const unique = [];
+    for (const row of rows2) {
+      const p = String(row["path"]);
+      if (seen.has(p))
+        continue;
+      seen.add(p);
+      unique.push({ path: p, content: String(row["content"] ?? "") });
+    }
+    return unique;
+  }
   const filterPatterns = contentScanOnly ? prefilterPatterns && prefilterPatterns.length > 0 ? prefilterPatterns : prefilterPattern ? [prefilterPattern] : [] : [escapedPattern];
   const memFilter = buildContentFilter("summary::text", likeOp, filterPatterns);
   const sessFilter = buildContentFilter("message::text", likeOp, filterPatterns);
@@ -638,6 +669,15 @@ async function searchDeeplakeTables(api, memoryTable, sessionsTable, opts) {
     content: String(row["content"] ?? "")
   }));
 }
+function serializeFloat4Array(vec) {
+  const parts = [];
+  for (const v of vec) {
+    if (!Number.isFinite(v))
+      return "NULL";
+    parts.push(String(v));
+  }
+  return `ARRAY[${parts.join(",")}]::float4[]`;
+}
 function buildPathFilter(targetPath) {
   const condition = buildPathCondition(targetPath);
   return condition ? ` AND ${condition}` : "";
@@ -716,13 +756,24 @@ function buildGrepSearchOptions(params, targetPath) {
   const hasRegexMeta = !params.fixedString && /[.*+?^${}()|[\]\\]/.test(params.pattern);
   const literalPrefilter = hasRegexMeta ? extractRegexLiteralPrefilter(params.pattern) : null;
   const alternationPrefilters = hasRegexMeta ? extractRegexAlternationPrefilters(params.pattern) : null;
+  let bm25Term;
+  if (!hasRegexMeta) {
+    bm25Term = params.pattern;
+  } else if (alternationPrefilters && alternationPrefilters.length > 0) {
+    bm25Term = alternationPrefilters.join(" ");
+  } else if (literalPrefilter) {
+    bm25Term = literalPrefilter;
+  }
   return {
     pathFilter: buildPathFilter(targetPath),
     contentScanOnly: hasRegexMeta,
-    likeOp: params.ignoreCase ? "ILIKE" : "LIKE",
+    // Kept for the pure-lexical fallback path and existing tests; BM25 is now
+    // the preferred lexical ranker when a term can be extracted.
+    likeOp: process.env.HIVEMIND_GREP_LIKE === "case-sensitive" ? "LIKE" : "ILIKE",
     escapedPattern: sqlLike(params.pattern),
     prefilterPattern: literalPrefilter ? sqlLike(literalPrefilter) : void 0,
-    prefilterPatterns: alternationPrefilters?.map((literal) => sqlLike(literal))
+    prefilterPatterns: alternationPrefilters?.map((literal) => sqlLike(literal)),
+    bm25Term
   };
 }
 function buildContentFilter(column, likeOp, patterns) {
@@ -773,11 +824,28 @@ function refineGrepMatches(rows, params, forceMultiFilePrefix) {
   }
   return output;
 }
-async function grepBothTables(api, memoryTable, sessionsTable, params, targetPath) {
-  const rows = await searchDeeplakeTables(api, memoryTable, sessionsTable, buildGrepSearchOptions(params, targetPath));
+async function grepBothTables(api, memoryTable, sessionsTable, params, targetPath, queryEmbedding) {
+  const rows = await searchDeeplakeTables(api, memoryTable, sessionsTable, {
+    ...buildGrepSearchOptions(params, targetPath),
+    queryEmbedding
+  });
   const seen = /* @__PURE__ */ new Set();
   const unique = rows.filter((r) => seen.has(r.path) ? false : (seen.add(r.path), true));
   const normalized = unique.map((r) => ({ path: r.path, content: normalizeContent(r.path, r.content) }));
+  if (queryEmbedding && queryEmbedding.length > 0) {
+    const emitAllLines = process.env.HIVEMIND_SEMANTIC_EMIT_ALL !== "false";
+    if (emitAllLines) {
+      const lines = [];
+      for (const r of normalized) {
+        for (const line of r.content.split("\n")) {
+          const trimmed = line.trim();
+          if (trimmed)
+            lines.push(`${r.path}:${line}`);
+        }
+      }
+      return lines;
+    }
+  }
   return refineGrepMatches(normalized, params);
 }
 
@@ -817,7 +885,255 @@ function capOutputForClaude(output, options = {}) {
   return keptLines.join("\n") + footer;
 }
 
+// dist/src/embeddings/client.js
+import { connect } from "node:net";
+import { spawn } from "node:child_process";
+import { openSync, closeSync, writeSync, unlinkSync, existsSync as existsSync3, readFileSync as readFileSync3 } from "node:fs";
+
+// dist/src/embeddings/protocol.js
+var DEFAULT_SOCKET_DIR = "/tmp";
+var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
+var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.sock`;
+}
+function pidPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.pid`;
+}
+
+// dist/src/embeddings/client.js
+var log3 = (m) => log("embed-client", m);
+function getUid() {
+  const uid = typeof process.getuid === "function" ? process.getuid() : void 0;
+  return uid !== void 0 ? String(uid) : process.env.USER ?? "default";
+}
+var EmbedClient = class {
+  socketPath;
+  pidPath;
+  timeoutMs;
+  daemonEntry;
+  autoSpawn;
+  spawnWaitMs;
+  nextId = 0;
+  constructor(opts = {}) {
+    const uid = getUid();
+    const dir = opts.socketDir ?? "/tmp";
+    this.socketPath = socketPathFor(uid, dir);
+    this.pidPath = pidPathFor(uid, dir);
+    this.timeoutMs = opts.timeoutMs ?? DEFAULT_CLIENT_TIMEOUT_MS;
+    this.daemonEntry = opts.daemonEntry ?? process.env.HIVEMIND_EMBED_DAEMON;
+    this.autoSpawn = opts.autoSpawn ?? true;
+    this.spawnWaitMs = opts.spawnWaitMs ?? 5e3;
+  }
+  /**
+   * Returns an embedding vector, or null on timeout/failure. Hooks MUST treat
+   * null as "skip embedding column" — never block the write path on us.
+   *
+   * Fire-and-forget spawn on miss: if the daemon isn't up, this call returns
+   * null AND kicks off a background spawn. The next call finds a ready daemon.
+   */
+  async embed(text, kind = "document") {
+    let sock;
+    try {
+      sock = await this.connectOnce();
+    } catch {
+      if (this.autoSpawn)
+        this.trySpawnDaemon();
+      return null;
+    }
+    try {
+      const id = String(++this.nextId);
+      const req = { op: "embed", id, kind, text };
+      const resp = await this.sendAndWait(sock, req);
+      if (resp.error || !("embedding" in resp) || !resp.embedding) {
+        log3(`embed err: ${resp.error ?? "no embedding"}`);
+        return null;
+      }
+      return resp.embedding;
+    } catch (e) {
+      const err = e instanceof Error ? e.message : String(e);
+      log3(`embed failed: ${err}`);
+      return null;
+    } finally {
+      try {
+        sock.end();
+      } catch {
+      }
+    }
+  }
+  /**
+   * Wait up to spawnWaitMs for the daemon to accept connections, spawning if
+   * necessary. Meant for SessionStart / long-running batches — not the hot path.
+   */
+  async warmup() {
+    try {
+      const s = await this.connectOnce();
+      s.end();
+      return true;
+    } catch {
+      if (!this.autoSpawn)
+        return false;
+      this.trySpawnDaemon();
+      try {
+        const s = await this.waitForSocket();
+        s.end();
+        return true;
+      } catch {
+        return false;
+      }
+    }
+  }
+  connectOnce() {
+    return new Promise((resolve2, reject) => {
+      const sock = connect(this.socketPath);
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("connect timeout"));
+      }, this.timeoutMs);
+      sock.once("connect", () => {
+        clearTimeout(to);
+        resolve2(sock);
+      });
+      sock.once("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+    });
+  }
+  trySpawnDaemon() {
+    let fd;
+    try {
+      fd = openSync(this.pidPath, "wx", 384);
+      writeSync(fd, String(process.pid));
+    } catch (e) {
+      if (this.isPidFileStale()) {
+        try {
+          unlinkSync(this.pidPath);
+        } catch {
+        }
+        try {
+          fd = openSync(this.pidPath, "wx", 384);
+          writeSync(fd, String(process.pid));
+        } catch {
+          return;
+        }
+      } else {
+        return;
+      }
+    }
+    if (!this.daemonEntry || !existsSync3(this.daemonEntry)) {
+      log3(`daemonEntry not configured or missing: ${this.daemonEntry}`);
+      try {
+        closeSync(fd);
+        unlinkSync(this.pidPath);
+      } catch {
+      }
+      return;
+    }
+    try {
+      const child = spawn(process.execPath, [this.daemonEntry], {
+        detached: true,
+        stdio: "ignore",
+        env: process.env
+      });
+      child.unref();
+      log3(`spawned daemon pid=${child.pid}`);
+    } finally {
+      closeSync(fd);
+    }
+  }
+  isPidFileStale() {
+    try {
+      const raw = readFileSync3(this.pidPath, "utf-8").trim();
+      const pid = Number(raw);
+      if (!pid || Number.isNaN(pid))
+        return true;
+      try {
+        process.kill(pid, 0);
+        return false;
+      } catch {
+        return true;
+      }
+    } catch {
+      return true;
+    }
+  }
+  async waitForSocket() {
+    const deadline = Date.now() + this.spawnWaitMs;
+    let delay = 30;
+    while (Date.now() < deadline) {
+      await sleep2(delay);
+      delay = Math.min(delay * 1.5, 300);
+      if (!existsSync3(this.socketPath))
+        continue;
+      try {
+        return await this.connectOnce();
+      } catch {
+      }
+    }
+    throw new Error("daemon did not become ready within spawnWaitMs");
+  }
+  sendAndWait(sock, req) {
+    return new Promise((resolve2, reject) => {
+      let buf = "";
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("request timeout"));
+      }, this.timeoutMs);
+      sock.setEncoding("utf-8");
+      sock.on("data", (chunk) => {
+        buf += chunk;
+        const nl = buf.indexOf("\n");
+        if (nl === -1)
+          return;
+        const line = buf.slice(0, nl);
+        clearTimeout(to);
+        try {
+          resolve2(JSON.parse(line));
+        } catch (e) {
+          reject(e);
+        }
+      });
+      sock.on("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+      sock.write(JSON.stringify(req) + "\n");
+    });
+  }
+};
+function sleep2(ms) {
+  return new Promise((r) => setTimeout(r, ms));
+}
+
 // dist/src/hooks/grep-direct.js
+import { fileURLToPath } from "node:url";
+import { dirname, join as join4 } from "node:path";
+var SEMANTIC_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false";
+var SEMANTIC_TIMEOUT_MS = Number(process.env.HIVEMIND_SEMANTIC_EMBED_TIMEOUT_MS ?? "500");
+function resolveDaemonPath() {
+  return join4(dirname(fileURLToPath(import.meta.url)), "..", "embeddings", "embed-daemon.js");
+}
+var sharedEmbedClient = null;
+function getEmbedClient() {
+  if (!sharedEmbedClient) {
+    sharedEmbedClient = new EmbedClient({
+      daemonEntry: resolveDaemonPath(),
+      timeoutMs: SEMANTIC_TIMEOUT_MS
+    });
+  }
+  return sharedEmbedClient;
+}
+function patternIsSemanticFriendly(pattern, fixedString) {
+  if (!pattern || pattern.length < 2)
+    return false;
+  if (fixedString)
+    return true;
+  const meta = pattern.match(/[|()\[\]{}+?^$\\]/g);
+  if (!meta)
+    return true;
+  return meta.length <= 1;
+}
 function splitFirstPipelineStage(cmd) {
   const input = cmd.trim();
   let quote = null;
@@ -1055,7 +1371,15 @@ async function handleGrepDirect(api, table, sessionsTable, params) {
     invertMatch: params.invertMatch,
     fixedString: params.fixedString
   };
-  const output = await grepBothTables(api, table, sessionsTable, matchParams, params.targetPath);
+  let queryEmbedding = null;
+  if (SEMANTIC_ENABLED && patternIsSemanticFriendly(params.pattern, params.fixedString)) {
+    try {
+      queryEmbedding = await getEmbedClient().embed(params.pattern, "query");
+    } catch {
+      queryEmbedding = null;
+    }
+  }
+  const output = await grepBothTables(api, table, sessionsTable, matchParams, params.targetPath, queryEmbedding);
   const joined = output.join("\n") || "(no matches)";
   return capOutputForClaude(joined, { kind: "grep" });
 }
@@ -1676,20 +2000,20 @@ async function executeCompiledBashCommand(api, memoryTable, sessionsTable, cmd,
 }
 
 // dist/src/hooks/query-cache.js
-import { mkdirSync as mkdirSync2, readFileSync as readFileSync3, rmSync, writeFileSync as writeFileSync2 } from "node:fs";
-import { join as join4 } from "node:path";
+import { mkdirSync as mkdirSync2, readFileSync as readFileSync4, rmSync, writeFileSync as writeFileSync2 } from "node:fs";
+import { join as join5 } from "node:path";
 import { homedir as homedir3 } from "node:os";
-var log3 = (msg) => log("query-cache", msg);
-var DEFAULT_CACHE_ROOT = join4(homedir3(), ".deeplake", "query-cache");
+var log4 = (msg) => log("query-cache", msg);
+var DEFAULT_CACHE_ROOT = join5(homedir3(), ".deeplake", "query-cache");
 var INDEX_CACHE_FILE = "index.md";
 function getSessionQueryCacheDir(sessionId, deps = {}) {
   const { cacheRoot = DEFAULT_CACHE_ROOT } = deps;
-  return join4(cacheRoot, sessionId);
+  return join5(cacheRoot, sessionId);
 }
 function readCachedIndexContent(sessionId, deps = {}) {
-  const { logFn = log3 } = deps;
+  const { logFn = log4 } = deps;
   try {
-    return readFileSync3(join4(getSessionQueryCacheDir(sessionId, deps), INDEX_CACHE_FILE), "utf-8");
+    return readFileSync4(join5(getSessionQueryCacheDir(sessionId, deps), INDEX_CACHE_FILE), "utf-8");
   } catch (e) {
     if (e?.code === "ENOENT")
       return null;
@@ -1698,11 +2022,11 @@ function readCachedIndexContent(sessionId, deps = {}) {
   }
 }
 function writeCachedIndexContent(sessionId, content, deps = {}) {
-  const { logFn = log3 } = deps;
+  const { logFn = log4 } = deps;
   try {
     const dir = getSessionQueryCacheDir(sessionId, deps);
     mkdirSync2(dir, { recursive: true });
-    writeFileSync2(join4(dir, INDEX_CACHE_FILE), content, "utf-8");
+    writeFileSync2(join5(dir, INDEX_CACHE_FILE), content, "utf-8");
   } catch (e) {
     logFn(`write failed for session=${sessionId}: ${e.message}`);
   }
@@ -1710,13 +2034,13 @@ function writeCachedIndexContent(sessionId, content, deps = {}) {
 
 // dist/src/utils/direct-run.js
 import { resolve } from "node:path";
-import { fileURLToPath } from "node:url";
+import { fileURLToPath as fileURLToPath2 } from "node:url";
 function isDirectRun(metaUrl) {
   const entry = process.argv[1];
   if (!entry)
     return false;
   try {
-    return resolve(fileURLToPath(metaUrl)) === resolve(entry);
+    return resolve(fileURLToPath2(metaUrl)) === resolve(entry);
   } catch {
     return false;
   }
@@ -1724,8 +2048,8 @@ function isDirectRun(metaUrl) {
 
 // dist/src/hooks/memory-path-utils.js
 import { homedir as homedir4 } from "node:os";
-import { join as join5 } from "node:path";
-var MEMORY_PATH = join5(homedir4(), ".deeplake", "memory");
+import { join as join6 } from "node:path";
+var MEMORY_PATH = join6(homedir4(), ".deeplake", "memory");
 var TILDE_PATH = "~/.deeplake/memory";
 var HOME_VAR_PATH = "$HOME/.deeplake/memory";
 var SAFE_BUILTINS = /* @__PURE__ */ new Set([
@@ -1841,13 +2165,13 @@ function rewritePaths(cmd) {
 }
 
 // dist/src/hooks/codex/pre-tool-use.js
-var log4 = (msg) => log("codex-pre", msg);
-var __bundleDir = dirname(fileURLToPath2(import.meta.url));
-var SHELL_BUNDLE = existsSync3(join6(__bundleDir, "shell", "deeplake-shell.js")) ? join6(__bundleDir, "shell", "deeplake-shell.js") : join6(__bundleDir, "..", "shell", "deeplake-shell.js");
+var log5 = (msg) => log("codex-pre", msg);
+var __bundleDir = dirname2(fileURLToPath3(import.meta.url));
+var SHELL_BUNDLE = existsSync4(join7(__bundleDir, "shell", "deeplake-shell.js")) ? join7(__bundleDir, "shell", "deeplake-shell.js") : join7(__bundleDir, "..", "shell", "deeplake-shell.js");
 function buildUnsupportedGuidance() {
   return "This command is not supported for ~/.deeplake/memory/ operations. Only bash builtins are available: cat, ls, grep, echo, jq, head, tail, sed, awk, wc, sort, find, etc. Do NOT use python, python3, node, curl, or other interpreters. Rewrite your command using only bash tools and retry.";
 }
-function runVirtualShell(cmd, shellBundle = SHELL_BUNDLE, logFn = log4) {
+function runVirtualShell(cmd, shellBundle = SHELL_BUNDLE, logFn = log5) {
   try {
     return execFileSync("node", [shellBundle, "-c", cmd], {
       encoding: "utf-8",
@@ -1872,7 +2196,7 @@ function buildIndexContent(rows) {
   return lines.join("\n");
 }
 async function processCodexPreToolUse(input, deps = {}) {
-  const { config = loadConfig(), createApi = (table, activeConfig) => new DeeplakeApi(activeConfig.token, activeConfig.apiUrl, activeConfig.orgId, activeConfig.workspaceId, table), executeCompiledBashCommandFn = executeCompiledBashCommand, readVirtualPathContentsFn = readVirtualPathContents, readVirtualPathContentFn = readVirtualPathContent, listVirtualPathRowsFn = listVirtualPathRows, findVirtualPathsFn = findVirtualPaths, handleGrepDirectFn = handleGrepDirect, readCachedIndexContentFn = readCachedIndexContent, writeCachedIndexContentFn = writeCachedIndexContent, runVirtualShellFn = runVirtualShell, shellBundle = SHELL_BUNDLE, logFn = log4 } = deps;
+  const { config = loadConfig(), createApi = (table, activeConfig) => new DeeplakeApi(activeConfig.token, activeConfig.apiUrl, activeConfig.orgId, activeConfig.workspaceId, table), executeCompiledBashCommandFn = executeCompiledBashCommand, readVirtualPathContentsFn = readVirtualPathContents, readVirtualPathContentFn = readVirtualPathContent, listVirtualPathRowsFn = listVirtualPathRows, findVirtualPathsFn = findVirtualPaths, handleGrepDirectFn = handleGrepDirect, readCachedIndexContentFn = readCachedIndexContent, writeCachedIndexContentFn = writeCachedIndexContent, runVirtualShellFn = runVirtualShell, shellBundle = SHELL_BUNDLE, logFn = log5 } = deps;
   const cmd = input.tool_input?.command ?? "";
   logFn(`hook fired: cmd=${cmd}`);
   if (!touchesMemory(cmd))
@@ -2082,7 +2406,7 @@ async function main() {
 }
 if (isDirectRun(import.meta.url)) {
   main().catch((e) => {
-    log4(`fatal: ${e.message}`);
+    log5(`fatal: ${e.message}`);
     process.exit(0);
   });
 }
diff --git a/codex/bundle/session-start-setup.js b/codex/bundle/session-start-setup.js
index 21609fa..a1761f3 100755
--- a/codex/bundle/session-start-setup.js
+++ b/codex/bundle/session-start-setup.js
@@ -386,7 +386,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(tbl)) {
       log2(`table "${tbl}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', summary_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
@@ -397,7 +397,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(name)) {
       log2(`table "${name}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, message_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
diff --git a/codex/bundle/shell/deeplake-shell.js b/codex/bundle/shell/deeplake-shell.js
index 0793149..eecc463 100755
--- a/codex/bundle/shell/deeplake-shell.js
+++ b/codex/bundle/shell/deeplake-shell.js
@@ -46081,14 +46081,14 @@ var require_turndown_cjs = __commonJS({
         } else if (node.nodeType === 1) {
           replacement = replacementForNode.call(self2, node);
         }
-        return join7(output, replacement);
+        return join9(output, replacement);
       }, "");
     }
     function postProcess(output) {
       var self2 = this;
       this.rules.forEach(function(rule) {
         if (typeof rule.append === "function") {
-          output = join7(output, rule.append(self2.options));
+          output = join9(output, rule.append(self2.options));
         }
       });
       return output.replace(/^[\t\r\n]+/, "").replace(/[\t\r\n\s]+$/, "");
@@ -46100,7 +46100,7 @@ var require_turndown_cjs = __commonJS({
       if (whitespace.leading || whitespace.trailing) content = content.trim();
       return whitespace.leading + rule.replacement(content, node, this.options) + whitespace.trailing;
     }
-    function join7(output, replacement) {
+    function join9(output, replacement) {
       var s12 = trimTrailingNewlines(output);
       var s22 = trimLeadingNewlines(replacement);
       var nls = Math.max(output.length - s12.length, replacement.length - s22.length);
@@ -67078,7 +67078,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(tbl)) {
       log2(`table "${tbl}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', summary_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
@@ -67089,7 +67089,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(name)) {
       log2(`table "${name}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, message_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
@@ -67101,6 +67101,8 @@ var DeeplakeApi = class {
 // dist/src/shell/deeplake-fs.js
 import { basename as basename4, posix } from "node:path";
 import { randomUUID as randomUUID2 } from "node:crypto";
+import { fileURLToPath } from "node:url";
+import { dirname as dirname4, join as join7 } from "node:path";
 
 // dist/src/shell/grep-core.js
 var TOOL_INPUT_FIELDS = [
@@ -67266,24 +67268,25 @@ function normalizeContent(path2, raw) {
     return raw;
   }
   if (Array.isArray(obj.turns)) {
-    const header = [];
-    if (obj.date_time)
-      header.push(`date: ${obj.date_time}`);
-    if (obj.speakers) {
-      const s10 = obj.speakers;
-      const names = [s10.speaker_a, s10.speaker_b].filter(Boolean).join(", ");
-      if (names)
-        header.push(`speakers: ${names}`);
-    }
+    const dateHeader = obj.date_time ? `(${String(obj.date_time)}) ` : "";
     const lines = obj.turns.map((t6) => {
       const sp = String(t6?.speaker ?? t6?.name ?? "?").trim();
       const tx = String(t6?.text ?? t6?.content ?? "").replace(/\s+/g, " ").trim();
       const tag = t6?.dia_id ? `[${t6.dia_id}] ` : "";
-      return `${tag}${sp}: ${tx}`;
+      return `${dateHeader}${tag}${sp}: ${tx}`;
     });
-    const out2 = [...header, ...lines].join("\n");
+    const out2 = lines.join("\n");
     return out2.trim() ? out2 : raw;
   }
+  if (obj.turn && typeof obj.turn === "object" && !Array.isArray(obj.turn)) {
+    const t6 = obj.turn;
+    const sp = String(t6.speaker ?? t6.name ?? "?").trim();
+    const tx = String(t6.text ?? t6.content ?? "").replace(/\s+/g, " ").trim();
+    const tag = t6.dia_id ? `[${String(t6.dia_id)}] ` : "";
+    const dateHeader = obj.date_time ? `(${String(obj.date_time)}) ` : "";
+    const line = `${dateHeader}${tag}${sp}: ${tx}`;
+    return line.trim() ? line : raw;
+  }
   const stripRecalled = (t6) => {
     const i11 = t6.indexOf("<recalled-memories>");
     if (i11 === -1)
@@ -67326,8 +67329,38 @@ function buildPathCondition(targetPath) {
   return `(path = '${sqlStr(clean)}' OR path LIKE '${sqlLike(clean)}/%' ESCAPE '\\')`;
 }
 async function searchDeeplakeTables(api, memoryTable, sessionsTable, opts) {
-  const { pathFilter, contentScanOnly, likeOp, escapedPattern, prefilterPattern, prefilterPatterns } = opts;
+  const { pathFilter, contentScanOnly, likeOp, escapedPattern, prefilterPattern, prefilterPatterns, queryEmbedding, bm25Term } = opts;
   const limit = opts.limit ?? 100;
+  if (queryEmbedding && queryEmbedding.length > 0) {
+    const vecLit = serializeFloat4Array(queryEmbedding);
+    const semanticLimit = Math.min(limit, Number(process.env.HIVEMIND_SEMANTIC_LIMIT ?? "20"));
+    const lexicalLimit = Math.min(limit, Number(process.env.HIVEMIND_HYBRID_LEXICAL_LIMIT ?? "20"));
+    const filterPatternsForLex = contentScanOnly ? prefilterPatterns && prefilterPatterns.length > 0 ? prefilterPatterns : prefilterPattern ? [prefilterPattern] : [] : [escapedPattern];
+    const memLexFilter = buildContentFilter("summary::text", likeOp, filterPatternsForLex);
+    const sessLexFilter = buildContentFilter("message::text", likeOp, filterPatternsForLex);
+    const memLexQuery = memLexFilter ? `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, 1.0 AS score FROM "${memoryTable}" WHERE 1=1${pathFilter}${memLexFilter} LIMIT ${lexicalLimit}` : null;
+    const sessLexQuery = sessLexFilter ? `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, 1.0 AS score FROM "${sessionsTable}" WHERE 1=1${pathFilter}${sessLexFilter} LIMIT ${lexicalLimit}` : null;
+    const memSemQuery = `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, (summary_embedding <#> ${vecLit}) AS score FROM "${memoryTable}" WHERE summary_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const sessSemQuery = `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, (message_embedding <#> ${vecLit}) AS score FROM "${sessionsTable}" WHERE message_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const parts = [memSemQuery, sessSemQuery];
+    if (memLexQuery)
+      parts.push(memLexQuery);
+    if (sessLexQuery)
+      parts.push(sessLexQuery);
+    const unionSql = parts.map((q17) => `(${q17})`).join(" UNION ALL ");
+    const outerLimit = semanticLimit + lexicalLimit;
+    const rows2 = await api.query(`SELECT path, content, source_order, creation_date, score FROM (` + unionSql + `) AS combined ORDER BY score DESC LIMIT ${outerLimit}`);
+    const seen = /* @__PURE__ */ new Set();
+    const unique = [];
+    for (const row of rows2) {
+      const p22 = String(row["path"]);
+      if (seen.has(p22))
+        continue;
+      seen.add(p22);
+      unique.push({ path: p22, content: String(row["content"] ?? "") });
+    }
+    return unique;
+  }
   const filterPatterns = contentScanOnly ? prefilterPatterns && prefilterPatterns.length > 0 ? prefilterPatterns : prefilterPattern ? [prefilterPattern] : [] : [escapedPattern];
   const memFilter = buildContentFilter("summary::text", likeOp, filterPatterns);
   const sessFilter = buildContentFilter("message::text", likeOp, filterPatterns);
@@ -67339,6 +67372,15 @@ async function searchDeeplakeTables(api, memoryTable, sessionsTable, opts) {
     content: String(row["content"] ?? "")
   }));
 }
+function serializeFloat4Array(vec) {
+  const parts = [];
+  for (const v27 of vec) {
+    if (!Number.isFinite(v27))
+      return "NULL";
+    parts.push(String(v27));
+  }
+  return `ARRAY[${parts.join(",")}]::float4[]`;
+}
 function buildPathFilter(targetPath) {
   const condition = buildPathCondition(targetPath);
   return condition ? ` AND ${condition}` : "";
@@ -67427,13 +67469,24 @@ function buildGrepSearchOptions(params, targetPath) {
   const hasRegexMeta = !params.fixedString && /[.*+?^${}()|[\]\\]/.test(params.pattern);
   const literalPrefilter = hasRegexMeta ? extractRegexLiteralPrefilter(params.pattern) : null;
   const alternationPrefilters = hasRegexMeta ? extractRegexAlternationPrefilters(params.pattern) : null;
+  let bm25Term;
+  if (!hasRegexMeta) {
+    bm25Term = params.pattern;
+  } else if (alternationPrefilters && alternationPrefilters.length > 0) {
+    bm25Term = alternationPrefilters.join(" ");
+  } else if (literalPrefilter) {
+    bm25Term = literalPrefilter;
+  }
   return {
     pathFilter: buildPathFilter(targetPath),
     contentScanOnly: hasRegexMeta,
-    likeOp: params.ignoreCase ? "ILIKE" : "LIKE",
+    // Kept for the pure-lexical fallback path and existing tests; BM25 is now
+    // the preferred lexical ranker when a term can be extracted.
+    likeOp: process.env.HIVEMIND_GREP_LIKE === "case-sensitive" ? "LIKE" : "ILIKE",
     escapedPattern: sqlLike(params.pattern),
     prefilterPattern: literalPrefilter ? sqlLike(literalPrefilter) : void 0,
-    prefilterPatterns: alternationPrefilters?.map((literal) => sqlLike(literal))
+    prefilterPatterns: alternationPrefilters?.map((literal) => sqlLike(literal)),
+    bm25Term
   };
 }
 function buildContentFilter(column, likeOp, patterns) {
@@ -67485,6 +67538,240 @@ function refineGrepMatches(rows, params, forceMultiFilePrefix) {
   return output;
 }
 
+// dist/src/embeddings/client.js
+import { connect } from "node:net";
+import { spawn } from "node:child_process";
+import { openSync, closeSync, writeSync, unlinkSync, existsSync as existsSync4, readFileSync as readFileSync3 } from "node:fs";
+
+// dist/src/embeddings/protocol.js
+var DEFAULT_SOCKET_DIR = "/tmp";
+var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
+var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.sock`;
+}
+function pidPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.pid`;
+}
+
+// dist/src/embeddings/client.js
+var log3 = (m26) => log("embed-client", m26);
+function getUid() {
+  const uid = typeof process.getuid === "function" ? process.getuid() : void 0;
+  return uid !== void 0 ? String(uid) : process.env.USER ?? "default";
+}
+var EmbedClient = class {
+  socketPath;
+  pidPath;
+  timeoutMs;
+  daemonEntry;
+  autoSpawn;
+  spawnWaitMs;
+  nextId = 0;
+  constructor(opts = {}) {
+    const uid = getUid();
+    const dir = opts.socketDir ?? "/tmp";
+    this.socketPath = socketPathFor(uid, dir);
+    this.pidPath = pidPathFor(uid, dir);
+    this.timeoutMs = opts.timeoutMs ?? DEFAULT_CLIENT_TIMEOUT_MS;
+    this.daemonEntry = opts.daemonEntry ?? process.env.HIVEMIND_EMBED_DAEMON;
+    this.autoSpawn = opts.autoSpawn ?? true;
+    this.spawnWaitMs = opts.spawnWaitMs ?? 5e3;
+  }
+  /**
+   * Returns an embedding vector, or null on timeout/failure. Hooks MUST treat
+   * null as "skip embedding column" — never block the write path on us.
+   *
+   * Fire-and-forget spawn on miss: if the daemon isn't up, this call returns
+   * null AND kicks off a background spawn. The next call finds a ready daemon.
+   */
+  async embed(text, kind = "document") {
+    let sock;
+    try {
+      sock = await this.connectOnce();
+    } catch {
+      if (this.autoSpawn)
+        this.trySpawnDaemon();
+      return null;
+    }
+    try {
+      const id = String(++this.nextId);
+      const req = { op: "embed", id, kind, text };
+      const resp = await this.sendAndWait(sock, req);
+      if (resp.error || !("embedding" in resp) || !resp.embedding) {
+        log3(`embed err: ${resp.error ?? "no embedding"}`);
+        return null;
+      }
+      return resp.embedding;
+    } catch (e6) {
+      const err = e6 instanceof Error ? e6.message : String(e6);
+      log3(`embed failed: ${err}`);
+      return null;
+    } finally {
+      try {
+        sock.end();
+      } catch {
+      }
+    }
+  }
+  /**
+   * Wait up to spawnWaitMs for the daemon to accept connections, spawning if
+   * necessary. Meant for SessionStart / long-running batches — not the hot path.
+   */
+  async warmup() {
+    try {
+      const s10 = await this.connectOnce();
+      s10.end();
+      return true;
+    } catch {
+      if (!this.autoSpawn)
+        return false;
+      this.trySpawnDaemon();
+      try {
+        const s10 = await this.waitForSocket();
+        s10.end();
+        return true;
+      } catch {
+        return false;
+      }
+    }
+  }
+  connectOnce() {
+    return new Promise((resolve5, reject) => {
+      const sock = connect(this.socketPath);
+      const to3 = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("connect timeout"));
+      }, this.timeoutMs);
+      sock.once("connect", () => {
+        clearTimeout(to3);
+        resolve5(sock);
+      });
+      sock.once("error", (e6) => {
+        clearTimeout(to3);
+        reject(e6);
+      });
+    });
+  }
+  trySpawnDaemon() {
+    let fd;
+    try {
+      fd = openSync(this.pidPath, "wx", 384);
+      writeSync(fd, String(process.pid));
+    } catch (e6) {
+      if (this.isPidFileStale()) {
+        try {
+          unlinkSync(this.pidPath);
+        } catch {
+        }
+        try {
+          fd = openSync(this.pidPath, "wx", 384);
+          writeSync(fd, String(process.pid));
+        } catch {
+          return;
+        }
+      } else {
+        return;
+      }
+    }
+    if (!this.daemonEntry || !existsSync4(this.daemonEntry)) {
+      log3(`daemonEntry not configured or missing: ${this.daemonEntry}`);
+      try {
+        closeSync(fd);
+        unlinkSync(this.pidPath);
+      } catch {
+      }
+      return;
+    }
+    try {
+      const child = spawn(process.execPath, [this.daemonEntry], {
+        detached: true,
+        stdio: "ignore",
+        env: process.env
+      });
+      child.unref();
+      log3(`spawned daemon pid=${child.pid}`);
+    } finally {
+      closeSync(fd);
+    }
+  }
+  isPidFileStale() {
+    try {
+      const raw = readFileSync3(this.pidPath, "utf-8").trim();
+      const pid = Number(raw);
+      if (!pid || Number.isNaN(pid))
+        return true;
+      try {
+        process.kill(pid, 0);
+        return false;
+      } catch {
+        return true;
+      }
+    } catch {
+      return true;
+    }
+  }
+  async waitForSocket() {
+    const deadline = Date.now() + this.spawnWaitMs;
+    let delay = 30;
+    while (Date.now() < deadline) {
+      await sleep2(delay);
+      delay = Math.min(delay * 1.5, 300);
+      if (!existsSync4(this.socketPath))
+        continue;
+      try {
+        return await this.connectOnce();
+      } catch {
+      }
+    }
+    throw new Error("daemon did not become ready within spawnWaitMs");
+  }
+  sendAndWait(sock, req) {
+    return new Promise((resolve5, reject) => {
+      let buf = "";
+      const to3 = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("request timeout"));
+      }, this.timeoutMs);
+      sock.setEncoding("utf-8");
+      sock.on("data", (chunk) => {
+        buf += chunk;
+        const nl3 = buf.indexOf("\n");
+        if (nl3 === -1)
+          return;
+        const line = buf.slice(0, nl3);
+        clearTimeout(to3);
+        try {
+          resolve5(JSON.parse(line));
+        } catch (e6) {
+          reject(e6);
+        }
+      });
+      sock.on("error", (e6) => {
+        clearTimeout(to3);
+        reject(e6);
+      });
+      sock.write(JSON.stringify(req) + "\n");
+    });
+  }
+};
+function sleep2(ms3) {
+  return new Promise((r10) => setTimeout(r10, ms3));
+}
+
+// dist/src/embeddings/sql.js
+function embeddingSqlLiteral(vec) {
+  if (!vec || vec.length === 0)
+    return "NULL";
+  const parts = [];
+  for (const v27 of vec) {
+    if (!Number.isFinite(v27))
+      return "NULL";
+    parts.push(String(v27));
+  }
+  return `ARRAY[${parts.join(",")}]::float4[]`;
+}
+
 // dist/src/shell/deeplake-fs.js
 var BATCH_SIZE = 10;
 var PREFETCH_BATCH_SIZE = 50;
@@ -67513,6 +67800,9 @@ function normalizeSessionMessage(path2, message) {
   const raw = typeof message === "string" ? message : JSON.stringify(message);
   return normalizeContent(path2, raw);
 }
+function resolveEmbedDaemonPath() {
+  return join7(dirname4(fileURLToPath(import.meta.url)), "embeddings", "embed-daemon.js");
+}
 function joinSessionMessages(path2, messages) {
   return messages.map((message) => normalizeSessionMessage(path2, message)).join("\n");
 }
@@ -67542,6 +67832,8 @@ var DeeplakeFs = class _DeeplakeFs {
   // Paths that live in the sessions table (multi-row, read by concatenation)
   sessionPaths = /* @__PURE__ */ new Set();
   sessionsTable = null;
+  // Embedding client lazily created on first flush. Lives as long as the process.
+  embedClient = null;
   constructor(client, table, mountPoint) {
     this.client = client;
     this.table = table;
@@ -67635,7 +67927,8 @@ var DeeplakeFs = class _DeeplakeFs {
     }
     const rows = [...this.pending.values()];
     this.pending.clear();
-    const results = await Promise.allSettled(rows.map((r10) => this.upsertRow(r10)));
+    const embeddings = await this.computeEmbeddings(rows);
+    const results = await Promise.allSettled(rows.map((r10, i11) => this.upsertRow(r10, embeddings[i11])));
     let failures = 0;
     for (let i11 = 0; i11 < results.length; i11++) {
       if (results[i11].status === "rejected") {
@@ -67649,7 +67942,15 @@ var DeeplakeFs = class _DeeplakeFs {
       throw new Error(`flush: ${failures}/${rows.length} writes failed and were re-queued`);
     }
   }
-  async upsertRow(r10) {
+  async computeEmbeddings(rows) {
+    if (rows.length === 0)
+      return [];
+    if (!this.embedClient) {
+      this.embedClient = new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() });
+    }
+    return Promise.all(rows.map((r10) => this.embedClient.embed(r10.contentText, "document")));
+  }
+  async upsertRow(r10, embedding) {
     const text = sqlStr(r10.contentText);
     const p22 = sqlStr(r10.path);
     const fname = sqlStr(r10.filename);
@@ -67657,8 +67958,9 @@ var DeeplakeFs = class _DeeplakeFs {
     const ts3 = (/* @__PURE__ */ new Date()).toISOString();
     const cd = r10.creationDate ?? ts3;
     const lud = r10.lastUpdateDate ?? ts3;
+    const embSql = embeddingSqlLiteral(embedding);
     if (this.flushed.has(r10.path)) {
-      let setClauses = `filename = '${fname}', summary = E'${text}', mime_type = '${mime}', size_bytes = ${r10.sizeBytes}, last_update_date = '${sqlStr(lud)}'`;
+      let setClauses = `filename = '${fname}', summary = E'${text}', summary_embedding = ${embSql}, mime_type = '${mime}', size_bytes = ${r10.sizeBytes}, last_update_date = '${sqlStr(lud)}'`;
       if (r10.project !== void 0)
         setClauses += `, project = '${sqlStr(r10.project)}'`;
       if (r10.description !== void 0)
@@ -67666,51 +67968,72 @@ var DeeplakeFs = class _DeeplakeFs {
       await this.client.query(`UPDATE "${this.table}" SET ${setClauses} WHERE path = '${p22}'`);
     } else {
       const id = randomUUID2();
-      const cols = "id, path, filename, summary, mime_type, size_bytes, creation_date, last_update_date" + (r10.project !== void 0 ? ", project" : "") + (r10.description !== void 0 ? ", description" : "");
-      const vals = `'${id}', '${p22}', '${fname}', E'${text}', '${mime}', ${r10.sizeBytes}, '${sqlStr(cd)}', '${sqlStr(lud)}'` + (r10.project !== void 0 ? `, '${sqlStr(r10.project)}'` : "") + (r10.description !== void 0 ? `, '${sqlStr(r10.description)}'` : "");
+      const cols = "id, path, filename, summary, summary_embedding, mime_type, size_bytes, creation_date, last_update_date" + (r10.project !== void 0 ? ", project" : "") + (r10.description !== void 0 ? ", description" : "");
+      const vals = `'${id}', '${p22}', '${fname}', E'${text}', ${embSql}, '${mime}', ${r10.sizeBytes}, '${sqlStr(cd)}', '${sqlStr(lud)}'` + (r10.project !== void 0 ? `, '${sqlStr(r10.project)}'` : "") + (r10.description !== void 0 ? `, '${sqlStr(r10.description)}'` : "");
       await this.client.query(`INSERT INTO "${this.table}" (${cols}) VALUES (${vals})`);
       this.flushed.add(r10.path);
     }
   }
   // ── Virtual index.md generation ────────────────────────────────────────────
   async generateVirtualIndex() {
-    const rows = await this.client.query(`SELECT path, project, description, creation_date, last_update_date FROM "${this.table}" WHERE path LIKE '${sqlStr("/summaries/")}%' ORDER BY last_update_date DESC`);
-    const sessionPathsByKey = /* @__PURE__ */ new Map();
-    for (const sp of this.sessionPaths) {
-      const hivemind = sp.match(/\/sessions\/[^/]+\/[^/]+_([^.]+)\.jsonl$/);
-      if (hivemind) {
-        sessionPathsByKey.set(hivemind[1], sp.slice(1));
-      } else {
-        const fname = sp.split("/").pop() ?? "";
-        const stem = fname.replace(/\.[^.]+$/, "");
-        if (stem)
-          sessionPathsByKey.set(stem, sp.slice(1));
+    const summaryRows = await this.client.query(`SELECT path, project, description, creation_date, last_update_date FROM "${this.table}" WHERE path LIKE '${sqlStr("/summaries/")}%' ORDER BY last_update_date DESC`);
+    let sessionRows = [];
+    if (this.sessionsTable) {
+      try {
+        sessionRows = await this.client.query(`SELECT path, MAX(description) AS description, MIN(creation_date) AS creation_date, MAX(last_update_date) AS last_update_date FROM "${this.sessionsTable}" WHERE path LIKE '${sqlStr("/sessions/")}%' GROUP BY path ORDER BY path`);
+      } catch {
+        sessionRows = [];
       }
     }
     const lines = [
       "# Session Index",
       "",
-      "List of all Claude Code sessions with summaries.",
-      "",
-      "| Session | Conversation | Created | Last Updated | Project | Description |",
-      "|---------|-------------|---------|--------------|---------|-------------|"
+      "Two sources are available. Consult the section relevant to the question.",
+      ""
     ];
-    for (const row of rows) {
-      const p22 = row["path"];
-      const match2 = p22.match(/\/summaries\/([^/]+)\/([^/]+)\.md$/);
-      if (!match2)
-        continue;
-      const summaryUser = match2[1];
-      const sessionId = match2[2];
-      const relPath = `summaries/${summaryUser}/${sessionId}.md`;
-      const baseName = sessionId.replace(/_summary$/, "");
-      const convPath = sessionPathsByKey.get(sessionId) ?? sessionPathsByKey.get(baseName);
-      const convLink = convPath ? `[messages](${convPath})` : "";
-      const project = row["project"] || "";
-      const description = row["description"] || "";
-      const creationDate = row["creation_date"] || "";
-      const lastUpdateDate = row["last_update_date"] || "";
-      lines.push(`| [${sessionId}](${relPath}) | ${convLink} | ${creationDate} | ${lastUpdateDate} | ${project} | ${description} |`);
+    lines.push("## memory");
+    lines.push("");
+    if (summaryRows.length === 0) {
+      lines.push("_(empty \u2014 no summaries ingested yet)_");
+    } else {
+      lines.push("AI-generated summaries per session. Read these first for topic-level overviews.");
+      lines.push("");
+      lines.push("| Session | Created | Last Updated | Project | Description |");
+      lines.push("|---------|---------|--------------|---------|-------------|");
+      for (const row of summaryRows) {
+        const p22 = row["path"];
+        const match2 = p22.match(/\/summaries\/([^/]+)\/([^/]+)\.md$/);
+        if (!match2)
+          continue;
+        const summaryUser = match2[1];
+        const sessionId = match2[2];
+        const relPath = `summaries/${summaryUser}/${sessionId}.md`;
+        const project = row["project"] || "";
+        const description = row["description"] || "";
+        const creationDate = row["creation_date"] || "";
+        const lastUpdateDate = row["last_update_date"] || "";
+        lines.push(`| [${sessionId}](${relPath}) | ${creationDate} | ${lastUpdateDate} | ${project} | ${description} |`);
+      }
+    }
+    lines.push("");
+    lines.push("## sessions");
+    lines.push("");
+    if (sessionRows.length === 0) {
+      lines.push("_(empty \u2014 no session records ingested yet)_");
+    } else {
+      lines.push("Raw session records (dialogue, tool calls). Read for exact detail / quotes.");
+      lines.push("");
+      lines.push("| Session | Created | Last Updated | Description |");
+      lines.push("|---------|---------|--------------|-------------|");
+      for (const row of sessionRows) {
+        const p22 = row["path"] || "";
+        const rel = p22.startsWith("/") ? p22.slice(1) : p22;
+        const filename = p22.split("/").pop() ?? p22;
+        const description = row["description"] || "";
+        const creationDate = row["creation_date"] || "";
+        const lastUpdateDate = row["last_update_date"] || "";
+        lines.push(`| [${filename}](${rel}) | ${creationDate} | ${lastUpdateDate} | ${description} |`);
+      }
     }
     lines.push("");
     return lines.join("\n");
@@ -69021,7 +69344,7 @@ function stripQuotes(val) {
 }
 
 // node_modules/yargs-parser/build/lib/index.js
-import { readFileSync as readFileSync3 } from "fs";
+import { readFileSync as readFileSync4 } from "fs";
 import { createRequire } from "node:module";
 var _a3;
 var _b;
@@ -69048,7 +69371,7 @@ var parser = new YargsParser({
     if (typeof require2 !== "undefined") {
       return require2(path2);
     } else if (path2.match(/\.json$/)) {
-      return JSON.parse(readFileSync3(path2, "utf8"));
+      return JSON.parse(readFileSync4(path2, "utf8"));
     } else {
       throw Error("only .json config files are supported in ESM");
     }
@@ -69067,6 +69390,33 @@ yargsParser.looksLikeNumber = looksLikeNumber;
 var lib_default = yargsParser;
 
 // dist/src/shell/grep-interceptor.js
+import { fileURLToPath as fileURLToPath2 } from "node:url";
+import { dirname as dirname5, join as join8 } from "node:path";
+var SEMANTIC_SEARCH_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false";
+var SEMANTIC_EMBED_TIMEOUT_MS = Number(process.env.HIVEMIND_SEMANTIC_EMBED_TIMEOUT_MS ?? "500");
+function resolveGrepEmbedDaemonPath() {
+  return join8(dirname5(fileURLToPath2(import.meta.url)), "..", "embeddings", "embed-daemon.js");
+}
+var sharedGrepEmbedClient = null;
+function getGrepEmbedClient() {
+  if (!sharedGrepEmbedClient) {
+    sharedGrepEmbedClient = new EmbedClient({
+      daemonEntry: resolveGrepEmbedDaemonPath(),
+      timeoutMs: SEMANTIC_EMBED_TIMEOUT_MS
+    });
+  }
+  return sharedGrepEmbedClient;
+}
+function patternIsSemanticFriendly(pattern, fixedString) {
+  if (!pattern || pattern.length < 2)
+    return false;
+  if (fixedString)
+    return true;
+  const metaMatches = pattern.match(/[|()\[\]{}+?^$\\]/g);
+  if (!metaMatches)
+    return true;
+  return metaMatches.length <= 1;
+}
 var MAX_FALLBACK_CANDIDATES = 500;
 function createGrepCommand(client, fs3, table, sessionsTable) {
   return Yi2("grep", async (args, ctx) => {
@@ -69108,12 +69458,21 @@ function createGrepCommand(client, fs3, table, sessionsTable) {
       filesOnly: Boolean(parsed.l || parsed["files-with-matches"]),
       countOnly: Boolean(parsed.c || parsed["count"])
     };
+    let queryEmbedding = null;
+    if (SEMANTIC_SEARCH_ENABLED && patternIsSemanticFriendly(pattern, matchParams.fixedString)) {
+      try {
+        queryEmbedding = await getGrepEmbedClient().embed(pattern, "query");
+      } catch {
+        queryEmbedding = null;
+      }
+    }
     let rows = [];
     try {
       const searchOptions = {
         ...buildGrepSearchOptions(matchParams, targets[0] ?? ctx.cwd),
         pathFilter: buildPathFilterForTargets(targets),
-        limit: 100
+        limit: 100,
+        queryEmbedding
       };
       const queryRows = await Promise.race([
         searchDeeplakeTables(client, table, sessionsTable ?? "sessions", searchOptions),
@@ -69123,6 +69482,21 @@ function createGrepCommand(client, fs3, table, sessionsTable) {
     } catch {
       rows = [];
     }
+    if (rows.length === 0 && queryEmbedding) {
+      try {
+        const lexicalOptions = {
+          ...buildGrepSearchOptions(matchParams, targets[0] ?? ctx.cwd),
+          pathFilter: buildPathFilterForTargets(targets),
+          limit: 100
+        };
+        const lexicalRows = await Promise.race([
+          searchDeeplakeTables(client, table, sessionsTable ?? "sessions", lexicalOptions),
+          new Promise((_16, reject) => setTimeout(() => reject(new Error("timeout")), 3e3))
+        ]);
+        rows.push(...lexicalRows);
+      } catch {
+      }
+    }
     const seen = /* @__PURE__ */ new Set();
     rows = rows.filter((r10) => seen.has(r10.path) ? false : (seen.add(r10.path), true));
     if (rows.length === 0) {
@@ -69136,7 +69510,19 @@ function createGrepCommand(client, fs3, table, sessionsTable) {
       }
     }
     const normalized = rows.map((r10) => ({ path: r10.path, content: normalizeContent(r10.path, r10.content) }));
-    const output = refineGrepMatches(normalized, matchParams);
+    let output;
+    if (queryEmbedding && queryEmbedding.length > 0 && process.env.HIVEMIND_SEMANTIC_EMIT_ALL !== "false") {
+      output = [];
+      for (const r10 of normalized) {
+        for (const line of r10.content.split("\n")) {
+          const trimmed = line.trim();
+          if (trimmed)
+            output.push(`${r10.path}:${line}`);
+        }
+      }
+    } else {
+      output = refineGrepMatches(normalized, matchParams);
+    }
     return {
       stdout: output.length > 0 ? output.join("\n") + "\n" : "",
       stderr: "",
diff --git a/codex/bundle/stop.js b/codex/bundle/stop.js
index e6081b5..a25b183 100755
--- a/codex/bundle/stop.js
+++ b/codex/bundle/stop.js
@@ -378,7 +378,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(tbl)) {
       log2(`table "${tbl}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${tbl}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', summary TEXT NOT NULL DEFAULT '', summary_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'text/plain', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
@@ -389,7 +389,7 @@ var DeeplakeApi = class {
     const tables = await this.listTables();
     if (!tables.includes(name)) {
       log2(`table "${name}" not found, creating`);
-      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
+      await this.query(`CREATE TABLE IF NOT EXISTS "${name}" (id TEXT NOT NULL DEFAULT '', path TEXT NOT NULL DEFAULT '', filename TEXT NOT NULL DEFAULT '', message JSONB, message_embedding FLOAT4[], author TEXT NOT NULL DEFAULT '', mime_type TEXT NOT NULL DEFAULT 'application/json', size_bytes BIGINT NOT NULL DEFAULT 0, project TEXT NOT NULL DEFAULT '', description TEXT NOT NULL DEFAULT '', agent TEXT NOT NULL DEFAULT '', creation_date TEXT NOT NULL DEFAULT '', last_update_date TEXT NOT NULL DEFAULT '') USING deeplake`);
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];

From 51c588163489da31f5fa7a8c5d20f138a562619b Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Wed, 22 Apr 2026 18:43:25 +0000
Subject: [PATCH 08/30] test(embeddings): raise coverage >=90% on all new +
 touched files

Adds targeted tests for the nomic daemon, IPC client, hybrid grep path,
and the semantic emit-all branch in grep-core, plus per-file thresholds
in vitest.config.ts so future regressions are caught in CI.

New test files
- claude-code/tests/embeddings-daemon.test.ts (11 tests): ping, embed,
  unknown op, pidfile content, stale-socket unlink, idle-timeout-triggered
  shutdown, malformed-JSON survival, dispatch-error -> { error } reply,
  default options, empty-line framing, abrupt client disconnect.
- claude-code/tests/embeddings-nomic.test.ts (12 tests): lazy load
  memoization, document/query prefixing, batching, empty batch, Matryoshka
  truncation with renormalization, zero-norm fallback, default repo/dtype/
  dims, and concurrent load() coalescing.

Extended tests
- embeddings-client.test.ts: stale-pid cleanup, alive-pid preservation,
  garbage-pid cleanup, socket reset mid-request, malformed JSON, request
  timeout, getEmbedClient() singleton, default options, default 'kind'
  argument, HIVEMIND_EMBED_DAEMON env fallback, successful auto-spawn via
  fake daemon entry.
- grep-interceptor.test.ts: semantic-friendly pattern passes embedding
  into searchDeeplakeTables; regex-heavy / too-short patterns skip
  embedding; embed() rejection falls back to lexical; lexical retry when
  semantic returns zero rows; emit-all-lines branch; SEMANTIC_EMIT_ALL
  opt-out; Promise.race 3s timeout rejector via fake timers.
- grep-core.test.ts: grepBothTables emits every non-empty line when a
  queryEmbedding is present; refinement still runs when SEMANTIC_EMIT_ALL
  is disabled.

Source tweak
- daemon.ts: marks the CLI-entrypoint block with /* v8 ignore start/stop
  */. The invokedDirectly bootstrap only fires when the file is node's
  argv[1], which unit tests can't reproduce without forking a subprocess.

Config
- vitest.config.ts: adds per-file thresholds for src/embeddings/*.ts.
  Lines/statements are held at 90 for every embeddings file; branches
  and functions dip to 80/75 only on client.ts and daemon.ts where a
  small number of paths (SIGINT/SIGTERM handlers, non-Linux getuid
  fallback, server 'error' handler) cannot be exercised from unit tests.

Resulting per-file coverage
- client.ts        95.9 / 85.1 / 95.23 / 96.29
- daemon.ts        94.87 / 77.77 / 78.94 / 100
- nomic.ts         96.22 / 92   / 100   / 100
- protocol.ts      100  / 100  / 100   / 100
- sql.ts           100  / 100  / 100   / 100
- grep-core.ts     96.79 / 91.5 / 97.22 / 100
- grep-interceptor 97.5 / 92.1 / 94.11 / 100

All 933 tests pass; no threshold errors.
---
 claude-code/tests/embeddings-client.test.ts | 216 ++++++++++++-
 claude-code/tests/embeddings-daemon.test.ts | 263 ++++++++++++++++
 claude-code/tests/embeddings-nomic.test.ts  | 149 +++++++++
 claude-code/tests/grep-core.test.ts         | 331 +++++++++++++++++++-
 claude-code/tests/grep-interceptor.test.ts  | 171 +++++++++-
 src/embeddings/daemon.ts                    |   2 +
 vitest.config.ts                            |  36 +++
 7 files changed, 1155 insertions(+), 13 deletions(-)
 create mode 100644 claude-code/tests/embeddings-daemon.test.ts
 create mode 100644 claude-code/tests/embeddings-nomic.test.ts

diff --git a/claude-code/tests/embeddings-client.test.ts b/claude-code/tests/embeddings-client.test.ts
index de13060..07c0d57 100644
--- a/claude-code/tests/embeddings-client.test.ts
+++ b/claude-code/tests/embeddings-client.test.ts
@@ -3,10 +3,11 @@
 
 import { describe, it, expect, afterEach } from "vitest";
 import { createServer, type Server, type Socket } from "node:net";
-import { mkdtempSync, rmSync, existsSync } from "node:fs";
+import { mkdtempSync, rmSync, existsSync, writeFileSync } from "node:fs";
 import { tmpdir } from "node:os";
 import { join } from "node:path";
-import { EmbedClient } from "../../src/embeddings/client.js";
+import { execSync } from "node:child_process";
+import { EmbedClient, getEmbedClient } from "../../src/embeddings/client.js";
 import type { DaemonRequest, DaemonResponse } from "../../src/embeddings/protocol.js";
 
 let servers: Server[] = [];
@@ -115,4 +116,215 @@ describe("EmbedClient", () => {
     ]);
     expect(results.every((r) => r !== null && r.length === 1)).toBe(true);
   });
+
+  it("warmup() returns true when the daemon is already listening", async () => {
+    const dir = makeTmpDir();
+    await startFakeDaemon(dir, (req) => ({ id: req.id, ready: true }));
+    const client = new EmbedClient({ socketDir: dir, timeoutMs: 500, autoSpawn: false });
+    const ok = await client.warmup();
+    expect(ok).toBe(true);
+  });
+
+  it("warmup() returns false when no daemon and autoSpawn is disabled", async () => {
+    const dir = makeTmpDir();
+    const client = new EmbedClient({ socketDir: dir, timeoutMs: 100, autoSpawn: false });
+    const ok = await client.warmup();
+    expect(ok).toBe(false);
+  });
+
+  it("warmup() returns false when autoSpawn is on but entry cannot be launched", async () => {
+    const dir = makeTmpDir();
+    const client = new EmbedClient({
+      socketDir: dir,
+      timeoutMs: 100,
+      autoSpawn: true,
+      daemonEntry: "/nonexistent/daemon.js",
+      spawnWaitMs: 150,
+    });
+    const ok = await client.warmup();
+    expect(ok).toBe(false);
+  });
+
+  it("cleans up a stale pidfile (dead PID) before trying to spawn", async () => {
+    const dir = makeTmpDir();
+    const uid = String(process.getuid?.() ?? "test");
+    const pidPath = join(dir, `hivemind-embed-${uid}.pid`);
+    // Write a PID guaranteed-dead: 0x7FFFFFFF is not a plausible live PID on Linux.
+    writeFileSync(pidPath, "2147483646");
+
+    const client = new EmbedClient({
+      socketDir: dir,
+      timeoutMs: 50,
+      autoSpawn: true,
+      daemonEntry: "/nonexistent/daemon.js",
+    });
+    const vec = await client.embed("x");
+    expect(vec).toBeNull();
+    // Client should have cleaned up the pidfile after detecting the entry is missing.
+    expect(existsSync(pidPath)).toBe(false);
+  });
+
+  it("leaves an alive-PID pidfile alone (treats the daemon as still starting)", async () => {
+    const dir = makeTmpDir();
+    const uid = String(process.getuid?.() ?? "test");
+    const pidPath = join(dir, `hivemind-embed-${uid}.pid`);
+    // Our own PID is alive → isPidFileStale() should return false.
+    writeFileSync(pidPath, String(process.pid));
+
+    const client = new EmbedClient({
+      socketDir: dir,
+      timeoutMs: 50,
+      autoSpawn: true,
+      daemonEntry: "/nonexistent/daemon.js",
+    });
+    const vec = await client.embed("x");
+    expect(vec).toBeNull();
+    // Pidfile is still there because client saw it as a live owner, not stale.
+    expect(existsSync(pidPath)).toBe(true);
+  });
+
+  it("treats a garbage pidfile as stale and removes it", async () => {
+    const dir = makeTmpDir();
+    const uid = String(process.getuid?.() ?? "test");
+    const pidPath = join(dir, `hivemind-embed-${uid}.pid`);
+    writeFileSync(pidPath, "not-a-number");
+
+    const client = new EmbedClient({
+      socketDir: dir,
+      timeoutMs: 50,
+      autoSpawn: true,
+      daemonEntry: "/nonexistent/daemon.js",
+    });
+    const vec = await client.embed("x");
+    expect(vec).toBeNull();
+    expect(existsSync(pidPath)).toBe(false);
+  });
+
+  it("returns null when the socket closes mid-request", async () => {
+    const dir = makeTmpDir();
+    const uid = String(process.getuid?.() ?? "test");
+    const sockPath = join(dir, `hivemind-embed-${uid}.sock`);
+    const srv = createServer((sock: Socket) => {
+      // Immediately destroy the connection after accept so sendAndWait errors.
+      sock.destroy();
+    });
+    servers.push(srv);
+    await new Promise<void>((resolve) => srv.listen(sockPath, resolve));
+
+    const client = new EmbedClient({ socketDir: dir, timeoutMs: 500, autoSpawn: false });
+    const vec = await client.embed("boom");
+    expect(vec).toBeNull();
+  });
+
+  it("returns null when the daemon writes malformed JSON", async () => {
+    const dir = makeTmpDir();
+    const uid = String(process.getuid?.() ?? "test");
+    const sockPath = join(dir, `hivemind-embed-${uid}.sock`);
+    const srv = createServer((sock: Socket) => {
+      sock.setEncoding("utf-8");
+      sock.on("data", () => {
+        sock.write("not-json\n");
+      });
+    });
+    servers.push(srv);
+    await new Promise<void>((resolve) => srv.listen(sockPath, resolve));
+
+    const client = new EmbedClient({ socketDir: dir, timeoutMs: 500, autoSpawn: false });
+    const vec = await client.embed("boom");
+    expect(vec).toBeNull();
+  });
+
+  it("returns null on request timeout (daemon accepts but never replies)", async () => {
+    const dir = makeTmpDir();
+    const uid = String(process.getuid?.() ?? "test");
+    const sockPath = join(dir, `hivemind-embed-${uid}.sock`);
+    const srv = createServer((_sock: Socket) => {
+      // Accept the connection but never send anything back.
+    });
+    servers.push(srv);
+    await new Promise<void>((resolve) => srv.listen(sockPath, resolve));
+
+    const client = new EmbedClient({ socketDir: dir, timeoutMs: 50, autoSpawn: false });
+    const vec = await client.embed("boom");
+    expect(vec).toBeNull();
+  });
+
+  it("getEmbedClient() returns a cached singleton", () => {
+    const a = getEmbedClient();
+    const b = getEmbedClient();
+    expect(a).toBe(b);
+  });
+
+  it("uses default option values when constructed with no arguments", () => {
+    // Just instantiating exercises every `opts.x ?? default` branch.
+    const c = new EmbedClient();
+    expect(c).toBeInstanceOf(EmbedClient);
+  });
+
+  it("defaults the embed 'kind' argument to document when omitted", async () => {
+    const dir = makeTmpDir();
+    const kinds: string[] = [];
+    await startFakeDaemon(dir, (req) => {
+      if (req.op === "embed") kinds.push(req.kind);
+      return { id: req.id, embedding: [0.5] };
+    });
+    const client = new EmbedClient({ socketDir: dir, timeoutMs: 500, autoSpawn: false });
+    await client.embed("hello"); // no kind
+    expect(kinds).toEqual(["document"]);
+  });
+
+  it("falls back to HIVEMIND_EMBED_DAEMON env when daemonEntry option is absent", () => {
+    const prev = process.env.HIVEMIND_EMBED_DAEMON;
+    process.env.HIVEMIND_EMBED_DAEMON = "/from/env.js";
+    try {
+      const c = new EmbedClient({ socketDir: makeTmpDir(), autoSpawn: false });
+      // We can't read the private field directly; just assert construction succeeded.
+      expect(c).toBeInstanceOf(EmbedClient);
+    } finally {
+      if (prev === undefined) delete process.env.HIVEMIND_EMBED_DAEMON;
+      else process.env.HIVEMIND_EMBED_DAEMON = prev;
+    }
+  });
+
+  it("warmup() succeeds after auto-spawning a fake daemon entry", async () => {
+    const dir = makeTmpDir();
+    const uid = String(process.getuid?.() ?? "test");
+    const sockPath = join(dir, `hivemind-embed-${uid}.sock`);
+    // Write a tiny daemon script that binds the expected socket and answers pings.
+    const daemonScript = join(dir, "fake-daemon.js");
+    writeFileSync(daemonScript, `
+      const net = require("node:net");
+      const srv = net.createServer((s) => {
+        s.setEncoding("utf-8");
+        let buf = "";
+        s.on("data", (c) => {
+          buf += c;
+          let nl;
+          while ((nl = buf.indexOf("\\n")) !== -1) {
+            const line = buf.slice(0, nl);
+            buf = buf.slice(nl + 1);
+            try {
+              const req = JSON.parse(line);
+              s.write(JSON.stringify({ id: req.id, ready: true }) + "\\n");
+            } catch {}
+          }
+        });
+      });
+      srv.listen(${JSON.stringify(sockPath)});
+      setTimeout(() => srv.close(), 3000);
+    `);
+
+    const client = new EmbedClient({
+      socketDir: dir,
+      timeoutMs: 500,
+      autoSpawn: true,
+      daemonEntry: daemonScript,
+      spawnWaitMs: 2000,
+    });
+    const ok = await client.warmup();
+    expect(ok).toBe(true);
+
+    // Cleanup the spawned daemon process.
+    try { execSync(`pkill -f ${daemonScript}`); } catch { /* already exited */ }
+  });
 });
diff --git a/claude-code/tests/embeddings-daemon.test.ts b/claude-code/tests/embeddings-daemon.test.ts
new file mode 100644
index 0000000..2917816
--- /dev/null
+++ b/claude-code/tests/embeddings-daemon.test.ts
@@ -0,0 +1,263 @@
+import { describe, it, expect, vi, beforeEach, afterEach } from "vitest";
+import { connect } from "node:net";
+import { mkdtempSync, rmSync, existsSync, writeFileSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+
+// Mock NomicEmbedder so the daemon doesn't pull in @huggingface/transformers.
+// The daemon talks to the embedder via two methods only: load() and embed().
+// The `embedMode` global lets an individual test flip behavior: "ok" returns
+// a vector, "throw" makes embed() reject — drives the dispatch-error branch.
+(globalThis as any).__embedMode = "ok";
+
+vi.mock("../../src/embeddings/nomic.js", () => {
+  class MockNomicEmbedder {
+    repo: string;
+    dims: number;
+    dtype: string;
+    constructor(opts: any = {}) {
+      this.repo = opts.repo ?? "mock-repo";
+      this.dims = opts.dims ?? 768;
+      this.dtype = opts.dtype ?? "q8";
+    }
+    async load() { /* no-op */ }
+    async embed(_text: string, _kind?: string) {
+      if ((globalThis as any).__embedMode === "throw") {
+        throw new Error("forced embed failure");
+      }
+      return [0.1, 0.2, 0.3];
+    }
+    async embedBatch(texts: string[], _kind?: string) {
+      return texts.map(() => [0.1, 0.2, 0.3]);
+    }
+  }
+  return { NomicEmbedder: MockNomicEmbedder };
+});
+
+import { EmbedDaemon } from "../../src/embeddings/daemon.js";
+
+function sendLine(socketPath: string, req: object): Promise<any> {
+  return new Promise((resolve, reject) => {
+    const sock = connect(socketPath);
+    let buf = "";
+    const to = setTimeout(() => { sock.destroy(); reject(new Error("timeout")); }, 2000);
+    sock.setEncoding("utf-8");
+    sock.on("connect", () => sock.write(JSON.stringify(req) + "\n"));
+    sock.on("data", (chunk: string) => {
+      buf += chunk;
+      const nl = buf.indexOf("\n");
+      if (nl === -1) return;
+      clearTimeout(to);
+      sock.end();
+      try { resolve(JSON.parse(buf.slice(0, nl))); } catch (e) { reject(e); }
+    });
+    sock.on("error", (e) => { clearTimeout(to); reject(e); });
+  });
+}
+
+describe("EmbedDaemon", () => {
+  let dir: string;
+  let daemon: EmbedDaemon | null = null;
+
+  beforeEach(() => {
+    dir = mkdtempSync(join(tmpdir(), "hvm-daemon-test-"));
+  });
+
+  afterEach(() => {
+    try { daemon?.shutdown(); } catch { /* shutdown calls process.exit, ignore */ }
+    daemon = null;
+    try { rmSync(dir, { recursive: true, force: true }); } catch { /* */ }
+    (globalThis as any).__embedMode = "ok";
+  });
+
+  it("answers a ping with the model + dims metadata", async () => {
+    // process.exit inside shutdown would terminate the test runner; stub it.
+    const exitSpy = vi.spyOn(process, "exit").mockImplementation(() => undefined as never);
+    daemon = new EmbedDaemon({ socketDir: dir, idleTimeoutMs: 60_000, dims: 128 });
+    await daemon.start();
+
+    const uid = String(process.getuid?.() ?? "test");
+    const sock = join(dir, `hivemind-embed-${uid}.sock`);
+    const resp = await sendLine(sock, { op: "ping", id: "p1" });
+    expect(resp.id).toBe("p1");
+    expect(resp.ready).toBe(true);
+    expect(resp.dims).toBe(128);
+
+    exitSpy.mockRestore();
+  });
+
+  it("answers an embed request with the vector from the mocked embedder", async () => {
+    const exitSpy = vi.spyOn(process, "exit").mockImplementation(() => undefined as never);
+    daemon = new EmbedDaemon({ socketDir: dir, idleTimeoutMs: 60_000 });
+    await daemon.start();
+
+    const uid = String(process.getuid?.() ?? "test");
+    const sock = join(dir, `hivemind-embed-${uid}.sock`);
+    const resp = await sendLine(sock, { op: "embed", id: "e1", kind: "document", text: "hello" });
+    expect(resp.id).toBe("e1");
+    expect(resp.embedding).toEqual([0.1, 0.2, 0.3]);
+
+    exitSpy.mockRestore();
+  });
+
+  it("returns { error } for unknown ops", async () => {
+    const exitSpy = vi.spyOn(process, "exit").mockImplementation(() => undefined as never);
+    daemon = new EmbedDaemon({ socketDir: dir, idleTimeoutMs: 60_000 });
+    await daemon.start();
+
+    const uid = String(process.getuid?.() ?? "test");
+    const sock = join(dir, `hivemind-embed-${uid}.sock`);
+    const resp = await sendLine(sock, { op: "bogus", id: "x" });
+    expect(resp.error).toContain("unknown op");
+
+    exitSpy.mockRestore();
+  });
+
+  it("writes a pidfile with the daemon's own PID on startup", async () => {
+    const exitSpy = vi.spyOn(process, "exit").mockImplementation(() => undefined as never);
+    daemon = new EmbedDaemon({ socketDir: dir, idleTimeoutMs: 60_000 });
+    await daemon.start();
+
+    const uid = String(process.getuid?.() ?? "test");
+    const pidPath = join(dir, `hivemind-embed-${uid}.pid`);
+    const { readFileSync } = await import("node:fs");
+    const pid = Number(readFileSync(pidPath, "utf-8").trim());
+    expect(pid).toBe(process.pid);
+
+    exitSpy.mockRestore();
+  });
+
+  it("unlinks a stale socket on startup before re-binding", async () => {
+    const uid = String(process.getuid?.() ?? "test");
+    const sockPath = join(dir, `hivemind-embed-${uid}.sock`);
+    // Pre-create a stale file at the socket path.
+    writeFileSync(sockPath, "stale");
+    expect(existsSync(sockPath)).toBe(true);
+
+    const exitSpy = vi.spyOn(process, "exit").mockImplementation(() => undefined as never);
+    daemon = new EmbedDaemon({ socketDir: dir, idleTimeoutMs: 60_000 });
+    await daemon.start();
+    // Now it's a live Unix socket; stat would say it's a socket not a regular file.
+    expect(existsSync(sockPath)).toBe(true);
+
+    exitSpy.mockRestore();
+  });
+
+  it("idle timer triggers shutdown after the configured window", async () => {
+    const exitSpy = vi.spyOn(process, "exit").mockImplementation(() => undefined as never);
+    daemon = new EmbedDaemon({ socketDir: dir, idleTimeoutMs: 50 });
+    await daemon.start();
+    await new Promise(r => setTimeout(r, 120));
+    // shutdown called via process.exit stub (spyed above) — our exit count > 0.
+    expect(exitSpy).toHaveBeenCalled();
+    exitSpy.mockRestore();
+  });
+
+  it("returns { error } when the embedder throws during an embed request", async () => {
+    const exitSpy = vi.spyOn(process, "exit").mockImplementation(() => undefined as never);
+    (globalThis as any).__embedMode = "throw";
+    daemon = new EmbedDaemon({ socketDir: dir, idleTimeoutMs: 60_000 });
+    await daemon.start();
+
+    const uid = String(process.getuid?.() ?? "test");
+    const sock = join(dir, `hivemind-embed-${uid}.sock`);
+    const resp = await sendLine(sock, { op: "embed", id: "e2", kind: "document", text: "hi" });
+    expect(resp.id).toBe("e2");
+    expect(resp.error).toContain("forced embed failure");
+
+    exitSpy.mockRestore();
+  });
+
+  it("constructs with default options (no opts object passed)", () => {
+    // Exercise the constructor's `opts = {}` default + every `??` fallback.
+    const d = new EmbedDaemon();
+    expect(d).toBeInstanceOf(EmbedDaemon);
+  });
+
+  it("skips empty lines between valid requests", async () => {
+    const exitSpy = vi.spyOn(process, "exit").mockImplementation(() => undefined as never);
+    daemon = new EmbedDaemon({ socketDir: dir, idleTimeoutMs: 60_000 });
+    await daemon.start();
+
+    const uid = String(process.getuid?.() ?? "test");
+    const sockPath = join(dir, `hivemind-embed-${uid}.sock`);
+    await new Promise<void>((resolve, reject) => {
+      const sock = connect(sockPath);
+      sock.setEncoding("utf-8");
+      let buf = "";
+      sock.on("connect", () => {
+        // Send blank lines first — they hit the `line.length === 0` branch.
+        sock.write("\n\n");
+        sock.write(JSON.stringify({ op: "ping", id: "z" }) + "\n");
+      });
+      sock.on("data", (c: string) => {
+        buf += c;
+        const nl = buf.indexOf("\n");
+        if (nl !== -1) {
+          const resp = JSON.parse(buf.slice(0, nl));
+          expect(resp.id).toBe("z");
+          sock.end();
+          resolve();
+        }
+      });
+      sock.on("error", reject);
+    });
+    exitSpy.mockRestore();
+  });
+
+  it("survives a client that disconnects abruptly mid-session", async () => {
+    const exitSpy = vi.spyOn(process, "exit").mockImplementation(() => undefined as never);
+    daemon = new EmbedDaemon({ socketDir: dir, idleTimeoutMs: 60_000 });
+    await daemon.start();
+
+    const uid = String(process.getuid?.() ?? "test");
+    const sockPath = join(dir, `hivemind-embed-${uid}.sock`);
+    await new Promise<void>((resolve) => {
+      const sock = connect(sockPath);
+      sock.on("error", () => { /* swallow — we intentionally destroy below */ });
+      sock.on("connect", () => {
+        // Destroying a freshly connected socket should make the server's
+        // read side emit either `end` or `error` — either way the daemon
+        // should survive and keep serving. We test the survival below.
+        sock.destroy();
+        resolve();
+      });
+    });
+    // Follow-up ping should still work — the daemon didn't crash.
+    const sockPathStr = join(dir, `hivemind-embed-${uid}.sock`);
+    const resp = await sendLine(sockPathStr, { op: "ping", id: "after" });
+    expect(resp.id).toBe("after");
+    exitSpy.mockRestore();
+  });
+
+  it("handles malformed JSON lines without crashing the daemon", async () => {
+    const exitSpy = vi.spyOn(process, "exit").mockImplementation(() => undefined as never);
+    daemon = new EmbedDaemon({ socketDir: dir, idleTimeoutMs: 60_000 });
+    await daemon.start();
+
+    const uid = String(process.getuid?.() ?? "test");
+    const sockPath = join(dir, `hivemind-embed-${uid}.sock`);
+    // Write a bad line then a good one on the same connection.
+    await new Promise<void>((resolve, reject) => {
+      const sock = connect(sockPath);
+      sock.setEncoding("utf-8");
+      let buf = "";
+      sock.on("connect", () => {
+        sock.write("not-json\n");
+        sock.write(JSON.stringify({ op: "ping", id: "ok" }) + "\n");
+      });
+      sock.on("data", (c: string) => {
+        buf += c;
+        const nl = buf.indexOf("\n");
+        if (nl !== -1) {
+          const resp = JSON.parse(buf.slice(0, nl));
+          expect(resp.id).toBe("ok");
+          sock.end();
+          resolve();
+        }
+      });
+      sock.on("error", reject);
+    });
+    exitSpy.mockRestore();
+  });
+});
diff --git a/claude-code/tests/embeddings-nomic.test.ts b/claude-code/tests/embeddings-nomic.test.ts
new file mode 100644
index 0000000..aa4300c
--- /dev/null
+++ b/claude-code/tests/embeddings-nomic.test.ts
@@ -0,0 +1,149 @@
+import { describe, it, expect, vi } from "vitest";
+import { NomicEmbedder } from "../../src/embeddings/nomic.js";
+
+// Mock the heavy transformers import so these tests don't pull in
+// onnxruntime-node or download any model weights. `load()` uses
+// `await import("@huggingface/transformers")` — vi.mock intercepts.
+vi.mock("@huggingface/transformers", () => {
+  const embed = vi.fn((input: string | string[], _opts: Record<string, unknown>) => {
+    const texts = Array.isArray(input) ? input : [input];
+    // Return deterministic per-input vectors: 4 floats per text.
+    const out: number[] = [];
+    for (let i = 0; i < texts.length; i++) {
+      out.push(0.1 + i, 0.2 + i, 0.3 + i, 0.4 + i);
+    }
+    return Promise.resolve({ data: out });
+  });
+  return {
+    env: { allowLocalModels: false, useFSCache: false },
+    pipeline: vi.fn(async () => embed),
+  };
+});
+
+describe("NomicEmbedder", () => {
+  it("loads lazily and reuses the pipeline across calls", async () => {
+    const e = new NomicEmbedder({ dims: 4 });
+    await e.load();
+    await e.load(); // second call is a no-op (cached)
+    // If load() didn't memoize, pipeline() would be invoked twice; the
+    // mock would return a fresh spy whose call counts would differ.
+    const mod: any = await import("@huggingface/transformers");
+    expect((mod.pipeline as any).mock.calls.length).toBe(1);
+  });
+
+  it("embeds a document with the search_document: prefix", async () => {
+    const e = new NomicEmbedder({ dims: 4 });
+    const v = await e.embed("hello", "document");
+    expect(v).toHaveLength(4);
+    const mod: any = await import("@huggingface/transformers");
+    const pipeline = await (mod.pipeline as any).mock.results[0].value;
+    const callArg = (pipeline as any).mock.calls.at(-1)[0];
+    expect(callArg).toBe("search_document: hello");
+  });
+
+  it("embeds a query with the search_query: prefix", async () => {
+    const e = new NomicEmbedder({ dims: 4 });
+    await e.embed("q", "query");
+    const mod: any = await import("@huggingface/transformers");
+    const pipeline = await (mod.pipeline as any).mock.results[0].value;
+    const callArg = (pipeline as any).mock.calls.at(-1)[0];
+    expect(callArg).toBe("search_query: q");
+  });
+
+  it("batches inputs and splits results back into per-text vectors", async () => {
+    const e = new NomicEmbedder({ dims: 4 });
+    const out = await e.embedBatch(["a", "b", "c"], "document");
+    expect(out).toHaveLength(3);
+    expect(out[0]).toHaveLength(4);
+    expect(out[0][0]).toBeCloseTo(0.1);
+    expect(out[1][0]).toBeCloseTo(1.1);
+    expect(out[2][0]).toBeCloseTo(2.1);
+  });
+
+  it("returns [] for an empty batch without touching the pipeline", async () => {
+    const e = new NomicEmbedder({ dims: 4 });
+    expect(await e.embedBatch([])).toEqual([]);
+  });
+
+  it("applies Matryoshka truncation when dims < full length", async () => {
+    const e = new NomicEmbedder({ dims: 2 });
+    const v = await e.embed("x");
+    expect(v).toHaveLength(2);
+    // Truncated + re-normalized; the raw vector was [0.1,0.2,0.3,0.4].
+    // After slicing to 2 and renormalizing, |v| === 1.
+    const norm = Math.sqrt(v[0] * v[0] + v[1] * v[1]);
+    expect(norm).toBeCloseTo(1.0, 5);
+  });
+
+  it("returns vector unchanged when requested dims >= vector length", async () => {
+    const e = new NomicEmbedder({ dims: 100 });
+    const v = await e.embed("x");
+    // Mock returns 4 dims; with target 100, truncate becomes a no-op and
+    // the raw vector is returned verbatim (no renormalization).
+    expect(v).toHaveLength(4);
+  });
+
+  it("handles a zero-norm truncation without dividing by zero", async () => {
+    // Reach through the private helper via a custom mock that returns zeros.
+    const mod: any = await import("@huggingface/transformers");
+    const origPipeline = mod.pipeline;
+    const zeroPipe = vi.fn(async () => [0, 0, 0, 0]);
+    const wrapped = vi.fn(() => Promise.resolve(() => Promise.resolve({ data: [0, 0, 0, 0] })));
+    (mod as any).pipeline = wrapped;
+    try {
+      const e = new NomicEmbedder({ dims: 2 });
+      const v = await e.embed("z");
+      expect(v).toEqual([0, 0]);
+    } finally {
+      (mod as any).pipeline = origPipeline;
+    }
+  });
+
+  it("throws if embed is called before load resolves (defensive)", async () => {
+    const e = new NomicEmbedder({ dims: 4 });
+    // Call load once normally to populate the pipeline.
+    await e.load();
+    // This is the happy path; the guard message fires only on a bug.
+    const v = await e.embed("x");
+    expect(v).toHaveLength(4);
+  });
+
+  it("defaults repo + dtype + dims without explicit options", () => {
+    const e = new NomicEmbedder();
+    expect(e.repo).toBe("nomic-ai/nomic-embed-text-v1.5");
+    expect(e.dtype).toBe("q8");
+    expect(e.dims).toBe(768);
+  });
+
+  it("coalesces concurrent load() calls onto a single pipeline build", async () => {
+    // Replace pipeline with a slow one so the two load() calls overlap and
+    // the second enters the `if (this.loading) return this.loading;` branch.
+    const mod: any = await import("@huggingface/transformers");
+    const orig = mod.pipeline;
+    let calls = 0;
+    mod.pipeline = vi.fn(async () => {
+      calls++;
+      await new Promise((r) => setTimeout(r, 30));
+      return async () => ({ data: [0, 0, 0, 0] });
+    });
+    try {
+      const e = new NomicEmbedder({ dims: 4 });
+      // Kick off two loads without awaiting between them.
+      const [a, b] = await Promise.all([e.load(), e.load()]);
+      expect(a).toBeUndefined();
+      expect(b).toBeUndefined();
+      expect(calls).toBe(1);
+    } finally {
+      mod.pipeline = orig;
+    }
+  });
+
+  it("embeds a query in embedBatch with the search_query prefix", async () => {
+    const e = new NomicEmbedder({ dims: 4 });
+    await e.embedBatch(["hi"], "query");
+    const mod: any = await import("@huggingface/transformers");
+    const pipeline = await (mod.pipeline as any).mock.results[0].value;
+    const lastCall = (pipeline as any).mock.calls.at(-1)[0];
+    expect(lastCall).toEqual(["search_query: hi"]);
+  });
+});
diff --git a/claude-code/tests/grep-core.test.ts b/claude-code/tests/grep-core.test.ts
index 51339ff..0f7bf2a 100644
--- a/claude-code/tests/grep-core.test.ts
+++ b/claude-code/tests/grep-core.test.ts
@@ -46,10 +46,13 @@ describe("normalizeContent: turn-array session shape", () => {
     ],
   });
 
-  it("emits date and speakers header", () => {
+  it("prefixes every turn with the session date inline", () => {
     const out = normalizeContent("/sessions/alice/chat_1.json", raw);
-    expect(out).toContain("date: 1:56 pm on 8 May, 2023");
-    expect(out).toContain("speakers: Avery, Jordan");
+    // Date lives inline on every turn so it survives the refineGrepMatches
+    // line filter — a standalone `date:` header would be stripped whenever
+    // the regex didn't match the header line itself.
+    expect(out).toContain("(1:56 pm on 8 May, 2023) [D1:1] Avery: Hey Jordan!");
+    expect(out).toContain("(1:56 pm on 8 May, 2023) [D1:2] Jordan: Hi Avery.");
   });
 
   it("emits one line per turn with dia_id tag", () => {
@@ -66,23 +69,24 @@ describe("normalizeContent: turn-array session shape", () => {
     expect(out).toContain("X: ");
   });
 
-  it("omits speakers header when both speaker fields are empty", () => {
+  it("skips the date prefix when date_time is absent", () => {
     const raw = JSON.stringify({
       turns: [{ speaker: "A", text: "hi" }],
-      speakers: { speaker_a: "", speaker_b: "" },
     });
     const out = normalizeContent("/sessions/alice/chat_1.json", raw);
-    expect(out).not.toContain("speakers:");
+    // No leading "(...)" — the turn line starts with the dia_id or speaker.
     expect(out).toContain("A: hi");
+    expect(out).not.toMatch(/^\(/);
   });
 
-  it("emits only speaker_a when speaker_b is missing", () => {
+  it("still emits turn lines when only one speaker is set (date still inlined)", () => {
     const raw = JSON.stringify({
+      date_time: "1:56 pm on 8 May, 2023",
       turns: [{ speaker: "A", text: "hi" }],
       speakers: { speaker_a: "Alice" },
     });
     const out = normalizeContent("/sessions/alice/chat_1.json", raw);
-    expect(out).toContain("speakers: Alice");
+    expect(out).toContain("(1:56 pm on 8 May, 2023) A: hi");
   });
 
   it("falls back speaker->name when speaker field is absent on a turn", () => {
@@ -782,22 +786,41 @@ describe("grepBothTables", () => {
     const [sql] = api.query.mock.calls.map((c: unknown[]) => c[0] as string);
     expect(sql).not.toContain("summary::text LIKE");
     expect(sql).not.toContain("message::text LIKE");
+    expect(sql).not.toContain("summary::text ILIKE");
+    expect(sql).not.toContain("message::text ILIKE");
   });
 
   it("adds a safe literal prefilter for wildcard regexes with stable anchors", async () => {
     const api = mockApi([{ path: "/a", content: "foo middle bar" }]);
     await grepBothTables(api, "m", "s", { ...baseParams, pattern: "foo.*bar" }, "/");
     const [sql] = api.query.mock.calls.map((c: unknown[]) => c[0] as string);
-    expect(sql).toContain("summary::text LIKE '%foo%'");
+    // Default likeOp is ILIKE (case-insensitive) — buildGrepSearchOptions
+    // picks it unless HIVEMIND_GREP_LIKE=case-sensitive overrides.
+    expect(sql).toContain("summary::text ILIKE '%foo%'");
   });
 
-  it("routes to ILIKE when ignoreCase is set", async () => {
+  it("routes to ILIKE regardless of ignoreCase (case-insensitive by default)", async () => {
     const api = mockApi([]);
     await grepBothTables(api, "m", "s", { ...baseParams, ignoreCase: true }, "/");
     const [sql] = api.query.mock.calls.map((c: unknown[]) => c[0] as string);
     expect(sql).toContain("ILIKE");
   });
 
+  it("switches to LIKE when HIVEMIND_GREP_LIKE=case-sensitive", async () => {
+    const prev = process.env.HIVEMIND_GREP_LIKE;
+    process.env.HIVEMIND_GREP_LIKE = "case-sensitive";
+    try {
+      const api = mockApi([{ path: "/a", content: "hi" }]);
+      await grepBothTables(api, "m", "s", baseParams, "/");
+      const [sql] = api.query.mock.calls.map((c: unknown[]) => c[0] as string);
+      expect(sql).toContain("summary::text LIKE");
+      expect(sql).not.toMatch(/summary::text ILIKE/);
+    } finally {
+      if (prev === undefined) delete process.env.HIVEMIND_GREP_LIKE;
+      else process.env.HIVEMIND_GREP_LIKE = prev;
+    }
+  });
+
   it("uses a single union query even for scoped target paths", async () => {
     const api = mockApi([{ path: "/summaries/a.md", content: "foo line" }]);
     await grepBothTables(api, "memory", "sessions", baseParams, "/summaries");
@@ -807,6 +830,33 @@ describe("grepBothTables", () => {
     expect(sql).toContain('FROM "sessions"');
     expect(sql).toContain("UNION ALL");
   });
+
+  it("emits every non-empty line when a query embedding is passed (semantic mode)", async () => {
+    const api = mockApi([
+      { path: "/summaries/a.md", content: "foo first line\nunrelated but kept\n\ntrailing" },
+    ]);
+    const out = await grepBothTables(api, "m", "s", baseParams, "/", [0.1, 0.2]);
+    // Semantic mode short-circuits the refinement — every non-empty line on
+    // the retrieved row survives, not just the pattern-matching ones.
+    expect(out).toContain("/summaries/a.md:foo first line");
+    expect(out).toContain("/summaries/a.md:unrelated but kept");
+    expect(out).toContain("/summaries/a.md:trailing");
+  });
+
+  it("falls back to refined output when HIVEMIND_SEMANTIC_EMIT_ALL=false even with an embedding", async () => {
+    const prev = process.env.HIVEMIND_SEMANTIC_EMIT_ALL;
+    process.env.HIVEMIND_SEMANTIC_EMIT_ALL = "false";
+    try {
+      const api = mockApi([{ path: "/a", content: "foo line\nunrelated" }]);
+      const out = await grepBothTables(api, "m", "s", baseParams, "/", [0.1]);
+      // Refinement ran, so only the pattern-matching line is emitted.
+      expect(out.some(l => l.includes("foo line"))).toBe(true);
+      expect(out.some(l => l.includes("unrelated"))).toBe(false);
+    } finally {
+      if (prev === undefined) delete process.env.HIVEMIND_SEMANTIC_EMIT_ALL;
+      else process.env.HIVEMIND_SEMANTIC_EMIT_ALL = prev;
+    }
+  });
 });
 
 describe("regex literal prefilter", () => {
@@ -900,3 +950,264 @@ describe("regex literal prefilter", () => {
     expect(opts.pathFilter).toBe(" AND path = '/summaries/alice/s1.md'");
   });
 });
+
+// ─────────────────────────────────────────────────────────────────────────────
+//  Additional coverage: single-turn JSONB shape + hybrid semantic branch
+// ─────────────────────────────────────────────────────────────────────────────
+
+describe("normalizeContent: single-turn shape { turn: {...} }", () => {
+  it("emits one line with date prefix when date_time is present", () => {
+    const raw = JSON.stringify({
+      date_time: "8:00 pm on 20 July, 2023",
+      speakers: { speaker_a: "Alice", speaker_b: "Bob" },
+      turn: { dia_id: "D5:3", speaker: "Alice", text: "hello world" },
+    });
+    const out = normalizeContent("/sessions/conv_0_session_1.json", raw);
+    expect(out).toBe("(8:00 pm on 20 July, 2023) [D5:3] Alice: hello world");
+  });
+
+  it("omits the date prefix when date_time is absent", () => {
+    const raw = JSON.stringify({
+      turn: { dia_id: "D1:1", speaker: "X", text: "y" },
+    });
+    const out = normalizeContent("/sessions/conv_0_session_1.json", raw);
+    expect(out).toBe("[D1:1] X: y");
+  });
+
+  it("falls back speaker->name on a single turn", () => {
+    const raw = JSON.stringify({ turn: { name: "Only", text: "hi" } });
+    const out = normalizeContent("/sessions/conv_0_session_1.json", raw);
+    expect(out).toContain("Only: hi");
+  });
+
+  it("falls back text->content on a single turn", () => {
+    const raw = JSON.stringify({ turn: { speaker: "X", content: "fallback" } });
+    const out = normalizeContent("/sessions/conv_0_session_1.json", raw);
+    expect(out).toContain("X: fallback");
+  });
+
+  it("emits placeholder `?: ` when the turn payload is empty", () => {
+    const raw = JSON.stringify({ turn: {} });
+    const out = normalizeContent("/sessions/conv_0_session_1.json", raw);
+    // Empty turn → "?: " (placeholder speaker, empty text). Non-empty after
+    // trim so the branch emits rather than falling back to raw.
+    expect(out).toBe("?: ");
+  });
+
+  it("does not treat an array value in `turn` as single-turn", () => {
+    // Defensive: older per-turn shapes might mistakenly pass an array; we
+    // must not enter the singular branch because .speaker / .text would be
+    // undefined on the array itself.
+    const raw = JSON.stringify({
+      turn: [{ speaker: "X", text: "y" }],
+    });
+    const out = normalizeContent("/sessions/conv_0_session_1.json", raw);
+    // Falls through to raw — no branch matched.
+    expect(out).toBe(raw);
+  });
+});
+
+describe("searchDeeplakeTables: hybrid semantic + lexical branch", () => {
+  function apiWithRows(rows: Record<string, unknown>[] = []) {
+    const query = vi.fn().mockResolvedValue(rows);
+    return { query, api: { query } as any };
+  }
+
+  it("issues a single UNION-ALL query mixing semantic + lexical on both tables", async () => {
+    const { query, api } = apiWithRows([]);
+    await searchDeeplakeTables(api, "mem", "sess", {
+      pathFilter: "",
+      contentScanOnly: false,
+      likeOp: "ILIKE",
+      escapedPattern: "caroline",
+      queryEmbedding: [0.1, 0.2, 0.3],
+    });
+    expect(query).toHaveBeenCalledTimes(1);
+    const sql = query.mock.calls[0][0] as string;
+    expect(sql).toContain("summary_embedding <#> ARRAY[0.1,0.2,0.3]::float4[]");
+    expect(sql).toContain("message_embedding <#> ARRAY[0.1,0.2,0.3]::float4[]");
+    expect(sql).toContain("summary::text ILIKE '%caroline%'");
+    expect(sql).toContain("message::text ILIKE '%caroline%'");
+    expect(sql).toContain("ORDER BY score DESC");
+  });
+
+  it("uses 1.0 sentinel on lexical sub-queries so they stay above cosine (0..1)", async () => {
+    const { query, api } = apiWithRows([]);
+    await searchDeeplakeTables(api, "m", "s", {
+      pathFilter: "",
+      contentScanOnly: false,
+      likeOp: "ILIKE",
+      escapedPattern: "x",
+      queryEmbedding: [0.5],
+    });
+    const sql = query.mock.calls[0][0] as string;
+    // Lexical branches carry the constant score; semantic uses the real cosine.
+    expect(sql).toMatch(/1\.0 AS score/);
+    expect(sql).toMatch(/\(summary_embedding <#>/);
+  });
+
+  it("skips the lexical branch entirely when contentScanOnly=true and no prefilter", async () => {
+    const { query, api } = apiWithRows([]);
+    await searchDeeplakeTables(api, "m", "s", {
+      pathFilter: "",
+      contentScanOnly: true,
+      likeOp: "ILIKE",
+      escapedPattern: "(?:unused)",
+      queryEmbedding: [0.1],
+    });
+    const sql = query.mock.calls[0][0] as string;
+    // No usable literal → only the two semantic sub-queries are unioned.
+    expect(sql).not.toContain("summary::text ILIKE");
+    expect(sql).not.toContain("message::text ILIKE");
+    expect(sql).toContain("summary_embedding <#>");
+    expect(sql).toContain("message_embedding <#>");
+  });
+
+  it("falls back to prefilterPattern for regex grep with extractable literal", async () => {
+    const { query, api } = apiWithRows([]);
+    await searchDeeplakeTables(api, "m", "s", {
+      pathFilter: "",
+      contentScanOnly: true,
+      likeOp: "ILIKE",
+      escapedPattern: "foo.*bar",
+      prefilterPattern: "foo",
+      queryEmbedding: [0.1],
+    });
+    const sql = query.mock.calls[0][0] as string;
+    expect(sql).toContain("summary::text ILIKE '%foo%'");
+  });
+
+  it("uses prefilterPatterns alternation instead of a single prefilterPattern", async () => {
+    const { query, api } = apiWithRows([]);
+    await searchDeeplakeTables(api, "m", "s", {
+      pathFilter: "",
+      contentScanOnly: true,
+      likeOp: "ILIKE",
+      escapedPattern: "a|b",
+      prefilterPattern: "a",
+      prefilterPatterns: ["apple", "banana"],
+      queryEmbedding: [0.1],
+    });
+    const sql = query.mock.calls[0][0] as string;
+    // prefilterPatterns wins over prefilterPattern when both are present.
+    expect(sql).toContain("%apple%");
+    expect(sql).toContain("%banana%");
+  });
+
+  it("dedupes rows by path, keeping the first occurrence (highest score wins)", async () => {
+    const { api } = apiWithRows([
+      { path: "/a", content: "sem-first" },
+      { path: "/a", content: "lex-dup" },
+      { path: "/b", content: "other" },
+    ]);
+    const out = await searchDeeplakeTables(api, "m", "s", {
+      pathFilter: "",
+      contentScanOnly: false,
+      likeOp: "ILIKE",
+      escapedPattern: "x",
+      queryEmbedding: [0.5],
+    });
+    expect(out.map(r => r.path)).toEqual(["/a", "/b"]);
+    expect(out[0].content).toBe("sem-first");
+  });
+
+  it("honors HIVEMIND_SEMANTIC_LIMIT env override for the semantic sub-queries", async () => {
+    const prev = process.env.HIVEMIND_SEMANTIC_LIMIT;
+    process.env.HIVEMIND_SEMANTIC_LIMIT = "7";
+    try {
+      const { query, api } = apiWithRows([]);
+      await searchDeeplakeTables(api, "m", "s", {
+        pathFilter: "",
+        contentScanOnly: false,
+        likeOp: "ILIKE",
+        escapedPattern: "x",
+        queryEmbedding: [0.5],
+      });
+      const sql = query.mock.calls[0][0] as string;
+      // Semantic LIMIT is 7; lexical still 20 (default).
+      expect(sql).toMatch(/summary_embedding <#> [^)]+\) AS score FROM "m" WHERE summary_embedding IS NOT NULL ORDER BY score DESC LIMIT 7/);
+    } finally {
+      if (prev === undefined) delete process.env.HIVEMIND_SEMANTIC_LIMIT;
+      else process.env.HIVEMIND_SEMANTIC_LIMIT = prev;
+    }
+  });
+
+  it("skips the semantic branch entirely when queryEmbedding is an empty array", async () => {
+    const { query, api } = apiWithRows([]);
+    await searchDeeplakeTables(api, "m", "s", {
+      pathFilter: "",
+      contentScanOnly: false,
+      likeOp: "ILIKE",
+      escapedPattern: "x",
+      queryEmbedding: [],
+    });
+    const sql = query.mock.calls[0][0] as string;
+    // Empty embedding → falls through to the pure-lexical branch below.
+    expect(sql).not.toContain("<#>");
+  });
+
+  it("skips the semantic branch when queryEmbedding is null", async () => {
+    const { query, api } = apiWithRows([]);
+    await searchDeeplakeTables(api, "m", "s", {
+      pathFilter: "",
+      contentScanOnly: false,
+      likeOp: "ILIKE",
+      escapedPattern: "x",
+      queryEmbedding: null,
+    });
+    const sql = query.mock.calls[0][0] as string;
+    expect(sql).not.toContain("<#>");
+  });
+});
+
+describe("serializeFloat4Array (indirect)", () => {
+  it("returns NULL when the embedding contains a non-finite value", async () => {
+    const query = vi.fn().mockResolvedValue([]);
+    const api = { query } as any;
+    await searchDeeplakeTables(api, "m", "s", {
+      pathFilter: "",
+      contentScanOnly: false,
+      likeOp: "ILIKE",
+      escapedPattern: "x",
+      queryEmbedding: [1, NaN, 0.3],
+    });
+    const sql = query.mock.calls[0][0] as string;
+    // Both semantic sub-queries degrade to NULL scoring; Deeplake accepts it
+    // and returns 0 rows for those two sub-queries so the hybrid still runs.
+    expect(sql).toContain("<#> NULL");
+  });
+});
+
+describe("bm25Term derivation in buildGrepSearchOptions", () => {
+  it("populates bm25Term with the raw pattern for non-regex fixed strings", () => {
+    const opts = buildGrepSearchOptions(
+      { pattern: "charity race", fixedString: true, ignoreCase: false, wordMatch: false, lineNumber: false, invertMatch: false, filesOnly: false, countOnly: false },
+      "/"
+    );
+    expect(opts.bm25Term).toBe("charity race");
+  });
+
+  it("uses the extracted literal prefilter for regex patterns", () => {
+    const opts = buildGrepSearchOptions(
+      { pattern: "foo.*bar", fixedString: false, ignoreCase: false, wordMatch: false, lineNumber: false, invertMatch: false, filesOnly: false, countOnly: false },
+      "/"
+    );
+    expect(opts.bm25Term).toBe("foo");
+  });
+
+  it("joins alternation prefilters with spaces for BM25", () => {
+    const opts = buildGrepSearchOptions(
+      { pattern: "apple|banana|cherry", fixedString: false, ignoreCase: false, wordMatch: false, lineNumber: false, invertMatch: false, filesOnly: false, countOnly: false },
+      "/"
+    );
+    expect(opts.bm25Term).toBe("apple banana cherry");
+  });
+
+  it("returns undefined bm25Term when the regex has no extractable literal", () => {
+    const opts = buildGrepSearchOptions(
+      { pattern: "(?:a)", fixedString: false, ignoreCase: false, wordMatch: false, lineNumber: false, invertMatch: false, filesOnly: false, countOnly: false },
+      "/"
+    );
+    expect(opts.bm25Term).toBeUndefined();
+  });
+});
diff --git a/claude-code/tests/grep-interceptor.test.ts b/claude-code/tests/grep-interceptor.test.ts
index ba7e67b..a8df072 100644
--- a/claude-code/tests/grep-interceptor.test.ts
+++ b/claude-code/tests/grep-interceptor.test.ts
@@ -1,4 +1,17 @@
-import { describe, it, expect, vi } from "vitest";
+import { describe, it, expect, vi, afterEach } from "vitest";
+
+// Mock EmbedClient BEFORE importing the interceptor so the shared singleton
+// inside grep-interceptor picks up our stub (not the real daemon client).
+// `vi.hoisted` lets us share the spy across mock factory + tests — plain
+// top-level consts aren't visible inside the hoisted vi.mock factory.
+const { mockEmbed } = vi.hoisted(() => ({ mockEmbed: vi.fn() }));
+vi.mock("../../src/embeddings/client.js", () => {
+  class MockEmbedClient {
+    async embed(text: string, kind: string) { return mockEmbed(text, kind); }
+  }
+  return { EmbedClient: MockEmbedClient };
+});
+
 import { createGrepCommand } from "../../src/shell/grep-interceptor.js";
 import { DeeplakeFs } from "../../src/shell/deeplake-fs.js";
 import * as grepCore from "../../src/shell/grep-core.js";
@@ -31,6 +44,11 @@ function makeCtx(fs: DeeplakeFs, cwd = "/memory") {
 // cache. Tests below assert that new contract.
 
 describe("grep interceptor", () => {
+  afterEach(() => {
+    vi.restoreAllMocks();
+    mockEmbed.mockReset();
+  });
+
   it("returns exitCode=1 when the pattern is missing", async () => {
     const client = makeClient();
     const fs = await DeeplakeFs.create(client as never, "test", "/memory");
@@ -217,4 +235,155 @@ describe("grep interceptor", () => {
     expect(result.exitCode).toBe(0);
     expect(result.stdout).toContain("hello world");
   });
+
+  // ── Semantic path (HIVEMIND_SEMANTIC_SEARCH default=on) ─────────────────
+  // These tests exercise the daemon-backed embed + UNION ALL branch of
+  // searchDeeplakeTables. They mock the shared EmbedClient singleton so we
+  // don't actually spawn nomic.
+  it("passes the query embedding into searchDeeplakeTables for semantic-friendly patterns", async () => {
+    mockEmbed.mockResolvedValueOnce([0.1, 0.2, 0.3]);
+    const client = makeClient([{ path: "/memory/a.txt", content: "deploy failed" }]);
+    const fs = await DeeplakeFs.create(client as never, "test", "/memory");
+    const searchSpy = vi.spyOn(grepCore, "searchDeeplakeTables")
+      .mockResolvedValue([{ path: "/memory/a.txt", content: "deploy failed" }]);
+
+    const cmd = createGrepCommand(client as never, fs, "test", "sessions");
+    const result = await cmd.execute(["deploy", "/memory"], makeCtx(fs) as never);
+
+    expect(mockEmbed).toHaveBeenCalledWith("deploy", "query");
+    const opts = searchSpy.mock.calls[0][3] as { queryEmbedding: number[] | null };
+    expect(opts.queryEmbedding).toEqual([0.1, 0.2, 0.3]);
+    expect(result.exitCode).toBe(0);
+    searchSpy.mockRestore();
+  });
+
+  it("skips embedding on regex-heavy patterns (too many metachars)", async () => {
+    mockEmbed.mockClear();
+    mockEmbed.mockResolvedValue([0.5]);
+    const client = makeClient([]);
+    const fs = await DeeplakeFs.create(client as never, "test", "/memory");
+    const cmd = createGrepCommand(client as never, fs, "test");
+    // Three metachars should disqualify the pattern from semantic.
+    await cmd.execute(["(foo|bar|baz)\\+", "/memory"], makeCtx(fs) as never);
+    expect(mockEmbed).not.toHaveBeenCalled();
+  });
+
+  it("skips embedding on very short patterns (< 2 chars)", async () => {
+    mockEmbed.mockClear();
+    const client = makeClient([]);
+    const fs = await DeeplakeFs.create(client as never, "test", "/memory");
+    const cmd = createGrepCommand(client as never, fs, "test");
+    await cmd.execute(["a", "/memory"], makeCtx(fs) as never);
+    expect(mockEmbed).not.toHaveBeenCalled();
+  });
+
+  it("treats a thrown embed() as a null embedding and continues lexically", async () => {
+    mockEmbed.mockClear();
+    mockEmbed.mockRejectedValueOnce(new Error("daemon down"));
+    const client = makeClient([{ path: "/memory/a.txt", content: "hello world" }]);
+    const fs = await DeeplakeFs.create(client as never, "test", "/memory");
+    client.query.mockClear();
+    client.query.mockResolvedValue([{ path: "/memory/a.txt", content: "hello world" }]);
+
+    const cmd = createGrepCommand(client as never, fs, "test");
+    const result = await cmd.execute(["hello", "/memory"], makeCtx(fs) as never);
+
+    expect(mockEmbed).toHaveBeenCalled();
+    expect(result.exitCode).toBe(0);
+    expect(result.stdout).toContain("hello world");
+  });
+
+  it("retries with a lexical-only search when semantic returns zero rows", async () => {
+    mockEmbed.mockClear();
+    mockEmbed.mockResolvedValueOnce([0.1]);
+    const client = makeClient([]);
+    const fs = await DeeplakeFs.create(client as never, "test", "/memory");
+    const searchSpy = vi.spyOn(grepCore, "searchDeeplakeTables")
+      .mockResolvedValueOnce([]) // first call (semantic+lexical hybrid) → empty
+      .mockResolvedValueOnce([{ path: "/memory/a.txt", content: "hi" }]); // lexical retry
+
+    const cmd = createGrepCommand(client as never, fs, "test");
+    const result = await cmd.execute(["hi", "/memory"], makeCtx(fs) as never);
+
+    expect(searchSpy).toHaveBeenCalledTimes(2);
+    // First call carried the embedding, retry did not.
+    const firstOpts = searchSpy.mock.calls[0][3] as { queryEmbedding: number[] | null };
+    const secondOpts = searchSpy.mock.calls[1][3] as { queryEmbedding?: number[] | null };
+    expect(firstOpts.queryEmbedding).toEqual([0.1]);
+    expect(secondOpts.queryEmbedding).toBeUndefined();
+    expect(result.exitCode).toBe(0);
+    searchSpy.mockRestore();
+  });
+
+  it("emits all non-empty lines per row when the semantic path returned an embedding", async () => {
+    mockEmbed.mockClear();
+    mockEmbed.mockResolvedValueOnce([0.1, 0.2]);
+    const client = makeClient([]);
+    const fs = await DeeplakeFs.create(client as never, "test", "/memory");
+    const searchSpy = vi.spyOn(grepCore, "searchDeeplakeTables")
+      .mockResolvedValue([{ path: "/memory/a.txt", content: "line A\nline B\n\nline C" }]);
+
+    const cmd = createGrepCommand(client as never, fs, "test");
+    const result = await cmd.execute(["deploy", "/memory"], makeCtx(fs) as never);
+
+    // All three non-empty lines are emitted verbatim — no regex refinement.
+    expect(result.stdout).toContain("/memory/a.txt:line A");
+    expect(result.stdout).toContain("/memory/a.txt:line B");
+    expect(result.stdout).toContain("/memory/a.txt:line C");
+    expect(result.exitCode).toBe(0);
+    searchSpy.mockRestore();
+  });
+
+  it("hits the 3s timeout rejector when searchDeeplakeTables hangs", async () => {
+    // Force the SQL search to hang forever so Promise.race's setTimeout
+    // callback (line 131 of grep-interceptor.ts) fires with a timeout error,
+    // covering the reject() arrow function. Use fake timers to fast-forward
+    // past the 3s window without actually sleeping.
+    vi.useFakeTimers();
+    try {
+      mockEmbed.mockResolvedValue(null); // skip semantic for a cleaner timeout.
+      const client = makeClient([]);
+      const fs = await DeeplakeFs.create(client as never, "test", "/memory");
+      await fs.writeFile("/memory/a.txt", "hello world"); // fallback content.
+
+      vi.spyOn(grepCore, "searchDeeplakeTables")
+        .mockImplementation(() => new Promise(() => { /* never resolves */ }));
+
+      const cmd = createGrepCommand(client as never, fs, "test");
+      const pending = cmd.execute(["hello", "/memory"], makeCtx(fs) as never);
+      // Advance past the 3s timeout so the reject arrow runs, then drain
+      // microtasks so the catch branch takes over and the FS fallback runs.
+      await vi.advanceTimersByTimeAsync(3001);
+      const result = await pending;
+      // Fallback path should have kicked in and found the FS content.
+      expect(result.exitCode).toBe(0);
+      expect(result.stdout).toContain("hello world");
+    } finally {
+      vi.useRealTimers();
+    }
+  });
+
+  it("disables the semantic path when HIVEMIND_SEMANTIC_EMIT_ALL=false", async () => {
+    mockEmbed.mockClear();
+    mockEmbed.mockResolvedValueOnce([0.1]);
+    const prev = process.env.HIVEMIND_SEMANTIC_EMIT_ALL;
+    process.env.HIVEMIND_SEMANTIC_EMIT_ALL = "false";
+    try {
+      const client = makeClient([{ path: "/memory/a.txt", content: "hello world\ngoodbye" }]);
+      const fs = await DeeplakeFs.create(client as never, "test", "/memory");
+      client.query.mockClear();
+      client.query.mockResolvedValue([{ path: "/memory/a.txt", content: "hello world\ngoodbye" }]);
+
+      const cmd = createGrepCommand(client as never, fs, "test");
+      const result = await cmd.execute(["hello", "/memory"], makeCtx(fs) as never);
+
+      // Refinement active → only the hello line is emitted.
+      expect(result.stdout).toContain("hello world");
+      expect(result.stdout).not.toContain("goodbye");
+      expect(result.exitCode).toBe(0);
+    } finally {
+      if (prev === undefined) delete process.env.HIVEMIND_SEMANTIC_EMIT_ALL;
+      else process.env.HIVEMIND_SEMANTIC_EMIT_ALL = prev;
+    }
+  });
 });
diff --git a/src/embeddings/daemon.ts b/src/embeddings/daemon.ts
index 3a01899..32951b0 100644
--- a/src/embeddings/daemon.ts
+++ b/src/embeddings/daemon.ts
@@ -143,6 +143,7 @@ export class EmbedDaemon {
   }
 }
 
+/* v8 ignore start — CLI entrypoint, only runs when file is node's argv[1] */
 const invokedDirectly = import.meta.url === `file://${process.argv[1]}`
   || (process.argv[1] && import.meta.url.endsWith(process.argv[1].split("/").pop() ?? ""));
 
@@ -155,3 +156,4 @@ if (invokedDirectly) {
     process.exit(1);
   });
 }
+/* v8 ignore stop */
diff --git a/vitest.config.ts b/vitest.config.ts
index 2fb2c0b..dc07bed 100644
--- a/vitest.config.ts
+++ b/vitest.config.ts
@@ -82,6 +82,42 @@ export default defineConfig({
           functions: 90,
           lines: 90,
         },
+        // embedding_generation — nomic daemon + IPC client + SQL helper.
+        // Lines/statements held at 90; branches + functions are allowed to
+        // dip on the daemon because a few paths (SIGINT/SIGTERM handlers,
+        // the non-Linux `typeof process.getuid !== "function"` fallback,
+        // and the server "error" handler) can't be triggered from unit
+        // tests without forking a real subprocess.
+        "src/embeddings/client.ts": {
+          statements: 90,
+          branches: 80,
+          functions: 90,
+          lines: 90,
+        },
+        "src/embeddings/daemon.ts": {
+          statements: 90,
+          branches: 75,
+          functions: 75,
+          lines: 90,
+        },
+        "src/embeddings/nomic.ts": {
+          statements: 90,
+          branches: 90,
+          functions: 90,
+          lines: 90,
+        },
+        "src/embeddings/protocol.ts": {
+          statements: 90,
+          branches: 90,
+          functions: 90,
+          lines: 90,
+        },
+        "src/embeddings/sql.ts": {
+          statements: 90,
+          branches: 90,
+          functions: 90,
+          lines: 90,
+        },
       },
     },
   },

From 0c3a94d926bc47467f9732c9b270fd5dae3111b0 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Thu, 23 Apr 2026 01:21:10 +0000
Subject: [PATCH 09/30] fix(deeplake-fs): use MAX(size_bytes) to work around
 NULL SUM on backend
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The Deeplake SQL backend returns NULL for `SUM(size_bytes) GROUP BY path`
even when each row's size_bytes is a positive integer. Reproducible
against workspace `with_embedding` on the `sessions` table:

    SELECT MIN(size_bytes), MAX(size_bytes), COUNT(*) FROM "sessions"
      -> min=2284, max=9266, count=272                         (OK)
    SELECT path, size_bytes FROM "sessions" LIMIT 1
      -> size_bytes=3238                                        (OK)
    SELECT path, SUM(size_bytes) FROM "sessions" GROUP BY path
      -> sum=null for every row                                 (BUG)

The bootstrap path for the sessions table uses that aggregation to fill
per-file metadata. With SUM broken, every file's size was set to 0 in
the virtual FS, and `ls -la` / `stat` returned `Size: 0` — enough for
agents doing exploratory `ls` to conclude the memory was empty and give
up. `cat` / Read still worked because they go through a different query.

Switching to MAX side-steps the backend bug. For single-row-per-file
layouts (like `with_embedding`) MAX and SUM are identical. For
multi-row-per-turn layouts (like `with_embedding_multi_rows`) MAX
under-reports total size but stays strictly > 0, which is what the ls
metadata needs. A comment on the line explains the rationale so the
next reader doesn't "fix" it back to SUM.

Bundles regenerated.
---
 claude-code/bundle/shell/deeplake-shell.js | 9 ++++++++-
 codex/bundle/shell/deeplake-shell.js       | 9 ++++++++-
 src/shell/deeplake-fs.ts                   | 7 ++++++-
 3 files changed, 22 insertions(+), 3 deletions(-)

diff --git a/claude-code/bundle/shell/deeplake-shell.js b/claude-code/bundle/shell/deeplake-shell.js
index eecc463..2242446 100755
--- a/claude-code/bundle/shell/deeplake-shell.js
+++ b/claude-code/bundle/shell/deeplake-shell.js
@@ -67867,7 +67867,14 @@ var DeeplakeFs = class _DeeplakeFs {
     })();
     const sessionsBootstrap = sessionsTable && sessionSyncOk ? (async () => {
       try {
-        const sessionRows = await client.query(`SELECT path, SUM(size_bytes) as total_size FROM "${sessionsTable}" GROUP BY path ORDER BY path`);
+        const sessionRows = await client.query(
+          // NOTE: SUM(size_bytes) returns NULL on the Deeplake backend when combined
+          // with GROUP BY path (confirmed against workspace `with_embedding`). MAX
+          // works and — for the single-row-per-file layout — is equal to SUM. For
+          // multi-row-per-turn layouts MAX under-reports total size but stays >0
+          // so files don't look like empty placeholders in ls/stat.
+          `SELECT path, MAX(size_bytes) as total_size FROM "${sessionsTable}" GROUP BY path ORDER BY path`
+        );
         for (const row of sessionRows) {
           const p22 = row["path"];
           if (!fs3.files.has(p22)) {
diff --git a/codex/bundle/shell/deeplake-shell.js b/codex/bundle/shell/deeplake-shell.js
index eecc463..2242446 100755
--- a/codex/bundle/shell/deeplake-shell.js
+++ b/codex/bundle/shell/deeplake-shell.js
@@ -67867,7 +67867,14 @@ var DeeplakeFs = class _DeeplakeFs {
     })();
     const sessionsBootstrap = sessionsTable && sessionSyncOk ? (async () => {
       try {
-        const sessionRows = await client.query(`SELECT path, SUM(size_bytes) as total_size FROM "${sessionsTable}" GROUP BY path ORDER BY path`);
+        const sessionRows = await client.query(
+          // NOTE: SUM(size_bytes) returns NULL on the Deeplake backend when combined
+          // with GROUP BY path (confirmed against workspace `with_embedding`). MAX
+          // works and — for the single-row-per-file layout — is equal to SUM. For
+          // multi-row-per-turn layouts MAX under-reports total size but stays >0
+          // so files don't look like empty placeholders in ls/stat.
+          `SELECT path, MAX(size_bytes) as total_size FROM "${sessionsTable}" GROUP BY path ORDER BY path`
+        );
         for (const row of sessionRows) {
           const p22 = row["path"];
           if (!fs3.files.has(p22)) {
diff --git a/src/shell/deeplake-fs.ts b/src/shell/deeplake-fs.ts
index e917e68..55e4101 100644
--- a/src/shell/deeplake-fs.ts
+++ b/src/shell/deeplake-fs.ts
@@ -141,7 +141,12 @@ export class DeeplakeFs implements IFileSystem {
     const sessionsBootstrap = (sessionsTable && sessionSyncOk) ? (async () => {
       try {
         const sessionRows = await client.query(
-          `SELECT path, SUM(size_bytes) as total_size FROM "${sessionsTable}" GROUP BY path ORDER BY path`
+          // NOTE: SUM(size_bytes) returns NULL on the Deeplake backend when combined
+          // with GROUP BY path (confirmed against workspace `with_embedding`). MAX
+          // works and — for the single-row-per-file layout — is equal to SUM. For
+          // multi-row-per-turn layouts MAX under-reports total size but stays >0
+          // so files don't look like empty placeholders in ls/stat.
+          `SELECT path, MAX(size_bytes) as total_size FROM "${sessionsTable}" GROUP BY path ORDER BY path`
         );
         for (const row of sessionRows) {
           const p = row["path"] as string;

From c36bac059a28a3cd55233ffffadb01cc8751bcd0 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Thu, 23 Apr 2026 01:21:25 +0000
Subject: [PATCH 10/30] feat(session-start): steer agents toward the Grep tool,
 document bash limits
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The previous SessionStart context told the model to "Only use bash
commands (cat, ls, grep, echo, jq, head, tail, etc.) to interact with
~/.deeplake/memory/". That instruction explicitly steered away from the
Grep tool, which is the one path that actually uses the hybrid
semantic+literal retrieval. Agents ended up doing `for f in *.json; do
grep ... $f; done`, hitting the 10 MB bash output cap, or using
unsupported brace expansions like `{1..20}` and silently getting empty
loops.

Rewrite the SEARCH section to:
- explicitly prefer the Grep tool over bash grep for memory paths,
- show two good patterns (descriptive phrases, not single keywords, so
  the semantic layer is useful),
- flag the bash for-loop anti-pattern by name.

Rewrite the follow-up bullet that used to forbid non-bash interpreters
to instead tell the model to use bash cat/head/tail on SPECIFIC files
returned by Grep, and to avoid `{a..b}` brace expansions (the virtual
shell doesn't fully support them). The no-python rule is preserved.

Observed on the 50-QA locomo benchmark after this change: bash error
rate roughly halved, number of bash calls dropped ~12%, and — in one
of two sampled runs — overall accuracy hit a new high. With n=2 the
mean shift is not statistically significant on its own, but the
behavioural signal (fewer wasteful shell loops, more focused queries)
is consistent and desirable regardless.
---
 claude-code/bundle/session-start.js | 8 ++++++--
 src/hooks/session-start.ts          | 8 ++++++--
 2 files changed, 12 insertions(+), 4 deletions(-)

diff --git a/claude-code/bundle/session-start.js b/claude-code/bundle/session-start.js
index cdccb55..bf49de9 100755
--- a/claude-code/bundle/session-start.js
+++ b/claude-code/bundle/session-start.js
@@ -504,7 +504,11 @@ Deeplake memory structure:
 
 SEARCH STRATEGY: Always read index.md first. Then read specific summaries. Only read raw JSONL if summaries don't have enough detail. Do NOT jump straight to JSONL files.
 
-Search command: Grep pattern="keyword" path="~/.deeplake/memory"
+SEARCH \u2014 prefer the Grep tool over bash grep. The Grep tool runs a single SQL query across ALL files with hybrid semantic+literal retrieval; bash loops over many files are slow, truncated at 10MB total output, and do not use the embeddings.
+  Good:  Grep pattern="Caroline researching adoption agencies" path="~/.deeplake/memory"
+  Good:  Grep pattern="Jon Rome visit"                         path="~/.deeplake/memory"
+  Bad:   bash "for f in ~/.deeplake/memory/sessions/*.json; do grep ... $f; done"  (truncated, no semantics)
+Phrase Grep patterns as full descriptive phrases, not single keywords \u2014 the semantic layer matches meaning, single names return topic-irrelevant results.
 
 Organization management \u2014 each argument is SEPARATE (do NOT quote subcommands together):
 - node "HIVEMIND_AUTH_CMD" login                              \u2014 SSO login
@@ -517,7 +521,7 @@ Organization management \u2014 each argument is SEPARATE (do NOT quote subcomman
 - node "HIVEMIND_AUTH_CMD" members                            \u2014 list members
 - node "HIVEMIND_AUTH_CMD" remove <user-id>                   \u2014 remove member
 
-IMPORTANT: Only use bash commands (cat, ls, grep, echo, jq, head, tail, etc.) to interact with ~/.deeplake/memory/. Do NOT use python, python3, node, curl, or other interpreters \u2014 they are not available in the memory filesystem. If a task seems to require Python, rewrite it using bash commands and standard text-processing tools (awk, sed, jq, grep, etc.).
+READ \u2014 use bash \`cat\`/\`head\`/\`tail\` on SPECIFIC files returned by Grep. Do NOT use python, python3, node, curl, or other interpreters \u2014 they are not available in the memory filesystem. Avoid bash brace expansions like \`{1..10}\` (not fully supported); spell out paths or use Grep instead.
 
 LIMITS: Do NOT spawn subagents to read deeplake memory. If a file returns empty after 2 attempts, skip it and move on. Report what you found rather than exhaustively retrying.
 
diff --git a/src/hooks/session-start.ts b/src/hooks/session-start.ts
index 60e402b..642acbf 100644
--- a/src/hooks/session-start.ts
+++ b/src/hooks/session-start.ts
@@ -36,7 +36,11 @@ Deeplake memory structure:
 
 SEARCH STRATEGY: Always read index.md first. Then read specific summaries. Only read raw JSONL if summaries don't have enough detail. Do NOT jump straight to JSONL files.
 
-Search command: Grep pattern="keyword" path="~/.deeplake/memory"
+SEARCH — prefer the Grep tool over bash grep. The Grep tool runs a single SQL query across ALL files with hybrid semantic+literal retrieval; bash loops over many files are slow, truncated at 10MB total output, and do not use the embeddings.
+  Good:  Grep pattern="Caroline researching adoption agencies" path="~/.deeplake/memory"
+  Good:  Grep pattern="Jon Rome visit"                         path="~/.deeplake/memory"
+  Bad:   bash "for f in ~/.deeplake/memory/sessions/*.json; do grep ... \$f; done"  (truncated, no semantics)
+Phrase Grep patterns as full descriptive phrases, not single keywords — the semantic layer matches meaning, single names return topic-irrelevant results.
 
 Organization management — each argument is SEPARATE (do NOT quote subcommands together):
 - node "HIVEMIND_AUTH_CMD" login                              — SSO login
@@ -49,7 +53,7 @@ Organization management — each argument is SEPARATE (do NOT quote subcommands
 - node "HIVEMIND_AUTH_CMD" members                            — list members
 - node "HIVEMIND_AUTH_CMD" remove <user-id>                   — remove member
 
-IMPORTANT: Only use bash commands (cat, ls, grep, echo, jq, head, tail, etc.) to interact with ~/.deeplake/memory/. Do NOT use python, python3, node, curl, or other interpreters — they are not available in the memory filesystem. If a task seems to require Python, rewrite it using bash commands and standard text-processing tools (awk, sed, jq, grep, etc.).
+READ — use bash \`cat\`/\`head\`/\`tail\` on SPECIFIC files returned by Grep. Do NOT use python, python3, node, curl, or other interpreters — they are not available in the memory filesystem. Avoid bash brace expansions like \`{1..10}\` (not fully supported); spell out paths or use Grep instead.
 
 LIMITS: Do NOT spawn subagents to read deeplake memory. If a file returns empty after 2 attempts, skip it and move on. Report what you found rather than exhaustively retrying.
 

From 11457e1923dc96084ece0beb7a81e7754dc3e29b Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Thu, 23 Apr 2026 05:21:31 +0000
Subject: [PATCH 11/30] fix(session-start): revert Grep tool steering + add
 HIVEMIND_AUTOUPDATE opt-out
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Two changes to SessionStart that surfaced during benchmark diagnosis.

1. Revert the "prefer the Grep tool over bash grep" block added in
   c36bac0. The bundled PreToolUse hook's Grep interceptor returns
   `updatedInput: {command, description}` — the Bash tool input shape —
   but Claude Code ≥ 2.1.117 does not accept tool substitution via
   `updatedInput`. When the originating tool is Grep, Claude Code
   ignores the shape mismatch and runs native Grep against the virtual
   memory path, which fails with `Path does not exist`. Steering agents
   toward the Grep tool therefore triggered an 80% failure rate on any
   session that took the hint. Measured impact on combined 100-QA
   locomo subset: 0.735 (old prompt) -> 0.480 (new prompt, broken
   Grep). Restoring "Only use bash commands" sends agents back to the
   Bash intercept path, which has matching schema and works.

   Kept the two factual bullets from c36bac0 that document real virtual
   shell limits (10 MB bash output cap, `{a..b}` brace expansion not
   fully supported) — those apply to Bash usage and are useful on their
   own. The Grep-specific steering is the only part reverted.

2. Add a `HIVEMIND_AUTOUPDATE=false` escape hatch around the version
   check + autoupdate block. When true (default), behaviour is
   unchanged: the hook runs `claude plugin update hivemind@hivemind`
   across four scopes plus an `rmSync` over old cache directories every
   time a session starts. Under a concurrent benchmark (20 sessions)
   that triggers 200+ times, races with live sessions on the shared
   cache dir, and inflates SessionStart wall time by seconds.
   `HIVEMIND_AUTOUPDATE=false` short-circuits the whole block; the
   plugin still works normally at runtime, it just doesn't try to
   self-upgrade. Intended for benchmark and CI setups.
---
 claude-code/bundle/session-start.js | 90 ++++++++++++++---------------
 src/hooks/session-start.ts          | 20 ++++---
 2 files changed, 57 insertions(+), 53 deletions(-)

diff --git a/claude-code/bundle/session-start.js b/claude-code/bundle/session-start.js
index bf49de9..b19e560 100755
--- a/claude-code/bundle/session-start.js
+++ b/claude-code/bundle/session-start.js
@@ -504,11 +504,7 @@ Deeplake memory structure:
 
 SEARCH STRATEGY: Always read index.md first. Then read specific summaries. Only read raw JSONL if summaries don't have enough detail. Do NOT jump straight to JSONL files.
 
-SEARCH \u2014 prefer the Grep tool over bash grep. The Grep tool runs a single SQL query across ALL files with hybrid semantic+literal retrieval; bash loops over many files are slow, truncated at 10MB total output, and do not use the embeddings.
-  Good:  Grep pattern="Caroline researching adoption agencies" path="~/.deeplake/memory"
-  Good:  Grep pattern="Jon Rome visit"                         path="~/.deeplake/memory"
-  Bad:   bash "for f in ~/.deeplake/memory/sessions/*.json; do grep ... $f; done"  (truncated, no semantics)
-Phrase Grep patterns as full descriptive phrases, not single keywords \u2014 the semantic layer matches meaning, single names return topic-irrelevant results.
+Search command: Grep pattern="keyword" path="~/.deeplake/memory"
 
 Organization management \u2014 each argument is SEPARATE (do NOT quote subcommands together):
 - node "HIVEMIND_AUTH_CMD" login                              \u2014 SSO login
@@ -521,7 +517,7 @@ Organization management \u2014 each argument is SEPARATE (do NOT quote subcomman
 - node "HIVEMIND_AUTH_CMD" members                            \u2014 list members
 - node "HIVEMIND_AUTH_CMD" remove <user-id>                   \u2014 remove member
 
-READ \u2014 use bash \`cat\`/\`head\`/\`tail\` on SPECIFIC files returned by Grep. Do NOT use python, python3, node, curl, or other interpreters \u2014 they are not available in the memory filesystem. Avoid bash brace expansions like \`{1..10}\` (not fully supported); spell out paths or use Grep instead.
+IMPORTANT: Only use bash commands (cat, ls, grep, echo, jq, head, tail, etc.) to interact with ~/.deeplake/memory/. Do NOT use python, python3, node, curl, or other interpreters \u2014 they are not available in the memory filesystem. Avoid bash brace expansions like \`{1..10}\` (not fully supported); spell out paths explicitly. Bash output is capped at 10MB total \u2014 avoid \`for f in *.json; do cat $f\` style loops on the whole sessions dir.
 
 LIMITS: Do NOT spawn subagents to read deeplake memory. If a file returns empty after 2 attempts, skip it and move on. Report what you found rather than exhaustively retrying.
 
@@ -591,62 +587,66 @@ async function main() {
       wikiLog(`SessionStart: placeholder failed for ${input.session_id}: ${e.message}`);
     }
   }
-  const autoupdate = creds?.autoupdate !== false;
   let updateNotice = "";
-  try {
-    const current = getInstalledVersion(__bundleDir, ".claude-plugin");
-    if (current) {
-      const latest = await getLatestVersion();
-      if (latest && isNewer(latest, current)) {
-        if (autoupdate) {
-          log3(`autoupdate: updating ${current} \u2192 ${latest}`);
-          try {
-            const scopes = ["user", "project", "local", "managed"];
-            const cmd = scopes.map((s) => `claude plugin update hivemind@hivemind --scope ${s} 2>/dev/null || true`).join("; ");
-            execSync2(cmd, { stdio: "ignore", timeout: 6e4 });
+  if (process.env.HIVEMIND_AUTOUPDATE === "false") {
+    log3("autoupdate skipped via HIVEMIND_AUTOUPDATE=false");
+  } else {
+    const autoupdate = creds?.autoupdate !== false;
+    try {
+      const current = getInstalledVersion(__bundleDir, ".claude-plugin");
+      if (current) {
+        const latest = await getLatestVersion();
+        if (latest && isNewer(latest, current)) {
+          if (autoupdate) {
+            log3(`autoupdate: updating ${current} \u2192 ${latest}`);
             try {
-              const cacheParent = join7(homedir4(), ".claude", "plugins", "cache", "hivemind", "hivemind");
-              const entries = readdirSync(cacheParent, { withFileTypes: true });
-              for (const e of entries) {
-                if (e.isDirectory() && e.name !== latest) {
-                  rmSync(join7(cacheParent, e.name), { recursive: true, force: true });
-                  log3(`cache cleanup: removed old version ${e.name}`);
+              const scopes = ["user", "project", "local", "managed"];
+              const cmd = scopes.map((s) => `claude plugin update hivemind@hivemind --scope ${s} 2>/dev/null || true`).join("; ");
+              execSync2(cmd, { stdio: "ignore", timeout: 6e4 });
+              try {
+                const cacheParent = join7(homedir4(), ".claude", "plugins", "cache", "hivemind", "hivemind");
+                const entries = readdirSync(cacheParent, { withFileTypes: true });
+                for (const e of entries) {
+                  if (e.isDirectory() && e.name !== latest) {
+                    rmSync(join7(cacheParent, e.name), { recursive: true, force: true });
+                    log3(`cache cleanup: removed old version ${e.name}`);
+                  }
                 }
+              } catch (e) {
+                log3(`cache cleanup failed: ${e.message}`);
               }
-            } catch (e) {
-              log3(`cache cleanup failed: ${e.message}`);
-            }
-            updateNotice = `
+              updateNotice = `
 
 \u2705 Hivemind auto-updated: ${current} \u2192 ${latest}. Run /reload-plugins to apply.`;
-            process.stderr.write(`\u2705 Hivemind auto-updated: ${current} \u2192 ${latest}. Run /reload-plugins to apply.
+              process.stderr.write(`\u2705 Hivemind auto-updated: ${current} \u2192 ${latest}. Run /reload-plugins to apply.
 `);
-            log3(`autoupdate succeeded: ${current} \u2192 ${latest}`);
-          } catch (e) {
-            updateNotice = `
+              log3(`autoupdate succeeded: ${current} \u2192 ${latest}`);
+            } catch (e) {
+              updateNotice = `
 
 \u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Auto-update failed \u2014 run /hivemind:update to upgrade manually.`;
-            process.stderr.write(`\u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Auto-update failed \u2014 run /hivemind:update to upgrade manually.
+              process.stderr.write(`\u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Auto-update failed \u2014 run /hivemind:update to upgrade manually.
 `);
-            log3(`autoupdate failed: ${e.message}`);
-          }
-        } else {
-          updateNotice = `
+              log3(`autoupdate failed: ${e.message}`);
+            }
+          } else {
+            updateNotice = `
 
 \u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Run /hivemind:update to upgrade.`;
-          process.stderr.write(`\u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Run /hivemind:update to upgrade.
+            process.stderr.write(`\u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Run /hivemind:update to upgrade.
 `);
-          log3(`update available (autoupdate off): ${current} \u2192 ${latest}`);
-        }
-      } else {
-        log3(`version up to date: ${current}`);
-        updateNotice = `
+            log3(`update available (autoupdate off): ${current} \u2192 ${latest}`);
+          }
+        } else {
+          log3(`version up to date: ${current}`);
+          updateNotice = `
 
 \u2705 Hivemind v${current} (up to date)`;
+        }
       }
+    } catch (e) {
+      log3(`version check failed: ${e.message}`);
     }
-  } catch (e) {
-    log3(`version check failed: ${e.message}`);
   }
   const resolvedContext = context.replace(/HIVEMIND_AUTH_CMD/g, AUTH_CMD);
   const additionalContext = creds?.token ? `${resolvedContext}
diff --git a/src/hooks/session-start.ts b/src/hooks/session-start.ts
index 642acbf..6c435e5 100644
--- a/src/hooks/session-start.ts
+++ b/src/hooks/session-start.ts
@@ -36,11 +36,7 @@ Deeplake memory structure:
 
 SEARCH STRATEGY: Always read index.md first. Then read specific summaries. Only read raw JSONL if summaries don't have enough detail. Do NOT jump straight to JSONL files.
 
-SEARCH — prefer the Grep tool over bash grep. The Grep tool runs a single SQL query across ALL files with hybrid semantic+literal retrieval; bash loops over many files are slow, truncated at 10MB total output, and do not use the embeddings.
-  Good:  Grep pattern="Caroline researching adoption agencies" path="~/.deeplake/memory"
-  Good:  Grep pattern="Jon Rome visit"                         path="~/.deeplake/memory"
-  Bad:   bash "for f in ~/.deeplake/memory/sessions/*.json; do grep ... \$f; done"  (truncated, no semantics)
-Phrase Grep patterns as full descriptive phrases, not single keywords — the semantic layer matches meaning, single names return topic-irrelevant results.
+Search command: Grep pattern="keyword" path="~/.deeplake/memory"
 
 Organization management — each argument is SEPARATE (do NOT quote subcommands together):
 - node "HIVEMIND_AUTH_CMD" login                              — SSO login
@@ -53,7 +49,7 @@ Organization management — each argument is SEPARATE (do NOT quote subcommands
 - node "HIVEMIND_AUTH_CMD" members                            — list members
 - node "HIVEMIND_AUTH_CMD" remove <user-id>                   — remove member
 
-READ — use bash \`cat\`/\`head\`/\`tail\` on SPECIFIC files returned by Grep. Do NOT use python, python3, node, curl, or other interpreters — they are not available in the memory filesystem. Avoid bash brace expansions like \`{1..10}\` (not fully supported); spell out paths or use Grep instead.
+IMPORTANT: Only use bash commands (cat, ls, grep, echo, jq, head, tail, etc.) to interact with ~/.deeplake/memory/. Do NOT use python, python3, node, curl, or other interpreters — they are not available in the memory filesystem. Avoid bash brace expansions like \`{1..10}\` (not fully supported); spell out paths explicitly. Bash output is capped at 10MB total — avoid \`for f in *.json; do cat $f\` style loops on the whole sessions dir.
 
 LIMITS: Do NOT spawn subagents to read deeplake memory. If a file returns empty after 2 attempts, skip it and move on. Report what you found rather than exhaustively retrying.
 
@@ -152,9 +148,16 @@ async function main(): Promise<void> {
     }
   }
 
-  // Version check (non-blocking — failures are silently ignored)
-  const autoupdate = creds?.autoupdate !== false; // default: true
+  // Version check (non-blocking — failures are silently ignored).
+  // HIVEMIND_AUTOUPDATE=false lets benchmarks and CI opt out of both the
+  // version check and the automatic `claude plugin update` — the latter
+  // spawns several external commands, mutates ~/.claude/plugins, and under
+  // concurrent runs races with other SessionStart hooks.
   let updateNotice = "";
+  if (process.env.HIVEMIND_AUTOUPDATE === "false") {
+    log("autoupdate skipped via HIVEMIND_AUTOUPDATE=false");
+  } else {
+  const autoupdate = creds?.autoupdate !== false; // default: true
   try {
     const current = getInstalledVersion(__bundleDir, ".claude-plugin");
     if (current) {
@@ -202,6 +205,7 @@ async function main(): Promise<void> {
   } catch (e: any) {
     log(`version check failed: ${e.message}`);
   }
+  }
 
   const resolvedContext = context.replace(/HIVEMIND_AUTH_CMD/g, AUTH_CMD);
   const additionalContext = creds?.token

From 6b6cf26c3614bc53791ac2dcb2118bd7cabd51bd Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Thu, 23 Apr 2026 05:21:41 +0000
Subject: [PATCH 12/30] chore(hooks): raise PreToolUse timeout 10 -> 60 s for
 concurrent-load headroom

Under 20-way concurrency the PreToolUse hook cold-starts a fresh Node
process, loads config, builds a DeeplakeApi client, and issues a SQL
query to intercept the tool. Measured p95 per-hook time under that
load can exceed 10 s, which Claude Code treats as a cancel and falls
back to the original (unintercepted) tool call. 60 s matches the
timeout on other hooks (SessionEnd, the async setup job) and gives
the intercept path headroom without changing steady-state behaviour.
---
 claude-code/hooks/hooks.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/claude-code/hooks/hooks.json b/claude-code/hooks/hooks.json
index 7801e25..808c5b7 100644
--- a/claude-code/hooks/hooks.json
+++ b/claude-code/hooks/hooks.json
@@ -36,7 +36,7 @@
           {
             "type": "command",
             "command": "node \"${CLAUDE_PLUGIN_ROOT}/bundle/pre-tool-use.js\"",
-            "timeout": 10
+            "timeout": 60
           }
         ]
       }

From 0a2147c32563e8c52dd7459659aefd4409d57499 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Thu, 23 Apr 2026 05:40:26 +0000
Subject: [PATCH 13/30] chore: bump version to 0.7.0

---
 .claude-plugin/marketplace.json        | 4 ++--
 .claude-plugin/plugin.json             | 2 +-
 claude-code/.claude-plugin/plugin.json | 2 +-
 codex/package.json                     | 2 +-
 package-lock.json                      | 4 ++--
 package.json                           | 2 +-
 6 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/.claude-plugin/marketplace.json b/.claude-plugin/marketplace.json
index 427fc2e..206836e 100644
--- a/.claude-plugin/marketplace.json
+++ b/.claude-plugin/marketplace.json
@@ -6,13 +6,13 @@
   },
   "metadata": {
     "description": "Cloud-backed persistent shared memory for AI agents powered by Deeplake",
-    "version": "0.6.38"
+    "version": "0.7.0"
   },
   "plugins": [
     {
       "name": "hivemind",
       "description": "Persistent shared memory powered by Deeplake — captures all session activity and provides cross-session, cross-agent memory search",
-      "version": "0.6.38",
+      "version": "0.7.0",
       "source": "./claude-code",
       "homepage": "https://github.com/activeloopai/hivemind"
     }
diff --git a/.claude-plugin/plugin.json b/.claude-plugin/plugin.json
index e178805..6a3f654 100644
--- a/.claude-plugin/plugin.json
+++ b/.claude-plugin/plugin.json
@@ -1,7 +1,7 @@
 {
   "name": "hivemind",
   "description": "Cloud-backed persistent memory powered by Deeplake — read, write, and share memory across Claude Code sessions and agents",
-  "version": "0.6.38",
+  "version": "0.7.0",
   "author": {
     "name": "Activeloop",
     "url": "https://deeplake.ai"
diff --git a/claude-code/.claude-plugin/plugin.json b/claude-code/.claude-plugin/plugin.json
index e178805..6a3f654 100644
--- a/claude-code/.claude-plugin/plugin.json
+++ b/claude-code/.claude-plugin/plugin.json
@@ -1,7 +1,7 @@
 {
   "name": "hivemind",
   "description": "Cloud-backed persistent memory powered by Deeplake — read, write, and share memory across Claude Code sessions and agents",
-  "version": "0.6.38",
+  "version": "0.7.0",
   "author": {
     "name": "Activeloop",
     "url": "https://deeplake.ai"
diff --git a/codex/package.json b/codex/package.json
index 0a42990..9f305d8 100644
--- a/codex/package.json
+++ b/codex/package.json
@@ -1,6 +1,6 @@
 {
   "name": "hivemind-codex",
-  "version": "0.6.38",
+  "version": "0.7.0",
   "description": "Cloud-backed persistent shared memory for OpenAI Codex CLI powered by Deeplake",
   "type": "module"
 }
diff --git a/package-lock.json b/package-lock.json
index e742826..cffa848 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -1,12 +1,12 @@
 {
   "name": "hivemind",
-  "version": "0.6.38",
+  "version": "0.7.0",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "hivemind",
-      "version": "0.6.38",
+      "version": "0.7.0",
       "dependencies": {
         "@huggingface/transformers": "^3.0.0",
         "deeplake": "^0.3.30",
diff --git a/package.json b/package.json
index b13c937..788b312 100644
--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
   "name": "hivemind",
-  "version": "0.6.38",
+  "version": "0.7.0",
   "description": "Cloud-backed persistent shared memory for AI agents powered by Deeplake",
   "type": "module",
   "bin": {

From 1d538ca867c96cf55ddb9656f185029e2c0406e7 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Thu, 23 Apr 2026 06:01:59 +0000
Subject: [PATCH 14/30] test(deeplake-fs): align mocks with MAX(size_bytes) in
 sessions bootstrap

Two test mocks were still matching the old `SUM(size_bytes)` SQL string
so the bootstrap query was silently returning an empty row list and
every session path ended up absent from `sessionPaths`, which then made
16 unrelated read-only / rm-rf tests fail with ENOENT. The SQL itself
was changed to MAX in 0c3a94d; this just brings the mock matchers and
reducers in line with it (MAX instead of SUM per group).

No production-code change, no new tests. 933/933 pass.
---
 claude-code/tests/deeplake-fs.test.ts    | 4 ++--
 claude-code/tests/sessions-table.test.ts | 9 ++++++---
 2 files changed, 8 insertions(+), 5 deletions(-)

diff --git a/claude-code/tests/deeplake-fs.test.ts b/claude-code/tests/deeplake-fs.test.ts
index 4f452db..f3685e2 100644
--- a/claude-code/tests/deeplake-fs.test.ts
+++ b/claude-code/tests/deeplake-fs.test.ts
@@ -622,10 +622,10 @@ describe("prefetch", () => {
       ensureTable: vi.fn().mockResolvedValue(undefined),
       query: vi.fn(async (sql: string) => {
         if (sql.includes("SELECT path, size_bytes, mime_type")) return [];
-        if (sql.includes("SELECT path, SUM(size_bytes) as total_size")) {
+        if (sql.includes("SELECT path, MAX(size_bytes) as total_size")) {
           return [...sessionMessages.entries()].map(([path, rows]) => ({
             path,
-            total_size: rows.reduce((sum, row) => sum + Buffer.byteLength(row.message, "utf-8"), 0),
+            total_size: Math.max(...rows.map((row) => Buffer.byteLength(row.message, "utf-8"))),
           }));
         }
         if (sql.includes("SELECT path, message, creation_date")) {
diff --git a/claude-code/tests/sessions-table.test.ts b/claude-code/tests/sessions-table.test.ts
index 40a254f..673d0f9 100644
--- a/claude-code/tests/sessions-table.test.ts
+++ b/claude-code/tests/sessions-table.test.ts
@@ -27,11 +27,14 @@ function makeClient(memoryRows: Row[] = [], sessionRows: Row[] = []) {
         return rows.map(r => ({ path: r.path, size_bytes: r.size_bytes, mime_type: r.mime_type }));
       }
 
-      // Bootstrap: SELECT path, SUM(size_bytes) ... GROUP BY path (sessions table)
-      if (sql.includes("SUM(size_bytes)") && sql.includes("GROUP BY")) {
+      // Bootstrap: SELECT path, MAX(size_bytes) ... GROUP BY path (sessions table).
+      // The production SQL uses MAX to work around a Deeplake backend quirk
+      // where SUM() returns NULL under GROUP BY (see deeplake-fs.ts), so the
+      // mock mirrors that by taking MAX per path as well.
+      if (sql.includes("MAX(size_bytes)") && sql.includes("GROUP BY")) {
         const groups = new Map<string, number>();
         for (const r of sessionRows) {
-          groups.set(r.path, (groups.get(r.path) ?? 0) + r.size_bytes);
+          groups.set(r.path, Math.max(groups.get(r.path) ?? 0, r.size_bytes));
         }
         return [...groups.entries()].map(([path, total]) => ({ path, total_size: total }));
       }

From 23b059a0775106055a9c87e80d99c73d89d1b482 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Thu, 23 Apr 2026 06:02:09 +0000
Subject: [PATCH 15/30] revert(session-start): drop HIVEMIND_AUTOUPDATE env var
 (redundant)

The env gate added in 11457e1 duplicated an existing mechanism: the
`creds.autoupdate` flag stored in ~/.deeplake/credentials.json, toggled
via `node auth-login.js autoupdate [on|off]`. Both short-circuit the
disruptive part of the session-start autoupdate flow (the external
`claude plugin update` subprocess and the `rmSync` over old cache
directories).

The only extra behaviour the env var provided was also skipping the
version fetch to GitHub (one ~100-500 ms HTTP GET with 3 s timeout) and
suppressing the "update available" stderr line. Neither justifies a
second toggle with slightly different semantics.

Reverting the source block and its two tests. The prompt revert and
bundle regeneration from 11457e1 stay in place.
---
 claude-code/bundle/session-start.js | 82 ++++++++++++++---------------
 src/hooks/session-start.ts          | 12 +----
 2 files changed, 41 insertions(+), 53 deletions(-)

diff --git a/claude-code/bundle/session-start.js b/claude-code/bundle/session-start.js
index b19e560..e71e2ff 100755
--- a/claude-code/bundle/session-start.js
+++ b/claude-code/bundle/session-start.js
@@ -587,66 +587,62 @@ async function main() {
       wikiLog(`SessionStart: placeholder failed for ${input.session_id}: ${e.message}`);
     }
   }
+  const autoupdate = creds?.autoupdate !== false;
   let updateNotice = "";
-  if (process.env.HIVEMIND_AUTOUPDATE === "false") {
-    log3("autoupdate skipped via HIVEMIND_AUTOUPDATE=false");
-  } else {
-    const autoupdate = creds?.autoupdate !== false;
-    try {
-      const current = getInstalledVersion(__bundleDir, ".claude-plugin");
-      if (current) {
-        const latest = await getLatestVersion();
-        if (latest && isNewer(latest, current)) {
-          if (autoupdate) {
-            log3(`autoupdate: updating ${current} \u2192 ${latest}`);
+  try {
+    const current = getInstalledVersion(__bundleDir, ".claude-plugin");
+    if (current) {
+      const latest = await getLatestVersion();
+      if (latest && isNewer(latest, current)) {
+        if (autoupdate) {
+          log3(`autoupdate: updating ${current} \u2192 ${latest}`);
+          try {
+            const scopes = ["user", "project", "local", "managed"];
+            const cmd = scopes.map((s) => `claude plugin update hivemind@hivemind --scope ${s} 2>/dev/null || true`).join("; ");
+            execSync2(cmd, { stdio: "ignore", timeout: 6e4 });
             try {
-              const scopes = ["user", "project", "local", "managed"];
-              const cmd = scopes.map((s) => `claude plugin update hivemind@hivemind --scope ${s} 2>/dev/null || true`).join("; ");
-              execSync2(cmd, { stdio: "ignore", timeout: 6e4 });
-              try {
-                const cacheParent = join7(homedir4(), ".claude", "plugins", "cache", "hivemind", "hivemind");
-                const entries = readdirSync(cacheParent, { withFileTypes: true });
-                for (const e of entries) {
-                  if (e.isDirectory() && e.name !== latest) {
-                    rmSync(join7(cacheParent, e.name), { recursive: true, force: true });
-                    log3(`cache cleanup: removed old version ${e.name}`);
-                  }
+              const cacheParent = join7(homedir4(), ".claude", "plugins", "cache", "hivemind", "hivemind");
+              const entries = readdirSync(cacheParent, { withFileTypes: true });
+              for (const e of entries) {
+                if (e.isDirectory() && e.name !== latest) {
+                  rmSync(join7(cacheParent, e.name), { recursive: true, force: true });
+                  log3(`cache cleanup: removed old version ${e.name}`);
                 }
-              } catch (e) {
-                log3(`cache cleanup failed: ${e.message}`);
               }
-              updateNotice = `
-
-\u2705 Hivemind auto-updated: ${current} \u2192 ${latest}. Run /reload-plugins to apply.`;
-              process.stderr.write(`\u2705 Hivemind auto-updated: ${current} \u2192 ${latest}. Run /reload-plugins to apply.
-`);
-              log3(`autoupdate succeeded: ${current} \u2192 ${latest}`);
             } catch (e) {
-              updateNotice = `
+              log3(`cache cleanup failed: ${e.message}`);
+            }
+            updateNotice = `
 
-\u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Auto-update failed \u2014 run /hivemind:update to upgrade manually.`;
-              process.stderr.write(`\u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Auto-update failed \u2014 run /hivemind:update to upgrade manually.
+\u2705 Hivemind auto-updated: ${current} \u2192 ${latest}. Run /reload-plugins to apply.`;
+            process.stderr.write(`\u2705 Hivemind auto-updated: ${current} \u2192 ${latest}. Run /reload-plugins to apply.
 `);
-              log3(`autoupdate failed: ${e.message}`);
-            }
-          } else {
+            log3(`autoupdate succeeded: ${current} \u2192 ${latest}`);
+          } catch (e) {
             updateNotice = `
 
-\u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Run /hivemind:update to upgrade.`;
-            process.stderr.write(`\u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Run /hivemind:update to upgrade.
+\u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Auto-update failed \u2014 run /hivemind:update to upgrade manually.`;
+            process.stderr.write(`\u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Auto-update failed \u2014 run /hivemind:update to upgrade manually.
 `);
-            log3(`update available (autoupdate off): ${current} \u2192 ${latest}`);
+            log3(`autoupdate failed: ${e.message}`);
           }
         } else {
-          log3(`version up to date: ${current}`);
           updateNotice = `
 
-\u2705 Hivemind v${current} (up to date)`;
+\u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Run /hivemind:update to upgrade.`;
+          process.stderr.write(`\u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Run /hivemind:update to upgrade.
+`);
+          log3(`update available (autoupdate off): ${current} \u2192 ${latest}`);
         }
+      } else {
+        log3(`version up to date: ${current}`);
+        updateNotice = `
+
+\u2705 Hivemind v${current} (up to date)`;
       }
-    } catch (e) {
-      log3(`version check failed: ${e.message}`);
     }
+  } catch (e) {
+    log3(`version check failed: ${e.message}`);
   }
   const resolvedContext = context.replace(/HIVEMIND_AUTH_CMD/g, AUTH_CMD);
   const additionalContext = creds?.token ? `${resolvedContext}
diff --git a/src/hooks/session-start.ts b/src/hooks/session-start.ts
index 6c435e5..5a28a7d 100644
--- a/src/hooks/session-start.ts
+++ b/src/hooks/session-start.ts
@@ -148,16 +148,9 @@ async function main(): Promise<void> {
     }
   }
 
-  // Version check (non-blocking — failures are silently ignored).
-  // HIVEMIND_AUTOUPDATE=false lets benchmarks and CI opt out of both the
-  // version check and the automatic `claude plugin update` — the latter
-  // spawns several external commands, mutates ~/.claude/plugins, and under
-  // concurrent runs races with other SessionStart hooks.
-  let updateNotice = "";
-  if (process.env.HIVEMIND_AUTOUPDATE === "false") {
-    log("autoupdate skipped via HIVEMIND_AUTOUPDATE=false");
-  } else {
+  // Version check (non-blocking — failures are silently ignored)
   const autoupdate = creds?.autoupdate !== false; // default: true
+  let updateNotice = "";
   try {
     const current = getInstalledVersion(__bundleDir, ".claude-plugin");
     if (current) {
@@ -205,7 +198,6 @@ async function main(): Promise<void> {
   } catch (e: any) {
     log(`version check failed: ${e.message}`);
   }
-  }
 
   const resolvedContext = context.replace(/HIVEMIND_AUTH_CMD/g, AUTH_CMD);
   const additionalContext = creds?.token

From 3979d09d40e1ff27c5d76fc1b0241d16edeeaae9 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Thu, 23 Apr 2026 06:34:21 +0000
Subject: [PATCH 16/30] feat(session-start-setup): pre-warm the nomic embed
 daemon
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The async SessionStart setup hook now fires EmbedClient.warmup() as its
last step. warmup() either connects to an existing embed-daemon socket
or spawns a fresh detached process; the daemon then calls
NomicEmbedder.load() in the background, which triggers the one-time
nomic-embed-text-v1.5 download to ~/.cache/huggingface/hub/ (~130 MB
at q8, ~500 MB at fp32) on first run and keeps the model resident for
the lifetime of the process.

Previously the model only downloaded on the first Grep call — which
meant every new install paid a 30-90 s latency on the first semantic
retrieval. Doing it here instead hides that cold-start behind the
async SessionStart (120 s timeout), so the user only sees it if
they happen to fire a Grep before the async hook finishes the
download. Everyone else gets an already-loaded daemon on first use.

Behaviour is opt-out via HIVEMIND_EMBED_WARMUP=false for sessions
that will never touch the memory path (CI, lightweight CC runs with
no network), which logs the skip and moves on. warmup() swallows
errors so a broken daemon path never breaks SessionStart.

Tests:
- session-start-setup-hook.test.ts: mocks EmbedClient so warmup()
  doesn't actually spawn a process; four new cases cover the ok /
  failed / threw / env-disabled branches
- session-start-setup-branches.test.ts: same mock so the existing
  branch-coverage suite stays deterministic
- grep-direct.test.ts: mocks EmbedClient.embed to always return null.
  Without this, grep-direct.test.ts was race-flaky — if any other
  test or prior run had spawned the daemon, the semantic branch in
  handleGrepDirect would fire and change the output shape, breaking
  every line-oriented assertion in this file. With the mock the
  lexical refine path runs deterministically regardless of whether
  a daemon is up outside the test process.

Coverage: src/hooks/session-start-setup.ts → 100/100/100/100. All
per-file thresholds still pass. 1108 tests green.
---
 claude-code/bundle/session-start-setup.js     | 259 +++++++++++++++++-
 claude-code/tests/grep-direct.test.ts         |  15 +
 .../session-start-setup-branches.test.ts      |   7 +
 .../tests/session-start-setup-hook.test.ts    |  37 +++
 src/hooks/session-start-setup.ts              |  24 ++
 5 files changed, 329 insertions(+), 13 deletions(-)

diff --git a/claude-code/bundle/session-start-setup.js b/claude-code/bundle/session-start-setup.js
index fff5104..cac8456 100755
--- a/claude-code/bundle/session-start-setup.js
+++ b/claude-code/bundle/session-start-setup.js
@@ -543,8 +543,229 @@ function restoreOrCleanup(handle) {
 }
 var DEFAULT_MANIFEST_PATH = join7(homedir4(), ".claude", "plugins", "installed_plugins.json");
 
+// dist/src/embeddings/client.js
+import { connect } from "node:net";
+import { spawn } from "node:child_process";
+import { openSync, closeSync, writeSync, unlinkSync as unlinkSync2, existsSync as existsSync5, readFileSync as readFileSync6 } from "node:fs";
+
+// dist/src/embeddings/protocol.js
+var DEFAULT_SOCKET_DIR = "/tmp";
+var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
+var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.sock`;
+}
+function pidPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.pid`;
+}
+
+// dist/src/embeddings/client.js
+var log3 = (m) => log("embed-client", m);
+function getUid() {
+  const uid = typeof process.getuid === "function" ? process.getuid() : void 0;
+  return uid !== void 0 ? String(uid) : process.env.USER ?? "default";
+}
+var EmbedClient = class {
+  socketPath;
+  pidPath;
+  timeoutMs;
+  daemonEntry;
+  autoSpawn;
+  spawnWaitMs;
+  nextId = 0;
+  constructor(opts = {}) {
+    const uid = getUid();
+    const dir = opts.socketDir ?? "/tmp";
+    this.socketPath = socketPathFor(uid, dir);
+    this.pidPath = pidPathFor(uid, dir);
+    this.timeoutMs = opts.timeoutMs ?? DEFAULT_CLIENT_TIMEOUT_MS;
+    this.daemonEntry = opts.daemonEntry ?? process.env.HIVEMIND_EMBED_DAEMON;
+    this.autoSpawn = opts.autoSpawn ?? true;
+    this.spawnWaitMs = opts.spawnWaitMs ?? 5e3;
+  }
+  /**
+   * Returns an embedding vector, or null on timeout/failure. Hooks MUST treat
+   * null as "skip embedding column" — never block the write path on us.
+   *
+   * Fire-and-forget spawn on miss: if the daemon isn't up, this call returns
+   * null AND kicks off a background spawn. The next call finds a ready daemon.
+   */
+  async embed(text, kind = "document") {
+    let sock;
+    try {
+      sock = await this.connectOnce();
+    } catch {
+      if (this.autoSpawn)
+        this.trySpawnDaemon();
+      return null;
+    }
+    try {
+      const id = String(++this.nextId);
+      const req = { op: "embed", id, kind, text };
+      const resp = await this.sendAndWait(sock, req);
+      if (resp.error || !("embedding" in resp) || !resp.embedding) {
+        log3(`embed err: ${resp.error ?? "no embedding"}`);
+        return null;
+      }
+      return resp.embedding;
+    } catch (e) {
+      const err = e instanceof Error ? e.message : String(e);
+      log3(`embed failed: ${err}`);
+      return null;
+    } finally {
+      try {
+        sock.end();
+      } catch {
+      }
+    }
+  }
+  /**
+   * Wait up to spawnWaitMs for the daemon to accept connections, spawning if
+   * necessary. Meant for SessionStart / long-running batches — not the hot path.
+   */
+  async warmup() {
+    try {
+      const s = await this.connectOnce();
+      s.end();
+      return true;
+    } catch {
+      if (!this.autoSpawn)
+        return false;
+      this.trySpawnDaemon();
+      try {
+        const s = await this.waitForSocket();
+        s.end();
+        return true;
+      } catch {
+        return false;
+      }
+    }
+  }
+  connectOnce() {
+    return new Promise((resolve2, reject) => {
+      const sock = connect(this.socketPath);
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("connect timeout"));
+      }, this.timeoutMs);
+      sock.once("connect", () => {
+        clearTimeout(to);
+        resolve2(sock);
+      });
+      sock.once("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+    });
+  }
+  trySpawnDaemon() {
+    let fd;
+    try {
+      fd = openSync(this.pidPath, "wx", 384);
+      writeSync(fd, String(process.pid));
+    } catch (e) {
+      if (this.isPidFileStale()) {
+        try {
+          unlinkSync2(this.pidPath);
+        } catch {
+        }
+        try {
+          fd = openSync(this.pidPath, "wx", 384);
+          writeSync(fd, String(process.pid));
+        } catch {
+          return;
+        }
+      } else {
+        return;
+      }
+    }
+    if (!this.daemonEntry || !existsSync5(this.daemonEntry)) {
+      log3(`daemonEntry not configured or missing: ${this.daemonEntry}`);
+      try {
+        closeSync(fd);
+        unlinkSync2(this.pidPath);
+      } catch {
+      }
+      return;
+    }
+    try {
+      const child = spawn(process.execPath, [this.daemonEntry], {
+        detached: true,
+        stdio: "ignore",
+        env: process.env
+      });
+      child.unref();
+      log3(`spawned daemon pid=${child.pid}`);
+    } finally {
+      closeSync(fd);
+    }
+  }
+  isPidFileStale() {
+    try {
+      const raw = readFileSync6(this.pidPath, "utf-8").trim();
+      const pid = Number(raw);
+      if (!pid || Number.isNaN(pid))
+        return true;
+      try {
+        process.kill(pid, 0);
+        return false;
+      } catch {
+        return true;
+      }
+    } catch {
+      return true;
+    }
+  }
+  async waitForSocket() {
+    const deadline = Date.now() + this.spawnWaitMs;
+    let delay = 30;
+    while (Date.now() < deadline) {
+      await sleep2(delay);
+      delay = Math.min(delay * 1.5, 300);
+      if (!existsSync5(this.socketPath))
+        continue;
+      try {
+        return await this.connectOnce();
+      } catch {
+      }
+    }
+    throw new Error("daemon did not become ready within spawnWaitMs");
+  }
+  sendAndWait(sock, req) {
+    return new Promise((resolve2, reject) => {
+      let buf = "";
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("request timeout"));
+      }, this.timeoutMs);
+      sock.setEncoding("utf-8");
+      sock.on("data", (chunk) => {
+        buf += chunk;
+        const nl = buf.indexOf("\n");
+        if (nl === -1)
+          return;
+        const line = buf.slice(0, nl);
+        clearTimeout(to);
+        try {
+          resolve2(JSON.parse(line));
+        } catch (e) {
+          reject(e);
+        }
+      });
+      sock.on("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+      sock.write(JSON.stringify(req) + "\n");
+    });
+  }
+};
+function sleep2(ms) {
+  return new Promise((r) => setTimeout(r, ms));
+}
+
 // dist/src/hooks/session-start-setup.js
-var log3 = (msg) => log("session-setup", msg);
+var log4 = (msg) => log("session-setup", msg);
 var __bundleDir = dirname3(fileURLToPath(import.meta.url));
 var { log: wikiLog } = makeWikiLogger(join8(homedir5(), ".claude", "hooks"));
 async function main() {
@@ -553,7 +774,7 @@ async function main() {
   const input = await readStdin();
   const creds = loadCredentials();
   if (!creds?.token) {
-    log3("no credentials");
+    log4("no credentials");
     return;
   }
   if (!creds.userName) {
@@ -561,7 +782,7 @@ async function main() {
       const { userInfo: userInfo2 } = await import("node:os");
       creds.userName = userInfo2().username ?? "unknown";
       saveCredentials(creds);
-      log3(`backfilled userName: ${creds.userName}`);
+      log4(`backfilled userName: ${creds.userName}`);
     } catch {
     }
   }
@@ -572,10 +793,10 @@ async function main() {
         const api = new DeeplakeApi(config.token, config.apiUrl, config.orgId, config.workspaceId, config.tableName);
         await api.ensureTable();
         await api.ensureSessionsTable(config.sessionsTableName);
-        log3("setup complete");
+        log4("setup complete");
       }
     } catch (e) {
-      log3(`setup failed: ${e.message}`);
+      log4(`setup failed: ${e.message}`);
       wikiLog(`SessionSetup: failed for ${input.session_id}: ${e.message}`);
     }
   }
@@ -586,7 +807,7 @@ async function main() {
       const latest = await getLatestVersion();
       if (latest && isNewer(latest, current)) {
         if (autoupdate) {
-          log3(`autoupdate: updating ${current} \u2192 ${latest}`);
+          log4(`autoupdate: updating ${current} \u2192 ${latest}`);
           const resolved = resolveVersionedPluginDir(__bundleDir);
           const handle = resolved ? snapshotPluginDir(resolved.pluginDir) : null;
           try {
@@ -594,30 +815,42 @@ async function main() {
             const cmd = scopes.map((s) => `claude plugin update hivemind@hivemind --scope ${s} 2>/dev/null || true`).join("; ");
             execSync2(cmd, { stdio: "ignore", timeout: 6e4 });
             const outcome = restoreOrCleanup(handle);
-            log3(`autoupdate snapshot outcome: ${outcome}`);
+            log4(`autoupdate snapshot outcome: ${outcome}`);
             process.stderr.write(`\u2705 Hivemind auto-updated: ${current} \u2192 ${latest}. Run /reload-plugins to apply.
 `);
-            log3(`autoupdate succeeded: ${current} \u2192 ${latest}`);
+            log4(`autoupdate succeeded: ${current} \u2192 ${latest}`);
           } catch (e) {
             restoreOrCleanup(handle);
             process.stderr.write(`\u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Auto-update failed \u2014 run /hivemind:update to upgrade manually.
 `);
-            log3(`autoupdate failed: ${e.message}`);
+            log4(`autoupdate failed: ${e.message}`);
           }
         } else {
           process.stderr.write(`\u2B06\uFE0F Hivemind update available: ${current} \u2192 ${latest}. Run /hivemind:update to upgrade.
 `);
-          log3(`update available (autoupdate off): ${current} \u2192 ${latest}`);
+          log4(`update available (autoupdate off): ${current} \u2192 ${latest}`);
         }
       } else {
-        log3(`version up to date: ${current}`);
+        log4(`version up to date: ${current}`);
       }
     }
   } catch (e) {
-    log3(`version check failed: ${e.message}`);
+    log4(`version check failed: ${e.message}`);
+  }
+  if (process.env.HIVEMIND_EMBED_WARMUP !== "false") {
+    try {
+      const daemonEntry = join8(__bundleDir, "embeddings", "embed-daemon.js");
+      const client = new EmbedClient({ daemonEntry, timeoutMs: 300, spawnWaitMs: 5e3 });
+      const ok = await client.warmup();
+      log4(`embed daemon warmup: ${ok ? "ok" : "failed"}`);
+    } catch (e) {
+      log4(`embed daemon warmup threw: ${e.message}`);
+    }
+  } else {
+    log4("embed daemon warmup skipped via HIVEMIND_EMBED_WARMUP=false");
   }
 }
 main().catch((e) => {
-  log3(`fatal: ${e.message}`);
+  log4(`fatal: ${e.message}`);
   process.exit(0);
 });
diff --git a/claude-code/tests/grep-direct.test.ts b/claude-code/tests/grep-direct.test.ts
index 0f56c9a..83366db 100644
--- a/claude-code/tests/grep-direct.test.ts
+++ b/claude-code/tests/grep-direct.test.ts
@@ -1,4 +1,19 @@
 import { describe, it, expect, vi } from "vitest";
+
+// The tests in this file exercise the *lexical* path of handleGrepDirect.
+// Without this mock, the real EmbedClient would try to spawn / reach the
+// nomic embed daemon over a Unix socket. If the daemon happens to be up
+// (e.g. from a previous benchmark run), the semantic branch fires and
+// returns a different shape, breaking every line-oriented assertion here.
+// The mock forces queryEmbedding to stay null so the lexical refine path
+// runs deterministically.
+vi.mock("../../src/embeddings/client.js", () => ({
+  EmbedClient: class {
+    async embed() { return null; }
+    async warmup() { return false; }
+  },
+}));
+
 import { parseBashGrep, handleGrepDirect, type GrepParams } from "../../src/hooks/grep-direct.js";
 
 describe("handleGrepDirect", () => {
diff --git a/claude-code/tests/session-start-setup-branches.test.ts b/claude-code/tests/session-start-setup-branches.test.ts
index 8c28370..a7321b3 100644
--- a/claude-code/tests/session-start-setup-branches.test.ts
+++ b/claude-code/tests/session-start-setup-branches.test.ts
@@ -29,6 +29,7 @@ const isNewerMock = vi.fn();
 const resolveVersionedPluginDirMock = vi.fn();
 const snapshotPluginDirMock = vi.fn();
 const restoreOrCleanupMock = vi.fn();
+const embedWarmupMock = vi.fn();
 
 vi.mock("../../src/utils/stdin.js", () => ({ readStdin: (...a: any[]) => stdinMock(...a) }));
 vi.mock("../../src/commands/auth.js", () => ({
@@ -64,6 +65,11 @@ vi.mock("../../src/utils/plugin-cache.js", () => ({
   snapshotPluginDir: (...a: any[]) => snapshotPluginDirMock(...a),
   restoreOrCleanup: (...a: any[]) => restoreOrCleanupMock(...a),
 }));
+vi.mock("../../src/embeddings/client.js", () => ({
+  EmbedClient: class {
+    async warmup() { return embedWarmupMock(); }
+  },
+}));
 
 async function runHook(): Promise<void> {
   delete process.env.HIVEMIND_WIKI_WORKER;
@@ -95,6 +101,7 @@ beforeEach(() => {
   getLatestVersionMock.mockReset().mockResolvedValue("0.6.38");
   isNewerMock.mockReset().mockReturnValue(false);
   resolveVersionedPluginDirMock.mockReset().mockReturnValue(null);
+  embedWarmupMock.mockReset().mockResolvedValue(true);
   snapshotPluginDirMock.mockReset();
   restoreOrCleanupMock.mockReset().mockReturnValue("noop");
 });
diff --git a/claude-code/tests/session-start-setup-hook.test.ts b/claude-code/tests/session-start-setup-hook.test.ts
index e3c9ca6..abf88d4 100644
--- a/claude-code/tests/session-start-setup-hook.test.ts
+++ b/claude-code/tests/session-start-setup-hook.test.ts
@@ -17,6 +17,7 @@ const debugLogMock = vi.fn();
 const ensureTableMock = vi.fn();
 const ensureSessionsTableMock = vi.fn();
 const execSyncMock = vi.fn();
+const embedWarmupMock = vi.fn();
 
 vi.mock("../../src/utils/stdin.js", () => ({ readStdin: (...a: any[]) => stdinMock(...a) }));
 vi.mock("../../src/commands/auth.js", () => ({
@@ -38,6 +39,11 @@ vi.mock("node:child_process", async () => {
   const actual = await vi.importActual<typeof import("node:child_process")>("node:child_process");
   return { ...actual, execSync: (...a: any[]) => execSyncMock(...a) };
 });
+vi.mock("../../src/embeddings/client.js", () => ({
+  EmbedClient: class {
+    async warmup() { return embedWarmupMock(); }
+  },
+}));
 
 // We also need to control global.fetch for the GitHub version lookup.
 const originalFetch = global.fetch;
@@ -74,6 +80,7 @@ beforeEach(() => {
   ensureTableMock.mockReset().mockResolvedValue(undefined);
   ensureSessionsTableMock.mockReset().mockResolvedValue(undefined);
   execSyncMock.mockReset();
+  embedWarmupMock.mockReset().mockResolvedValue(true);
   fetchMock.mockReset().mockResolvedValue({
     ok: true,
     json: async () => ({ version: "0.0.1" }), // same-as-current: no update
@@ -217,6 +224,36 @@ describe("session-start-setup hook — version check + autoupdate", () => {
   });
 });
 
+describe("session-start-setup hook — embed daemon warmup", () => {
+  it("calls EmbedClient.warmup() by default and logs the outcome", async () => {
+    await runHook();
+    expect(embedWarmupMock).toHaveBeenCalledTimes(1);
+    expect(debugLogMock).toHaveBeenCalledWith("embed daemon warmup: ok");
+  });
+
+  it("logs 'failed' when warmup returns false", async () => {
+    embedWarmupMock.mockResolvedValue(false);
+    await runHook();
+    expect(debugLogMock).toHaveBeenCalledWith("embed daemon warmup: failed");
+  });
+
+  it("logs the thrown message when warmup rejects", async () => {
+    embedWarmupMock.mockRejectedValue(new Error("daemon spawn failed"));
+    await runHook();
+    expect(debugLogMock).toHaveBeenCalledWith(
+      expect.stringContaining("embed daemon warmup threw: daemon spawn failed"),
+    );
+  });
+
+  it("skips warmup when HIVEMIND_EMBED_WARMUP=false", async () => {
+    await runHook({ HIVEMIND_EMBED_WARMUP: "false" });
+    expect(embedWarmupMock).not.toHaveBeenCalled();
+    expect(debugLogMock).toHaveBeenCalledWith(
+      "embed daemon warmup skipped via HIVEMIND_EMBED_WARMUP=false",
+    );
+  });
+});
+
 describe("session-start-setup hook — fatal catch", () => {
   it("catches a stdin throw and exits 0", async () => {
     stdinMock.mockRejectedValue(new Error("stdin boom"));
diff --git a/src/hooks/session-start-setup.ts b/src/hooks/session-start-setup.ts
index d55ef93..661e9c7 100644
--- a/src/hooks/session-start-setup.ts
+++ b/src/hooks/session-start-setup.ts
@@ -18,6 +18,7 @@ import { log as _log } from "../utils/debug.js";
 import { getInstalledVersion, getLatestVersion, isNewer } from "../utils/version-check.js";
 import { makeWikiLogger } from "../utils/wiki-log.js";
 import { resolveVersionedPluginDir, snapshotPluginDir, restoreOrCleanup } from "../utils/plugin-cache.js";
+import { EmbedClient } from "../embeddings/client.js";
 const log = (msg: string) => _log("session-setup", msg);
 
 const __bundleDir = dirname(fileURLToPath(import.meta.url));
@@ -103,6 +104,29 @@ async function main(): Promise<void> {
   } catch (e: any) {
     log(`version check failed: ${e.message}`);
   }
+
+  // Warm up the embedding daemon so the nomic-embed-text-v1.5 model is
+  // cached and loaded before the first Grep call. The daemon eagerly
+  // calls `embedder.load()` on startup (fire-and-forget), which downloads
+  // the model to ~/.cache/huggingface/hub/ on first run (~130 MB q8 /
+  // ~500 MB fp32) and keeps it resident for the lifetime of the process.
+  // `warmup()` itself just ensures the socket is accepting connections;
+  // the actual model download runs in the daemon's background — so this
+  // hook stays quick even on a cold install. Opt-out via
+  // HIVEMIND_EMBED_WARMUP=false for sessions that will never touch the
+  // memory path (lightweight CC runs, no-network CI).
+  if (process.env.HIVEMIND_EMBED_WARMUP !== "false") {
+    try {
+      const daemonEntry = join(__bundleDir, "embeddings", "embed-daemon.js");
+      const client = new EmbedClient({ daemonEntry, timeoutMs: 300, spawnWaitMs: 5000 });
+      const ok = await client.warmup();
+      log(`embed daemon warmup: ${ok ? "ok" : "failed"}`);
+    } catch (e: any) {
+      log(`embed daemon warmup threw: ${e.message}`);
+    }
+  } else {
+    log("embed daemon warmup skipped via HIVEMIND_EMBED_WARMUP=false");
+  }
 }
 
 main().catch((e) => { log(`fatal: ${e.message}`); process.exit(0); });

From 6402e350f4becac4874ab662cd77986b666bd9a4 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Thu, 23 Apr 2026 07:34:39 +0000
Subject: [PATCH 17/30] feat(embeddings): unified HIVEMIND_EMBEDDINGS=false
 kill-switch + schema auto-migrate
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The existing opt-out story was scattered across three independent
flags: HIVEMIND_SEMANTIC_SEARCH=false (query-time), HIVEMIND_EMBED_WARMUP=false
(session-start spawn), and HIVEMIND_CAPTURE=false (write path — but
that takes out capture entirely, not just the embed call inside it).
There was no single lever to say "I want the plugin without the
embedding feature at all, don't spawn the daemon, don't download the
model".

Adds one: HIVEMIND_EMBEDDINGS=false short-circuits every call site
that would otherwise talk to the nomic daemon —

- src/hooks/grep-direct.ts         (query-time embed for Grep tool)
- src/shell/grep-interceptor.ts    (query-time embed for bash grep)
- src/hooks/capture.ts             (write-time embed before INSERT)
- src/shell/deeplake-fs.ts         (batched write-time embed in _doFlush)
- src/hooks/session-start-setup.ts (SessionStart daemon warmup)

The two per-feature flags keep working; HIVEMIND_EMBEDDINGS=false is
the superset that kills all of them. Writes still succeed — the
embedding columns land as NULL — so toggling the flag is reversible
without rewriting existing rows.

Schema migration
---------------
Paired with this: ensureTable and ensureSessionsTable now issue
ALTER TABLE ... ADD COLUMN IF NOT EXISTS for summary_embedding /
message_embedding on tables that existed before the embeddings
feature shipped. Wrapped in try/catch so backends that don't support
ADD COLUMN IF NOT EXISTS (older Deeplake snapshots) log the skip and
carry on — the write path already tolerates the column being absent.

Users upgrading from 0.6.x pick the column up automatically on their
next SessionStart without having to re-ingest.

Tests
-----
- claude-code/tests/embeddings-disable.test.ts: unit test for the
  embeddingsDisabled() helper (default false, "false" → true, other
  strings stay false)
- session-start-setup-hook.test.ts: new case for the master flag
  (alongside the existing HIVEMIND_EMBED_WARMUP case)
- deeplake-api.test.ts: rewrote the "table already exists" /
  "lookup-index already set up" cases to expect the new ALTER calls,
  plus a dedicated assertion that ALTER failures are swallowed
  so older backends keep working

All 1 113 tests pass. Per-file coverage thresholds unchanged.
---
 claude-code/bundle/capture.js                 | 20 ++++++-
 claude-code/bundle/commands/auth-login.js     | 12 ++++
 claude-code/bundle/pre-tool-use.js            | 19 +++++-
 claude-code/bundle/session-start-setup.js     | 21 ++++++-
 claude-code/bundle/session-start.js           | 12 ++++
 claude-code/bundle/shell/deeplake-shell.js    | 21 ++++++-
 claude-code/tests/deeplake-api.test.ts        | 59 ++++++++++++++-----
 claude-code/tests/embeddings-disable.test.ts  | 38 ++++++++++++
 .../tests/session-start-setup-hook.test.ts    |  8 +++
 codex/bundle/capture.js                       | 12 ++++
 codex/bundle/commands/auth-login.js           | 12 ++++
 codex/bundle/pre-tool-use.js                  | 19 +++++-
 codex/bundle/session-start-setup.js           | 12 ++++
 codex/bundle/shell/deeplake-shell.js          | 21 ++++++-
 codex/bundle/stop.js                          | 12 ++++
 src/deeplake-api.ts                           | 22 +++++++
 src/embeddings/disable.ts                     | 22 +++++++
 src/hooks/capture.ts                          |  8 ++-
 src/hooks/grep-direct.ts                      |  3 +-
 src/hooks/session-start-setup.ts              |  5 +-
 src/shell/deeplake-fs.ts                      |  5 ++
 src/shell/grep-interceptor.ts                 |  3 +-
 22 files changed, 340 insertions(+), 26 deletions(-)
 create mode 100644 claude-code/tests/embeddings-disable.test.ts
 create mode 100644 src/embeddings/disable.ts

diff --git a/claude-code/bundle/capture.js b/claude-code/bundle/capture.js
index 9942c48..9d8c739 100755
--- a/claude-code/bundle/capture.js
+++ b/claude-code/bundle/capture.js
@@ -374,6 +374,12 @@ var DeeplakeApi = class {
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${tbl}" ADD COLUMN IF NOT EXISTS summary_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add summary_embedding skipped: ${e.message}`);
+      }
     }
   }
   /** Create the sessions table (uses JSONB for message since every row is a JSON event). */
@@ -385,6 +391,12 @@ var DeeplakeApi = class {
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${name}" ADD COLUMN IF NOT EXISTS message_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add message_embedding skipped: ${e.message}`);
+      }
     }
     await this.ensureLookupIndex(name, "path_creation_date", `("path", "creation_date")`);
   }
@@ -887,6 +899,11 @@ function embeddingSqlLiteral(vec) {
   return `ARRAY[${parts.join(",")}]::float4[]`;
 }
 
+// dist/src/embeddings/disable.js
+function embeddingsDisabled() {
+  return process.env.HIVEMIND_EMBEDDINGS === "false";
+}
+
 // dist/src/hooks/capture.js
 import { fileURLToPath as fileURLToPath2 } from "node:url";
 import { dirname as dirname2, join as join7 } from "node:path";
@@ -956,8 +973,7 @@ async function main() {
   const projectName = (input.cwd ?? "").split("/").pop() || "unknown";
   const filename = sessionPath.split("/").pop() ?? "";
   const jsonForSql = line.replace(/'/g, "''");
-  const embedClient = new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() });
-  const embedding = await embedClient.embed(line, "document");
+  const embedding = embeddingsDisabled() ? null : await new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() }).embed(line, "document");
   const embeddingSql = embeddingSqlLiteral(embedding);
   const insertSql = `INSERT INTO "${sessionsTable}" (id, path, filename, message, message_embedding, author, size_bytes, project, description, agent, creation_date, last_update_date) VALUES ('${crypto.randomUUID()}', '${sqlStr(sessionPath)}', '${sqlStr(filename)}', '${jsonForSql}'::jsonb, ${embeddingSql}, '${sqlStr(config.userName)}', ${Buffer.byteLength(line, "utf-8")}, '${sqlStr(projectName)}', '${sqlStr(input.hook_event_name ?? "")}', 'claude_code', '${ts}', '${ts}')`;
   try {
diff --git a/claude-code/bundle/commands/auth-login.js b/claude-code/bundle/commands/auth-login.js
index d21dbdb..8714067 100755
--- a/claude-code/bundle/commands/auth-login.js
+++ b/claude-code/bundle/commands/auth-login.js
@@ -555,6 +555,12 @@ var DeeplakeApi = class {
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${tbl}" ADD COLUMN IF NOT EXISTS summary_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add summary_embedding skipped: ${e.message}`);
+      }
     }
   }
   /** Create the sessions table (uses JSONB for message since every row is a JSON event). */
@@ -566,6 +572,12 @@ var DeeplakeApi = class {
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${name}" ADD COLUMN IF NOT EXISTS message_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add message_embedding skipped: ${e.message}`);
+      }
     }
     await this.ensureLookupIndex(name, "path_creation_date", `("path", "creation_date")`);
   }
diff --git a/claude-code/bundle/pre-tool-use.js b/claude-code/bundle/pre-tool-use.js
index 86964e8..4daedfa 100755
--- a/claude-code/bundle/pre-tool-use.js
+++ b/claude-code/bundle/pre-tool-use.js
@@ -380,6 +380,12 @@ var DeeplakeApi = class {
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${tbl}" ADD COLUMN IF NOT EXISTS summary_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add summary_embedding skipped: ${e.message}`);
+      }
     }
   }
   /** Create the sessions table (uses JSONB for message since every row is a JSON event). */
@@ -391,6 +397,12 @@ var DeeplakeApi = class {
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${name}" ADD COLUMN IF NOT EXISTS message_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add message_embedding skipped: ${e.message}`);
+      }
     }
     await this.ensureLookupIndex(name, "path_creation_date", `("path", "creation_date")`);
   }
@@ -1121,10 +1133,15 @@ function sleep2(ms) {
   return new Promise((r) => setTimeout(r, ms));
 }
 
+// dist/src/embeddings/disable.js
+function embeddingsDisabled() {
+  return process.env.HIVEMIND_EMBEDDINGS === "false";
+}
+
 // dist/src/hooks/grep-direct.js
 import { fileURLToPath as fileURLToPath2 } from "node:url";
 import { dirname, join as join4 } from "node:path";
-var SEMANTIC_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false";
+var SEMANTIC_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false" && !embeddingsDisabled();
 var SEMANTIC_TIMEOUT_MS = Number(process.env.HIVEMIND_SEMANTIC_EMBED_TIMEOUT_MS ?? "500");
 function resolveDaemonPath() {
   return join4(dirname(fileURLToPath2(import.meta.url)), "..", "embeddings", "embed-daemon.js");
diff --git a/claude-code/bundle/session-start-setup.js b/claude-code/bundle/session-start-setup.js
index cac8456..622ddf7 100755
--- a/claude-code/bundle/session-start-setup.js
+++ b/claude-code/bundle/session-start-setup.js
@@ -385,6 +385,12 @@ var DeeplakeApi = class {
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${tbl}" ADD COLUMN IF NOT EXISTS summary_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add summary_embedding skipped: ${e.message}`);
+      }
     }
   }
   /** Create the sessions table (uses JSONB for message since every row is a JSON event). */
@@ -396,6 +402,12 @@ var DeeplakeApi = class {
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${name}" ADD COLUMN IF NOT EXISTS message_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add message_embedding skipped: ${e.message}`);
+      }
     }
     await this.ensureLookupIndex(name, "path_creation_date", `("path", "creation_date")`);
   }
@@ -764,6 +776,11 @@ function sleep2(ms) {
   return new Promise((r) => setTimeout(r, ms));
 }
 
+// dist/src/embeddings/disable.js
+function embeddingsDisabled() {
+  return process.env.HIVEMIND_EMBEDDINGS === "false";
+}
+
 // dist/src/hooks/session-start-setup.js
 var log4 = (msg) => log("session-setup", msg);
 var __bundleDir = dirname3(fileURLToPath(import.meta.url));
@@ -837,7 +854,9 @@ async function main() {
   } catch (e) {
     log4(`version check failed: ${e.message}`);
   }
-  if (process.env.HIVEMIND_EMBED_WARMUP !== "false") {
+  if (embeddingsDisabled()) {
+    log4("embed daemon warmup skipped via HIVEMIND_EMBEDDINGS=false");
+  } else if (process.env.HIVEMIND_EMBED_WARMUP !== "false") {
     try {
       const daemonEntry = join8(__bundleDir, "embeddings", "embed-daemon.js");
       const client = new EmbedClient({ daemonEntry, timeoutMs: 300, spawnWaitMs: 5e3 });
diff --git a/claude-code/bundle/session-start.js b/claude-code/bundle/session-start.js
index 2a737f3..3b34266 100755
--- a/claude-code/bundle/session-start.js
+++ b/claude-code/bundle/session-start.js
@@ -385,6 +385,12 @@ var DeeplakeApi = class {
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${tbl}" ADD COLUMN IF NOT EXISTS summary_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add summary_embedding skipped: ${e.message}`);
+      }
     }
   }
   /** Create the sessions table (uses JSONB for message since every row is a JSON event). */
@@ -396,6 +402,12 @@ var DeeplakeApi = class {
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${name}" ADD COLUMN IF NOT EXISTS message_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add message_embedding skipped: ${e.message}`);
+      }
     }
     await this.ensureLookupIndex(name, "path_creation_date", `("path", "creation_date")`);
   }
diff --git a/claude-code/bundle/shell/deeplake-shell.js b/claude-code/bundle/shell/deeplake-shell.js
index 825e008..18e11f9 100755
--- a/claude-code/bundle/shell/deeplake-shell.js
+++ b/claude-code/bundle/shell/deeplake-shell.js
@@ -67077,6 +67077,12 @@ var DeeplakeApi = class {
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${tbl}" ADD COLUMN IF NOT EXISTS summary_embedding FLOAT4[]`);
+      } catch (e6) {
+        log2(`ALTER TABLE add summary_embedding skipped: ${e6.message}`);
+      }
     }
   }
   /** Create the sessions table (uses JSONB for message since every row is a JSON event). */
@@ -67088,6 +67094,12 @@ var DeeplakeApi = class {
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${name}" ADD COLUMN IF NOT EXISTS message_embedding FLOAT4[]`);
+      } catch (e6) {
+        log2(`ALTER TABLE add message_embedding skipped: ${e6.message}`);
+      }
     }
     await this.ensureLookupIndex(name, "path_creation_date", `("path", "creation_date")`);
   }
@@ -67769,6 +67781,11 @@ function embeddingSqlLiteral(vec) {
   return `ARRAY[${parts.join(",")}]::float4[]`;
 }
 
+// dist/src/embeddings/disable.js
+function embeddingsDisabled() {
+  return process.env.HIVEMIND_EMBEDDINGS === "false";
+}
+
 // dist/src/shell/deeplake-fs.js
 var BATCH_SIZE = 10;
 var PREFETCH_BATCH_SIZE = 50;
@@ -67949,6 +67966,8 @@ var DeeplakeFs = class _DeeplakeFs {
   async computeEmbeddings(rows) {
     if (rows.length === 0)
       return [];
+    if (embeddingsDisabled())
+      return rows.map(() => null);
     if (!this.embedClient) {
       this.embedClient = new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() });
     }
@@ -69396,7 +69415,7 @@ var lib_default = yargsParser;
 // dist/src/shell/grep-interceptor.js
 import { fileURLToPath as fileURLToPath2 } from "node:url";
 import { dirname as dirname5, join as join8 } from "node:path";
-var SEMANTIC_SEARCH_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false";
+var SEMANTIC_SEARCH_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false" && !embeddingsDisabled();
 var SEMANTIC_EMBED_TIMEOUT_MS = Number(process.env.HIVEMIND_SEMANTIC_EMBED_TIMEOUT_MS ?? "500");
 function resolveGrepEmbedDaemonPath() {
   return join8(dirname5(fileURLToPath2(import.meta.url)), "..", "embeddings", "embed-daemon.js");
diff --git a/claude-code/tests/deeplake-api.test.ts b/claude-code/tests/deeplake-api.test.ts
index e3e1b59..a4b9099 100644
--- a/claude-code/tests/deeplake-api.test.ts
+++ b/claude-code/tests/deeplake-api.test.ts
@@ -406,15 +406,29 @@ describe("DeeplakeApi.ensureTable", () => {
     expect(createSql).toContain("USING deeplake");
   });
 
-  it("does nothing when table already exists", async () => {
-    // BM25 index creation is disabled (oid bug), so ensureTable only calls listTables
+  it("issues ALTER TABLE ADD COLUMN IF NOT EXISTS for the embedding column when the table already exists", async () => {
     mockFetch.mockResolvedValueOnce({
       ok: true, status: 200,
       json: async () => ({ tables: [{ table_name: "my_table" }] }),
     });
+    mockFetch.mockResolvedValueOnce(jsonResponse({}));
     const api = makeApi("my_table");
     await api.ensureTable();
-    expect(mockFetch).toHaveBeenCalledOnce(); // only listTables, no CREATE
+    expect(mockFetch).toHaveBeenCalledTimes(2); // listTables + ALTER
+    const alterSql = JSON.parse(mockFetch.mock.calls[1][1].body).query;
+    expect(alterSql).toContain("ALTER TABLE");
+    expect(alterSql).toContain("my_table");
+    expect(alterSql).toContain("ADD COLUMN IF NOT EXISTS summary_embedding FLOAT4[]");
+  });
+
+  it("swallows ALTER TABLE errors (older backend without ADD COLUMN IF NOT EXISTS)", async () => {
+    mockFetch.mockResolvedValueOnce({
+      ok: true, status: 200,
+      json: async () => ({ tables: [{ table_name: "my_table" }] }),
+    });
+    mockFetch.mockResolvedValueOnce(jsonResponse("syntax error", 400));
+    const api = makeApi("my_table");
+    await expect(api.ensureTable()).resolves.toBeUndefined();
   });
 
   it("creates table with custom name", async () => {
@@ -434,18 +448,22 @@ describe("DeeplakeApi.ensureTable", () => {
       ok: true, status: 200,
       json: async () => ({ tables: [{ table_name: "memory" }] }),
     });
-    mockFetch.mockResolvedValueOnce(jsonResponse({}));
-    mockFetch.mockResolvedValueOnce(jsonResponse({}));
+    mockFetch.mockResolvedValueOnce(jsonResponse({})); // ALTER memory
+    mockFetch.mockResolvedValueOnce(jsonResponse({})); // CREATE sessions
+    mockFetch.mockResolvedValueOnce(jsonResponse({})); // CREATE INDEX
     const api = makeApi("memory");
 
     await api.ensureTable();
     await api.ensureSessionsTable("sessions");
 
-    expect(mockFetch).toHaveBeenCalledTimes(3);
-    const createSql = JSON.parse(mockFetch.mock.calls[1][1].body).query;
+    expect(mockFetch).toHaveBeenCalledTimes(4);
+    const alterSql = JSON.parse(mockFetch.mock.calls[1][1].body).query;
+    expect(alterSql).toContain("ALTER TABLE");
+    expect(alterSql).toContain("summary_embedding");
+    const createSql = JSON.parse(mockFetch.mock.calls[2][1].body).query;
     expect(createSql).toContain("CREATE TABLE IF NOT EXISTS");
     expect(createSql).toContain("sessions");
-    const indexSql = JSON.parse(mockFetch.mock.calls[2][1].body).query;
+    const indexSql = JSON.parse(mockFetch.mock.calls[3][1].body).query;
     expect(indexSql).toContain("CREATE INDEX IF NOT EXISTS");
     expect(indexSql).toContain("\"path\"");
     expect(indexSql).toContain("\"creation_date\"");
@@ -475,16 +493,20 @@ describe("DeeplakeApi.ensureSessionsTable", () => {
     expect(indexSql).toContain("(\"path\", \"creation_date\")");
   });
 
-  it("ensures the lookup index when sessions table already exists", async () => {
+  it("adds message_embedding column and ensures the lookup index when sessions table already exists", async () => {
     mockFetch.mockResolvedValueOnce({
       ok: true, status: 200,
       json: async () => ({ tables: [{ table_name: "sessions" }] }),
     });
-    mockFetch.mockResolvedValueOnce(jsonResponse({}));
+    mockFetch.mockResolvedValueOnce(jsonResponse({})); // ALTER
+    mockFetch.mockResolvedValueOnce(jsonResponse({})); // CREATE INDEX
     const api = makeApi();
     await api.ensureSessionsTable("sessions");
-    expect(mockFetch).toHaveBeenCalledTimes(2);
-    const indexSql = JSON.parse(mockFetch.mock.calls[1][1].body).query;
+    expect(mockFetch).toHaveBeenCalledTimes(3);
+    const alterSql = JSON.parse(mockFetch.mock.calls[1][1].body).query;
+    expect(alterSql).toContain("ALTER TABLE");
+    expect(alterSql).toContain("message_embedding FLOAT4[]");
+    const indexSql = JSON.parse(mockFetch.mock.calls[2][1].body).query;
     expect(indexSql).toContain("CREATE INDEX IF NOT EXISTS");
   });
 
@@ -493,11 +515,12 @@ describe("DeeplakeApi.ensureSessionsTable", () => {
       ok: true, status: 200,
       json: async () => ({ tables: [{ table_name: "sessions" }] }),
     });
+    mockFetch.mockResolvedValueOnce(jsonResponse({})); // ALTER ok
     mockFetch.mockResolvedValueOnce(jsonResponse("forbidden", 403));
     const api = makeApi();
 
     await expect(api.ensureSessionsTable("sessions")).resolves.toBeUndefined();
-    expect(mockFetch).toHaveBeenCalledTimes(2);
+    expect(mockFetch).toHaveBeenCalledTimes(3);
   });
 
   it("treats duplicate concurrent index creation errors as success and records a local marker", async () => {
@@ -505,15 +528,23 @@ describe("DeeplakeApi.ensureSessionsTable", () => {
       ok: true, status: 200,
       json: async () => ({ tables: [{ table_name: "sessions" }] }),
     });
+    mockFetch.mockResolvedValueOnce(jsonResponse({})); // ALTER ok
     mockFetch.mockResolvedValueOnce(jsonResponse("duplicate key value violates unique constraint \"pg_class_relname_nsp_index\"", 400));
 
     const api = makeApi();
     await expect(api.ensureSessionsTable("sessions")).resolves.toBeUndefined();
 
     mockFetch.mockReset();
+    mockFetch.mockResolvedValueOnce(jsonResponse({})); // ALTER re-runs on 2nd call
     await api.ensureSessionsTable("sessions");
 
-    expect(mockFetch).not.toHaveBeenCalled();
+    // On the second call: listTables is cached, the index marker short-
+    // circuits the CREATE INDEX, but ALTER TABLE ADD COLUMN IF NOT EXISTS
+    // still fires once — it's cheap (the backend no-ops when the column
+    // already exists) and leaves the migration idempotent across versions.
+    expect(mockFetch).toHaveBeenCalledTimes(1);
+    const secondCallSql = JSON.parse(mockFetch.mock.calls[0][1].body).query;
+    expect(secondCallSql).toContain("ALTER TABLE");
   });
 });
 
diff --git a/claude-code/tests/embeddings-disable.test.ts b/claude-code/tests/embeddings-disable.test.ts
new file mode 100644
index 0000000..9a8d527
--- /dev/null
+++ b/claude-code/tests/embeddings-disable.test.ts
@@ -0,0 +1,38 @@
+import { describe, it, expect, beforeEach, afterEach } from "vitest";
+import { embeddingsDisabled } from "../../src/embeddings/disable.js";
+
+describe("embeddingsDisabled()", () => {
+  const original = process.env.HIVEMIND_EMBEDDINGS;
+
+  beforeEach(() => {
+    delete process.env.HIVEMIND_EMBEDDINGS;
+  });
+
+  afterEach(() => {
+    if (original === undefined) delete process.env.HIVEMIND_EMBEDDINGS;
+    else process.env.HIVEMIND_EMBEDDINGS = original;
+  });
+
+  it("returns false when the env var is unset (default behaviour)", () => {
+    expect(embeddingsDisabled()).toBe(false);
+  });
+
+  it("returns true only when explicitly set to the string 'false'", () => {
+    process.env.HIVEMIND_EMBEDDINGS = "false";
+    expect(embeddingsDisabled()).toBe(true);
+  });
+
+  it("stays off for any non-'false' truthy value (intentional: avoid surprise kills)", () => {
+    process.env.HIVEMIND_EMBEDDINGS = "0";
+    expect(embeddingsDisabled()).toBe(false);
+
+    process.env.HIVEMIND_EMBEDDINGS = "no";
+    expect(embeddingsDisabled()).toBe(false);
+
+    process.env.HIVEMIND_EMBEDDINGS = "true";
+    expect(embeddingsDisabled()).toBe(false);
+
+    process.env.HIVEMIND_EMBEDDINGS = "";
+    expect(embeddingsDisabled()).toBe(false);
+  });
+});
diff --git a/claude-code/tests/session-start-setup-hook.test.ts b/claude-code/tests/session-start-setup-hook.test.ts
index abf88d4..9a4484d 100644
--- a/claude-code/tests/session-start-setup-hook.test.ts
+++ b/claude-code/tests/session-start-setup-hook.test.ts
@@ -252,6 +252,14 @@ describe("session-start-setup hook — embed daemon warmup", () => {
       "embed daemon warmup skipped via HIVEMIND_EMBED_WARMUP=false",
     );
   });
+
+  it("skips warmup when the master HIVEMIND_EMBEDDINGS=false flag is set", async () => {
+    await runHook({ HIVEMIND_EMBEDDINGS: "false" });
+    expect(embedWarmupMock).not.toHaveBeenCalled();
+    expect(debugLogMock).toHaveBeenCalledWith(
+      "embed daemon warmup skipped via HIVEMIND_EMBEDDINGS=false",
+    );
+  });
 });
 
 describe("session-start-setup hook — fatal catch", () => {
diff --git a/codex/bundle/capture.js b/codex/bundle/capture.js
index 7e15b40..7cdf620 100755
--- a/codex/bundle/capture.js
+++ b/codex/bundle/capture.js
@@ -374,6 +374,12 @@ var DeeplakeApi = class {
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${tbl}" ADD COLUMN IF NOT EXISTS summary_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add summary_embedding skipped: ${e.message}`);
+      }
     }
   }
   /** Create the sessions table (uses JSONB for message since every row is a JSON event). */
@@ -385,6 +391,12 @@ var DeeplakeApi = class {
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${name}" ADD COLUMN IF NOT EXISTS message_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add message_embedding skipped: ${e.message}`);
+      }
     }
     await this.ensureLookupIndex(name, "path_creation_date", `("path", "creation_date")`);
   }
diff --git a/codex/bundle/commands/auth-login.js b/codex/bundle/commands/auth-login.js
index d21dbdb..8714067 100755
--- a/codex/bundle/commands/auth-login.js
+++ b/codex/bundle/commands/auth-login.js
@@ -555,6 +555,12 @@ var DeeplakeApi = class {
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${tbl}" ADD COLUMN IF NOT EXISTS summary_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add summary_embedding skipped: ${e.message}`);
+      }
     }
   }
   /** Create the sessions table (uses JSONB for message since every row is a JSON event). */
@@ -566,6 +572,12 @@ var DeeplakeApi = class {
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${name}" ADD COLUMN IF NOT EXISTS message_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add message_embedding skipped: ${e.message}`);
+      }
     }
     await this.ensureLookupIndex(name, "path_creation_date", `("path", "creation_date")`);
   }
diff --git a/codex/bundle/pre-tool-use.js b/codex/bundle/pre-tool-use.js
index 2cc0001..552b425 100755
--- a/codex/bundle/pre-tool-use.js
+++ b/codex/bundle/pre-tool-use.js
@@ -380,6 +380,12 @@ var DeeplakeApi = class {
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${tbl}" ADD COLUMN IF NOT EXISTS summary_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add summary_embedding skipped: ${e.message}`);
+      }
     }
   }
   /** Create the sessions table (uses JSONB for message since every row is a JSON event). */
@@ -391,6 +397,12 @@ var DeeplakeApi = class {
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${name}" ADD COLUMN IF NOT EXISTS message_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add message_embedding skipped: ${e.message}`);
+      }
     }
     await this.ensureLookupIndex(name, "path_creation_date", `("path", "creation_date")`);
   }
@@ -1107,10 +1119,15 @@ function sleep2(ms) {
   return new Promise((r) => setTimeout(r, ms));
 }
 
+// dist/src/embeddings/disable.js
+function embeddingsDisabled() {
+  return process.env.HIVEMIND_EMBEDDINGS === "false";
+}
+
 // dist/src/hooks/grep-direct.js
 import { fileURLToPath } from "node:url";
 import { dirname, join as join4 } from "node:path";
-var SEMANTIC_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false";
+var SEMANTIC_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false" && !embeddingsDisabled();
 var SEMANTIC_TIMEOUT_MS = Number(process.env.HIVEMIND_SEMANTIC_EMBED_TIMEOUT_MS ?? "500");
 function resolveDaemonPath() {
   return join4(dirname(fileURLToPath(import.meta.url)), "..", "embeddings", "embed-daemon.js");
diff --git a/codex/bundle/session-start-setup.js b/codex/bundle/session-start-setup.js
index b7c07ec..c854fcc 100755
--- a/codex/bundle/session-start-setup.js
+++ b/codex/bundle/session-start-setup.js
@@ -385,6 +385,12 @@ var DeeplakeApi = class {
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${tbl}" ADD COLUMN IF NOT EXISTS summary_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add summary_embedding skipped: ${e.message}`);
+      }
     }
   }
   /** Create the sessions table (uses JSONB for message since every row is a JSON event). */
@@ -396,6 +402,12 @@ var DeeplakeApi = class {
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${name}" ADD COLUMN IF NOT EXISTS message_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add message_embedding skipped: ${e.message}`);
+      }
     }
     await this.ensureLookupIndex(name, "path_creation_date", `("path", "creation_date")`);
   }
diff --git a/codex/bundle/shell/deeplake-shell.js b/codex/bundle/shell/deeplake-shell.js
index 825e008..18e11f9 100755
--- a/codex/bundle/shell/deeplake-shell.js
+++ b/codex/bundle/shell/deeplake-shell.js
@@ -67077,6 +67077,12 @@ var DeeplakeApi = class {
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${tbl}" ADD COLUMN IF NOT EXISTS summary_embedding FLOAT4[]`);
+      } catch (e6) {
+        log2(`ALTER TABLE add summary_embedding skipped: ${e6.message}`);
+      }
     }
   }
   /** Create the sessions table (uses JSONB for message since every row is a JSON event). */
@@ -67088,6 +67094,12 @@ var DeeplakeApi = class {
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${name}" ADD COLUMN IF NOT EXISTS message_embedding FLOAT4[]`);
+      } catch (e6) {
+        log2(`ALTER TABLE add message_embedding skipped: ${e6.message}`);
+      }
     }
     await this.ensureLookupIndex(name, "path_creation_date", `("path", "creation_date")`);
   }
@@ -67769,6 +67781,11 @@ function embeddingSqlLiteral(vec) {
   return `ARRAY[${parts.join(",")}]::float4[]`;
 }
 
+// dist/src/embeddings/disable.js
+function embeddingsDisabled() {
+  return process.env.HIVEMIND_EMBEDDINGS === "false";
+}
+
 // dist/src/shell/deeplake-fs.js
 var BATCH_SIZE = 10;
 var PREFETCH_BATCH_SIZE = 50;
@@ -67949,6 +67966,8 @@ var DeeplakeFs = class _DeeplakeFs {
   async computeEmbeddings(rows) {
     if (rows.length === 0)
       return [];
+    if (embeddingsDisabled())
+      return rows.map(() => null);
     if (!this.embedClient) {
       this.embedClient = new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() });
     }
@@ -69396,7 +69415,7 @@ var lib_default = yargsParser;
 // dist/src/shell/grep-interceptor.js
 import { fileURLToPath as fileURLToPath2 } from "node:url";
 import { dirname as dirname5, join as join8 } from "node:path";
-var SEMANTIC_SEARCH_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false";
+var SEMANTIC_SEARCH_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false" && !embeddingsDisabled();
 var SEMANTIC_EMBED_TIMEOUT_MS = Number(process.env.HIVEMIND_SEMANTIC_EMBED_TIMEOUT_MS ?? "500");
 function resolveGrepEmbedDaemonPath() {
   return join8(dirname5(fileURLToPath2(import.meta.url)), "..", "embeddings", "embed-daemon.js");
diff --git a/codex/bundle/stop.js b/codex/bundle/stop.js
index 2e241b2..9e1563e 100755
--- a/codex/bundle/stop.js
+++ b/codex/bundle/stop.js
@@ -377,6 +377,12 @@ var DeeplakeApi = class {
       log2(`table "${tbl}" created`);
       if (!tables.includes(tbl))
         this._tablesCache = [...tables, tbl];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${tbl}" ADD COLUMN IF NOT EXISTS summary_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add summary_embedding skipped: ${e.message}`);
+      }
     }
   }
   /** Create the sessions table (uses JSONB for message since every row is a JSON event). */
@@ -388,6 +394,12 @@ var DeeplakeApi = class {
       log2(`table "${name}" created`);
       if (!tables.includes(name))
         this._tablesCache = [...tables, name];
+    } else {
+      try {
+        await this.query(`ALTER TABLE "${name}" ADD COLUMN IF NOT EXISTS message_embedding FLOAT4[]`);
+      } catch (e) {
+        log2(`ALTER TABLE add message_embedding skipped: ${e.message}`);
+      }
     }
     await this.ensureLookupIndex(name, "path_creation_date", `("path", "creation_date")`);
   }
diff --git a/src/deeplake-api.ts b/src/deeplake-api.ts
index ae5f25c..2933384 100644
--- a/src/deeplake-api.ts
+++ b/src/deeplake-api.ts
@@ -369,6 +369,19 @@ export class DeeplakeApi {
       );
       log(`table "${tbl}" created`);
       if (!tables.includes(tbl)) this._tablesCache = [...tables, tbl];
+    } else {
+      // Migrate older memory tables that were created before the embeddings
+      // feature landed. ADD COLUMN IF NOT EXISTS is idempotent on Postgres
+      // and Deeplake; we swallow errors because on backends that don't
+      // support it the column just stays absent and the embedding-column
+      // writes fall through to NULL (capture / flush tolerate that).
+      try {
+        await this.query(
+          `ALTER TABLE "${tbl}" ADD COLUMN IF NOT EXISTS summary_embedding FLOAT4[]`,
+        );
+      } catch (e: any) {
+        log(`ALTER TABLE add summary_embedding skipped: ${e.message}`);
+      }
     }
     // BM25 index disabled — CREATE INDEX causes intermittent oid errors on fresh tables.
     // See bm25-oid-bug.sh for reproduction. Re-enable once Deeplake fixes the oid invalidation.
@@ -403,6 +416,15 @@ export class DeeplakeApi {
       );
       log(`table "${name}" created`);
       if (!tables.includes(name)) this._tablesCache = [...tables, name];
+    } else {
+      // Same rationale as ensureTable: migrate pre-embeddings sessions tables.
+      try {
+        await this.query(
+          `ALTER TABLE "${name}" ADD COLUMN IF NOT EXISTS message_embedding FLOAT4[]`,
+        );
+      } catch (e: any) {
+        log(`ALTER TABLE add message_embedding skipped: ${e.message}`);
+      }
     }
     await this.ensureLookupIndex(name, "path_creation_date", `("path", "creation_date")`);
   }
diff --git a/src/embeddings/disable.ts b/src/embeddings/disable.ts
new file mode 100644
index 0000000..8c0db83
--- /dev/null
+++ b/src/embeddings/disable.ts
@@ -0,0 +1,22 @@
+/**
+ * Master opt-out for the embedding feature.
+ *
+ * `HIVEMIND_EMBEDDINGS=false` short-circuits every call site that would
+ * otherwise talk to the nomic daemon: the SessionStart warmup, the
+ * capture-side write embed, the batched flush embed in DeeplakeFs, and
+ * both grep query-time embed paths (direct + interceptor). The SQL
+ * schema still has the embedding columns and existing rows' embeddings
+ * remain readable, but no new embedding is computed and no daemon is
+ * spawned.
+ *
+ * Intended for: air-gapped / no-network installs, CI / benchmarks that
+ * want pure-lexical retrieval, and users who want the plugin's capture
+ * + grep without paying the ~110 MB nomic download.
+ *
+ * Read-once: honours mutations during the process lifetime; the hooks
+ * are short-lived subprocesses so a live toggle via `export` takes
+ * effect on the next session.
+ */
+export function embeddingsDisabled(): boolean {
+  return process.env.HIVEMIND_EMBEDDINGS === "false";
+}
diff --git a/src/hooks/capture.ts b/src/hooks/capture.ts
index 70e897f..1c5b3a3 100644
--- a/src/hooks/capture.ts
+++ b/src/hooks/capture.ts
@@ -23,6 +23,7 @@ import {
 import { bundleDirFromImportMeta, spawnWikiWorker, wikiLog } from "./spawn-wiki-worker.js";
 import { EmbedClient } from "../embeddings/client.js";
 import { embeddingSqlLiteral } from "../embeddings/sql.js";
+import { embeddingsDisabled } from "../embeddings/disable.js";
 import { fileURLToPath } from "node:url";
 import { dirname, join } from "node:path";
 const log = (msg: string) => _log("capture", msg);
@@ -123,8 +124,11 @@ async function main(): Promise<void> {
   // sqlStr() would also escape backslashes and strip control chars, corrupting the JSON.
   const jsonForSql = line.replace(/'/g, "''");
 
-  const embedClient = new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() });
-  const embedding = await embedClient.embed(line, "document");
+  // Skip the daemon round-trip entirely when embeddings are globally disabled —
+  // the column stays NULL, schema-compatible with future re-enabling.
+  const embedding = embeddingsDisabled()
+    ? null
+    : await new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() }).embed(line, "document");
   const embeddingSql = embeddingSqlLiteral(embedding);
 
   const insertSql =
diff --git a/src/hooks/grep-direct.ts b/src/hooks/grep-direct.ts
index 63598c5..789a1bc 100644
--- a/src/hooks/grep-direct.ts
+++ b/src/hooks/grep-direct.ts
@@ -9,10 +9,11 @@ import type { DeeplakeApi } from "../deeplake-api.js";
 import { grepBothTables, type GrepMatchParams } from "../shell/grep-core.js";
 import { capOutputForClaude } from "../utils/output-cap.js";
 import { EmbedClient } from "../embeddings/client.js";
+import { embeddingsDisabled } from "../embeddings/disable.js";
 import { fileURLToPath } from "node:url";
 import { dirname, join } from "node:path";
 
-const SEMANTIC_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false";
+const SEMANTIC_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false" && !embeddingsDisabled();
 const SEMANTIC_TIMEOUT_MS = Number(process.env.HIVEMIND_SEMANTIC_EMBED_TIMEOUT_MS ?? "500");
 
 function resolveDaemonPath(): string {
diff --git a/src/hooks/session-start-setup.ts b/src/hooks/session-start-setup.ts
index 661e9c7..6c62d9a 100644
--- a/src/hooks/session-start-setup.ts
+++ b/src/hooks/session-start-setup.ts
@@ -19,6 +19,7 @@ import { getInstalledVersion, getLatestVersion, isNewer } from "../utils/version
 import { makeWikiLogger } from "../utils/wiki-log.js";
 import { resolveVersionedPluginDir, snapshotPluginDir, restoreOrCleanup } from "../utils/plugin-cache.js";
 import { EmbedClient } from "../embeddings/client.js";
+import { embeddingsDisabled } from "../embeddings/disable.js";
 const log = (msg: string) => _log("session-setup", msg);
 
 const __bundleDir = dirname(fileURLToPath(import.meta.url));
@@ -115,7 +116,9 @@ async function main(): Promise<void> {
   // hook stays quick even on a cold install. Opt-out via
   // HIVEMIND_EMBED_WARMUP=false for sessions that will never touch the
   // memory path (lightweight CC runs, no-network CI).
-  if (process.env.HIVEMIND_EMBED_WARMUP !== "false") {
+  if (embeddingsDisabled()) {
+    log("embed daemon warmup skipped via HIVEMIND_EMBEDDINGS=false");
+  } else if (process.env.HIVEMIND_EMBED_WARMUP !== "false") {
     try {
       const daemonEntry = join(__bundleDir, "embeddings", "embed-daemon.js");
       const client = new EmbedClient({ daemonEntry, timeoutMs: 300, spawnWaitMs: 5000 });
diff --git a/src/shell/deeplake-fs.ts b/src/shell/deeplake-fs.ts
index 55e4101..24c3ba7 100644
--- a/src/shell/deeplake-fs.ts
+++ b/src/shell/deeplake-fs.ts
@@ -10,6 +10,7 @@ import type {
 import { normalizeContent } from "./grep-core.js";
 import { EmbedClient } from "../embeddings/client.js";
 import { embeddingSqlLiteral } from "../embeddings/sql.js";
+import { embeddingsDisabled } from "../embeddings/disable.js";
 
 interface ReadFileOptions { encoding?: BufferEncoding }
 interface WriteFileOptions { encoding?: BufferEncoding }
@@ -232,6 +233,10 @@ export class DeeplakeFs implements IFileSystem {
 
   private async computeEmbeddings(rows: PendingRow[]): Promise<(number[] | null)[]> {
     if (rows.length === 0) return [];
+    // Skip the daemon hop entirely when embeddings are globally disabled.
+    // upsertRow writes NULL for embedding columns when the value is null,
+    // so the INSERT / UPDATE shape stays identical.
+    if (embeddingsDisabled()) return rows.map(() => null);
     if (!this.embedClient) {
       this.embedClient = new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() });
     }
diff --git a/src/shell/grep-interceptor.ts b/src/shell/grep-interceptor.ts
index 6992422..46f9613 100644
--- a/src/shell/grep-interceptor.ts
+++ b/src/shell/grep-interceptor.ts
@@ -5,6 +5,7 @@ import type { DeeplakeFs } from "./deeplake-fs.js";
 import { fileURLToPath } from "node:url";
 import { dirname, join } from "node:path";
 import { EmbedClient } from "../embeddings/client.js";
+import { embeddingsDisabled } from "../embeddings/disable.js";
 
 import {
   buildGrepSearchOptions,
@@ -16,7 +17,7 @@ import {
   type ContentRow,
 } from "./grep-core.js";
 
-const SEMANTIC_SEARCH_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false";
+const SEMANTIC_SEARCH_ENABLED = process.env.HIVEMIND_SEMANTIC_SEARCH !== "false" && !embeddingsDisabled();
 const SEMANTIC_EMBED_TIMEOUT_MS = Number(process.env.HIVEMIND_SEMANTIC_EMBED_TIMEOUT_MS ?? "500");
 
 function resolveGrepEmbedDaemonPath(): string {

From 0ec2139b785eb04d380f26383e2d9c3d04bce6a1 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Thu, 23 Apr 2026 07:51:54 +0000
Subject: [PATCH 18/30] feat(wiki-worker): embed the final summary before the
 memory upload
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

uploadSummary() was the last write path into the memory table that left
summary_embedding = NULL. The DeeplakeFs-backed flush already embedded
every row it touched, capture.ts already embedded every message, but
the wiki-worker's final summary — the long, purpose-built wiki-style
text that actually ought to be semantically retrievable — was going
to Deeplake with no embedding at all. As a result summaries were only
reachable from the lexical branch of the hybrid grep, never from the
cosine branch.

Changes:

- `uploadSummary()` now takes an optional `embedding: number[] | null`
  on UploadParams and threads it into both the UPDATE and the INSERT,
  serialized through `embeddingSqlLiteral()` so the literal is either
  `ARRAY[...]::float4[]` or bare SQL `NULL`. The column is kept in
  the same statement as `summary` / `description` (the single-UPDATE
  invariant from the module docstring still holds — see
  `deeplake-update-bug-repro.py`).
- Both `src/hooks/wiki-worker.ts` and `src/hooks/codex/wiki-worker.ts`
  call EmbedClient.embed(text, "document") right before uploadSummary,
  gated by `embeddingsDisabled()` and wrapped in try/catch. On any
  failure (daemon down, `HIVEMIND_EMBEDDINGS=false`, spawn fails) the
  summary still lands, just with NULL in the embedding column — so
  existing callers keep working and the row stays reachable via the
  lexical branch.

Retrieval already uses it: `searchDeeplakeTables` in grep-core already
joins memory.summary_embedding against the query vector when one is
present, gated by `WHERE summary_embedding IS NOT NULL`. No changes
needed there.

Existing pre-embedding summaries (older rows) still have NULL in the
column. They stay retrievable lexically; a one-shot back-fill script
to compute embeddings for the existing backlog is left as a separate
change so the first-principles write path lands cleanly here.

Tests:
- 5 new cases in upload-summary.test.ts covering ARRAY literal on
  UPDATE and INSERT, bare SQL NULL when the caller omits the
  embedding, explicit null, and the empty-array "daemon returned
  nothing" degenerate case. The existing "single UPDATE invariant"
  assertions still pass — summary, summary_embedding, size_bytes and
  description are all in the same statement.
- wiki-worker.test.ts and codex-wiki-worker.test.ts now mock
  EmbedClient so the EmbedClient import doesn't try to reach a real
  socket during unit tests; the mock returns a fixed vector and the
  existing uploadSummary-call assertions pass unchanged.

1 118 tests green.
---
 claude-code/bundle/wiki-worker.js           | 269 +++++++++++++++++++-
 claude-code/tests/codex-wiki-worker.test.ts |   7 +
 claude-code/tests/upload-summary.test.ts    |  59 +++++
 claude-code/tests/wiki-worker.test.ts       |   7 +
 codex/bundle/wiki-worker.js                 | 269 +++++++++++++++++++-
 src/hooks/codex/wiki-worker.ts              |  18 +-
 src/hooks/upload-summary.ts                 |  14 +-
 src/hooks/wiki-worker.ts                    |  18 +-
 8 files changed, 641 insertions(+), 20 deletions(-)

diff --git a/claude-code/bundle/wiki-worker.js b/claude-code/bundle/wiki-worker.js
index b2f974f..8dee999 100755
--- a/claude-code/bundle/wiki-worker.js
+++ b/claude-code/bundle/wiki-worker.js
@@ -1,9 +1,10 @@
 #!/usr/bin/env node
 
 // dist/src/hooks/wiki-worker.js
-import { readFileSync as readFileSync2, writeFileSync as writeFileSync2, existsSync as existsSync2, appendFileSync as appendFileSync2, mkdirSync as mkdirSync2, rmSync } from "node:fs";
+import { readFileSync as readFileSync3, writeFileSync as writeFileSync2, existsSync as existsSync3, appendFileSync as appendFileSync2, mkdirSync as mkdirSync2, rmSync } from "node:fs";
 import { execFileSync } from "node:child_process";
-import { join as join3 } from "node:path";
+import { dirname, join as join3 } from "node:path";
+import { fileURLToPath } from "node:url";
 
 // dist/src/utils/debug.js
 import { appendFileSync } from "node:fs";
@@ -107,6 +108,21 @@ function releaseLock(sessionId) {
 
 // dist/src/hooks/upload-summary.js
 import { randomUUID } from "node:crypto";
+
+// dist/src/embeddings/sql.js
+function embeddingSqlLiteral(vec) {
+  if (!vec || vec.length === 0)
+    return "NULL";
+  const parts = [];
+  for (const v of vec) {
+    if (!Number.isFinite(v))
+      return "NULL";
+    parts.push(String(v));
+  }
+  return `ARRAY[${parts.join(",")}]::float4[]`;
+}
+
+// dist/src/hooks/upload-summary.js
 function esc(s) {
   return s.replace(/\\/g, "\\\\").replace(/'/g, "''").replace(/[\x01-\x08\x0b\x0c\x0e-\x1f\x7f]/g, "");
 }
@@ -119,20 +135,247 @@ async function uploadSummary(query2, params) {
   const ts = params.ts ?? (/* @__PURE__ */ new Date()).toISOString();
   const desc = extractDescription(text);
   const sizeBytes = Buffer.byteLength(text);
+  const embSql = embeddingSqlLiteral(params.embedding ?? null);
   const existing = await query2(`SELECT path FROM "${tableName}" WHERE path = '${esc(vpath)}' LIMIT 1`);
   if (existing.length > 0) {
-    const sql2 = `UPDATE "${tableName}" SET summary = E'${esc(text)}', size_bytes = ${sizeBytes}, description = E'${esc(desc)}', last_update_date = '${ts}' WHERE path = '${esc(vpath)}'`;
+    const sql2 = `UPDATE "${tableName}" SET summary = E'${esc(text)}', summary_embedding = ${embSql}, size_bytes = ${sizeBytes}, description = E'${esc(desc)}', last_update_date = '${ts}' WHERE path = '${esc(vpath)}'`;
     await query2(sql2);
     return { path: "update", sql: sql2, descLength: desc.length, summaryLength: text.length };
   }
-  const sql = `INSERT INTO "${tableName}" (id, path, filename, summary, author, mime_type, size_bytes, project, description, agent, creation_date, last_update_date) VALUES ('${randomUUID()}', '${esc(vpath)}', '${esc(fname)}', E'${esc(text)}', '${esc(userName)}', 'text/markdown', ${sizeBytes}, '${esc(project)}', E'${esc(desc)}', '${esc(agent)}', '${ts}', '${ts}')`;
+  const sql = `INSERT INTO "${tableName}" (id, path, filename, summary, summary_embedding, author, mime_type, size_bytes, project, description, agent, creation_date, last_update_date) VALUES ('${randomUUID()}', '${esc(vpath)}', '${esc(fname)}', E'${esc(text)}', ${embSql}, '${esc(userName)}', 'text/markdown', ${sizeBytes}, '${esc(project)}', E'${esc(desc)}', '${esc(agent)}', '${ts}', '${ts}')`;
   await query2(sql);
   return { path: "insert", sql, descLength: desc.length, summaryLength: text.length };
 }
 
+// dist/src/embeddings/client.js
+import { connect } from "node:net";
+import { spawn } from "node:child_process";
+import { openSync as openSync2, closeSync as closeSync2, writeSync as writeSync2, unlinkSync as unlinkSync2, existsSync as existsSync2, readFileSync as readFileSync2 } from "node:fs";
+
+// dist/src/embeddings/protocol.js
+var DEFAULT_SOCKET_DIR = "/tmp";
+var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
+var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.sock`;
+}
+function pidPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.pid`;
+}
+
+// dist/src/embeddings/client.js
+var log2 = (m) => log("embed-client", m);
+function getUid() {
+  const uid = typeof process.getuid === "function" ? process.getuid() : void 0;
+  return uid !== void 0 ? String(uid) : process.env.USER ?? "default";
+}
+var EmbedClient = class {
+  socketPath;
+  pidPath;
+  timeoutMs;
+  daemonEntry;
+  autoSpawn;
+  spawnWaitMs;
+  nextId = 0;
+  constructor(opts = {}) {
+    const uid = getUid();
+    const dir = opts.socketDir ?? "/tmp";
+    this.socketPath = socketPathFor(uid, dir);
+    this.pidPath = pidPathFor(uid, dir);
+    this.timeoutMs = opts.timeoutMs ?? DEFAULT_CLIENT_TIMEOUT_MS;
+    this.daemonEntry = opts.daemonEntry ?? process.env.HIVEMIND_EMBED_DAEMON;
+    this.autoSpawn = opts.autoSpawn ?? true;
+    this.spawnWaitMs = opts.spawnWaitMs ?? 5e3;
+  }
+  /**
+   * Returns an embedding vector, or null on timeout/failure. Hooks MUST treat
+   * null as "skip embedding column" — never block the write path on us.
+   *
+   * Fire-and-forget spawn on miss: if the daemon isn't up, this call returns
+   * null AND kicks off a background spawn. The next call finds a ready daemon.
+   */
+  async embed(text, kind = "document") {
+    let sock;
+    try {
+      sock = await this.connectOnce();
+    } catch {
+      if (this.autoSpawn)
+        this.trySpawnDaemon();
+      return null;
+    }
+    try {
+      const id = String(++this.nextId);
+      const req = { op: "embed", id, kind, text };
+      const resp = await this.sendAndWait(sock, req);
+      if (resp.error || !("embedding" in resp) || !resp.embedding) {
+        log2(`embed err: ${resp.error ?? "no embedding"}`);
+        return null;
+      }
+      return resp.embedding;
+    } catch (e) {
+      const err = e instanceof Error ? e.message : String(e);
+      log2(`embed failed: ${err}`);
+      return null;
+    } finally {
+      try {
+        sock.end();
+      } catch {
+      }
+    }
+  }
+  /**
+   * Wait up to spawnWaitMs for the daemon to accept connections, spawning if
+   * necessary. Meant for SessionStart / long-running batches — not the hot path.
+   */
+  async warmup() {
+    try {
+      const s = await this.connectOnce();
+      s.end();
+      return true;
+    } catch {
+      if (!this.autoSpawn)
+        return false;
+      this.trySpawnDaemon();
+      try {
+        const s = await this.waitForSocket();
+        s.end();
+        return true;
+      } catch {
+        return false;
+      }
+    }
+  }
+  connectOnce() {
+    return new Promise((resolve, reject) => {
+      const sock = connect(this.socketPath);
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("connect timeout"));
+      }, this.timeoutMs);
+      sock.once("connect", () => {
+        clearTimeout(to);
+        resolve(sock);
+      });
+      sock.once("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+    });
+  }
+  trySpawnDaemon() {
+    let fd;
+    try {
+      fd = openSync2(this.pidPath, "wx", 384);
+      writeSync2(fd, String(process.pid));
+    } catch (e) {
+      if (this.isPidFileStale()) {
+        try {
+          unlinkSync2(this.pidPath);
+        } catch {
+        }
+        try {
+          fd = openSync2(this.pidPath, "wx", 384);
+          writeSync2(fd, String(process.pid));
+        } catch {
+          return;
+        }
+      } else {
+        return;
+      }
+    }
+    if (!this.daemonEntry || !existsSync2(this.daemonEntry)) {
+      log2(`daemonEntry not configured or missing: ${this.daemonEntry}`);
+      try {
+        closeSync2(fd);
+        unlinkSync2(this.pidPath);
+      } catch {
+      }
+      return;
+    }
+    try {
+      const child = spawn(process.execPath, [this.daemonEntry], {
+        detached: true,
+        stdio: "ignore",
+        env: process.env
+      });
+      child.unref();
+      log2(`spawned daemon pid=${child.pid}`);
+    } finally {
+      closeSync2(fd);
+    }
+  }
+  isPidFileStale() {
+    try {
+      const raw = readFileSync2(this.pidPath, "utf-8").trim();
+      const pid = Number(raw);
+      if (!pid || Number.isNaN(pid))
+        return true;
+      try {
+        process.kill(pid, 0);
+        return false;
+      } catch {
+        return true;
+      }
+    } catch {
+      return true;
+    }
+  }
+  async waitForSocket() {
+    const deadline = Date.now() + this.spawnWaitMs;
+    let delay = 30;
+    while (Date.now() < deadline) {
+      await sleep(delay);
+      delay = Math.min(delay * 1.5, 300);
+      if (!existsSync2(this.socketPath))
+        continue;
+      try {
+        return await this.connectOnce();
+      } catch {
+      }
+    }
+    throw new Error("daemon did not become ready within spawnWaitMs");
+  }
+  sendAndWait(sock, req) {
+    return new Promise((resolve, reject) => {
+      let buf = "";
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("request timeout"));
+      }, this.timeoutMs);
+      sock.setEncoding("utf-8");
+      sock.on("data", (chunk) => {
+        buf += chunk;
+        const nl = buf.indexOf("\n");
+        if (nl === -1)
+          return;
+        const line = buf.slice(0, nl);
+        clearTimeout(to);
+        try {
+          resolve(JSON.parse(line));
+        } catch (e) {
+          reject(e);
+        }
+      });
+      sock.on("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+      sock.write(JSON.stringify(req) + "\n");
+    });
+  }
+};
+function sleep(ms) {
+  return new Promise((r) => setTimeout(r, ms));
+}
+
+// dist/src/embeddings/disable.js
+function embeddingsDisabled() {
+  return process.env.HIVEMIND_EMBEDDINGS === "false";
+}
+
 // dist/src/hooks/wiki-worker.js
 var dlog2 = (msg) => log("wiki-worker", msg);
-var cfg = JSON.parse(readFileSync2(process.argv[2], "utf-8"));
+var cfg = JSON.parse(readFileSync3(process.argv[2], "utf-8"));
 var tmpDir = cfg.tmpDir;
 var tmpJsonl = join3(tmpDir, "session.jsonl");
 var tmpSummary = join3(tmpDir, "summary.md");
@@ -230,11 +473,20 @@ async function main() {
     } catch (e) {
       wlog(`claude -p failed: ${e.status ?? e.message}`);
     }
-    if (existsSync2(tmpSummary)) {
-      const text = readFileSync2(tmpSummary, "utf-8");
+    if (existsSync3(tmpSummary)) {
+      const text = readFileSync3(tmpSummary, "utf-8");
       if (text.trim()) {
         const fname = `${cfg.sessionId}.md`;
         const vpath = `/summaries/${cfg.userName}/${fname}`;
+        let embedding = null;
+        if (!embeddingsDisabled()) {
+          try {
+            const daemonEntry = join3(dirname(fileURLToPath(import.meta.url)), "embeddings", "embed-daemon.js");
+            embedding = await new EmbedClient({ daemonEntry }).embed(text, "document");
+          } catch (e) {
+            wlog(`summary embedding failed, writing NULL: ${e.message}`);
+          }
+        }
         const result = await uploadSummary(query, {
           tableName: cfg.memoryTable,
           vpath,
@@ -243,7 +495,8 @@ async function main() {
           project: cfg.project,
           agent: "claude_code",
           sessionId: cfg.sessionId,
-          text
+          text,
+          embedding
         });
         wlog(`uploaded ${vpath} (summary=${result.summaryLength}, desc=${result.descLength})`);
         try {
diff --git a/claude-code/tests/codex-wiki-worker.test.ts b/claude-code/tests/codex-wiki-worker.test.ts
index 6a4260a..9ff6127 100644
--- a/claude-code/tests/codex-wiki-worker.test.ts
+++ b/claude-code/tests/codex-wiki-worker.test.ts
@@ -19,6 +19,7 @@ const finalizeSummaryMock = vi.fn();
 const releaseLockMock = vi.fn();
 const uploadSummaryMock = vi.fn();
 const execFileSyncMock = vi.fn();
+const embedSummaryMock = vi.fn();
 
 vi.mock("../../src/hooks/summary-state.js", () => ({
   finalizeSummary: (...a: any[]) => finalizeSummaryMock(...a),
@@ -27,6 +28,11 @@ vi.mock("../../src/hooks/summary-state.js", () => ({
 vi.mock("../../src/hooks/upload-summary.js", () => ({
   uploadSummary: (...a: any[]) => uploadSummaryMock(...a),
 }));
+vi.mock("../../src/embeddings/client.js", () => ({
+  EmbedClient: class {
+    async embed(text: string, kind: string) { return embedSummaryMock(text, kind); }
+  },
+}));
 vi.mock("node:child_process", async () => {
   const actual = await vi.importActual<typeof import("node:child_process")>("node:child_process");
   return { ...actual, execFileSync: (...a: any[]) => execFileSyncMock(...a) };
@@ -94,6 +100,7 @@ beforeEach(() => {
   finalizeSummaryMock.mockReset();
   releaseLockMock.mockReset();
   uploadSummaryMock.mockReset().mockResolvedValue({ path: "insert", summaryLength: 80, descLength: 15, sql: "..." });
+  embedSummaryMock.mockReset().mockResolvedValue([0.1, 0.2, 0.3]);
   execFileSyncMock.mockReset();
 });
 
diff --git a/claude-code/tests/upload-summary.test.ts b/claude-code/tests/upload-summary.test.ts
index 56eb0e9..9918d7b 100644
--- a/claude-code/tests/upload-summary.test.ts
+++ b/claude-code/tests/upload-summary.test.ts
@@ -133,6 +133,65 @@ describe("uploadSummary — Deeplake single-UPDATE invariant", () => {
   });
 });
 
+describe("uploadSummary — summary_embedding column", () => {
+  it("INSERT path includes summary_embedding as ARRAY[...]::float4[] when an embedding is supplied", async () => {
+    const { fn, calls } = makeSpyQuery([[]]);
+    await uploadSummary(fn, {
+      ...BASE,
+      text: TEXT_WITH_WHAT_HAPPENED,
+      embedding: [0.1, -0.2, 0.3],
+    });
+    const insert = calls.find(c => /^INSERT INTO/i.test(c))!;
+    expect(insert).toContain("summary_embedding");
+    expect(insert).toContain("ARRAY[0.1,-0.2,0.3]::float4[]");
+  });
+
+  it("UPDATE path sets summary_embedding in the same statement as summary", async () => {
+    const { fn, calls } = makeSpyQuery([[{ path: BASE.vpath }]]);
+    await uploadSummary(fn, {
+      ...BASE,
+      text: TEXT_WITH_WHAT_HAPPENED,
+      embedding: [0.5, 0.25],
+    });
+    const update = calls.find(c => /^UPDATE/i.test(c))!;
+    expect(update).toContain("summary = E'");
+    expect(update).toContain("summary_embedding = ARRAY[0.5,0.25]::float4[]");
+  });
+
+  it("writes SQL NULL for summary_embedding when the caller omits the embedding", async () => {
+    const { fn, calls } = makeSpyQuery([[]]);
+    await uploadSummary(fn, { ...BASE, text: TEXT_WITH_WHAT_HAPPENED });
+    const insert = calls.find(c => /^INSERT INTO/i.test(c))!;
+    expect(insert).toContain("summary_embedding");
+    // The literal token must be the bare SQL NULL, not the string 'NULL'.
+    expect(insert).not.toContain("'NULL'");
+    expect(insert).toContain(", NULL, "); // bare NULL between surrounding values in VALUES (...)
+  });
+
+  it("writes SQL NULL when the caller explicitly passes embedding: null", async () => {
+    const { fn, calls } = makeSpyQuery([[{ path: BASE.vpath }]]);
+    await uploadSummary(fn, {
+      ...BASE,
+      text: TEXT_WITH_WHAT_HAPPENED,
+      embedding: null,
+    });
+    const update = calls.find(c => /^UPDATE/i.test(c))!;
+    expect(update).toContain("summary_embedding = NULL");
+  });
+
+  it("writes SQL NULL for an empty embedding array (daemon returned invalid)", async () => {
+    const { fn, calls } = makeSpyQuery([[]]);
+    await uploadSummary(fn, {
+      ...BASE,
+      text: TEXT_WITH_WHAT_HAPPENED,
+      embedding: [],
+    });
+    const insert = calls.find(c => /^INSERT INTO/i.test(c))!;
+    expect(insert).not.toContain("'NULL'");
+    expect(insert).toContain(", NULL, ");
+  });
+});
+
 describe("extractDescription", () => {
   it("extracts the What Happened section trimmed to 300 chars", () => {
     const d = extractDescription(TEXT_WITH_WHAT_HAPPENED);
diff --git a/claude-code/tests/wiki-worker.test.ts b/claude-code/tests/wiki-worker.test.ts
index f287cc1..dd16d04 100644
--- a/claude-code/tests/wiki-worker.test.ts
+++ b/claude-code/tests/wiki-worker.test.ts
@@ -27,6 +27,7 @@ const finalizeSummaryMock = vi.fn();
 const releaseLockMock = vi.fn();
 const uploadSummaryMock = vi.fn();
 const execFileSyncMock = vi.fn();
+const embedSummaryMock = vi.fn();
 
 vi.mock("../../src/hooks/summary-state.js", () => ({
   finalizeSummary: (...a: any[]) => finalizeSummaryMock(...a),
@@ -35,6 +36,11 @@ vi.mock("../../src/hooks/summary-state.js", () => ({
 vi.mock("../../src/hooks/upload-summary.js", () => ({
   uploadSummary: (...a: any[]) => uploadSummaryMock(...a),
 }));
+vi.mock("../../src/embeddings/client.js", () => ({
+  EmbedClient: class {
+    async embed(text: string, kind: string) { return embedSummaryMock(text, kind); }
+  },
+}));
 vi.mock("node:child_process", async () => {
   const actual = await vi.importActual<typeof import("node:child_process")>("node:child_process");
   return { ...actual, execFileSync: (...a: any[]) => execFileSyncMock(...a) };
@@ -107,6 +113,7 @@ beforeEach(() => {
   finalizeSummaryMock.mockReset();
   releaseLockMock.mockReset();
   uploadSummaryMock.mockReset().mockResolvedValue({ path: "insert", summaryLength: 100, descLength: 20, sql: "..." });
+  embedSummaryMock.mockReset().mockResolvedValue([0.1, 0.2, 0.3]);
   execFileSyncMock.mockReset();
 });
 
diff --git a/codex/bundle/wiki-worker.js b/codex/bundle/wiki-worker.js
index bf134ed..5fffb2e 100755
--- a/codex/bundle/wiki-worker.js
+++ b/codex/bundle/wiki-worker.js
@@ -1,9 +1,10 @@
 #!/usr/bin/env node
 
 // dist/src/hooks/codex/wiki-worker.js
-import { readFileSync as readFileSync2, writeFileSync as writeFileSync2, existsSync as existsSync2, appendFileSync as appendFileSync2, mkdirSync as mkdirSync2, rmSync } from "node:fs";
+import { readFileSync as readFileSync3, writeFileSync as writeFileSync2, existsSync as existsSync3, appendFileSync as appendFileSync2, mkdirSync as mkdirSync2, rmSync } from "node:fs";
 import { execFileSync } from "node:child_process";
-import { join as join3 } from "node:path";
+import { dirname, join as join3 } from "node:path";
+import { fileURLToPath } from "node:url";
 
 // dist/src/hooks/summary-state.js
 import { readFileSync, writeFileSync, writeSync, mkdirSync, renameSync, existsSync, unlinkSync, openSync, closeSync } from "node:fs";
@@ -106,6 +107,21 @@ function releaseLock(sessionId) {
 
 // dist/src/hooks/upload-summary.js
 import { randomUUID } from "node:crypto";
+
+// dist/src/embeddings/sql.js
+function embeddingSqlLiteral(vec) {
+  if (!vec || vec.length === 0)
+    return "NULL";
+  const parts = [];
+  for (const v of vec) {
+    if (!Number.isFinite(v))
+      return "NULL";
+    parts.push(String(v));
+  }
+  return `ARRAY[${parts.join(",")}]::float4[]`;
+}
+
+// dist/src/hooks/upload-summary.js
 function esc(s) {
   return s.replace(/\\/g, "\\\\").replace(/'/g, "''").replace(/[\x01-\x08\x0b\x0c\x0e-\x1f\x7f]/g, "");
 }
@@ -118,20 +134,247 @@ async function uploadSummary(query2, params) {
   const ts = params.ts ?? (/* @__PURE__ */ new Date()).toISOString();
   const desc = extractDescription(text);
   const sizeBytes = Buffer.byteLength(text);
+  const embSql = embeddingSqlLiteral(params.embedding ?? null);
   const existing = await query2(`SELECT path FROM "${tableName}" WHERE path = '${esc(vpath)}' LIMIT 1`);
   if (existing.length > 0) {
-    const sql2 = `UPDATE "${tableName}" SET summary = E'${esc(text)}', size_bytes = ${sizeBytes}, description = E'${esc(desc)}', last_update_date = '${ts}' WHERE path = '${esc(vpath)}'`;
+    const sql2 = `UPDATE "${tableName}" SET summary = E'${esc(text)}', summary_embedding = ${embSql}, size_bytes = ${sizeBytes}, description = E'${esc(desc)}', last_update_date = '${ts}' WHERE path = '${esc(vpath)}'`;
     await query2(sql2);
     return { path: "update", sql: sql2, descLength: desc.length, summaryLength: text.length };
   }
-  const sql = `INSERT INTO "${tableName}" (id, path, filename, summary, author, mime_type, size_bytes, project, description, agent, creation_date, last_update_date) VALUES ('${randomUUID()}', '${esc(vpath)}', '${esc(fname)}', E'${esc(text)}', '${esc(userName)}', 'text/markdown', ${sizeBytes}, '${esc(project)}', E'${esc(desc)}', '${esc(agent)}', '${ts}', '${ts}')`;
+  const sql = `INSERT INTO "${tableName}" (id, path, filename, summary, summary_embedding, author, mime_type, size_bytes, project, description, agent, creation_date, last_update_date) VALUES ('${randomUUID()}', '${esc(vpath)}', '${esc(fname)}', E'${esc(text)}', ${embSql}, '${esc(userName)}', 'text/markdown', ${sizeBytes}, '${esc(project)}', E'${esc(desc)}', '${esc(agent)}', '${ts}', '${ts}')`;
   await query2(sql);
   return { path: "insert", sql, descLength: desc.length, summaryLength: text.length };
 }
 
+// dist/src/embeddings/client.js
+import { connect } from "node:net";
+import { spawn } from "node:child_process";
+import { openSync as openSync2, closeSync as closeSync2, writeSync as writeSync2, unlinkSync as unlinkSync2, existsSync as existsSync2, readFileSync as readFileSync2 } from "node:fs";
+
+// dist/src/embeddings/protocol.js
+var DEFAULT_SOCKET_DIR = "/tmp";
+var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
+var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.sock`;
+}
+function pidPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.pid`;
+}
+
+// dist/src/embeddings/client.js
+var log2 = (m) => log("embed-client", m);
+function getUid() {
+  const uid = typeof process.getuid === "function" ? process.getuid() : void 0;
+  return uid !== void 0 ? String(uid) : process.env.USER ?? "default";
+}
+var EmbedClient = class {
+  socketPath;
+  pidPath;
+  timeoutMs;
+  daemonEntry;
+  autoSpawn;
+  spawnWaitMs;
+  nextId = 0;
+  constructor(opts = {}) {
+    const uid = getUid();
+    const dir = opts.socketDir ?? "/tmp";
+    this.socketPath = socketPathFor(uid, dir);
+    this.pidPath = pidPathFor(uid, dir);
+    this.timeoutMs = opts.timeoutMs ?? DEFAULT_CLIENT_TIMEOUT_MS;
+    this.daemonEntry = opts.daemonEntry ?? process.env.HIVEMIND_EMBED_DAEMON;
+    this.autoSpawn = opts.autoSpawn ?? true;
+    this.spawnWaitMs = opts.spawnWaitMs ?? 5e3;
+  }
+  /**
+   * Returns an embedding vector, or null on timeout/failure. Hooks MUST treat
+   * null as "skip embedding column" — never block the write path on us.
+   *
+   * Fire-and-forget spawn on miss: if the daemon isn't up, this call returns
+   * null AND kicks off a background spawn. The next call finds a ready daemon.
+   */
+  async embed(text, kind = "document") {
+    let sock;
+    try {
+      sock = await this.connectOnce();
+    } catch {
+      if (this.autoSpawn)
+        this.trySpawnDaemon();
+      return null;
+    }
+    try {
+      const id = String(++this.nextId);
+      const req = { op: "embed", id, kind, text };
+      const resp = await this.sendAndWait(sock, req);
+      if (resp.error || !("embedding" in resp) || !resp.embedding) {
+        log2(`embed err: ${resp.error ?? "no embedding"}`);
+        return null;
+      }
+      return resp.embedding;
+    } catch (e) {
+      const err = e instanceof Error ? e.message : String(e);
+      log2(`embed failed: ${err}`);
+      return null;
+    } finally {
+      try {
+        sock.end();
+      } catch {
+      }
+    }
+  }
+  /**
+   * Wait up to spawnWaitMs for the daemon to accept connections, spawning if
+   * necessary. Meant for SessionStart / long-running batches — not the hot path.
+   */
+  async warmup() {
+    try {
+      const s = await this.connectOnce();
+      s.end();
+      return true;
+    } catch {
+      if (!this.autoSpawn)
+        return false;
+      this.trySpawnDaemon();
+      try {
+        const s = await this.waitForSocket();
+        s.end();
+        return true;
+      } catch {
+        return false;
+      }
+    }
+  }
+  connectOnce() {
+    return new Promise((resolve, reject) => {
+      const sock = connect(this.socketPath);
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("connect timeout"));
+      }, this.timeoutMs);
+      sock.once("connect", () => {
+        clearTimeout(to);
+        resolve(sock);
+      });
+      sock.once("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+    });
+  }
+  trySpawnDaemon() {
+    let fd;
+    try {
+      fd = openSync2(this.pidPath, "wx", 384);
+      writeSync2(fd, String(process.pid));
+    } catch (e) {
+      if (this.isPidFileStale()) {
+        try {
+          unlinkSync2(this.pidPath);
+        } catch {
+        }
+        try {
+          fd = openSync2(this.pidPath, "wx", 384);
+          writeSync2(fd, String(process.pid));
+        } catch {
+          return;
+        }
+      } else {
+        return;
+      }
+    }
+    if (!this.daemonEntry || !existsSync2(this.daemonEntry)) {
+      log2(`daemonEntry not configured or missing: ${this.daemonEntry}`);
+      try {
+        closeSync2(fd);
+        unlinkSync2(this.pidPath);
+      } catch {
+      }
+      return;
+    }
+    try {
+      const child = spawn(process.execPath, [this.daemonEntry], {
+        detached: true,
+        stdio: "ignore",
+        env: process.env
+      });
+      child.unref();
+      log2(`spawned daemon pid=${child.pid}`);
+    } finally {
+      closeSync2(fd);
+    }
+  }
+  isPidFileStale() {
+    try {
+      const raw = readFileSync2(this.pidPath, "utf-8").trim();
+      const pid = Number(raw);
+      if (!pid || Number.isNaN(pid))
+        return true;
+      try {
+        process.kill(pid, 0);
+        return false;
+      } catch {
+        return true;
+      }
+    } catch {
+      return true;
+    }
+  }
+  async waitForSocket() {
+    const deadline = Date.now() + this.spawnWaitMs;
+    let delay = 30;
+    while (Date.now() < deadline) {
+      await sleep(delay);
+      delay = Math.min(delay * 1.5, 300);
+      if (!existsSync2(this.socketPath))
+        continue;
+      try {
+        return await this.connectOnce();
+      } catch {
+      }
+    }
+    throw new Error("daemon did not become ready within spawnWaitMs");
+  }
+  sendAndWait(sock, req) {
+    return new Promise((resolve, reject) => {
+      let buf = "";
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("request timeout"));
+      }, this.timeoutMs);
+      sock.setEncoding("utf-8");
+      sock.on("data", (chunk) => {
+        buf += chunk;
+        const nl = buf.indexOf("\n");
+        if (nl === -1)
+          return;
+        const line = buf.slice(0, nl);
+        clearTimeout(to);
+        try {
+          resolve(JSON.parse(line));
+        } catch (e) {
+          reject(e);
+        }
+      });
+      sock.on("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+      sock.write(JSON.stringify(req) + "\n");
+    });
+  }
+};
+function sleep(ms) {
+  return new Promise((r) => setTimeout(r, ms));
+}
+
+// dist/src/embeddings/disable.js
+function embeddingsDisabled() {
+  return process.env.HIVEMIND_EMBEDDINGS === "false";
+}
+
 // dist/src/hooks/codex/wiki-worker.js
 var dlog2 = (msg) => log("codex-wiki-worker", msg);
-var cfg = JSON.parse(readFileSync2(process.argv[2], "utf-8"));
+var cfg = JSON.parse(readFileSync3(process.argv[2], "utf-8"));
 var tmpDir = cfg.tmpDir;
 var tmpJsonl = join3(tmpDir, "session.jsonl");
 var tmpSummary = join3(tmpDir, "summary.md");
@@ -225,11 +468,20 @@ async function main() {
     } catch (e) {
       wlog(`codex exec failed: ${e.status ?? e.message}`);
     }
-    if (existsSync2(tmpSummary)) {
-      const text = readFileSync2(tmpSummary, "utf-8");
+    if (existsSync3(tmpSummary)) {
+      const text = readFileSync3(tmpSummary, "utf-8");
       if (text.trim()) {
         const fname = `${cfg.sessionId}.md`;
         const vpath = `/summaries/${cfg.userName}/${fname}`;
+        let embedding = null;
+        if (!embeddingsDisabled()) {
+          try {
+            const daemonEntry = join3(dirname(fileURLToPath(import.meta.url)), "embeddings", "embed-daemon.js");
+            embedding = await new EmbedClient({ daemonEntry }).embed(text, "document");
+          } catch (e) {
+            wlog(`summary embedding failed, writing NULL: ${e.message}`);
+          }
+        }
         const result = await uploadSummary(query, {
           tableName: cfg.memoryTable,
           vpath,
@@ -238,7 +490,8 @@ async function main() {
           project: cfg.project,
           agent: "codex",
           sessionId: cfg.sessionId,
-          text
+          text,
+          embedding
         });
         wlog(`uploaded ${vpath} (summary=${result.summaryLength}, desc=${result.descLength})`);
         try {
diff --git a/src/hooks/codex/wiki-worker.ts b/src/hooks/codex/wiki-worker.ts
index 7d74f75..ce016e1 100644
--- a/src/hooks/codex/wiki-worker.ts
+++ b/src/hooks/codex/wiki-worker.ts
@@ -9,10 +9,13 @@
 
 import { readFileSync, writeFileSync, existsSync, appendFileSync, mkdirSync, rmSync } from "node:fs";
 import { execFileSync } from "node:child_process";
-import { join } from "node:path";
+import { dirname, join } from "node:path";
+import { fileURLToPath } from "node:url";
 import { finalizeSummary, releaseLock } from "../summary-state.js";
 import { uploadSummary } from "../upload-summary.js";
 import { log as _log } from "../../utils/debug.js";
+import { EmbedClient } from "../../embeddings/client.js";
+import { embeddingsDisabled } from "../../embeddings/disable.js";
 
 const dlog = (msg: string) => _log("codex-wiki-worker", msg);
 
@@ -176,6 +179,18 @@ async function main(): Promise<void> {
       if (text.trim()) {
         const fname = `${cfg.sessionId}.md`;
         const vpath = `/summaries/${cfg.userName}/${fname}`;
+        // Embed the summary so it ranks in the semantic retrieval branch.
+        // Skipped when globally disabled or the daemon is unreachable —
+        // uploadSummary() writes SQL NULL in that case.
+        let embedding: number[] | null = null;
+        if (!embeddingsDisabled()) {
+          try {
+            const daemonEntry = join(dirname(fileURLToPath(import.meta.url)), "embeddings", "embed-daemon.js");
+            embedding = await new EmbedClient({ daemonEntry }).embed(text, "document");
+          } catch (e: any) {
+            wlog(`summary embedding failed, writing NULL: ${e.message}`);
+          }
+        }
         const result = await uploadSummary(query, {
           tableName: cfg.memoryTable,
           vpath, fname,
@@ -184,6 +199,7 @@ async function main(): Promise<void> {
           agent: "codex",
           sessionId: cfg.sessionId,
           text,
+          embedding,
         });
         wlog(`uploaded ${vpath} (summary=${result.summaryLength}, desc=${result.descLength})`);
 
diff --git a/src/hooks/upload-summary.ts b/src/hooks/upload-summary.ts
index f6c96a0..7d9e0cf 100644
--- a/src/hooks/upload-summary.ts
+++ b/src/hooks/upload-summary.ts
@@ -9,6 +9,7 @@
  */
 
 import { randomUUID } from "node:crypto";
+import { embeddingSqlLiteral } from "../embeddings/sql.js";
 
 export type QueryFn = (sql: string) => Promise<Array<Record<string, unknown>>>;
 
@@ -22,6 +23,13 @@ export interface UploadParams {
   sessionId: string;
   text: string;
   ts?: string;
+  /**
+   * Pre-computed nomic embedding of `text` to store alongside the summary.
+   * Passing `null` or `undefined` writes SQL NULL — the column stays
+   * schema-compatible and the row is still reachable via the lexical
+   * retrieval branch, it just won't show up in the semantic branch.
+   */
+  embedding?: number[] | null;
 }
 
 export interface UploadResult {
@@ -56,6 +64,7 @@ export async function uploadSummary(query: QueryFn, params: UploadParams): Promi
   const ts = params.ts ?? new Date().toISOString();
   const desc = extractDescription(text);
   const sizeBytes = Buffer.byteLength(text);
+  const embSql = embeddingSqlLiteral(params.embedding ?? null);
 
   const existing = await query(
     `SELECT path FROM "${tableName}" WHERE path = '${esc(vpath)}' LIMIT 1`
@@ -65,6 +74,7 @@ export async function uploadSummary(query: QueryFn, params: UploadParams): Promi
     const sql =
       `UPDATE "${tableName}" SET ` +
       `summary = E'${esc(text)}', ` +
+      `summary_embedding = ${embSql}, ` +
       `size_bytes = ${sizeBytes}, ` +
       `description = E'${esc(desc)}', ` +
       `last_update_date = '${ts}' ` +
@@ -74,8 +84,8 @@ export async function uploadSummary(query: QueryFn, params: UploadParams): Promi
   }
 
   const sql =
-    `INSERT INTO "${tableName}" (id, path, filename, summary, author, mime_type, size_bytes, project, description, agent, creation_date, last_update_date) ` +
-    `VALUES ('${randomUUID()}', '${esc(vpath)}', '${esc(fname)}', E'${esc(text)}', '${esc(userName)}', 'text/markdown', ` +
+    `INSERT INTO "${tableName}" (id, path, filename, summary, summary_embedding, author, mime_type, size_bytes, project, description, agent, creation_date, last_update_date) ` +
+    `VALUES ('${randomUUID()}', '${esc(vpath)}', '${esc(fname)}', E'${esc(text)}', ${embSql}, '${esc(userName)}', 'text/markdown', ` +
     `${sizeBytes}, '${esc(project)}', E'${esc(desc)}', '${esc(agent)}', '${ts}', '${ts}')`;
   await query(sql);
   return { path: "insert", sql, descLength: desc.length, summaryLength: text.length };
diff --git a/src/hooks/wiki-worker.ts b/src/hooks/wiki-worker.ts
index 2359ea0..990d054 100644
--- a/src/hooks/wiki-worker.ts
+++ b/src/hooks/wiki-worker.ts
@@ -9,12 +9,15 @@
 
 import { readFileSync, writeFileSync, existsSync, appendFileSync, mkdirSync, rmSync } from "node:fs";
 import { execFileSync } from "node:child_process";
-import { join } from "node:path";
+import { dirname, join } from "node:path";
+import { fileURLToPath } from "node:url";
 import { utcTimestamp, log as _log } from "../utils/debug.js";
 
 const dlog = (msg: string) => _log("wiki-worker", msg);
 import { finalizeSummary, releaseLock } from "./summary-state.js";
 import { uploadSummary } from "./upload-summary.js";
+import { EmbedClient } from "../embeddings/client.js";
+import { embeddingsDisabled } from "../embeddings/disable.js";
 
 interface WorkerConfig {
   apiUrl: string;
@@ -181,6 +184,18 @@ async function main(): Promise<void> {
       if (text.trim()) {
         const fname = `${cfg.sessionId}.md`;
         const vpath = `/summaries/${cfg.userName}/${fname}`;
+        // Embed the summary so it ranks in the semantic retrieval branch.
+        // Skipped when globally disabled or the daemon is unreachable —
+        // uploadSummary() writes SQL NULL in that case.
+        let embedding: number[] | null = null;
+        if (!embeddingsDisabled()) {
+          try {
+            const daemonEntry = join(dirname(fileURLToPath(import.meta.url)), "embeddings", "embed-daemon.js");
+            embedding = await new EmbedClient({ daemonEntry }).embed(text, "document");
+          } catch (e: any) {
+            wlog(`summary embedding failed, writing NULL: ${e.message}`);
+          }
+        }
         const result = await uploadSummary(query, {
           tableName: cfg.memoryTable,
           vpath, fname,
@@ -189,6 +204,7 @@ async function main(): Promise<void> {
           agent: "claude_code",
           sessionId: cfg.sessionId,
           text,
+          embedding,
         });
         wlog(`uploaded ${vpath} (summary=${result.summaryLength}, desc=${result.descLength})`);
 

From 9f4c30ded594a8f12933962472d080fdcfe8b35c Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Mon, 27 Apr 2026 17:42:04 +0000
Subject: [PATCH 19/30] fix(grep-core): exclude empty [] embeddings from
 semantic search
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The semantic branch of searchDeeplakeTables previously filtered with
`WHERE summary_embedding IS NOT NULL` (and the analogous predicate on
message_embedding). That filter is insufficient for tables that gained
the embedding column via `ALTER TABLE ADD COLUMN summary_embedding
FLOAT4[]` after rows were already present: Postgres backfills the new
column with `[]` (empty array), not SQL NULL. Pre-migration rows
therefore pass `IS NOT NULL`, but the cosine operator `<#>` returns
NULL when applied to an empty array, and `ORDER BY score DESC` orders
NULL ahead of any real float — so unembedded rows dominate the top-K
and push genuine matches out of the result set.

Switch the predicate to `ARRAY_LENGTH(<col>, 1) > 0`, which:
- returns NULL for an empty array (excluding the row),
- returns NULL when the column itself is NULL (excluding the row),
- returns the array length otherwise (passing the > 0 check).

This handles both the post-ADD-COLUMN backfill and the legacy NULL case
in a single condition. Test assertion updated to match the new SQL
shape.
---
 claude-code/tests/grep-core.test.ts |  2 +-
 src/shell/grep-core.ts              | 12 ++++++++++--
 2 files changed, 11 insertions(+), 3 deletions(-)

diff --git a/claude-code/tests/grep-core.test.ts b/claude-code/tests/grep-core.test.ts
index 20a8d1d..d615a2a 100644
--- a/claude-code/tests/grep-core.test.ts
+++ b/claude-code/tests/grep-core.test.ts
@@ -1236,7 +1236,7 @@ describe("searchDeeplakeTables: hybrid semantic + lexical branch", () => {
       });
       const sql = query.mock.calls[0][0] as string;
       // Semantic LIMIT is 7; lexical still 20 (default).
-      expect(sql).toMatch(/summary_embedding <#> [^)]+\) AS score FROM "m" WHERE summary_embedding IS NOT NULL ORDER BY score DESC LIMIT 7/);
+      expect(sql).toMatch(/summary_embedding <#> [^)]+\) AS score FROM "m" WHERE ARRAY_LENGTH\(summary_embedding, 1\) > 0 ORDER BY score DESC LIMIT 7/);
     } finally {
       if (prev === undefined) delete process.env.HIVEMIND_SEMANTIC_LIMIT;
       else process.env.HIVEMIND_SEMANTIC_LIMIT = prev;
diff --git a/src/shell/grep-core.ts b/src/shell/grep-core.ts
index ae65912..c144926 100644
--- a/src/shell/grep-core.ts
+++ b/src/shell/grep-core.ts
@@ -349,15 +349,23 @@ export async function searchDeeplakeTables(
         `FROM "${sessionsTable}" WHERE 1=1${pathFilter}${sessLexFilter} LIMIT ${lexicalLimit}`
       : null;
 
+    // Filter out rows with a missing OR empty embedding. ALTER TABLE ADD
+    // COLUMN FLOAT4[] on an existing table (our migration path for pre-0.7.x
+    // schemas) backfills existing rows with `[]`, NOT SQL NULL. Those rows
+    // pass an `IS NOT NULL` check but the cosine operator `<#>` returns NULL
+    // on an empty array, and Postgres orders NULL before any float under
+    // `ORDER BY score DESC` — so pre-migration rows would dominate the top-K
+    // and push real matches out. `ARRAY_LENGTH(col, 1)` returns NULL for
+    // empty arrays, so `> 0` excludes both the empty and the NULL cases.
     const memSemQuery =
       `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, ` +
       `(summary_embedding <#> ${vecLit}) AS score ` +
-      `FROM "${memoryTable}" WHERE summary_embedding IS NOT NULL${pathFilter} ` +
+      `FROM "${memoryTable}" WHERE ARRAY_LENGTH(summary_embedding, 1) > 0${pathFilter} ` +
       `ORDER BY score DESC LIMIT ${semanticLimit}`;
     const sessSemQuery =
       `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, ` +
       `(message_embedding <#> ${vecLit}) AS score ` +
-      `FROM "${sessionsTable}" WHERE message_embedding IS NOT NULL${pathFilter} ` +
+      `FROM "${sessionsTable}" WHERE ARRAY_LENGTH(message_embedding, 1) > 0${pathFilter} ` +
       `ORDER BY score DESC LIMIT ${semanticLimit}`;
 
     const parts = [memSemQuery, sessSemQuery];

From fbc3024313c006d0adb349d919b060df74660ac5 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Mon, 27 Apr 2026 17:42:36 +0000
Subject: [PATCH 20/30] feat(virtual-index): cap rendered index.md to 50
 most-recent per section
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

generateVirtualIndex previously fetched and rendered every summary and
session row in the workspace. On a fully populated workspace (272
summaries + 272 sessions in the locomo benchmark workspace) the
resulting markdown weighs ~83 KB / ~32 k tokens, which exceeds Claude
Code's Read tool output limit and fails with "File content (N tokens)
exceeds maximum allowed tokens" — making the very first hop of the
recall workflow (read index.md) unusable.

Cap each section to 50 most-recent entries (introduced as
INDEX_LIMIT_PER_SECTION). The implementation:
- adds `LIMIT 51` to both queries — fetching one row past the cap so
  truncation can be detected without a second COUNT(*) round-trip;
- changes the sessions ordering from `ORDER BY path` to
  `ORDER BY MAX(last_update_date) DESC`, so the cap actually keeps the
  most-recent rows (path order is uncorrelated with recency);
- slices to 50 before rendering and emits a footer note pointing the
  agent at the workspace memory grep entry point for older rows
  whenever the truncation flag is set.

50 keeps the rendered index well under the Read limit (covers the
common "what happened recently" use case) while older rows remain
reachable via grep on the memory path.
---
 src/shell/deeplake-fs.ts | 31 +++++++++++++++++++++++++++----
 1 file changed, 27 insertions(+), 4 deletions(-)

diff --git a/src/shell/deeplake-fs.ts b/src/shell/deeplake-fs.ts
index 24c3ba7..2d17d48 100644
--- a/src/shell/deeplake-fs.ts
+++ b/src/shell/deeplake-fs.ts
@@ -281,10 +281,19 @@ export class DeeplakeFs implements IFileSystem {
   // ── Virtual index.md generation ────────────────────────────────────────────
 
   private async generateVirtualIndex(): Promise<string> {
+    // Cap per section. A fully populated index (272 summaries + 272 sessions
+    // in the locomo benchmark workspace) renders to ~83 KB / ~32 k tokens,
+    // which trips Claude Code's Read tool output limit (fails with
+    // "File content (N tokens) exceeds maximum allowed tokens"). 50 most
+    // recent entries per section stays comfortably under the limit while
+    // covering the common "what happened recently" use case; older rows
+    // remain reachable via Grep on the memory path.
+    const INDEX_LIMIT_PER_SECTION = 50;
+
     // Memory (summaries) section — high-level wikipage per session.
     const summaryRows = await this.client.query(
       `SELECT path, project, description, creation_date, last_update_date FROM "${this.table}" ` +
-      `WHERE path LIKE '${esc("/summaries/")}%' ORDER BY last_update_date DESC`
+      `WHERE path LIKE '${esc("/summaries/")}%' ORDER BY last_update_date DESC LIMIT ${INDEX_LIMIT_PER_SECTION + 1}`
     );
 
     // Sessions section — raw session records (dialogue / events). Pulled
@@ -296,7 +305,7 @@ export class DeeplakeFs implements IFileSystem {
         sessionRows = await this.client.query(
           `SELECT path, MAX(description) AS description, MIN(creation_date) AS creation_date, MAX(last_update_date) AS last_update_date ` +
           `FROM "${this.sessionsTable}" WHERE path LIKE '${esc("/sessions/")}%' ` +
-          `GROUP BY path ORDER BY path`
+          `GROUP BY path ORDER BY MAX(last_update_date) DESC LIMIT ${INDEX_LIMIT_PER_SECTION + 1}`
         );
       } catch {
         // sessions table absent or schema mismatch — leave empty, emit memory-only index.
@@ -304,6 +313,12 @@ export class DeeplakeFs implements IFileSystem {
       }
     }
 
+    // Slice the N+1 fetched rows to N and detect if more exist for the footer.
+    const summaryTruncated = summaryRows.length > INDEX_LIMIT_PER_SECTION;
+    const sessionTruncated = sessionRows.length > INDEX_LIMIT_PER_SECTION;
+    const summaryVisible = summaryRows.slice(0, INDEX_LIMIT_PER_SECTION);
+    const sessionVisible = sessionRows.slice(0, INDEX_LIMIT_PER_SECTION);
+
     const lines: string[] = [
       "# Session Index",
       "",
@@ -319,9 +334,13 @@ export class DeeplakeFs implements IFileSystem {
     } else {
       lines.push("AI-generated summaries per session. Read these first for topic-level overviews.");
       lines.push("");
+      if (summaryTruncated) {
+        lines.push(`_Showing ${INDEX_LIMIT_PER_SECTION} most-recent of many — older summaries reachable via \`Grep pattern=\"...\" path=\"~/.deeplake/memory\"\`._`);
+        lines.push("");
+      }
       lines.push("| Session | Created | Last Updated | Project | Description |");
       lines.push("|---------|---------|--------------|---------|-------------|");
-      for (const row of summaryRows) {
+      for (const row of summaryVisible) {
         const p = row["path"] as string;
         const match = p.match(/\/summaries\/([^/]+)\/([^/]+)\.md$/);
         if (!match) continue;
@@ -345,9 +364,13 @@ export class DeeplakeFs implements IFileSystem {
     } else {
       lines.push("Raw session records (dialogue, tool calls). Read for exact detail / quotes.");
       lines.push("");
+      if (sessionTruncated) {
+        lines.push(`_Showing ${INDEX_LIMIT_PER_SECTION} most-recent of many — older sessions reachable via \`Grep pattern=\"...\" path=\"~/.deeplake/memory\"\`._`);
+        lines.push("");
+      }
       lines.push("| Session | Created | Last Updated | Description |");
       lines.push("|---------|---------|--------------|-------------|");
-      for (const row of sessionRows) {
+      for (const row of sessionVisible) {
         const p = (row["path"] as string) || "";
         // Show the path relative to /sessions/ so the table stays compact.
         const rel = p.startsWith("/") ? p.slice(1) : p;

From 60236a6ee75a6c31b7fe74b863fc479098e04752 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Mon, 27 Apr 2026 17:42:54 +0000
Subject: [PATCH 21/30] docs(session-start): two-tier recall workflow +
 Grep-broken warning
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Both Claude and Codex SessionStart hooks previously injected a vague
"read index.md first, then summaries, then sessions" prompt that did
not steer the agent away from two systematic failure modes seen in
benchmark runs:

1. Agents called the built-in Grep tool on the memory path. The tool
   errors out with "Path does not exist" because Claude Code resolves
   the Grep tool's path argument against the real filesystem, where
   the virtual mount point does not exist. The plugin's PreToolUse
   hook does not intercept Grep on CC 2.1.118 (only Bash and Read
   fire), so the call goes through unrewritten and fails.
2. Agents grep-ed across the whole memory tree without a summaries/
   or sessions/ suffix, drowning the answer in raw JSONL noise.

Replace the prompt with explicit guidance:
- two-tier hierarchy with size hints (~3 KB summaries vs ~5 KB
  sessions) and ordering rules (summaries first, sessions only as
  fallback);
- explicit "✅ ... ❌ ..." examples that show the correct shell
  invocation and call out the broken Grep-tool invocation by name;
- "never read index.md" rule (agents would otherwise hit the size
  limit and waste a turn);
- restored the existing "no python/node/curl" and "no subagent" rules
  on the codex side so feature parity with the Claude-side prompt is
  maintained.

The codex integration test that asserted the removed string is
updated to assert the new stable phrasing instead.
---
 codex/tests/codex-integration.test.ts |  5 +++--
 src/hooks/codex/session-start.ts      | 19 +++++++++++++++----
 src/hooks/session-start.ts            | 22 ++++++++++++++++------
 3 files changed, 34 insertions(+), 12 deletions(-)

diff --git a/codex/tests/codex-integration.test.ts b/codex/tests/codex-integration.test.ts
index d399a9d..edf5656 100644
--- a/codex/tests/codex-integration.test.ts
+++ b/codex/tests/codex-integration.test.ts
@@ -106,14 +106,15 @@ describe("codex integration: session-start", () => {
     expect(raw).toContain("Do NOT spawn subagents");
   });
 
-  it("context includes JSONL warning", () => {
+  it("context steers recall to summaries first, sessions as fallback", () => {
     const raw = runHook("session-start.js", {
       session_id: "test-session-004",
       cwd: "/tmp",
       hook_event_name: "SessionStart",
       model: "gpt-5.2",
     });
-    expect(raw).toContain("Do NOT jump straight to JSONL");
+    expect(raw).toContain("summaries/");
+    expect(raw).toContain("FALLBACK");
   });
 });
 
diff --git a/src/hooks/codex/session-start.ts b/src/hooks/codex/session-start.ts
index 81d25e4..c7a26da 100644
--- a/src/hooks/codex/session-start.ts
+++ b/src/hooks/codex/session-start.ts
@@ -24,10 +24,21 @@ const AUTH_CMD = join(__bundleDir, "commands", "auth-login.js");
 
 const context = `DEEPLAKE MEMORY: Persistent memory at ~/.deeplake/memory/ shared across sessions, users, and agents.
 
-Structure: index.md (start here) → summaries/*.md → sessions/*.jsonl (last resort). Do NOT jump straight to JSONL.
-Search: grep -r "keyword" ~/.deeplake/memory/
-IMPORTANT: Only use bash commands (cat, ls, grep, echo, jq, head, tail, sed, awk, etc.) to interact with ~/.deeplake/memory/. Do NOT use python, python3, node, curl, or other interpreters — they are not available in the memory filesystem.
-Do NOT spawn subagents to read deeplake memory.`;
+Deeplake memory has TWO tiers — search them IN THIS ORDER:
+1. ~/.deeplake/memory/summaries/ — condensed wiki summaries (~3 KB each). START HERE: the answer to recall questions is usually in a summary.
+2. ~/.deeplake/memory/sessions/  — raw full-dialogue JSONL (~5 KB each). Use as FALLBACK only if no summary matches.
+3. ~/.deeplake/memory/index.md   — skip (too large).
+
+Recall workflow:
+1. grep -r "keyword" ~/.deeplake/memory/summaries/   ← FIRST
+2. cat the top-matching summary(ies)
+3. Only if no summary matches: grep -r "keyword" ~/.deeplake/memory/sessions/
+
+✅ grep -r "keyword" ~/.deeplake/memory/summaries/
+❌ grep without a summaries/ or sessions/ suffix — too noisy
+
+IMPORTANT: Only use bash builtins (cat, ls, grep, echo, jq, head, tail, sed, awk, etc.) on ~/.deeplake/memory/. Do NOT use python, python3, node, curl, or other interpreters — they are not available in the memory filesystem.
+Do NOT spawn subagents to read deeplake memory. Never read index.md.`;
 
 interface CodexSessionStartInput {
   session_id: string;
diff --git a/src/hooks/session-start.ts b/src/hooks/session-start.ts
index 727b991..4564d71 100644
--- a/src/hooks/session-start.ts
+++ b/src/hooks/session-start.ts
@@ -29,14 +29,24 @@ const context = `DEEPLAKE MEMORY: You have TWO memory sources. ALWAYS check BOTH
 1. Your built-in memory (~/.claude/) — personal per-project notes
 2. Deeplake global memory (~/.deeplake/memory/) — global memory shared across all sessions, users, and agents in the org
 
-Deeplake memory structure:
-- ~/.deeplake/memory/index.md — START HERE, table of all sessions
-- ~/.deeplake/memory/summaries/username/*.md — AI-generated wiki summaries per session
-- ~/.deeplake/memory/sessions/username/*.jsonl — raw session data (last resort)
+⚠️ CRITICAL: the built-in Grep tool is BROKEN on ~/.deeplake/memory — always errors "Path does not exist". Use the Bash tool with \`grep -r\`.
 
-SEARCH STRATEGY: Always read index.md first. Then read specific summaries. Only read raw JSONL if summaries don't have enough detail. Do NOT jump straight to JSONL files.
+Deeplake memory has TWO tiers — search them IN THIS ORDER:
+1. ~/.deeplake/memory/summaries/ — condensed wiki summaries (~3 KB each). START HERE: the answer to recall questions is usually in a summary.
+2. ~/.deeplake/memory/sessions/  — raw full-dialogue JSONL (~5 KB each). Use as FALLBACK only if no summary matches.
+3. ~/.deeplake/memory/index.md   — skip (too large; agents shouldn't read it).
 
-Search command: Grep pattern="keyword" path="~/.deeplake/memory"
+Recall workflow (follow this order):
+  1. Bash → \`grep -r "keyword" ~/.deeplake/memory/summaries/\`   ← FIRST
+  2. \`cat\` or Read the top-matching summary(ies) to pull the answer
+  3. Only if no summary matches: Bash → \`grep -r "keyword" ~/.deeplake/memory/sessions/\`
+
+Search shape:
+  ✅ Bash tool → command: \`grep -r "keyword" ~/.deeplake/memory/summaries/\`
+  ❌ Grep tool on this path   ← will fail with "Path does not exist"
+  ❌ grep without a \`summaries/\` or \`sessions/\` suffix   ← too noisy, drowns the answer
+
+Never call the Grep tool on this path. Never read index.md.
 
 Organization management — each argument is SEPARATE (do NOT quote subcommands together):
 - node "HIVEMIND_AUTH_CMD" login                              — SSO login

From 0c8625abef9e325c7d4430fd512689ed8f112710 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Mon, 27 Apr 2026 17:43:04 +0000
Subject: [PATCH 22/30] build: rebuild bundles for grep-core / virtual-index /
 session-start

Pure rebuild of the esbuild outputs for the three preceding source
commits. No source changes here; the bundles are the result of
`npm run build` on top of HEAD~3.

- claude-code/bundle/pre-tool-use.js, codex/bundle/pre-tool-use.js
  and the two shell/deeplake-shell.js bundles pick up the
  ARRAY_LENGTH(...) > 0 predicate from the grep-core fix.
- claude-code/bundle/session-start.js, codex/bundle/session-start.js
  and the two shell bundles pick up the 50-row cap and the new
  recall prompt.
---
 claude-code/bundle/pre-tool-use.js         |  4 ++--
 claude-code/bundle/session-start.js        | 22 +++++++++++++------
 claude-code/bundle/shell/deeplake-shell.js | 25 ++++++++++++++++------
 codex/bundle/pre-tool-use.js               |  4 ++--
 codex/bundle/session-start.js              | 19 ++++++++++++----
 codex/bundle/shell/deeplake-shell.js       | 25 ++++++++++++++++------
 6 files changed, 73 insertions(+), 26 deletions(-)

diff --git a/claude-code/bundle/pre-tool-use.js b/claude-code/bundle/pre-tool-use.js
index 4daedfa..27f6dcb 100755
--- a/claude-code/bundle/pre-tool-use.js
+++ b/claude-code/bundle/pre-tool-use.js
@@ -658,8 +658,8 @@ async function searchDeeplakeTables(api, memoryTable, sessionsTable, opts) {
     const sessLexFilter = buildContentFilter("message::text", likeOp, filterPatternsForLex);
     const memLexQuery = memLexFilter ? `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, 1.0 AS score FROM "${memoryTable}" WHERE 1=1${pathFilter}${memLexFilter} LIMIT ${lexicalLimit}` : null;
     const sessLexQuery = sessLexFilter ? `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, 1.0 AS score FROM "${sessionsTable}" WHERE 1=1${pathFilter}${sessLexFilter} LIMIT ${lexicalLimit}` : null;
-    const memSemQuery = `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, (summary_embedding <#> ${vecLit}) AS score FROM "${memoryTable}" WHERE summary_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
-    const sessSemQuery = `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, (message_embedding <#> ${vecLit}) AS score FROM "${sessionsTable}" WHERE message_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const memSemQuery = `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, (summary_embedding <#> ${vecLit}) AS score FROM "${memoryTable}" WHERE ARRAY_LENGTH(summary_embedding, 1) > 0${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const sessSemQuery = `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, (message_embedding <#> ${vecLit}) AS score FROM "${sessionsTable}" WHERE ARRAY_LENGTH(message_embedding, 1) > 0${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
     const parts = [memSemQuery, sessSemQuery];
     if (memLexQuery)
       parts.push(memLexQuery);
diff --git a/claude-code/bundle/session-start.js b/claude-code/bundle/session-start.js
index 3b34266..e0902d5 100755
--- a/claude-code/bundle/session-start.js
+++ b/claude-code/bundle/session-start.js
@@ -564,14 +564,24 @@ var context = `DEEPLAKE MEMORY: You have TWO memory sources. ALWAYS check BOTH w
 1. Your built-in memory (~/.claude/) \u2014 personal per-project notes
 2. Deeplake global memory (~/.deeplake/memory/) \u2014 global memory shared across all sessions, users, and agents in the org
 
-Deeplake memory structure:
-- ~/.deeplake/memory/index.md \u2014 START HERE, table of all sessions
-- ~/.deeplake/memory/summaries/username/*.md \u2014 AI-generated wiki summaries per session
-- ~/.deeplake/memory/sessions/username/*.jsonl \u2014 raw session data (last resort)
+\u26A0\uFE0F CRITICAL: the built-in Grep tool is BROKEN on ~/.deeplake/memory \u2014 always errors "Path does not exist". Use the Bash tool with \`grep -r\`.
 
-SEARCH STRATEGY: Always read index.md first. Then read specific summaries. Only read raw JSONL if summaries don't have enough detail. Do NOT jump straight to JSONL files.
+Deeplake memory has TWO tiers \u2014 search them IN THIS ORDER:
+1. ~/.deeplake/memory/summaries/ \u2014 condensed wiki summaries (~3 KB each). START HERE: the answer to recall questions is usually in a summary.
+2. ~/.deeplake/memory/sessions/  \u2014 raw full-dialogue JSONL (~5 KB each). Use as FALLBACK only if no summary matches.
+3. ~/.deeplake/memory/index.md   \u2014 skip (too large; agents shouldn't read it).
 
-Search command: Grep pattern="keyword" path="~/.deeplake/memory"
+Recall workflow (follow this order):
+  1. Bash \u2192 \`grep -r "keyword" ~/.deeplake/memory/summaries/\`   \u2190 FIRST
+  2. \`cat\` or Read the top-matching summary(ies) to pull the answer
+  3. Only if no summary matches: Bash \u2192 \`grep -r "keyword" ~/.deeplake/memory/sessions/\`
+
+Search shape:
+  \u2705 Bash tool \u2192 command: \`grep -r "keyword" ~/.deeplake/memory/summaries/\`
+  \u274C Grep tool on this path   \u2190 will fail with "Path does not exist"
+  \u274C grep without a \`summaries/\` or \`sessions/\` suffix   \u2190 too noisy, drowns the answer
+
+Never call the Grep tool on this path. Never read index.md.
 
 Organization management \u2014 each argument is SEPARATE (do NOT quote subcommands together):
 - node "HIVEMIND_AUTH_CMD" login                              \u2014 SSO login
diff --git a/claude-code/bundle/shell/deeplake-shell.js b/claude-code/bundle/shell/deeplake-shell.js
index 18e11f9..fa9fcbc 100755
--- a/claude-code/bundle/shell/deeplake-shell.js
+++ b/claude-code/bundle/shell/deeplake-shell.js
@@ -67347,8 +67347,8 @@ async function searchDeeplakeTables(api, memoryTable, sessionsTable, opts) {
     const sessLexFilter = buildContentFilter("message::text", likeOp, filterPatternsForLex);
     const memLexQuery = memLexFilter ? `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, 1.0 AS score FROM "${memoryTable}" WHERE 1=1${pathFilter}${memLexFilter} LIMIT ${lexicalLimit}` : null;
     const sessLexQuery = sessLexFilter ? `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, 1.0 AS score FROM "${sessionsTable}" WHERE 1=1${pathFilter}${sessLexFilter} LIMIT ${lexicalLimit}` : null;
-    const memSemQuery = `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, (summary_embedding <#> ${vecLit}) AS score FROM "${memoryTable}" WHERE summary_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
-    const sessSemQuery = `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, (message_embedding <#> ${vecLit}) AS score FROM "${sessionsTable}" WHERE message_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const memSemQuery = `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, (summary_embedding <#> ${vecLit}) AS score FROM "${memoryTable}" WHERE ARRAY_LENGTH(summary_embedding, 1) > 0${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const sessSemQuery = `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, (message_embedding <#> ${vecLit}) AS score FROM "${sessionsTable}" WHERE ARRAY_LENGTH(message_embedding, 1) > 0${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
     const parts = [memSemQuery, sessSemQuery];
     if (memLexQuery)
       parts.push(memLexQuery);
@@ -67999,15 +67999,20 @@ var DeeplakeFs = class _DeeplakeFs {
   }
   // ── Virtual index.md generation ────────────────────────────────────────────
   async generateVirtualIndex() {
-    const summaryRows = await this.client.query(`SELECT path, project, description, creation_date, last_update_date FROM "${this.table}" WHERE path LIKE '${sqlStr("/summaries/")}%' ORDER BY last_update_date DESC`);
+    const INDEX_LIMIT_PER_SECTION = 50;
+    const summaryRows = await this.client.query(`SELECT path, project, description, creation_date, last_update_date FROM "${this.table}" WHERE path LIKE '${sqlStr("/summaries/")}%' ORDER BY last_update_date DESC LIMIT ${INDEX_LIMIT_PER_SECTION + 1}`);
     let sessionRows = [];
     if (this.sessionsTable) {
       try {
-        sessionRows = await this.client.query(`SELECT path, MAX(description) AS description, MIN(creation_date) AS creation_date, MAX(last_update_date) AS last_update_date FROM "${this.sessionsTable}" WHERE path LIKE '${sqlStr("/sessions/")}%' GROUP BY path ORDER BY path`);
+        sessionRows = await this.client.query(`SELECT path, MAX(description) AS description, MIN(creation_date) AS creation_date, MAX(last_update_date) AS last_update_date FROM "${this.sessionsTable}" WHERE path LIKE '${sqlStr("/sessions/")}%' GROUP BY path ORDER BY MAX(last_update_date) DESC LIMIT ${INDEX_LIMIT_PER_SECTION + 1}`);
       } catch {
         sessionRows = [];
       }
     }
+    const summaryTruncated = summaryRows.length > INDEX_LIMIT_PER_SECTION;
+    const sessionTruncated = sessionRows.length > INDEX_LIMIT_PER_SECTION;
+    const summaryVisible = summaryRows.slice(0, INDEX_LIMIT_PER_SECTION);
+    const sessionVisible = sessionRows.slice(0, INDEX_LIMIT_PER_SECTION);
     const lines = [
       "# Session Index",
       "",
@@ -68021,9 +68026,13 @@ var DeeplakeFs = class _DeeplakeFs {
     } else {
       lines.push("AI-generated summaries per session. Read these first for topic-level overviews.");
       lines.push("");
+      if (summaryTruncated) {
+        lines.push(`_Showing ${INDEX_LIMIT_PER_SECTION} most-recent of many \u2014 older summaries reachable via \`Grep pattern="..." path="~/.deeplake/memory"\`._`);
+        lines.push("");
+      }
       lines.push("| Session | Created | Last Updated | Project | Description |");
       lines.push("|---------|---------|--------------|---------|-------------|");
-      for (const row of summaryRows) {
+      for (const row of summaryVisible) {
         const p22 = row["path"];
         const match2 = p22.match(/\/summaries\/([^/]+)\/([^/]+)\.md$/);
         if (!match2)
@@ -68046,9 +68055,13 @@ var DeeplakeFs = class _DeeplakeFs {
     } else {
       lines.push("Raw session records (dialogue, tool calls). Read for exact detail / quotes.");
       lines.push("");
+      if (sessionTruncated) {
+        lines.push(`_Showing ${INDEX_LIMIT_PER_SECTION} most-recent of many \u2014 older sessions reachable via \`Grep pattern="..." path="~/.deeplake/memory"\`._`);
+        lines.push("");
+      }
       lines.push("| Session | Created | Last Updated | Description |");
       lines.push("|---------|---------|--------------|-------------|");
-      for (const row of sessionRows) {
+      for (const row of sessionVisible) {
         const p22 = row["path"] || "";
         const rel = p22.startsWith("/") ? p22.slice(1) : p22;
         const filename = p22.split("/").pop() ?? p22;
diff --git a/codex/bundle/pre-tool-use.js b/codex/bundle/pre-tool-use.js
index 552b425..a0adb46 100755
--- a/codex/bundle/pre-tool-use.js
+++ b/codex/bundle/pre-tool-use.js
@@ -644,8 +644,8 @@ async function searchDeeplakeTables(api, memoryTable, sessionsTable, opts) {
     const sessLexFilter = buildContentFilter("message::text", likeOp, filterPatternsForLex);
     const memLexQuery = memLexFilter ? `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, 1.0 AS score FROM "${memoryTable}" WHERE 1=1${pathFilter}${memLexFilter} LIMIT ${lexicalLimit}` : null;
     const sessLexQuery = sessLexFilter ? `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, 1.0 AS score FROM "${sessionsTable}" WHERE 1=1${pathFilter}${sessLexFilter} LIMIT ${lexicalLimit}` : null;
-    const memSemQuery = `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, (summary_embedding <#> ${vecLit}) AS score FROM "${memoryTable}" WHERE summary_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
-    const sessSemQuery = `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, (message_embedding <#> ${vecLit}) AS score FROM "${sessionsTable}" WHERE message_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const memSemQuery = `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, (summary_embedding <#> ${vecLit}) AS score FROM "${memoryTable}" WHERE ARRAY_LENGTH(summary_embedding, 1) > 0${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const sessSemQuery = `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, (message_embedding <#> ${vecLit}) AS score FROM "${sessionsTable}" WHERE ARRAY_LENGTH(message_embedding, 1) > 0${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
     const parts = [memSemQuery, sessSemQuery];
     if (memLexQuery)
       parts.push(memLexQuery);
diff --git a/codex/bundle/session-start.js b/codex/bundle/session-start.js
index ea95b2f..fbbcac1 100755
--- a/codex/bundle/session-start.js
+++ b/codex/bundle/session-start.js
@@ -86,10 +86,21 @@ var __bundleDir = dirname2(fileURLToPath(import.meta.url));
 var AUTH_CMD = join4(__bundleDir, "commands", "auth-login.js");
 var context = `DEEPLAKE MEMORY: Persistent memory at ~/.deeplake/memory/ shared across sessions, users, and agents.
 
-Structure: index.md (start here) \u2192 summaries/*.md \u2192 sessions/*.jsonl (last resort). Do NOT jump straight to JSONL.
-Search: grep -r "keyword" ~/.deeplake/memory/
-IMPORTANT: Only use bash commands (cat, ls, grep, echo, jq, head, tail, sed, awk, etc.) to interact with ~/.deeplake/memory/. Do NOT use python, python3, node, curl, or other interpreters \u2014 they are not available in the memory filesystem.
-Do NOT spawn subagents to read deeplake memory.`;
+Deeplake memory has TWO tiers \u2014 search them IN THIS ORDER:
+1. ~/.deeplake/memory/summaries/ \u2014 condensed wiki summaries (~3 KB each). START HERE: the answer to recall questions is usually in a summary.
+2. ~/.deeplake/memory/sessions/  \u2014 raw full-dialogue JSONL (~5 KB each). Use as FALLBACK only if no summary matches.
+3. ~/.deeplake/memory/index.md   \u2014 skip (too large).
+
+Recall workflow:
+1. grep -r "keyword" ~/.deeplake/memory/summaries/   \u2190 FIRST
+2. cat the top-matching summary(ies)
+3. Only if no summary matches: grep -r "keyword" ~/.deeplake/memory/sessions/
+
+\u2705 grep -r "keyword" ~/.deeplake/memory/summaries/
+\u274C grep without a summaries/ or sessions/ suffix \u2014 too noisy
+
+IMPORTANT: Only use bash builtins (cat, ls, grep, echo, jq, head, tail, sed, awk, etc.) on ~/.deeplake/memory/. Do NOT use python, python3, node, curl, or other interpreters \u2014 they are not available in the memory filesystem.
+Do NOT spawn subagents to read deeplake memory. Never read index.md.`;
 async function main() {
   if (process.env.HIVEMIND_WIKI_WORKER === "1")
     return;
diff --git a/codex/bundle/shell/deeplake-shell.js b/codex/bundle/shell/deeplake-shell.js
index 18e11f9..fa9fcbc 100755
--- a/codex/bundle/shell/deeplake-shell.js
+++ b/codex/bundle/shell/deeplake-shell.js
@@ -67347,8 +67347,8 @@ async function searchDeeplakeTables(api, memoryTable, sessionsTable, opts) {
     const sessLexFilter = buildContentFilter("message::text", likeOp, filterPatternsForLex);
     const memLexQuery = memLexFilter ? `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, 1.0 AS score FROM "${memoryTable}" WHERE 1=1${pathFilter}${memLexFilter} LIMIT ${lexicalLimit}` : null;
     const sessLexQuery = sessLexFilter ? `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, 1.0 AS score FROM "${sessionsTable}" WHERE 1=1${pathFilter}${sessLexFilter} LIMIT ${lexicalLimit}` : null;
-    const memSemQuery = `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, (summary_embedding <#> ${vecLit}) AS score FROM "${memoryTable}" WHERE summary_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
-    const sessSemQuery = `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, (message_embedding <#> ${vecLit}) AS score FROM "${sessionsTable}" WHERE message_embedding IS NOT NULL${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const memSemQuery = `SELECT path, summary::text AS content, 0 AS source_order, '' AS creation_date, (summary_embedding <#> ${vecLit}) AS score FROM "${memoryTable}" WHERE ARRAY_LENGTH(summary_embedding, 1) > 0${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
+    const sessSemQuery = `SELECT path, message::text AS content, 1 AS source_order, COALESCE(creation_date::text, '') AS creation_date, (message_embedding <#> ${vecLit}) AS score FROM "${sessionsTable}" WHERE ARRAY_LENGTH(message_embedding, 1) > 0${pathFilter} ORDER BY score DESC LIMIT ${semanticLimit}`;
     const parts = [memSemQuery, sessSemQuery];
     if (memLexQuery)
       parts.push(memLexQuery);
@@ -67999,15 +67999,20 @@ var DeeplakeFs = class _DeeplakeFs {
   }
   // ── Virtual index.md generation ────────────────────────────────────────────
   async generateVirtualIndex() {
-    const summaryRows = await this.client.query(`SELECT path, project, description, creation_date, last_update_date FROM "${this.table}" WHERE path LIKE '${sqlStr("/summaries/")}%' ORDER BY last_update_date DESC`);
+    const INDEX_LIMIT_PER_SECTION = 50;
+    const summaryRows = await this.client.query(`SELECT path, project, description, creation_date, last_update_date FROM "${this.table}" WHERE path LIKE '${sqlStr("/summaries/")}%' ORDER BY last_update_date DESC LIMIT ${INDEX_LIMIT_PER_SECTION + 1}`);
     let sessionRows = [];
     if (this.sessionsTable) {
       try {
-        sessionRows = await this.client.query(`SELECT path, MAX(description) AS description, MIN(creation_date) AS creation_date, MAX(last_update_date) AS last_update_date FROM "${this.sessionsTable}" WHERE path LIKE '${sqlStr("/sessions/")}%' GROUP BY path ORDER BY path`);
+        sessionRows = await this.client.query(`SELECT path, MAX(description) AS description, MIN(creation_date) AS creation_date, MAX(last_update_date) AS last_update_date FROM "${this.sessionsTable}" WHERE path LIKE '${sqlStr("/sessions/")}%' GROUP BY path ORDER BY MAX(last_update_date) DESC LIMIT ${INDEX_LIMIT_PER_SECTION + 1}`);
       } catch {
         sessionRows = [];
       }
     }
+    const summaryTruncated = summaryRows.length > INDEX_LIMIT_PER_SECTION;
+    const sessionTruncated = sessionRows.length > INDEX_LIMIT_PER_SECTION;
+    const summaryVisible = summaryRows.slice(0, INDEX_LIMIT_PER_SECTION);
+    const sessionVisible = sessionRows.slice(0, INDEX_LIMIT_PER_SECTION);
     const lines = [
       "# Session Index",
       "",
@@ -68021,9 +68026,13 @@ var DeeplakeFs = class _DeeplakeFs {
     } else {
       lines.push("AI-generated summaries per session. Read these first for topic-level overviews.");
       lines.push("");
+      if (summaryTruncated) {
+        lines.push(`_Showing ${INDEX_LIMIT_PER_SECTION} most-recent of many \u2014 older summaries reachable via \`Grep pattern="..." path="~/.deeplake/memory"\`._`);
+        lines.push("");
+      }
       lines.push("| Session | Created | Last Updated | Project | Description |");
       lines.push("|---------|---------|--------------|---------|-------------|");
-      for (const row of summaryRows) {
+      for (const row of summaryVisible) {
         const p22 = row["path"];
         const match2 = p22.match(/\/summaries\/([^/]+)\/([^/]+)\.md$/);
         if (!match2)
@@ -68046,9 +68055,13 @@ var DeeplakeFs = class _DeeplakeFs {
     } else {
       lines.push("Raw session records (dialogue, tool calls). Read for exact detail / quotes.");
       lines.push("");
+      if (sessionTruncated) {
+        lines.push(`_Showing ${INDEX_LIMIT_PER_SECTION} most-recent of many \u2014 older sessions reachable via \`Grep pattern="..." path="~/.deeplake/memory"\`._`);
+        lines.push("");
+      }
       lines.push("| Session | Created | Last Updated | Description |");
       lines.push("|---------|---------|--------------|-------------|");
-      for (const row of sessionRows) {
+      for (const row of sessionVisible) {
         const p22 = row["path"] || "";
         const rel = p22.startsWith("/") ? p22.slice(1) : p22;
         const filename = p22.split("/").pop() ?? p22;

From de9893dc8e30f1a9351dce0c7150a0e41b2b4c8b Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Mon, 27 Apr 2026 20:05:00 +0000
Subject: [PATCH 23/30] =?UTF-8?q?fix(embed-client):=20bump=20first-call=20?=
 =?UTF-8?q?timeout=20200ms=20=E2=86=92=202000ms?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

DEFAULT_CLIENT_TIMEOUT_MS was 200ms, which is comfortably below the
~800ms first-inference cost of the nomic-embed-text-v1.5 pipeline
right after the daemon spawns and the ONNX weights finish loading. As
a result, the first embed call from a freshly-spawned daemon would
abort, EmbedClient.embed() returned null, and the row was inserted
with NULL in the embedding column — silently, without logging a
failure. Subsequent calls eventually succeeded (the daemon stays warm
for 15 minutes), but every cold session lost its first N captures'
embeddings.

2000ms keeps headroom for slow disks / first-load ONNX initialisation
without making genuine hangs (network, daemon crash) wait noticeably
longer in the steady state — an embed against a warm daemon returns
in <50ms, well under either ceiling.
---
 src/embeddings/protocol.ts | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/embeddings/protocol.ts b/src/embeddings/protocol.ts
index 9959ced..4aa9f12 100644
--- a/src/embeddings/protocol.ts
+++ b/src/embeddings/protocol.ts
@@ -37,7 +37,11 @@ export const DEFAULT_MODEL_REPO = "nomic-ai/nomic-embed-text-v1.5";
 export const DEFAULT_DTYPE = "q8";
 export const DEFAULT_DIMS = 768;
 export const DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1000;
-export const DEFAULT_CLIENT_TIMEOUT_MS = 200;
+// Generous enough that the first embed after a daemon spawn — when the nomic
+// pipeline is still warming up — does not silently time out. A 200ms cap was
+// short enough that any not-yet-warm daemon returned null and the row landed
+// with NULL in the embedding column.
+export const DEFAULT_CLIENT_TIMEOUT_MS = 2000;
 export const DOC_PREFIX = "search_document: ";
 export const QUERY_PREFIX = "search_query: ";
 

From 973dd34e8412136e8e8c72847315bbceb4d1b638 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Mon, 27 Apr 2026 20:05:16 +0000
Subject: [PATCH 24/30] perf(deeplake-api): fail fast on 500 "already exists"
 instead of retrying
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Deeplake returns HTTP 500 (not 409 Conflict) when ADD COLUMN IF NOT
EXISTS or CREATE INDEX IF NOT EXISTS hit an already-present object —
both are deterministic errors that retrying cannot recover from.
RETRYABLE_CODES already includes 500, so until now every such call
went through the full MAX_RETRIES=3 + exponential backoff cycle:
~500ms + ~1000ms + ~2000ms = ~4s of wasted backoff per call, plus the
three actual round-trips.

SessionStart issues several ALTER ADD COLUMN IF NOT EXISTS calls on
every run (one per embedding column on the memory + sessions tables),
so the cumulative cost was ~8s of dead time at the start of every
session — measurable in the hook-debug.log under the "query retry
N/3 (500)" lines.

Reuse the existing isDuplicateIndexError() helper (which already
matches "already exists" / "duplicate key" / "pg_class_relname_nsp_index")
to short-circuit retries for that specific failure mode. The error
still surfaces to the caller — callers wrap these IF NOT EXISTS calls
in try/catch and treat the duplicate as a no-op — but it surfaces in
~30ms instead of ~4s.
---
 src/deeplake-api.ts | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/deeplake-api.ts b/src/deeplake-api.ts
index 2933384..8aabfe6 100644
--- a/src/deeplake-api.ts
+++ b/src/deeplake-api.ts
@@ -176,7 +176,12 @@ export class DeeplakeApi {
       const retryable403 =
         isSessionInsertQuery(sql) &&
         (resp.status === 401 || (resp.status === 403 && (text.length === 0 || isTransientHtml403(text))));
-      if (attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
+      // Deeplake returns HTTP 500 (not 409) when ADD COLUMN IF NOT EXISTS / CREATE
+      // INDEX IF NOT EXISTS hit an already-present object. The error is
+      // deterministic — retrying just burns ~4s of exponential backoff per call,
+      // and SessionStart issues several of these on every run. Fail fast.
+      const alreadyExists = resp.status === 500 && isDuplicateIndexError(text);
+      if (!alreadyExists && attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
         const delay = BASE_DELAY_MS * Math.pow(2, attempt) + Math.random() * 200;
         log(`query retry ${attempt + 1}/${MAX_RETRIES} (${resp.status}) in ${delay.toFixed(0)}ms`);
         await sleep(delay);

From 227af980f02ca6e112ea6af2f851c29a7435cf6a Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Mon, 27 Apr 2026 20:05:28 +0000
Subject: [PATCH 25/30] build: rebuild bundles for embed timeout + deeplake-api
 fail-fast
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Pure rebuild from `npm run build` on top of HEAD~2 (de9893d, 973dd34).
Touched bundles are the ones that pull in src/embeddings/protocol.ts
or src/deeplake-api.ts — capture, session-start (+ setup), pre-tool-use,
wiki-worker, auth-login, and the deeplake-shell — across both
claude-code/bundle/ and codex/bundle/.
---
 claude-code/bundle/capture.js              | 5 +++--
 claude-code/bundle/commands/auth-login.js  | 3 ++-
 claude-code/bundle/pre-tool-use.js         | 5 +++--
 claude-code/bundle/session-start-setup.js  | 5 +++--
 claude-code/bundle/session-start.js        | 3 ++-
 claude-code/bundle/shell/deeplake-shell.js | 5 +++--
 claude-code/bundle/wiki-worker.js          | 2 +-
 codex/bundle/capture.js                    | 3 ++-
 codex/bundle/commands/auth-login.js        | 3 ++-
 codex/bundle/pre-tool-use.js               | 5 +++--
 codex/bundle/session-start-setup.js        | 3 ++-
 codex/bundle/shell/deeplake-shell.js       | 5 +++--
 codex/bundle/stop.js                       | 3 ++-
 codex/bundle/wiki-worker.js                | 2 +-
 14 files changed, 32 insertions(+), 20 deletions(-)

diff --git a/claude-code/bundle/capture.js b/claude-code/bundle/capture.js
index 9d8c739..2ca54df 100755
--- a/claude-code/bundle/capture.js
+++ b/claude-code/bundle/capture.js
@@ -214,7 +214,8 @@ var DeeplakeApi = class {
       }
       const text = await resp.text().catch(() => "");
       const retryable403 = isSessionInsertQuery(sql) && (resp.status === 401 || resp.status === 403 && (text.length === 0 || isTransientHtml403(text)));
-      if (attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
+      const alreadyExists = resp.status === 500 && isDuplicateIndexError(text);
+      if (!alreadyExists && attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
         const delay = BASE_DELAY_MS * Math.pow(2, attempt) + Math.random() * 200;
         log2(`query retry ${attempt + 1}/${MAX_RETRIES} (${resp.status}) in ${delay.toFixed(0)}ms`);
         await sleep(delay);
@@ -673,7 +674,7 @@ import { openSync as openSync2, closeSync as closeSync2, writeSync as writeSync2
 // dist/src/embeddings/protocol.js
 var DEFAULT_SOCKET_DIR = "/tmp";
 var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
-var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+var DEFAULT_CLIENT_TIMEOUT_MS = 2e3;
 function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
   return `${dir}/hivemind-embed-${uid}.sock`;
 }
diff --git a/claude-code/bundle/commands/auth-login.js b/claude-code/bundle/commands/auth-login.js
index 8714067..ac09152 100755
--- a/claude-code/bundle/commands/auth-login.js
+++ b/claude-code/bundle/commands/auth-login.js
@@ -395,7 +395,8 @@ var DeeplakeApi = class {
       }
       const text = await resp.text().catch(() => "");
       const retryable403 = isSessionInsertQuery(sql) && (resp.status === 401 || resp.status === 403 && (text.length === 0 || isTransientHtml403(text)));
-      if (attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
+      const alreadyExists = resp.status === 500 && isDuplicateIndexError(text);
+      if (!alreadyExists && attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
         const delay = BASE_DELAY_MS * Math.pow(2, attempt) + Math.random() * 200;
         log2(`query retry ${attempt + 1}/${MAX_RETRIES} (${resp.status}) in ${delay.toFixed(0)}ms`);
         await sleep(delay);
diff --git a/claude-code/bundle/pre-tool-use.js b/claude-code/bundle/pre-tool-use.js
index 27f6dcb..017dd0d 100755
--- a/claude-code/bundle/pre-tool-use.js
+++ b/claude-code/bundle/pre-tool-use.js
@@ -220,7 +220,8 @@ var DeeplakeApi = class {
       }
       const text = await resp.text().catch(() => "");
       const retryable403 = isSessionInsertQuery(sql) && (resp.status === 401 || resp.status === 403 && (text.length === 0 || isTransientHtml403(text)));
-      if (attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
+      const alreadyExists = resp.status === 500 && isDuplicateIndexError(text);
+      if (!alreadyExists && attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
         const delay = BASE_DELAY_MS * Math.pow(2, attempt) + Math.random() * 200;
         log2(`query retry ${attempt + 1}/${MAX_RETRIES} (${resp.status}) in ${delay.toFixed(0)}ms`);
         await sleep(delay);
@@ -920,7 +921,7 @@ import { openSync, closeSync, writeSync, unlinkSync, existsSync as existsSync3,
 // dist/src/embeddings/protocol.js
 var DEFAULT_SOCKET_DIR = "/tmp";
 var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
-var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+var DEFAULT_CLIENT_TIMEOUT_MS = 2e3;
 function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
   return `${dir}/hivemind-embed-${uid}.sock`;
 }
diff --git a/claude-code/bundle/session-start-setup.js b/claude-code/bundle/session-start-setup.js
index 622ddf7..5a92470 100755
--- a/claude-code/bundle/session-start-setup.js
+++ b/claude-code/bundle/session-start-setup.js
@@ -225,7 +225,8 @@ var DeeplakeApi = class {
       }
       const text = await resp.text().catch(() => "");
       const retryable403 = isSessionInsertQuery(sql) && (resp.status === 401 || resp.status === 403 && (text.length === 0 || isTransientHtml403(text)));
-      if (attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
+      const alreadyExists = resp.status === 500 && isDuplicateIndexError(text);
+      if (!alreadyExists && attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
         const delay = BASE_DELAY_MS * Math.pow(2, attempt) + Math.random() * 200;
         log2(`query retry ${attempt + 1}/${MAX_RETRIES} (${resp.status}) in ${delay.toFixed(0)}ms`);
         await sleep(delay);
@@ -563,7 +564,7 @@ import { openSync, closeSync, writeSync, unlinkSync as unlinkSync2, existsSync a
 // dist/src/embeddings/protocol.js
 var DEFAULT_SOCKET_DIR = "/tmp";
 var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
-var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+var DEFAULT_CLIENT_TIMEOUT_MS = 2e3;
 function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
   return `${dir}/hivemind-embed-${uid}.sock`;
 }
diff --git a/claude-code/bundle/session-start.js b/claude-code/bundle/session-start.js
index e0902d5..0280f58 100755
--- a/claude-code/bundle/session-start.js
+++ b/claude-code/bundle/session-start.js
@@ -225,7 +225,8 @@ var DeeplakeApi = class {
       }
       const text = await resp.text().catch(() => "");
       const retryable403 = isSessionInsertQuery(sql) && (resp.status === 401 || resp.status === 403 && (text.length === 0 || isTransientHtml403(text)));
-      if (attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
+      const alreadyExists = resp.status === 500 && isDuplicateIndexError(text);
+      if (!alreadyExists && attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
         const delay = BASE_DELAY_MS * Math.pow(2, attempt) + Math.random() * 200;
         log2(`query retry ${attempt + 1}/${MAX_RETRIES} (${resp.status}) in ${delay.toFixed(0)}ms`);
         await sleep(delay);
diff --git a/claude-code/bundle/shell/deeplake-shell.js b/claude-code/bundle/shell/deeplake-shell.js
index fa9fcbc..171d01b 100755
--- a/claude-code/bundle/shell/deeplake-shell.js
+++ b/claude-code/bundle/shell/deeplake-shell.js
@@ -66917,7 +66917,8 @@ var DeeplakeApi = class {
       }
       const text = await resp.text().catch(() => "");
       const retryable403 = isSessionInsertQuery(sql) && (resp.status === 401 || resp.status === 403 && (text.length === 0 || isTransientHtml403(text)));
-      if (attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
+      const alreadyExists = resp.status === 500 && isDuplicateIndexError(text);
+      if (!alreadyExists && attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
         const delay = BASE_DELAY_MS * Math.pow(2, attempt) + Math.random() * 200;
         log2(`query retry ${attempt + 1}/${MAX_RETRIES} (${resp.status}) in ${delay.toFixed(0)}ms`);
         await sleep(delay);
@@ -67555,7 +67556,7 @@ import { openSync, closeSync, writeSync, unlinkSync, existsSync as existsSync4,
 // dist/src/embeddings/protocol.js
 var DEFAULT_SOCKET_DIR = "/tmp";
 var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
-var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+var DEFAULT_CLIENT_TIMEOUT_MS = 2e3;
 function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
   return `${dir}/hivemind-embed-${uid}.sock`;
 }
diff --git a/claude-code/bundle/wiki-worker.js b/claude-code/bundle/wiki-worker.js
index 8dee999..6536f3a 100755
--- a/claude-code/bundle/wiki-worker.js
+++ b/claude-code/bundle/wiki-worker.js
@@ -155,7 +155,7 @@ import { openSync as openSync2, closeSync as closeSync2, writeSync as writeSync2
 // dist/src/embeddings/protocol.js
 var DEFAULT_SOCKET_DIR = "/tmp";
 var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
-var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+var DEFAULT_CLIENT_TIMEOUT_MS = 2e3;
 function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
   return `${dir}/hivemind-embed-${uid}.sock`;
 }
diff --git a/codex/bundle/capture.js b/codex/bundle/capture.js
index 911d238..ce3a2f6 100755
--- a/codex/bundle/capture.js
+++ b/codex/bundle/capture.js
@@ -214,7 +214,8 @@ var DeeplakeApi = class {
       }
       const text = await resp.text().catch(() => "");
       const retryable403 = isSessionInsertQuery(sql) && (resp.status === 401 || resp.status === 403 && (text.length === 0 || isTransientHtml403(text)));
-      if (attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
+      const alreadyExists = resp.status === 500 && isDuplicateIndexError(text);
+      if (!alreadyExists && attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
         const delay = BASE_DELAY_MS * Math.pow(2, attempt) + Math.random() * 200;
         log2(`query retry ${attempt + 1}/${MAX_RETRIES} (${resp.status}) in ${delay.toFixed(0)}ms`);
         await sleep(delay);
diff --git a/codex/bundle/commands/auth-login.js b/codex/bundle/commands/auth-login.js
index 8714067..ac09152 100755
--- a/codex/bundle/commands/auth-login.js
+++ b/codex/bundle/commands/auth-login.js
@@ -395,7 +395,8 @@ var DeeplakeApi = class {
       }
       const text = await resp.text().catch(() => "");
       const retryable403 = isSessionInsertQuery(sql) && (resp.status === 401 || resp.status === 403 && (text.length === 0 || isTransientHtml403(text)));
-      if (attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
+      const alreadyExists = resp.status === 500 && isDuplicateIndexError(text);
+      if (!alreadyExists && attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
         const delay = BASE_DELAY_MS * Math.pow(2, attempt) + Math.random() * 200;
         log2(`query retry ${attempt + 1}/${MAX_RETRIES} (${resp.status}) in ${delay.toFixed(0)}ms`);
         await sleep(delay);
diff --git a/codex/bundle/pre-tool-use.js b/codex/bundle/pre-tool-use.js
index a0adb46..81f040f 100755
--- a/codex/bundle/pre-tool-use.js
+++ b/codex/bundle/pre-tool-use.js
@@ -220,7 +220,8 @@ var DeeplakeApi = class {
       }
       const text = await resp.text().catch(() => "");
       const retryable403 = isSessionInsertQuery(sql) && (resp.status === 401 || resp.status === 403 && (text.length === 0 || isTransientHtml403(text)));
-      if (attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
+      const alreadyExists = resp.status === 500 && isDuplicateIndexError(text);
+      if (!alreadyExists && attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
         const delay = BASE_DELAY_MS * Math.pow(2, attempt) + Math.random() * 200;
         log2(`query retry ${attempt + 1}/${MAX_RETRIES} (${resp.status}) in ${delay.toFixed(0)}ms`);
         await sleep(delay);
@@ -906,7 +907,7 @@ import { openSync, closeSync, writeSync, unlinkSync, existsSync as existsSync3,
 // dist/src/embeddings/protocol.js
 var DEFAULT_SOCKET_DIR = "/tmp";
 var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
-var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+var DEFAULT_CLIENT_TIMEOUT_MS = 2e3;
 function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
   return `${dir}/hivemind-embed-${uid}.sock`;
 }
diff --git a/codex/bundle/session-start-setup.js b/codex/bundle/session-start-setup.js
index c854fcc..301e948 100755
--- a/codex/bundle/session-start-setup.js
+++ b/codex/bundle/session-start-setup.js
@@ -225,7 +225,8 @@ var DeeplakeApi = class {
       }
       const text = await resp.text().catch(() => "");
       const retryable403 = isSessionInsertQuery(sql) && (resp.status === 401 || resp.status === 403 && (text.length === 0 || isTransientHtml403(text)));
-      if (attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
+      const alreadyExists = resp.status === 500 && isDuplicateIndexError(text);
+      if (!alreadyExists && attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
         const delay = BASE_DELAY_MS * Math.pow(2, attempt) + Math.random() * 200;
         log2(`query retry ${attempt + 1}/${MAX_RETRIES} (${resp.status}) in ${delay.toFixed(0)}ms`);
         await sleep(delay);
diff --git a/codex/bundle/shell/deeplake-shell.js b/codex/bundle/shell/deeplake-shell.js
index fa9fcbc..171d01b 100755
--- a/codex/bundle/shell/deeplake-shell.js
+++ b/codex/bundle/shell/deeplake-shell.js
@@ -66917,7 +66917,8 @@ var DeeplakeApi = class {
       }
       const text = await resp.text().catch(() => "");
       const retryable403 = isSessionInsertQuery(sql) && (resp.status === 401 || resp.status === 403 && (text.length === 0 || isTransientHtml403(text)));
-      if (attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
+      const alreadyExists = resp.status === 500 && isDuplicateIndexError(text);
+      if (!alreadyExists && attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
         const delay = BASE_DELAY_MS * Math.pow(2, attempt) + Math.random() * 200;
         log2(`query retry ${attempt + 1}/${MAX_RETRIES} (${resp.status}) in ${delay.toFixed(0)}ms`);
         await sleep(delay);
@@ -67555,7 +67556,7 @@ import { openSync, closeSync, writeSync, unlinkSync, existsSync as existsSync4,
 // dist/src/embeddings/protocol.js
 var DEFAULT_SOCKET_DIR = "/tmp";
 var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
-var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+var DEFAULT_CLIENT_TIMEOUT_MS = 2e3;
 function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
   return `${dir}/hivemind-embed-${uid}.sock`;
 }
diff --git a/codex/bundle/stop.js b/codex/bundle/stop.js
index 7c86181..7b96903 100755
--- a/codex/bundle/stop.js
+++ b/codex/bundle/stop.js
@@ -217,7 +217,8 @@ var DeeplakeApi = class {
       }
       const text = await resp.text().catch(() => "");
       const retryable403 = isSessionInsertQuery(sql) && (resp.status === 401 || resp.status === 403 && (text.length === 0 || isTransientHtml403(text)));
-      if (attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
+      const alreadyExists = resp.status === 500 && isDuplicateIndexError(text);
+      if (!alreadyExists && attempt < MAX_RETRIES && (RETRYABLE_CODES.has(resp.status) || retryable403)) {
         const delay = BASE_DELAY_MS * Math.pow(2, attempt) + Math.random() * 200;
         log2(`query retry ${attempt + 1}/${MAX_RETRIES} (${resp.status}) in ${delay.toFixed(0)}ms`);
         await sleep(delay);
diff --git a/codex/bundle/wiki-worker.js b/codex/bundle/wiki-worker.js
index 5fffb2e..a1e7e00 100755
--- a/codex/bundle/wiki-worker.js
+++ b/codex/bundle/wiki-worker.js
@@ -154,7 +154,7 @@ import { openSync as openSync2, closeSync as closeSync2, writeSync as writeSync2
 // dist/src/embeddings/protocol.js
 var DEFAULT_SOCKET_DIR = "/tmp";
 var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
-var DEFAULT_CLIENT_TIMEOUT_MS = 200;
+var DEFAULT_CLIENT_TIMEOUT_MS = 2e3;
 function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
   return `${dir}/hivemind-embed-${uid}.sock`;
 }

From 6b77d6d1bd1040506d725bbeb2cd4b62c34c173a Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Mon, 27 Apr 2026 21:32:01 +0000
Subject: [PATCH 26/30] feat(embeddings): degrade to lexical-only when
 transformers is missing
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The plugin's embed daemon dynamically imports `@huggingface/transformers`
at runtime. The package can't be bundled (it depends on
`onnxruntime-node`, which has platform-specific native binaries that
esbuild can't inline), and Claude Code's marketplace install does not
run `npm install` on plugins — so a fresh install has nothing to
resolve. The daemon then crashed on the dynamic import, the embed
client returned `null`, and rows landed with `NULL` in the embedding
column without any user-facing signal.

Detect at runtime whether `@huggingface/transformers` is resolvable from
this bundle's location (same `node_modules` walk Node would do for the
spawned daemon) and, when it isn't, treat embeddings as if
`HIVEMIND_EMBEDDINGS=false`. This:

- skips the SessionStart daemon warmup (no failed-spawn log);
- makes capture / wiki-worker write rows with `NULL` in the embedding
  column instead of crashing the daemon (existing graceful path);
- short-circuits the semantic branch in grep so `Grep` falls back to
  pure BM25 / ILIKE on text columns.

The result is exposed as a three-state `EmbeddingsStatus` (`enabled` /
`env-disabled` / `no-transformers`) so the hook log can surface the
actual reason once at session start.

Also documents the optional install step in the README and the
lexical-only fallback behaviour, plus introduces the
`HIVEMIND_EMBEDDINGS=false` opt-out into the env-var table.

Tests cover both branches:
- env-disabled wins regardless of resolver state, and any non-"false"
  truthy env value is intentionally a no-op (avoid surprise kills).
- resolver throws (MODULE_NOT_FOUND or any other error) → "no-transformers".
- resolver succeeds → "enabled".
- the result is cached for the process lifetime; the resolver is
  invoked at most once even across many `embeddingsStatus()` calls.
- the real resolver is exercised by a smoke test that runs against the
  dev / CI environment (where the package IS installed via npm install)
  and asserts "enabled".
---
 README.md                                    |  34 +++++
 claude-code/tests/embeddings-disable.test.ts | 124 ++++++++++++++++---
 src/embeddings/disable.ts                    |  80 +++++++++---
 3 files changed, 210 insertions(+), 28 deletions(-)

diff --git a/README.md b/README.md
index 1e47b2e..039e638 100644
--- a/README.md
+++ b/README.md
@@ -244,8 +244,42 @@ This plugin captures session activity and stores it in your Deeplake workspace:
 | `HIVEMIND_SESSIONS_TABLE` | `sessions`                | SQL table for per-event session capture    |
 | `HIVEMIND_MEMORY_PATH`    | `~/.deeplake/memory`      | Path that triggers interception            |
 | `HIVEMIND_CAPTURE`        | `true`                    | Set to `false` to disable capture          |
+| `HIVEMIND_EMBEDDINGS`     | `true`                    | Set to `false` to force lexical-only mode  |
 | `HIVEMIND_DEBUG`          | —                         | Set to `1` for verbose hook debug logs     |
 
+## Optional: enable semantic search (embeddings)
+
+Hivemind can run a local embedding daemon (nomic-embed-text-v1.5, ~130 MB)
+so that `Grep` over `~/.deeplake/memory/` uses hybrid semantic + lexical
+ranking instead of pure BM25. This is **off by default** — the daemon
+depends on `@huggingface/transformers`, which has native bindings that
+can't be bundled into the plugin and is therefore not shipped with the
+marketplace install.
+
+To enable:
+
+```bash
+# Install the dependency inside the plugin's cache directory.
+cd ~/.claude/plugins/cache/hivemind/hivemind/<version>
+npm install @huggingface/transformers@^3.0.0
+```
+
+Restart Claude Code afterwards. From the next session, captured messages
+and AI-generated summaries will include a 768-dim embedding, and
+semantic recall queries will route through the local daemon (the model
+is downloaded on first use and cached in `~/.cache/huggingface/`).
+
+If `@huggingface/transformers` is **not** present (or `npm` is unavailable
+on your system), Hivemind silently degrades to lexical-only mode:
+
+- ✅ Capture continues; rows still land in Deeplake.
+- ✅ `Grep` still works via BM25 / `ILIKE` matching on text columns.
+- ⚪ The `message_embedding` / `summary_embedding` columns stay `NULL`.
+- ⚪ The hook log notes `embeddings: no-transformers` once at session start.
+
+You can also force lexical-only mode explicitly with
+`HIVEMIND_EMBEDDINGS=false` (useful for CI or air-gapped environments).
+
 ## Architecture
 
 ### Hook lifecycle (Claude Code)
diff --git a/claude-code/tests/embeddings-disable.test.ts b/claude-code/tests/embeddings-disable.test.ts
index 9a8d527..fb17d31 100644
--- a/claude-code/tests/embeddings-disable.test.ts
+++ b/claude-code/tests/embeddings-disable.test.ts
@@ -1,38 +1,134 @@
 import { describe, it, expect, beforeEach, afterEach } from "vitest";
-import { embeddingsDisabled } from "../../src/embeddings/disable.js";
+import {
+  embeddingsDisabled,
+  embeddingsStatus,
+  _setResolveForTesting,
+  _resetForTesting,
+} from "../../src/embeddings/disable.js";
 
-describe("embeddingsDisabled()", () => {
-  const original = process.env.HIVEMIND_EMBEDDINGS;
+const originalEnv = process.env.HIVEMIND_EMBEDDINGS;
 
+function restoreEnv(): void {
+  if (originalEnv === undefined) delete process.env.HIVEMIND_EMBEDDINGS;
+  else process.env.HIVEMIND_EMBEDDINGS = originalEnv;
+}
+
+describe("embeddingsStatus / embeddingsDisabled — env branch", () => {
   beforeEach(() => {
     delete process.env.HIVEMIND_EMBEDDINGS;
+    _resetForTesting();
   });
 
   afterEach(() => {
-    if (original === undefined) delete process.env.HIVEMIND_EMBEDDINGS;
-    else process.env.HIVEMIND_EMBEDDINGS = original;
+    restoreEnv();
+    _resetForTesting();
   });
 
-  it("returns false when the env var is unset (default behaviour)", () => {
+  it("is 'enabled' when env is unset and the package resolves", () => {
+    _setResolveForTesting(() => { /* no throw → installed */ });
+    expect(embeddingsStatus()).toBe("enabled");
     expect(embeddingsDisabled()).toBe(false);
   });
 
-  it("returns true only when explicitly set to the string 'false'", () => {
+  it("is 'env-disabled' when HIVEMIND_EMBEDDINGS is exactly 'false'", () => {
     process.env.HIVEMIND_EMBEDDINGS = "false";
+    // Resolver should never be consulted — set it to throw so this fails
+    // loudly if the env-check is ever removed.
+    _setResolveForTesting(() => { throw new Error("must not be called"); });
+    expect(embeddingsStatus()).toBe("env-disabled");
     expect(embeddingsDisabled()).toBe(true);
   });
 
-  it("stays off for any non-'false' truthy value (intentional: avoid surprise kills)", () => {
-    process.env.HIVEMIND_EMBEDDINGS = "0";
-    expect(embeddingsDisabled()).toBe(false);
+  it("env-disabled wins over a missing package (single, definitive signal)", () => {
+    process.env.HIVEMIND_EMBEDDINGS = "false";
+    _setResolveForTesting(() => { throw new Error("MODULE_NOT_FOUND"); });
+    expect(embeddingsStatus()).toBe("env-disabled");
+    expect(embeddingsDisabled()).toBe(true);
+  });
 
-    process.env.HIVEMIND_EMBEDDINGS = "no";
-    expect(embeddingsDisabled()).toBe(false);
+  it("stays 'enabled' for any non-'false' truthy env value (avoid surprise kills)", () => {
+    for (const value of ["0", "no", "true", "", "FALSE", "False"]) {
+      process.env.HIVEMIND_EMBEDDINGS = value;
+      _resetForTesting();
+      _setResolveForTesting(() => { /* installed */ });
+      expect(embeddingsStatus()).toBe("enabled");
+      expect(embeddingsDisabled()).toBe(false);
+    }
+  });
+});
+
+describe("embeddingsStatus / embeddingsDisabled — transformers-presence branch", () => {
+  beforeEach(() => {
+    delete process.env.HIVEMIND_EMBEDDINGS;
+    _resetForTesting();
+  });
+
+  afterEach(() => {
+    restoreEnv();
+    _resetForTesting();
+  });
 
-    process.env.HIVEMIND_EMBEDDINGS = "true";
+  it("is 'enabled' when @huggingface/transformers resolves cleanly", () => {
+    _setResolveForTesting(() => { /* resolution OK */ });
+    expect(embeddingsStatus()).toBe("enabled");
     expect(embeddingsDisabled()).toBe(false);
+  });
+
+  it("is 'no-transformers' on MODULE_NOT_FOUND from the resolver", () => {
+    _setResolveForTesting(() => {
+      const err = new Error("Cannot find module '@huggingface/transformers'") as NodeJS.ErrnoException;
+      err.code = "MODULE_NOT_FOUND";
+      throw err;
+    });
+    expect(embeddingsStatus()).toBe("no-transformers");
+    expect(embeddingsDisabled()).toBe(true);
+  });
+
+  it("is 'no-transformers' on any other resolver throw (defensive: never crash)", () => {
+    _setResolveForTesting(() => { throw new Error("permission denied"); });
+    expect(embeddingsStatus()).toBe("no-transformers");
+    expect(embeddingsDisabled()).toBe(true);
+  });
 
-    process.env.HIVEMIND_EMBEDDINGS = "";
+  it("does not re-resolve on every call — first result is cached for the process", () => {
+    let calls = 0;
+    _setResolveForTesting(() => {
+      calls += 1;
+      if (calls > 1) throw new Error("resolver should be called at most once");
+    });
+    expect(embeddingsStatus()).toBe("enabled");
+    expect(embeddingsStatus()).toBe("enabled");
     expect(embeddingsDisabled()).toBe(false);
+    expect(calls).toBe(1);
+  });
+
+  it("caches the disabled result too (a missing package doesn't probe again)", () => {
+    let calls = 0;
+    _setResolveForTesting(() => {
+      calls += 1;
+      throw new Error("MODULE_NOT_FOUND");
+    });
+    expect(embeddingsStatus()).toBe("no-transformers");
+    expect(embeddingsStatus()).toBe("no-transformers");
+    expect(embeddingsDisabled()).toBe(true);
+    expect(calls).toBe(1);
+  });
+
+  it("_resetForTesting clears the cache and restores the real resolver", () => {
+    _setResolveForTesting(() => { throw new Error("simulated missing"); });
+    expect(embeddingsStatus()).toBe("no-transformers");
+    _resetForTesting();
+    // Real resolver runs against this test process, which has the package
+    // installed via the worktree's node_modules → comes back 'enabled'.
+    expect(embeddingsStatus()).toBe("enabled");
+  });
+
+  it("real default resolver finds @huggingface/transformers in this repo", () => {
+    // Smoke check: in the dev / CI environment the package IS installed,
+    // so the actual createRequire-based resolver succeeds. Guards against
+    // a regression in the resolution path itself (wrong base URL, wrong
+    // package name spelling, build-time vs runtime path drift, etc.).
+    _resetForTesting();
+    expect(embeddingsStatus()).toBe("enabled");
   });
 });
diff --git a/src/embeddings/disable.ts b/src/embeddings/disable.ts
index 8c0db83..e832bd4 100644
--- a/src/embeddings/disable.ts
+++ b/src/embeddings/disable.ts
@@ -1,22 +1,74 @@
+import { createRequire } from "node:module";
+
 /**
  * Master opt-out for the embedding feature.
  *
- * `HIVEMIND_EMBEDDINGS=false` short-circuits every call site that would
- * otherwise talk to the nomic daemon: the SessionStart warmup, the
- * capture-side write embed, the batched flush embed in DeeplakeFs, and
- * both grep query-time embed paths (direct + interceptor). The SQL
- * schema still has the embedding columns and existing rows' embeddings
- * remain readable, but no new embedding is computed and no daemon is
- * spawned.
+ * Embeddings are off when EITHER:
  *
- * Intended for: air-gapped / no-network installs, CI / benchmarks that
- * want pure-lexical retrieval, and users who want the plugin's capture
- * + grep without paying the ~110 MB nomic download.
+ * 1. `HIVEMIND_EMBEDDINGS=false` is set — explicit opt-out for air-gapped /
+ *    no-network installs, CI / benchmarks that want pure-lexical retrieval,
+ *    and users who don't want the ~110 MB nomic download.
  *
- * Read-once: honours mutations during the process lifetime; the hooks
- * are short-lived subprocesses so a live toggle via `export` takes
- * effect on the next session.
+ * 2. `@huggingface/transformers` is not resolvable from this bundle — the
+ *    plugin ships without it (it has native deps that can't be bundled into
+ *    the daemon). A fresh marketplace install lacks it; the README documents
+ *    the optional `npm install @huggingface/transformers` step. When absent,
+ *    we degrade silently to lexical-only mode rather than spawning a daemon
+ *    that will crash on `import("@huggingface/transformers")` and emit
+ *    confusing logs.
+ *
+ * In either case: SessionStart skips the warmup, capture / wiki-worker write
+ * rows with NULL in the embedding column, and `Grep` falls back to BM25 /
+ * ILIKE matching on text columns. Existing rows' embeddings remain readable.
+ *
+ * Read-once: cached for the lifetime of the (short-lived) hook process so a
+ * live `export HIVEMIND_EMBEDDINGS=...` takes effect on the next session.
  */
+
+export type EmbeddingsStatus = "enabled" | "env-disabled" | "no-transformers";
+
+let cachedStatus: EmbeddingsStatus | null = null;
+
+function defaultResolveTransformers(): void {
+  // Resolve from this module's location — the same node_modules walk Node
+  // would do for the spawned daemon, since the daemon lives in the same
+  // bundle dir tree.
+  createRequire(import.meta.url).resolve("@huggingface/transformers");
+}
+
+let _resolve: () => void = defaultResolveTransformers;
+
+function detectStatus(): EmbeddingsStatus {
+  if (process.env.HIVEMIND_EMBEDDINGS === "false") return "env-disabled";
+  try {
+    _resolve();
+    return "enabled";
+  } catch {
+    return "no-transformers";
+  }
+}
+
+export function embeddingsStatus(): EmbeddingsStatus {
+  if (cachedStatus !== null) return cachedStatus;
+  cachedStatus = detectStatus();
+  return cachedStatus;
+}
+
 export function embeddingsDisabled(): boolean {
-  return process.env.HIVEMIND_EMBEDDINGS === "false";
+  return embeddingsStatus() !== "enabled";
+}
+
+// ── Test helpers ────────────────────────────────────────────────────────────
+// Exposed so unit tests can simulate "transformers not installed" without
+// actually uninstalling the package. Underscore-prefixed and intentionally
+// not re-exported from any public entry point — runtime never calls these.
+
+export function _setResolveForTesting(fn: () => void): void {
+  _resolve = fn;
+  cachedStatus = null;
+}
+
+export function _resetForTesting(): void {
+  _resolve = defaultResolveTransformers;
+  cachedStatus = null;
 }

From a9c8ffd0ab2fda82b0a1632404740880d5ab8392 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Mon, 27 Apr 2026 21:32:15 +0000
Subject: [PATCH 27/30] build: rebuild bundles for embeddings detection

Pure rebuild from `npm run build` after the disable.ts change in
6b77d6d. Touched bundles are the ones that pull in
`src/embeddings/disable.ts`: capture, session-start-setup, pre-tool-use,
wiki-worker (claude-code) and pre-tool-use, wiki-worker, deeplake-shell
(codex side), plus the shell bundle.
---
 claude-code/bundle/capture.js              | 24 ++++++++++++++++++-
 claude-code/bundle/pre-tool-use.js         | 24 ++++++++++++++++++-
 claude-code/bundle/session-start-setup.js  | 24 ++++++++++++++++++-
 claude-code/bundle/shell/deeplake-shell.js | 28 +++++++++++++++++++---
 claude-code/bundle/wiki-worker.js          | 24 ++++++++++++++++++-
 codex/bundle/pre-tool-use.js               | 24 ++++++++++++++++++-
 codex/bundle/shell/deeplake-shell.js       | 28 +++++++++++++++++++---
 codex/bundle/wiki-worker.js                | 24 ++++++++++++++++++-
 8 files changed, 188 insertions(+), 12 deletions(-)

diff --git a/claude-code/bundle/capture.js b/claude-code/bundle/capture.js
index 2ca54df..a3df769 100755
--- a/claude-code/bundle/capture.js
+++ b/claude-code/bundle/capture.js
@@ -901,8 +901,30 @@ function embeddingSqlLiteral(vec) {
 }
 
 // dist/src/embeddings/disable.js
+import { createRequire } from "node:module";
+var cachedStatus = null;
+function defaultResolveTransformers() {
+  createRequire(import.meta.url).resolve("@huggingface/transformers");
+}
+var _resolve = defaultResolveTransformers;
+function detectStatus() {
+  if (process.env.HIVEMIND_EMBEDDINGS === "false")
+    return "env-disabled";
+  try {
+    _resolve();
+    return "enabled";
+  } catch {
+    return "no-transformers";
+  }
+}
+function embeddingsStatus() {
+  if (cachedStatus !== null)
+    return cachedStatus;
+  cachedStatus = detectStatus();
+  return cachedStatus;
+}
 function embeddingsDisabled() {
-  return process.env.HIVEMIND_EMBEDDINGS === "false";
+  return embeddingsStatus() !== "enabled";
 }
 
 // dist/src/hooks/capture.js
diff --git a/claude-code/bundle/pre-tool-use.js b/claude-code/bundle/pre-tool-use.js
index 017dd0d..e94800d 100755
--- a/claude-code/bundle/pre-tool-use.js
+++ b/claude-code/bundle/pre-tool-use.js
@@ -1135,8 +1135,30 @@ function sleep2(ms) {
 }
 
 // dist/src/embeddings/disable.js
+import { createRequire } from "node:module";
+var cachedStatus = null;
+function defaultResolveTransformers() {
+  createRequire(import.meta.url).resolve("@huggingface/transformers");
+}
+var _resolve = defaultResolveTransformers;
+function detectStatus() {
+  if (process.env.HIVEMIND_EMBEDDINGS === "false")
+    return "env-disabled";
+  try {
+    _resolve();
+    return "enabled";
+  } catch {
+    return "no-transformers";
+  }
+}
+function embeddingsStatus() {
+  if (cachedStatus !== null)
+    return cachedStatus;
+  cachedStatus = detectStatus();
+  return cachedStatus;
+}
 function embeddingsDisabled() {
-  return process.env.HIVEMIND_EMBEDDINGS === "false";
+  return embeddingsStatus() !== "enabled";
 }
 
 // dist/src/hooks/grep-direct.js
diff --git a/claude-code/bundle/session-start-setup.js b/claude-code/bundle/session-start-setup.js
index 5a92470..1730202 100755
--- a/claude-code/bundle/session-start-setup.js
+++ b/claude-code/bundle/session-start-setup.js
@@ -778,8 +778,30 @@ function sleep2(ms) {
 }
 
 // dist/src/embeddings/disable.js
+import { createRequire } from "node:module";
+var cachedStatus = null;
+function defaultResolveTransformers() {
+  createRequire(import.meta.url).resolve("@huggingface/transformers");
+}
+var _resolve = defaultResolveTransformers;
+function detectStatus() {
+  if (process.env.HIVEMIND_EMBEDDINGS === "false")
+    return "env-disabled";
+  try {
+    _resolve();
+    return "enabled";
+  } catch {
+    return "no-transformers";
+  }
+}
+function embeddingsStatus() {
+  if (cachedStatus !== null)
+    return cachedStatus;
+  cachedStatus = detectStatus();
+  return cachedStatus;
+}
 function embeddingsDisabled() {
-  return process.env.HIVEMIND_EMBEDDINGS === "false";
+  return embeddingsStatus() !== "enabled";
 }
 
 // dist/src/hooks/session-start-setup.js
diff --git a/claude-code/bundle/shell/deeplake-shell.js b/claude-code/bundle/shell/deeplake-shell.js
index 171d01b..d1e438c 100755
--- a/claude-code/bundle/shell/deeplake-shell.js
+++ b/claude-code/bundle/shell/deeplake-shell.js
@@ -67783,8 +67783,30 @@ function embeddingSqlLiteral(vec) {
 }
 
 // dist/src/embeddings/disable.js
+import { createRequire } from "node:module";
+var cachedStatus = null;
+function defaultResolveTransformers() {
+  createRequire(import.meta.url).resolve("@huggingface/transformers");
+}
+var _resolve = defaultResolveTransformers;
+function detectStatus() {
+  if (process.env.HIVEMIND_EMBEDDINGS === "false")
+    return "env-disabled";
+  try {
+    _resolve();
+    return "enabled";
+  } catch {
+    return "no-transformers";
+  }
+}
+function embeddingsStatus() {
+  if (cachedStatus !== null)
+    return cachedStatus;
+  cachedStatus = detectStatus();
+  return cachedStatus;
+}
 function embeddingsDisabled() {
-  return process.env.HIVEMIND_EMBEDDINGS === "false";
+  return embeddingsStatus() !== "enabled";
 }
 
 // dist/src/shell/deeplake-fs.js
@@ -69382,7 +69404,7 @@ function stripQuotes(val) {
 
 // node_modules/yargs-parser/build/lib/index.js
 import { readFileSync as readFileSync4 } from "fs";
-import { createRequire } from "node:module";
+import { createRequire as createRequire2 } from "node:module";
 var _a3;
 var _b;
 var _c;
@@ -69395,7 +69417,7 @@ if (nodeVersion) {
   }
 }
 var env = process ? process.env : {};
-var require2 = createRequire ? createRequire(import.meta.url) : void 0;
+var require2 = createRequire2 ? createRequire2(import.meta.url) : void 0;
 var parser = new YargsParser({
   cwd: process.cwd,
   env: () => {
diff --git a/claude-code/bundle/wiki-worker.js b/claude-code/bundle/wiki-worker.js
index 6536f3a..a5a311f 100755
--- a/claude-code/bundle/wiki-worker.js
+++ b/claude-code/bundle/wiki-worker.js
@@ -369,8 +369,30 @@ function sleep(ms) {
 }
 
 // dist/src/embeddings/disable.js
+import { createRequire } from "node:module";
+var cachedStatus = null;
+function defaultResolveTransformers() {
+  createRequire(import.meta.url).resolve("@huggingface/transformers");
+}
+var _resolve = defaultResolveTransformers;
+function detectStatus() {
+  if (process.env.HIVEMIND_EMBEDDINGS === "false")
+    return "env-disabled";
+  try {
+    _resolve();
+    return "enabled";
+  } catch {
+    return "no-transformers";
+  }
+}
+function embeddingsStatus() {
+  if (cachedStatus !== null)
+    return cachedStatus;
+  cachedStatus = detectStatus();
+  return cachedStatus;
+}
 function embeddingsDisabled() {
-  return process.env.HIVEMIND_EMBEDDINGS === "false";
+  return embeddingsStatus() !== "enabled";
 }
 
 // dist/src/hooks/wiki-worker.js
diff --git a/codex/bundle/pre-tool-use.js b/codex/bundle/pre-tool-use.js
index 81f040f..42d020c 100755
--- a/codex/bundle/pre-tool-use.js
+++ b/codex/bundle/pre-tool-use.js
@@ -1121,8 +1121,30 @@ function sleep2(ms) {
 }
 
 // dist/src/embeddings/disable.js
+import { createRequire } from "node:module";
+var cachedStatus = null;
+function defaultResolveTransformers() {
+  createRequire(import.meta.url).resolve("@huggingface/transformers");
+}
+var _resolve = defaultResolveTransformers;
+function detectStatus() {
+  if (process.env.HIVEMIND_EMBEDDINGS === "false")
+    return "env-disabled";
+  try {
+    _resolve();
+    return "enabled";
+  } catch {
+    return "no-transformers";
+  }
+}
+function embeddingsStatus() {
+  if (cachedStatus !== null)
+    return cachedStatus;
+  cachedStatus = detectStatus();
+  return cachedStatus;
+}
 function embeddingsDisabled() {
-  return process.env.HIVEMIND_EMBEDDINGS === "false";
+  return embeddingsStatus() !== "enabled";
 }
 
 // dist/src/hooks/grep-direct.js
diff --git a/codex/bundle/shell/deeplake-shell.js b/codex/bundle/shell/deeplake-shell.js
index 171d01b..d1e438c 100755
--- a/codex/bundle/shell/deeplake-shell.js
+++ b/codex/bundle/shell/deeplake-shell.js
@@ -67783,8 +67783,30 @@ function embeddingSqlLiteral(vec) {
 }
 
 // dist/src/embeddings/disable.js
+import { createRequire } from "node:module";
+var cachedStatus = null;
+function defaultResolveTransformers() {
+  createRequire(import.meta.url).resolve("@huggingface/transformers");
+}
+var _resolve = defaultResolveTransformers;
+function detectStatus() {
+  if (process.env.HIVEMIND_EMBEDDINGS === "false")
+    return "env-disabled";
+  try {
+    _resolve();
+    return "enabled";
+  } catch {
+    return "no-transformers";
+  }
+}
+function embeddingsStatus() {
+  if (cachedStatus !== null)
+    return cachedStatus;
+  cachedStatus = detectStatus();
+  return cachedStatus;
+}
 function embeddingsDisabled() {
-  return process.env.HIVEMIND_EMBEDDINGS === "false";
+  return embeddingsStatus() !== "enabled";
 }
 
 // dist/src/shell/deeplake-fs.js
@@ -69382,7 +69404,7 @@ function stripQuotes(val) {
 
 // node_modules/yargs-parser/build/lib/index.js
 import { readFileSync as readFileSync4 } from "fs";
-import { createRequire } from "node:module";
+import { createRequire as createRequire2 } from "node:module";
 var _a3;
 var _b;
 var _c;
@@ -69395,7 +69417,7 @@ if (nodeVersion) {
   }
 }
 var env = process ? process.env : {};
-var require2 = createRequire ? createRequire(import.meta.url) : void 0;
+var require2 = createRequire2 ? createRequire2(import.meta.url) : void 0;
 var parser = new YargsParser({
   cwd: process.cwd,
   env: () => {
diff --git a/codex/bundle/wiki-worker.js b/codex/bundle/wiki-worker.js
index a1e7e00..ff6de72 100755
--- a/codex/bundle/wiki-worker.js
+++ b/codex/bundle/wiki-worker.js
@@ -368,8 +368,30 @@ function sleep(ms) {
 }
 
 // dist/src/embeddings/disable.js
+import { createRequire } from "node:module";
+var cachedStatus = null;
+function defaultResolveTransformers() {
+  createRequire(import.meta.url).resolve("@huggingface/transformers");
+}
+var _resolve = defaultResolveTransformers;
+function detectStatus() {
+  if (process.env.HIVEMIND_EMBEDDINGS === "false")
+    return "env-disabled";
+  try {
+    _resolve();
+    return "enabled";
+  } catch {
+    return "no-transformers";
+  }
+}
+function embeddingsStatus() {
+  if (cachedStatus !== null)
+    return cachedStatus;
+  cachedStatus = detectStatus();
+  return cachedStatus;
+}
 function embeddingsDisabled() {
-  return process.env.HIVEMIND_EMBEDDINGS === "false";
+  return embeddingsStatus() !== "enabled";
 }
 
 // dist/src/hooks/codex/wiki-worker.js

From 0aef2df7583a70b887bb4b362b913055e611c02c Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Mon, 27 Apr 2026 21:42:29 +0000
Subject: [PATCH 28/30] refactor(session-start): log specific reason embeddings
 are off
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The warmup-skipped log line previously said "skipped via
HIVEMIND_EMBEDDINGS=false" regardless of the actual cause. With
embeddingsDisabled() now also returning true when
@huggingface/transformers is not installed, this message was misleading
on fresh marketplace installs (the user sees "HIVEMIND_EMBEDDINGS=false"
in the log, but they never set that flag).

Branch on embeddingsStatus() and emit the precise reason — pointing
to the README install step in the no-transformers case so users have a
clear next step. The HIVEMIND_EMBED_WARMUP=false message is unchanged.

End-to-end check (bundle copied to /tmp where node_modules is not
reachable, real session-start-setup hook fed synthetic stdin):

  [session-setup] setup complete
  [session-setup] embed daemon warmup skipped:
    @huggingface/transformers not installed
    (see README to enable embeddings)

Test asserting the env-disabled log message is updated to match the
new wording.
---
 claude-code/bundle/session-start-setup.js          | 4 +++-
 claude-code/tests/session-start-setup-hook.test.ts | 2 +-
 src/hooks/session-start-setup.ts                   | 8 ++++++--
 3 files changed, 10 insertions(+), 4 deletions(-)

diff --git a/claude-code/bundle/session-start-setup.js b/claude-code/bundle/session-start-setup.js
index 1730202..fa4f717 100755
--- a/claude-code/bundle/session-start-setup.js
+++ b/claude-code/bundle/session-start-setup.js
@@ -878,7 +878,9 @@ async function main() {
     log4(`version check failed: ${e.message}`);
   }
   if (embeddingsDisabled()) {
-    log4("embed daemon warmup skipped via HIVEMIND_EMBEDDINGS=false");
+    const status = embeddingsStatus();
+    const reason = status === "no-transformers" ? "@huggingface/transformers not installed (see README to enable embeddings)" : "HIVEMIND_EMBEDDINGS=false";
+    log4(`embed daemon warmup skipped: ${reason}`);
   } else if (process.env.HIVEMIND_EMBED_WARMUP !== "false") {
     try {
       const daemonEntry = join8(__bundleDir, "embeddings", "embed-daemon.js");
diff --git a/claude-code/tests/session-start-setup-hook.test.ts b/claude-code/tests/session-start-setup-hook.test.ts
index 9a4484d..48944b2 100644
--- a/claude-code/tests/session-start-setup-hook.test.ts
+++ b/claude-code/tests/session-start-setup-hook.test.ts
@@ -257,7 +257,7 @@ describe("session-start-setup hook — embed daemon warmup", () => {
     await runHook({ HIVEMIND_EMBEDDINGS: "false" });
     expect(embedWarmupMock).not.toHaveBeenCalled();
     expect(debugLogMock).toHaveBeenCalledWith(
-      "embed daemon warmup skipped via HIVEMIND_EMBEDDINGS=false",
+      "embed daemon warmup skipped: HIVEMIND_EMBEDDINGS=false",
     );
   });
 });
diff --git a/src/hooks/session-start-setup.ts b/src/hooks/session-start-setup.ts
index 6c62d9a..1667549 100644
--- a/src/hooks/session-start-setup.ts
+++ b/src/hooks/session-start-setup.ts
@@ -19,7 +19,7 @@ import { getInstalledVersion, getLatestVersion, isNewer } from "../utils/version
 import { makeWikiLogger } from "../utils/wiki-log.js";
 import { resolveVersionedPluginDir, snapshotPluginDir, restoreOrCleanup } from "../utils/plugin-cache.js";
 import { EmbedClient } from "../embeddings/client.js";
-import { embeddingsDisabled } from "../embeddings/disable.js";
+import { embeddingsDisabled, embeddingsStatus } from "../embeddings/disable.js";
 const log = (msg: string) => _log("session-setup", msg);
 
 const __bundleDir = dirname(fileURLToPath(import.meta.url));
@@ -117,7 +117,11 @@ async function main(): Promise<void> {
   // HIVEMIND_EMBED_WARMUP=false for sessions that will never touch the
   // memory path (lightweight CC runs, no-network CI).
   if (embeddingsDisabled()) {
-    log("embed daemon warmup skipped via HIVEMIND_EMBEDDINGS=false");
+    const status = embeddingsStatus();
+    const reason = status === "no-transformers"
+      ? "@huggingface/transformers not installed (see README to enable embeddings)"
+      : "HIVEMIND_EMBEDDINGS=false";
+    log(`embed daemon warmup skipped: ${reason}`);
   } else if (process.env.HIVEMIND_EMBED_WARMUP !== "false") {
     try {
       const daemonEntry = join(__bundleDir, "embeddings", "embed-daemon.js");

From 008fb07e795ae0769f7452f3ef454355414fc1a2 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Mon, 27 Apr 2026 22:14:58 +0000
Subject: [PATCH 29/30] test(schema-scenarios): cover the 7 new-user upgrade
 scenarios
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Adds claude-code/tests/schema-scenarios.test.ts, the unit-level
mirror of the real-table verification in scenario-matrix.sh. Each
scenario corresponds to a (memory, sessions) pair of {missing,
no-emb-column, with-emb-column} starting states and asserts:

  1. The exact SQL ensureTable + ensureSessionsTable issue against
     a mocked query() (network boundary, per CLAUDE.md test rules).
  2. The query count matches what we expect for each branch
     (CREATE only, ALTER only, both, none of either).
  3. ALTER ADD COLUMN failures — including the deterministic
     500 "already exists" returned by Deeplake when the column is
     already there — never bubble up out of ensureTable, so the
     SessionStart hook always completes setup.

Cross-cutting tests pin two invariants:

  - Any 500/503 from ALTER is swallowed (regression guard against
     SessionStart aborting on every run for users on a fully
     migrated workspace).
  - The post-ALTER vector::at INSERT failure DOES reach the caller
     (capture's main catch logs "fatal" + exit 0; not silently
     swallowed by the API client).

Tests use a per-test temp HIVEMIND_INDEX_MARKER_DIR so the lookup
index marker cache does not bleed across scenarios.

The scenario-matrix.sh script (kept untracked in the worktree)
empirically confirms the same 7 cases against real Deeplake test
tables and reports the only post-ALTER bug observed: scenarios
2/4/6 lose the first capture INSERT to the vector::at window
(~30s) after the sessions ALTER.
---
 claude-code/tests/schema-scenarios.test.ts | 274 +++++++++++++++++++++
 1 file changed, 274 insertions(+)
 create mode 100644 claude-code/tests/schema-scenarios.test.ts

diff --git a/claude-code/tests/schema-scenarios.test.ts b/claude-code/tests/schema-scenarios.test.ts
new file mode 100644
index 0000000..1b9cfd9
--- /dev/null
+++ b/claude-code/tests/schema-scenarios.test.ts
@@ -0,0 +1,274 @@
+import { describe, it, expect, vi, beforeEach, afterAll } from "vitest";
+import { mkdtempSync, rmSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { DeeplakeApi } from "../../src/deeplake-api.js";
+
+// Each test gets a fresh marker dir so the per-table CREATE INDEX cache
+// in ensureLookupIndex() does not bleed between scenarios.
+const ORIG_MARKER_DIR = process.env.HIVEMIND_INDEX_MARKER_DIR;
+let markerDir: string;
+
+/**
+ * Unit-level mirror of the 7 schema/upgrade scenarios exercised in
+ * scenario-matrix.sh against real Deeplake tables. Where the shell
+ * script measures the runtime outcome (post-ALTER vector::at window,
+ * silent reads, etc.), this file pins the SQL the plugin actually
+ * sends in each state and verifies the hooks survive every
+ * combination of "table exists / ALTER outcome" without throwing.
+ *
+ * Mocks only the network boundary (`query`, `listTables`) per
+ * CLAUDE.md's testing philosophy.
+ */
+
+interface QueryRule {
+  match: RegExp;
+  result: "ok" | { errorStatus: number; errorBody: string };
+}
+
+function makeApi(rules: QueryRule[], existingTables: string[]) {
+  const api = new DeeplakeApi("tok", "https://api.example", "org", "ws", "memory");
+  const queryCalls: string[] = [];
+
+  vi.spyOn(api, "listTables").mockResolvedValue(existingTables);
+  vi.spyOn(api, "query").mockImplementation(async (sql: string) => {
+    queryCalls.push(sql);
+    const rule = rules.find(r => r.match.test(sql));
+    if (!rule) throw new Error(`unexpected SQL in test: ${sql}`);
+    if (rule.result === "ok") return [];
+    throw new Error(
+      `Query failed: ${rule.result.errorStatus}: ${rule.result.errorBody}`,
+    );
+  });
+
+  return { api, queryCalls };
+}
+
+const ALTER_MEM     = /^ALTER TABLE "memory" ADD COLUMN IF NOT EXISTS summary_embedding FLOAT4\[\]$/;
+const ALTER_SESS    = /^ALTER TABLE "sessions" ADD COLUMN IF NOT EXISTS message_embedding FLOAT4\[\]$/;
+const CREATE_MEM    = /^CREATE TABLE IF NOT EXISTS "memory" .*summary_embedding FLOAT4\[\]/;
+const CREATE_SESS   = /^CREATE TABLE IF NOT EXISTS "sessions" .*message_embedding FLOAT4\[\]/;
+const CREATE_INDEX  = /^CREATE INDEX IF NOT EXISTS .* ON "sessions"/;
+const ALREADY_EXISTS = (col: string) => ({
+  errorStatus: 500,
+  errorBody: `{"error":"Database error: Failed to add column '${col}' to deeplake dataset: Column '${col}' already exists","code":"QUERY_ERROR"}`,
+});
+const VECTOR_AT = {
+  errorStatus: 500,
+  errorBody: `{"error":"Database error: Failed to insert tuple: vector::at out of range","code":"QUERY_ERROR"}`,
+};
+
+beforeEach(() => {
+  vi.restoreAllMocks();
+  if (markerDir) rmSync(markerDir, { recursive: true, force: true });
+  markerDir = mkdtempSync(join(tmpdir(), "hivemind-test-markers-"));
+  process.env.HIVEMIND_INDEX_MARKER_DIR = markerDir;
+});
+
+afterAll(() => {
+  if (markerDir) rmSync(markerDir, { recursive: true, force: true });
+  if (ORIG_MARKER_DIR === undefined) delete process.env.HIVEMIND_INDEX_MARKER_DIR;
+  else process.env.HIVEMIND_INDEX_MARKER_DIR = ORIG_MARKER_DIR;
+});
+
+// ── Scenarios 1..7 — each mirrors a row of scenario-matrix.sh's summary ─────
+
+describe("scenario 1 — GREENFIELD (memory missing, sessions missing)", () => {
+  it("CREATEs both tables embedding-ready, no ALTER, capture inserts cleanly", async () => {
+    const { api, queryCalls } = makeApi(
+      [
+        { match: CREATE_MEM,   result: "ok" },
+        { match: CREATE_SESS,  result: "ok" },
+        { match: CREATE_INDEX, result: "ok" },
+      ],
+      [], // listTables: nothing exists
+    );
+
+    await api.ensureTable();
+    await api.ensureSessionsTable("sessions");
+
+    // ensureTable: 1 CREATE on memory.
+    // ensureSessionsTable: 1 CREATE on sessions + 1 CREATE INDEX.
+    expect(queryCalls).toHaveLength(3);
+    expect(queryCalls[0]).toMatch(CREATE_MEM);
+    expect(queryCalls[1]).toMatch(CREATE_SESS);
+    expect(queryCalls[2]).toMatch(CREATE_INDEX);
+    // No ALTER attempted on a fresh table → no post-ALTER vector::at window.
+    expect(queryCalls.some(s => /^ALTER TABLE/.test(s))).toBe(false);
+  });
+});
+
+describe("scenario 2 — FULL LEGACY (memory no-emb, sessions no-emb)", () => {
+  it("ALTERs both tables; both succeed, but the post-ALTER window applies to capture", async () => {
+    const { api, queryCalls } = makeApi(
+      [
+        { match: ALTER_MEM,    result: "ok" },
+        { match: ALTER_SESS,   result: "ok" },
+        { match: CREATE_INDEX, result: "ok" },
+      ],
+      ["memory", "sessions"], // both legacy tables already present
+    );
+
+    await api.ensureTable();
+    await api.ensureSessionsTable("sessions");
+
+    expect(queryCalls).toHaveLength(3);
+    expect(queryCalls[0]).toMatch(ALTER_MEM);
+    expect(queryCalls[1]).toMatch(ALTER_SESS);
+    expect(queryCalls[2]).toMatch(CREATE_INDEX);
+    // No CREATE on a table that already exists.
+    expect(queryCalls.some(s => /^CREATE TABLE/.test(s))).toBe(false);
+  });
+});
+
+describe("scenario 3 — HALF LEGACY MEMORY (memory no-emb, sessions missing)", () => {
+  it("ALTERs memory, CREATEs sessions; capture INSERT immediately succeeds in the real run", async () => {
+    const { api, queryCalls } = makeApi(
+      [
+        { match: ALTER_MEM,    result: "ok" },
+        { match: CREATE_SESS,  result: "ok" },
+        { match: CREATE_INDEX, result: "ok" },
+      ],
+      ["memory"],
+    );
+
+    await api.ensureTable();
+    await api.ensureSessionsTable("sessions");
+
+    expect(queryCalls).toHaveLength(3);
+    expect(queryCalls[0]).toMatch(ALTER_MEM);
+    expect(queryCalls[1]).toMatch(CREATE_SESS);
+    expect(queryCalls[2]).toMatch(CREATE_INDEX);
+  });
+});
+
+describe("scenario 4 — HALF LEGACY SESSIONS (memory missing, sessions no-emb)", () => {
+  it("CREATEs memory, ALTERs sessions — sessions ALTER triggers the real-world post-ALTER window", async () => {
+    const { api, queryCalls } = makeApi(
+      [
+        { match: CREATE_MEM,   result: "ok" },
+        { match: ALTER_SESS,   result: "ok" },
+        { match: CREATE_INDEX, result: "ok" },
+      ],
+      ["sessions"],
+    );
+
+    await api.ensureTable();
+    await api.ensureSessionsTable("sessions");
+
+    expect(queryCalls).toHaveLength(3);
+    expect(queryCalls[0]).toMatch(CREATE_MEM);
+    expect(queryCalls[1]).toMatch(ALTER_SESS);
+    expect(queryCalls[2]).toMatch(CREATE_INDEX);
+  });
+});
+
+describe("scenario 5 — FULLY MIGRATED (memory with-emb, sessions with-emb)", () => {
+  it("both ALTERs return 500 'already exists' and are swallowed by try/catch — fast-fail, no retries", async () => {
+    const { api, queryCalls } = makeApi(
+      [
+        { match: ALTER_MEM,    result: ALREADY_EXISTS("summary_embedding") },
+        { match: ALTER_SESS,   result: ALREADY_EXISTS("message_embedding") },
+        { match: CREATE_INDEX, result: "ok" },
+      ],
+      ["memory", "sessions"],
+    );
+
+    // No throw despite both ALTERs failing — the swallowed-error path.
+    await expect(api.ensureTable()).resolves.toBeUndefined();
+    await expect(api.ensureSessionsTable("sessions")).resolves.toBeUndefined();
+
+    expect(queryCalls).toHaveLength(3);
+    // The fail-fast on "already exists" (commit 973dd34) means each ALTER is
+    // sent exactly once — no retries on the deterministic 500.
+    const alterCalls = queryCalls.filter(s => /^ALTER TABLE/.test(s));
+    expect(alterCalls).toHaveLength(2);
+  });
+});
+
+describe("scenario 6 — MIXED MEM-EMB (memory with-emb, sessions no-emb)", () => {
+  it("memory ALTER fast-fails on 'already exists'; sessions ALTER actually adds the column", async () => {
+    const { api, queryCalls } = makeApi(
+      [
+        { match: ALTER_MEM,    result: ALREADY_EXISTS("summary_embedding") },
+        { match: ALTER_SESS,   result: "ok" },
+        { match: CREATE_INDEX, result: "ok" },
+      ],
+      ["memory", "sessions"],
+    );
+
+    await api.ensureTable();
+    await api.ensureSessionsTable("sessions");
+
+    expect(queryCalls).toHaveLength(3);
+    expect(queryCalls[0]).toMatch(ALTER_MEM);
+    expect(queryCalls[1]).toMatch(ALTER_SESS);
+  });
+});
+
+describe("scenario 7 — MIXED SESS-EMB (memory no-emb, sessions with-emb)", () => {
+  it("memory ALTER actually adds the column; sessions ALTER fast-fails on 'already exists'", async () => {
+    const { api, queryCalls } = makeApi(
+      [
+        { match: ALTER_MEM,    result: "ok" },
+        { match: ALTER_SESS,   result: ALREADY_EXISTS("message_embedding") },
+        { match: CREATE_INDEX, result: "ok" },
+      ],
+      ["memory", "sessions"],
+    );
+
+    await api.ensureTable();
+    await api.ensureSessionsTable("sessions");
+
+    expect(queryCalls).toHaveLength(3);
+    expect(queryCalls[0]).toMatch(ALTER_MEM);
+    expect(queryCalls[1]).toMatch(ALTER_SESS);
+  });
+});
+
+// ── Cross-cutting invariants ────────────────────────────────────────────────
+
+describe("schema scenarios — cross-cutting invariants", () => {
+  it("ALTER ADD COLUMN failures NEVER bubble up — ensureTable always resolves", async () => {
+    // The ALTER swallow is what keeps fully-migrated tables from breaking
+    // SessionStart on every run. If this regresses, scenario 5 starts
+    // surfacing a 500 to the hook caller and SessionStart partially aborts.
+    const cases = [
+      ALREADY_EXISTS("summary_embedding"),
+      { errorStatus: 500, errorBody: '{"error":"random transient backend error"}' },
+      { errorStatus: 503, errorBody: "Service Unavailable" },
+    ];
+    for (const errorResult of cases) {
+      vi.restoreAllMocks();
+      const { api } = makeApi(
+        [
+          { match: ALTER_MEM,    result: errorResult },
+          { match: ALTER_SESS,   result: errorResult },
+          { match: CREATE_INDEX, result: "ok" },
+        ],
+        ["memory", "sessions"],
+      );
+      await expect(api.ensureTable()).resolves.toBeUndefined();
+      await expect(api.ensureSessionsTable("sessions")).resolves.toBeUndefined();
+    }
+  });
+
+  it("the post-ALTER vector::at INSERT failure surfaces to the caller (capture's main catch handles it)", async () => {
+    // The capture hook wraps its INSERT in a try/catch + log("fatal: …")
+    // path; we verify here that the API client itself does NOT swallow
+    // INSERT 500s — that's the right behaviour, since the capture flow
+    // wants to know its write was lost (so future retries/observability
+    // can react). Scenario-matrix.sh confirms this end-to-end on
+    // scenarios 2/4/6 where sessions was ALTERed.
+    const api = new DeeplakeApi("tok", "https://api.example", "org", "ws", "memory");
+    vi.spyOn(api, "query").mockImplementation(async (sql: string) => {
+      if (/^INSERT INTO/.test(sql)) {
+        throw new Error(`Query failed: 500: ${VECTOR_AT.errorBody}`);
+      }
+      return [];
+    });
+    await expect(
+      api.query(`INSERT INTO "sessions" (id, message_embedding) VALUES ('x', NULL)`),
+    ).rejects.toThrow(/vector::at out of range/);
+  });
+});

From 4dd1c326cda28ac2a96611a0ea13386010086592 Mon Sep 17 00:00:00 2001
From: Emanuele Fenocchi <emanuele.fenocchi@activeloop.dev>
Date: Mon, 27 Apr 2026 22:26:38 +0000
Subject: [PATCH 30/30] feat(codex): embed message inline before sessions
 INSERT
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Brings codex's capture and stop hooks to parity with the claude-code
capture path (commit bfff7be). Until now codex sessions wrote rows
without ever calling EmbedClient — neither UserPromptSubmit /
PostToolUse via codex/capture.ts nor the assistant-stop event via
codex/stop.ts listed the message_embedding column in their INSERTs,
so semantic recall against codex sessions was permanently lexical-only
even with the daemon running.

The asymmetry was an oversight, not a design decision — codex
wiki-worker DID embed summaries (and was the only codex hook
importing EmbedClient), but capture-time embeddings never landed.

Mirror the claude-code pattern in both hooks:
- import EmbedClient + embeddingsDisabled + embeddingSqlLiteral and
  the resolveEmbedDaemonPath helper;
- compute the embedding best-effort right before the INSERT (returns
  null on disabled / no-transformers / daemon miss → column lands
  NULL via embeddingSqlLiteral, schema-compatible);
- list message_embedding in the INSERT column tuple with the literal
  in matching position.

The two existing codex hook unit tests are updated to mock the
EmbedClient module the same way claude-code's capture-hook test
does — without it, the hook's `await new EmbedClient(...).embed(...)`
threw before the SQL was sent and every SQL-shape assertion failed
with "calls[0] is undefined". The mock returns Promise.resolve(null)
so the existing INSERT-shape assertions can be tightened in a follow
up to also assert message_embedding presence.
---
 claude-code/tests/codex-capture-hook.test.ts |   6 +
 claude-code/tests/codex-stop-hook.test.ts    |   6 +
 codex/bundle/capture.js                      | 330 +++++++++++++++++--
 codex/bundle/stop.js                         | 294 ++++++++++++++++-
 src/hooks/codex/capture.ts                   |  20 +-
 src/hooks/codex/stop.ts                      |  20 +-
 6 files changed, 629 insertions(+), 47 deletions(-)

diff --git a/claude-code/tests/codex-capture-hook.test.ts b/claude-code/tests/codex-capture-hook.test.ts
index 7ad363f..36dd993 100644
--- a/claude-code/tests/codex-capture-hook.test.ts
+++ b/claude-code/tests/codex-capture-hook.test.ts
@@ -44,6 +44,12 @@ vi.mock("../../src/deeplake-api.js", () => ({
     ensureSessionsTable(t: string) { return ensureSessionsTableMock(t); }
   },
 }));
+vi.mock("../../src/embeddings/client.js", () => ({
+  EmbedClient: class {
+    embed(_text: string, _kind?: string) { return Promise.resolve(null); }
+    warmup() { return Promise.resolve(false); }
+  },
+}));
 
 async function runHook(env: Record<string, string | undefined> = {}): Promise<void> {
   delete process.env.HIVEMIND_WIKI_WORKER;
diff --git a/claude-code/tests/codex-stop-hook.test.ts b/claude-code/tests/codex-stop-hook.test.ts
index 46eb283..6b745b6 100644
--- a/claude-code/tests/codex-stop-hook.test.ts
+++ b/claude-code/tests/codex-stop-hook.test.ts
@@ -37,6 +37,12 @@ vi.mock("../../src/utils/debug.js", () => ({
 vi.mock("../../src/deeplake-api.js", () => ({
   DeeplakeApi: class { query(sql: string) { return queryMock(sql); } },
 }));
+vi.mock("../../src/embeddings/client.js", () => ({
+  EmbedClient: class {
+    embed(_text: string, _kind?: string) { return Promise.resolve(null); }
+    warmup() { return Promise.resolve(false); }
+  },
+}));
 
 async function runHook(env: Record<string, string | undefined> = {}): Promise<void> {
   delete process.env.HIVEMIND_WIKI_WORKER;
diff --git a/codex/bundle/capture.js b/codex/bundle/capture.js
index ce3a2f6..c424b34 100755
--- a/codex/bundle/capture.js
+++ b/codex/bundle/capture.js
@@ -409,8 +409,273 @@ function buildSessionPath(config, sessionId) {
   return `/sessions/${config.userName}/${config.userName}_${config.orgName}_${workspace}_${sessionId}.jsonl`;
 }
 
+// dist/src/embeddings/client.js
+import { connect } from "node:net";
+import { spawn } from "node:child_process";
+import { openSync, closeSync, writeSync, unlinkSync, existsSync as existsSync3, readFileSync as readFileSync3 } from "node:fs";
+
+// dist/src/embeddings/protocol.js
+var DEFAULT_SOCKET_DIR = "/tmp";
+var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
+var DEFAULT_CLIENT_TIMEOUT_MS = 2e3;
+function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.sock`;
+}
+function pidPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.pid`;
+}
+
+// dist/src/embeddings/client.js
+var log3 = (m) => log("embed-client", m);
+function getUid() {
+  const uid = typeof process.getuid === "function" ? process.getuid() : void 0;
+  return uid !== void 0 ? String(uid) : process.env.USER ?? "default";
+}
+var EmbedClient = class {
+  socketPath;
+  pidPath;
+  timeoutMs;
+  daemonEntry;
+  autoSpawn;
+  spawnWaitMs;
+  nextId = 0;
+  constructor(opts = {}) {
+    const uid = getUid();
+    const dir = opts.socketDir ?? "/tmp";
+    this.socketPath = socketPathFor(uid, dir);
+    this.pidPath = pidPathFor(uid, dir);
+    this.timeoutMs = opts.timeoutMs ?? DEFAULT_CLIENT_TIMEOUT_MS;
+    this.daemonEntry = opts.daemonEntry ?? process.env.HIVEMIND_EMBED_DAEMON;
+    this.autoSpawn = opts.autoSpawn ?? true;
+    this.spawnWaitMs = opts.spawnWaitMs ?? 5e3;
+  }
+  /**
+   * Returns an embedding vector, or null on timeout/failure. Hooks MUST treat
+   * null as "skip embedding column" — never block the write path on us.
+   *
+   * Fire-and-forget spawn on miss: if the daemon isn't up, this call returns
+   * null AND kicks off a background spawn. The next call finds a ready daemon.
+   */
+  async embed(text, kind = "document") {
+    let sock;
+    try {
+      sock = await this.connectOnce();
+    } catch {
+      if (this.autoSpawn)
+        this.trySpawnDaemon();
+      return null;
+    }
+    try {
+      const id = String(++this.nextId);
+      const req = { op: "embed", id, kind, text };
+      const resp = await this.sendAndWait(sock, req);
+      if (resp.error || !("embedding" in resp) || !resp.embedding) {
+        log3(`embed err: ${resp.error ?? "no embedding"}`);
+        return null;
+      }
+      return resp.embedding;
+    } catch (e) {
+      const err = e instanceof Error ? e.message : String(e);
+      log3(`embed failed: ${err}`);
+      return null;
+    } finally {
+      try {
+        sock.end();
+      } catch {
+      }
+    }
+  }
+  /**
+   * Wait up to spawnWaitMs for the daemon to accept connections, spawning if
+   * necessary. Meant for SessionStart / long-running batches — not the hot path.
+   */
+  async warmup() {
+    try {
+      const s = await this.connectOnce();
+      s.end();
+      return true;
+    } catch {
+      if (!this.autoSpawn)
+        return false;
+      this.trySpawnDaemon();
+      try {
+        const s = await this.waitForSocket();
+        s.end();
+        return true;
+      } catch {
+        return false;
+      }
+    }
+  }
+  connectOnce() {
+    return new Promise((resolve, reject) => {
+      const sock = connect(this.socketPath);
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("connect timeout"));
+      }, this.timeoutMs);
+      sock.once("connect", () => {
+        clearTimeout(to);
+        resolve(sock);
+      });
+      sock.once("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+    });
+  }
+  trySpawnDaemon() {
+    let fd;
+    try {
+      fd = openSync(this.pidPath, "wx", 384);
+      writeSync(fd, String(process.pid));
+    } catch (e) {
+      if (this.isPidFileStale()) {
+        try {
+          unlinkSync(this.pidPath);
+        } catch {
+        }
+        try {
+          fd = openSync(this.pidPath, "wx", 384);
+          writeSync(fd, String(process.pid));
+        } catch {
+          return;
+        }
+      } else {
+        return;
+      }
+    }
+    if (!this.daemonEntry || !existsSync3(this.daemonEntry)) {
+      log3(`daemonEntry not configured or missing: ${this.daemonEntry}`);
+      try {
+        closeSync(fd);
+        unlinkSync(this.pidPath);
+      } catch {
+      }
+      return;
+    }
+    try {
+      const child = spawn(process.execPath, [this.daemonEntry], {
+        detached: true,
+        stdio: "ignore",
+        env: process.env
+      });
+      child.unref();
+      log3(`spawned daemon pid=${child.pid}`);
+    } finally {
+      closeSync(fd);
+    }
+  }
+  isPidFileStale() {
+    try {
+      const raw = readFileSync3(this.pidPath, "utf-8").trim();
+      const pid = Number(raw);
+      if (!pid || Number.isNaN(pid))
+        return true;
+      try {
+        process.kill(pid, 0);
+        return false;
+      } catch {
+        return true;
+      }
+    } catch {
+      return true;
+    }
+  }
+  async waitForSocket() {
+    const deadline = Date.now() + this.spawnWaitMs;
+    let delay = 30;
+    while (Date.now() < deadline) {
+      await sleep2(delay);
+      delay = Math.min(delay * 1.5, 300);
+      if (!existsSync3(this.socketPath))
+        continue;
+      try {
+        return await this.connectOnce();
+      } catch {
+      }
+    }
+    throw new Error("daemon did not become ready within spawnWaitMs");
+  }
+  sendAndWait(sock, req) {
+    return new Promise((resolve, reject) => {
+      let buf = "";
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("request timeout"));
+      }, this.timeoutMs);
+      sock.setEncoding("utf-8");
+      sock.on("data", (chunk) => {
+        buf += chunk;
+        const nl = buf.indexOf("\n");
+        if (nl === -1)
+          return;
+        const line = buf.slice(0, nl);
+        clearTimeout(to);
+        try {
+          resolve(JSON.parse(line));
+        } catch (e) {
+          reject(e);
+        }
+      });
+      sock.on("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+      sock.write(JSON.stringify(req) + "\n");
+    });
+  }
+};
+function sleep2(ms) {
+  return new Promise((r) => setTimeout(r, ms));
+}
+
+// dist/src/embeddings/sql.js
+function embeddingSqlLiteral(vec) {
+  if (!vec || vec.length === 0)
+    return "NULL";
+  const parts = [];
+  for (const v of vec) {
+    if (!Number.isFinite(v))
+      return "NULL";
+    parts.push(String(v));
+  }
+  return `ARRAY[${parts.join(",")}]::float4[]`;
+}
+
+// dist/src/embeddings/disable.js
+import { createRequire } from "node:module";
+var cachedStatus = null;
+function defaultResolveTransformers() {
+  createRequire(import.meta.url).resolve("@huggingface/transformers");
+}
+var _resolve = defaultResolveTransformers;
+function detectStatus() {
+  if (process.env.HIVEMIND_EMBEDDINGS === "false")
+    return "env-disabled";
+  try {
+    _resolve();
+    return "enabled";
+  } catch {
+    return "no-transformers";
+  }
+}
+function embeddingsStatus() {
+  if (cachedStatus !== null)
+    return cachedStatus;
+  cachedStatus = detectStatus();
+  return cachedStatus;
+}
+function embeddingsDisabled() {
+  return embeddingsStatus() !== "enabled";
+}
+
+// dist/src/hooks/codex/capture.js
+import { fileURLToPath as fileURLToPath2 } from "node:url";
+import { dirname as dirname2, join as join7 } from "node:path";
+
 // dist/src/hooks/summary-state.js
-import { readFileSync as readFileSync3, writeFileSync as writeFileSync2, writeSync, mkdirSync as mkdirSync2, renameSync, existsSync as existsSync3, unlinkSync, openSync, closeSync } from "node:fs";
+import { readFileSync as readFileSync4, writeFileSync as writeFileSync2, writeSync as writeSync2, mkdirSync as mkdirSync2, renameSync, existsSync as existsSync4, unlinkSync as unlinkSync2, openSync as openSync2, closeSync as closeSync2 } from "node:fs";
 import { homedir as homedir3 } from "node:os";
 import { join as join4 } from "node:path";
 var dlog = (msg) => log("summary-state", msg);
@@ -424,10 +689,10 @@ function lockPath(sessionId) {
 }
 function readState(sessionId) {
   const p = statePath(sessionId);
-  if (!existsSync3(p))
+  if (!existsSync4(p))
     return null;
   try {
-    return JSON.parse(readFileSync3(p, "utf-8"));
+    return JSON.parse(readFileSync4(p, "utf-8"));
   } catch {
     return null;
   }
@@ -446,14 +711,14 @@ function withRmwLock(sessionId, fn) {
   let fd = null;
   while (fd === null) {
     try {
-      fd = openSync(rmwLock, "wx");
+      fd = openSync2(rmwLock, "wx");
     } catch (e) {
       if (e.code !== "EEXIST")
         throw e;
       if (Date.now() > deadline) {
         dlog(`rmw lock deadline exceeded for ${sessionId}, reclaiming stale lock`);
         try {
-          unlinkSync(rmwLock);
+          unlinkSync2(rmwLock);
         } catch (unlinkErr) {
           dlog(`stale rmw lock unlink failed for ${sessionId}: ${unlinkErr.message}`);
         }
@@ -465,9 +730,9 @@ function withRmwLock(sessionId, fn) {
   try {
     return fn();
   } finally {
-    closeSync(fd);
+    closeSync2(fd);
     try {
-      unlinkSync(rmwLock);
+      unlinkSync2(rmwLock);
     } catch (unlinkErr) {
       dlog(`rmw lock cleanup failed for ${sessionId}: ${unlinkErr.message}`);
     }
@@ -504,27 +769,27 @@ function shouldTrigger(state, cfg, now = Date.now()) {
 function tryAcquireLock(sessionId, maxAgeMs = 10 * 60 * 1e3) {
   mkdirSync2(STATE_DIR, { recursive: true });
   const p = lockPath(sessionId);
-  if (existsSync3(p)) {
+  if (existsSync4(p)) {
     try {
-      const ageMs = Date.now() - parseInt(readFileSync3(p, "utf-8"), 10);
+      const ageMs = Date.now() - parseInt(readFileSync4(p, "utf-8"), 10);
       if (Number.isFinite(ageMs) && ageMs < maxAgeMs)
         return false;
     } catch (readErr) {
       dlog(`lock file unreadable for ${sessionId}, treating as stale: ${readErr.message}`);
     }
     try {
-      unlinkSync(p);
+      unlinkSync2(p);
     } catch (unlinkErr) {
       dlog(`could not unlink stale lock for ${sessionId}: ${unlinkErr.message}`);
       return false;
     }
   }
   try {
-    const fd = openSync(p, "wx");
+    const fd = openSync2(p, "wx");
     try {
-      writeSync(fd, String(Date.now()));
+      writeSync2(fd, String(Date.now()));
     } finally {
-      closeSync(fd);
+      closeSync2(fd);
     }
     return true;
   } catch (e) {
@@ -535,7 +800,7 @@ function tryAcquireLock(sessionId, maxAgeMs = 10 * 60 * 1e3) {
 }
 function releaseLock(sessionId) {
   try {
-    unlinkSync(lockPath(sessionId));
+    unlinkSync2(lockPath(sessionId));
   } catch (e) {
     if (e?.code !== "ENOENT") {
       dlog(`releaseLock unlink failed for ${sessionId}: ${e.message}`);
@@ -544,7 +809,7 @@ function releaseLock(sessionId) {
 }
 
 // dist/src/hooks/codex/spawn-wiki-worker.js
-import { spawn, execSync } from "node:child_process";
+import { spawn as spawn2, execSync } from "node:child_process";
 import { fileURLToPath } from "node:url";
 import { dirname, join as join6 } from "node:path";
 import { writeFileSync as writeFileSync3, mkdirSync as mkdirSync4 } from "node:fs";
@@ -653,7 +918,7 @@ function spawnCodexWikiWorker(opts) {
   }));
   wikiLog(`${reason}: spawning summary worker for ${sessionId}`);
   const workerPath = join6(bundleDir, "wiki-worker.js");
-  spawn("nohup", ["node", workerPath, configFile], {
+  spawn2("nohup", ["node", workerPath, configFile], {
     detached: true,
     stdio: ["ignore", "ignore", "ignore"]
   }).unref();
@@ -664,7 +929,10 @@ function bundleDirFromImportMeta(importMetaUrl) {
 }
 
 // dist/src/hooks/codex/capture.js
-var log3 = (msg) => log("codex-capture", msg);
+var log4 = (msg) => log("codex-capture", msg);
+function resolveEmbedDaemonPath() {
+  return join7(dirname2(fileURLToPath2(import.meta.url)), "embeddings", "embed-daemon.js");
+}
 var CAPTURE = process.env.HIVEMIND_CAPTURE !== "false";
 async function main() {
   if (!CAPTURE)
@@ -672,7 +940,7 @@ async function main() {
   const input = await readStdin();
   const config = loadConfig();
   if (!config) {
-    log3("no config");
+    log4("no config");
     return;
   }
   const sessionsTable = config.sessionsTableName;
@@ -689,7 +957,7 @@ async function main() {
   };
   let entry;
   if (input.hook_event_name === "UserPromptSubmit" && input.prompt !== void 0) {
-    log3(`user session=${input.session_id}`);
+    log4(`user session=${input.session_id}`);
     entry = {
       id: crypto.randomUUID(),
       ...meta,
@@ -697,7 +965,7 @@ async function main() {
       content: input.prompt
     };
   } else if (input.hook_event_name === "PostToolUse" && input.tool_name !== void 0) {
-    log3(`tool=${input.tool_name} session=${input.session_id}`);
+    log4(`tool=${input.tool_name} session=${input.session_id}`);
     entry = {
       id: crypto.randomUUID(),
       ...meta,
@@ -708,28 +976,30 @@ async function main() {
       tool_response: JSON.stringify(input.tool_response)
     };
   } else {
-    log3(`unknown event: ${input.hook_event_name}, skipping`);
+    log4(`unknown event: ${input.hook_event_name}, skipping`);
     return;
   }
   const sessionPath = buildSessionPath(config, input.session_id);
   const line = JSON.stringify(entry);
-  log3(`writing to ${sessionPath}`);
+  log4(`writing to ${sessionPath}`);
   const projectName = (input.cwd ?? "").split("/").pop() || "unknown";
   const filename = sessionPath.split("/").pop() ?? "";
   const jsonForSql = line.replace(/'/g, "''");
-  const insertSql = `INSERT INTO "${sessionsTable}" (id, path, filename, message, author, size_bytes, project, description, agent, creation_date, last_update_date) VALUES ('${crypto.randomUUID()}', '${sqlStr(sessionPath)}', '${sqlStr(filename)}', '${jsonForSql}'::jsonb, '${sqlStr(config.userName)}', ${Buffer.byteLength(line, "utf-8")}, '${sqlStr(projectName)}', '${sqlStr(input.hook_event_name ?? "")}', 'codex', '${ts}', '${ts}')`;
+  const embedding = embeddingsDisabled() ? null : await new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() }).embed(line, "document");
+  const embeddingSql = embeddingSqlLiteral(embedding);
+  const insertSql = `INSERT INTO "${sessionsTable}" (id, path, filename, message, message_embedding, author, size_bytes, project, description, agent, creation_date, last_update_date) VALUES ('${crypto.randomUUID()}', '${sqlStr(sessionPath)}', '${sqlStr(filename)}', '${jsonForSql}'::jsonb, ${embeddingSql}, '${sqlStr(config.userName)}', ${Buffer.byteLength(line, "utf-8")}, '${sqlStr(projectName)}', '${sqlStr(input.hook_event_name ?? "")}', 'codex', '${ts}', '${ts}')`;
   try {
     await api.query(insertSql);
   } catch (e) {
     if (e.message?.includes("permission denied") || e.message?.includes("does not exist")) {
-      log3("table missing, creating and retrying");
+      log4("table missing, creating and retrying");
       await api.ensureSessionsTable(sessionsTable);
       await api.query(insertSql);
     } else {
       throw e;
     }
   }
-  log3("capture ok");
+  log4("capture ok");
   maybeTriggerPeriodicSummary(input.session_id, input.cwd ?? "", config);
 }
 function maybeTriggerPeriodicSummary(sessionId, cwd, config) {
@@ -741,7 +1011,7 @@ function maybeTriggerPeriodicSummary(sessionId, cwd, config) {
     if (!shouldTrigger(state, cfg))
       return;
     if (!tryAcquireLock(sessionId)) {
-      log3(`periodic trigger suppressed (lock held) session=${sessionId}`);
+      log4(`periodic trigger suppressed (lock held) session=${sessionId}`);
       return;
     }
     wikiLog(`Periodic: threshold hit (total=${state.totalCount}, since=${state.totalCount - state.lastSummaryCount}, N=${cfg.everyNMessages}, hours=${cfg.everyHours})`);
@@ -754,19 +1024,19 @@ function maybeTriggerPeriodicSummary(sessionId, cwd, config) {
         reason: "Periodic"
       });
     } catch (e) {
-      log3(`periodic spawn failed: ${e.message}`);
+      log4(`periodic spawn failed: ${e.message}`);
       try {
         releaseLock(sessionId);
       } catch (releaseErr) {
-        log3(`releaseLock after periodic spawn failure also failed: ${releaseErr.message}`);
+        log4(`releaseLock after periodic spawn failure also failed: ${releaseErr.message}`);
       }
       throw e;
     }
   } catch (e) {
-    log3(`periodic trigger error: ${e.message}`);
+    log4(`periodic trigger error: ${e.message}`);
   }
 }
 main().catch((e) => {
-  log3(`fatal: ${e.message}`);
+  log4(`fatal: ${e.message}`);
   process.exit(0);
 });
diff --git a/codex/bundle/stop.js b/codex/bundle/stop.js
index 7b96903..66bd150 100755
--- a/codex/bundle/stop.js
+++ b/codex/bundle/stop.js
@@ -1,7 +1,9 @@
 #!/usr/bin/env node
 
 // dist/src/hooks/codex/stop.js
-import { readFileSync as readFileSync4, existsSync as existsSync4 } from "node:fs";
+import { readFileSync as readFileSync5, existsSync as existsSync5 } from "node:fs";
+import { fileURLToPath as fileURLToPath2 } from "node:url";
+import { dirname as dirname2, join as join7 } from "node:path";
 
 // dist/src/utils/stdin.js
 function readStdin() {
@@ -584,8 +586,272 @@ function buildSessionPath(config, sessionId) {
   return `/sessions/${config.userName}/${config.userName}_${config.orgName}_${workspace}_${sessionId}.jsonl`;
 }
 
+// dist/src/embeddings/client.js
+import { connect } from "node:net";
+import { spawn as spawn2 } from "node:child_process";
+import { openSync as openSync2, closeSync as closeSync2, writeSync as writeSync2, unlinkSync as unlinkSync2, existsSync as existsSync4, readFileSync as readFileSync4 } from "node:fs";
+
+// dist/src/embeddings/protocol.js
+var DEFAULT_SOCKET_DIR = "/tmp";
+var DEFAULT_IDLE_TIMEOUT_MS = 15 * 60 * 1e3;
+var DEFAULT_CLIENT_TIMEOUT_MS = 2e3;
+function socketPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.sock`;
+}
+function pidPathFor(uid, dir = DEFAULT_SOCKET_DIR) {
+  return `${dir}/hivemind-embed-${uid}.pid`;
+}
+
+// dist/src/embeddings/client.js
+var log3 = (m) => log("embed-client", m);
+function getUid() {
+  const uid = typeof process.getuid === "function" ? process.getuid() : void 0;
+  return uid !== void 0 ? String(uid) : process.env.USER ?? "default";
+}
+var EmbedClient = class {
+  socketPath;
+  pidPath;
+  timeoutMs;
+  daemonEntry;
+  autoSpawn;
+  spawnWaitMs;
+  nextId = 0;
+  constructor(opts = {}) {
+    const uid = getUid();
+    const dir = opts.socketDir ?? "/tmp";
+    this.socketPath = socketPathFor(uid, dir);
+    this.pidPath = pidPathFor(uid, dir);
+    this.timeoutMs = opts.timeoutMs ?? DEFAULT_CLIENT_TIMEOUT_MS;
+    this.daemonEntry = opts.daemonEntry ?? process.env.HIVEMIND_EMBED_DAEMON;
+    this.autoSpawn = opts.autoSpawn ?? true;
+    this.spawnWaitMs = opts.spawnWaitMs ?? 5e3;
+  }
+  /**
+   * Returns an embedding vector, or null on timeout/failure. Hooks MUST treat
+   * null as "skip embedding column" — never block the write path on us.
+   *
+   * Fire-and-forget spawn on miss: if the daemon isn't up, this call returns
+   * null AND kicks off a background spawn. The next call finds a ready daemon.
+   */
+  async embed(text, kind = "document") {
+    let sock;
+    try {
+      sock = await this.connectOnce();
+    } catch {
+      if (this.autoSpawn)
+        this.trySpawnDaemon();
+      return null;
+    }
+    try {
+      const id = String(++this.nextId);
+      const req = { op: "embed", id, kind, text };
+      const resp = await this.sendAndWait(sock, req);
+      if (resp.error || !("embedding" in resp) || !resp.embedding) {
+        log3(`embed err: ${resp.error ?? "no embedding"}`);
+        return null;
+      }
+      return resp.embedding;
+    } catch (e) {
+      const err = e instanceof Error ? e.message : String(e);
+      log3(`embed failed: ${err}`);
+      return null;
+    } finally {
+      try {
+        sock.end();
+      } catch {
+      }
+    }
+  }
+  /**
+   * Wait up to spawnWaitMs for the daemon to accept connections, spawning if
+   * necessary. Meant for SessionStart / long-running batches — not the hot path.
+   */
+  async warmup() {
+    try {
+      const s = await this.connectOnce();
+      s.end();
+      return true;
+    } catch {
+      if (!this.autoSpawn)
+        return false;
+      this.trySpawnDaemon();
+      try {
+        const s = await this.waitForSocket();
+        s.end();
+        return true;
+      } catch {
+        return false;
+      }
+    }
+  }
+  connectOnce() {
+    return new Promise((resolve, reject) => {
+      const sock = connect(this.socketPath);
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("connect timeout"));
+      }, this.timeoutMs);
+      sock.once("connect", () => {
+        clearTimeout(to);
+        resolve(sock);
+      });
+      sock.once("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+    });
+  }
+  trySpawnDaemon() {
+    let fd;
+    try {
+      fd = openSync2(this.pidPath, "wx", 384);
+      writeSync2(fd, String(process.pid));
+    } catch (e) {
+      if (this.isPidFileStale()) {
+        try {
+          unlinkSync2(this.pidPath);
+        } catch {
+        }
+        try {
+          fd = openSync2(this.pidPath, "wx", 384);
+          writeSync2(fd, String(process.pid));
+        } catch {
+          return;
+        }
+      } else {
+        return;
+      }
+    }
+    if (!this.daemonEntry || !existsSync4(this.daemonEntry)) {
+      log3(`daemonEntry not configured or missing: ${this.daemonEntry}`);
+      try {
+        closeSync2(fd);
+        unlinkSync2(this.pidPath);
+      } catch {
+      }
+      return;
+    }
+    try {
+      const child = spawn2(process.execPath, [this.daemonEntry], {
+        detached: true,
+        stdio: "ignore",
+        env: process.env
+      });
+      child.unref();
+      log3(`spawned daemon pid=${child.pid}`);
+    } finally {
+      closeSync2(fd);
+    }
+  }
+  isPidFileStale() {
+    try {
+      const raw = readFileSync4(this.pidPath, "utf-8").trim();
+      const pid = Number(raw);
+      if (!pid || Number.isNaN(pid))
+        return true;
+      try {
+        process.kill(pid, 0);
+        return false;
+      } catch {
+        return true;
+      }
+    } catch {
+      return true;
+    }
+  }
+  async waitForSocket() {
+    const deadline = Date.now() + this.spawnWaitMs;
+    let delay = 30;
+    while (Date.now() < deadline) {
+      await sleep2(delay);
+      delay = Math.min(delay * 1.5, 300);
+      if (!existsSync4(this.socketPath))
+        continue;
+      try {
+        return await this.connectOnce();
+      } catch {
+      }
+    }
+    throw new Error("daemon did not become ready within spawnWaitMs");
+  }
+  sendAndWait(sock, req) {
+    return new Promise((resolve, reject) => {
+      let buf = "";
+      const to = setTimeout(() => {
+        sock.destroy();
+        reject(new Error("request timeout"));
+      }, this.timeoutMs);
+      sock.setEncoding("utf-8");
+      sock.on("data", (chunk) => {
+        buf += chunk;
+        const nl = buf.indexOf("\n");
+        if (nl === -1)
+          return;
+        const line = buf.slice(0, nl);
+        clearTimeout(to);
+        try {
+          resolve(JSON.parse(line));
+        } catch (e) {
+          reject(e);
+        }
+      });
+      sock.on("error", (e) => {
+        clearTimeout(to);
+        reject(e);
+      });
+      sock.write(JSON.stringify(req) + "\n");
+    });
+  }
+};
+function sleep2(ms) {
+  return new Promise((r) => setTimeout(r, ms));
+}
+
+// dist/src/embeddings/sql.js
+function embeddingSqlLiteral(vec) {
+  if (!vec || vec.length === 0)
+    return "NULL";
+  const parts = [];
+  for (const v of vec) {
+    if (!Number.isFinite(v))
+      return "NULL";
+    parts.push(String(v));
+  }
+  return `ARRAY[${parts.join(",")}]::float4[]`;
+}
+
+// dist/src/embeddings/disable.js
+import { createRequire } from "node:module";
+var cachedStatus = null;
+function defaultResolveTransformers() {
+  createRequire(import.meta.url).resolve("@huggingface/transformers");
+}
+var _resolve = defaultResolveTransformers;
+function detectStatus() {
+  if (process.env.HIVEMIND_EMBEDDINGS === "false")
+    return "env-disabled";
+  try {
+    _resolve();
+    return "enabled";
+  } catch {
+    return "no-transformers";
+  }
+}
+function embeddingsStatus() {
+  if (cachedStatus !== null)
+    return cachedStatus;
+  cachedStatus = detectStatus();
+  return cachedStatus;
+}
+function embeddingsDisabled() {
+  return embeddingsStatus() !== "enabled";
+}
+
 // dist/src/hooks/codex/stop.js
-var log3 = (msg) => log("codex-stop", msg);
+var log4 = (msg) => log("codex-stop", msg);
+function resolveEmbedDaemonPath() {
+  return join7(dirname2(fileURLToPath2(import.meta.url)), "embeddings", "embed-daemon.js");
+}
 var CAPTURE = process.env.HIVEMIND_CAPTURE !== "false";
 async function main() {
   if (process.env.HIVEMIND_WIKI_WORKER === "1")
@@ -596,7 +862,7 @@ async function main() {
     return;
   const config = loadConfig();
   if (!config) {
-    log3("no config");
+    log4("no config");
     return;
   }
   if (CAPTURE) {
@@ -608,8 +874,8 @@ async function main() {
       if (input.transcript_path) {
         try {
           const transcriptPath = input.transcript_path;
-          if (existsSync4(transcriptPath)) {
-            const transcript = readFileSync4(transcriptPath, "utf-8");
+          if (existsSync5(transcriptPath)) {
+            const transcript = readFileSync5(transcriptPath, "utf-8");
             const lines = transcript.trim().split("\n").reverse();
             for (const line2 of lines) {
               try {
@@ -626,10 +892,10 @@ async function main() {
               }
             }
             if (lastAssistantMessage)
-              log3(`extracted assistant message from transcript (${lastAssistantMessage.length} chars)`);
+              log4(`extracted assistant message from transcript (${lastAssistantMessage.length} chars)`);
           }
         } catch (e) {
-          log3(`transcript read failed: ${e.message}`);
+          log4(`transcript read failed: ${e.message}`);
         }
       }
       const entry = {
@@ -648,11 +914,13 @@ async function main() {
       const projectName = (input.cwd ?? "").split("/").pop() || "unknown";
       const filename = sessionPath.split("/").pop() ?? "";
       const jsonForSql = line.replace(/'/g, "''");
-      const insertSql = `INSERT INTO "${sessionsTable}" (id, path, filename, message, author, size_bytes, project, description, agent, creation_date, last_update_date) VALUES ('${crypto.randomUUID()}', '${sqlStr(sessionPath)}', '${sqlStr(filename)}', '${jsonForSql}'::jsonb, '${sqlStr(config.userName)}', ${Buffer.byteLength(line, "utf-8")}, '${sqlStr(projectName)}', 'Stop', 'codex', '${ts}', '${ts}')`;
+      const embedding = embeddingsDisabled() ? null : await new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() }).embed(line, "document");
+      const embeddingSql = embeddingSqlLiteral(embedding);
+      const insertSql = `INSERT INTO "${sessionsTable}" (id, path, filename, message, message_embedding, author, size_bytes, project, description, agent, creation_date, last_update_date) VALUES ('${crypto.randomUUID()}', '${sqlStr(sessionPath)}', '${sqlStr(filename)}', '${jsonForSql}'::jsonb, ${embeddingSql}, '${sqlStr(config.userName)}', ${Buffer.byteLength(line, "utf-8")}, '${sqlStr(projectName)}', 'Stop', 'codex', '${ts}', '${ts}')`;
       await api.query(insertSql);
-      log3("stop event captured");
+      log4("stop event captured");
     } catch (e) {
-      log3(`capture failed: ${e.message}`);
+      log4(`capture failed: ${e.message}`);
     }
   }
   if (!CAPTURE)
@@ -671,16 +939,16 @@ async function main() {
       reason: "Stop"
     });
   } catch (e) {
-    log3(`spawn failed: ${e.message}`);
+    log4(`spawn failed: ${e.message}`);
     try {
       releaseLock(sessionId);
     } catch (releaseErr) {
-      log3(`releaseLock after spawn failure also failed: ${releaseErr.message}`);
+      log4(`releaseLock after spawn failure also failed: ${releaseErr.message}`);
     }
     throw e;
   }
 }
 main().catch((e) => {
-  log3(`fatal: ${e.message}`);
+  log4(`fatal: ${e.message}`);
   process.exit(0);
 });
diff --git a/src/hooks/codex/capture.ts b/src/hooks/codex/capture.ts
index fc16b01..5358f0e 100644
--- a/src/hooks/codex/capture.ts
+++ b/src/hooks/codex/capture.ts
@@ -18,6 +18,11 @@ import { DeeplakeApi } from "../../deeplake-api.js";
 import { sqlStr } from "../../utils/sql.js";
 import { log as _log } from "../../utils/debug.js";
 import { buildSessionPath } from "../../utils/session-path.js";
+import { EmbedClient } from "../../embeddings/client.js";
+import { embeddingSqlLiteral } from "../../embeddings/sql.js";
+import { embeddingsDisabled } from "../../embeddings/disable.js";
+import { fileURLToPath } from "node:url";
+import { dirname, join } from "node:path";
 import {
   bumpTotalCount,
   loadTriggerConfig,
@@ -28,6 +33,10 @@ import {
 import { bundleDirFromImportMeta, spawnCodexWikiWorker, wikiLog } from "./spawn-wiki-worker.js";
 const log = (msg: string) => _log("codex-capture", msg);
 
+function resolveEmbedDaemonPath(): string {
+  return join(dirname(fileURLToPath(import.meta.url)), "embeddings", "embed-daemon.js");
+}
+
 interface CodexHookInput {
   session_id: string;
   transcript_path?: string | null;
@@ -102,9 +111,16 @@ async function main(): Promise<void> {
   // sqlStr() would also escape backslashes and strip control chars, corrupting the JSON.
   const jsonForSql = line.replace(/'/g, "''");
 
+  // Best-effort embed: if the daemon is unavailable (no @huggingface/transformers
+  // or HIVEMIND_EMBEDDINGS=false), embed() returns null and the column lands NULL.
+  const embedding = embeddingsDisabled()
+    ? null
+    : await new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() }).embed(line, "document");
+  const embeddingSql = embeddingSqlLiteral(embedding);
+
   const insertSql =
-    `INSERT INTO "${sessionsTable}" (id, path, filename, message, author, size_bytes, project, description, agent, creation_date, last_update_date) ` +
-    `VALUES ('${crypto.randomUUID()}', '${sqlStr(sessionPath)}', '${sqlStr(filename)}', '${jsonForSql}'::jsonb, '${sqlStr(config.userName)}', ` +
+    `INSERT INTO "${sessionsTable}" (id, path, filename, message, message_embedding, author, size_bytes, project, description, agent, creation_date, last_update_date) ` +
+    `VALUES ('${crypto.randomUUID()}', '${sqlStr(sessionPath)}', '${sqlStr(filename)}', '${jsonForSql}'::jsonb, ${embeddingSql}, '${sqlStr(config.userName)}', ` +
     `${Buffer.byteLength(line, "utf-8")}, '${sqlStr(projectName)}', '${sqlStr(input.hook_event_name ?? "")}', 'codex', '${ts}', '${ts}')`;
 
   try {
diff --git a/src/hooks/codex/stop.ts b/src/hooks/codex/stop.ts
index f698423..37ff7ba 100644
--- a/src/hooks/codex/stop.ts
+++ b/src/hooks/codex/stop.ts
@@ -12,6 +12,8 @@
  */
 
 import { readFileSync, existsSync } from "node:fs";
+import { fileURLToPath } from "node:url";
+import { dirname, join } from "node:path";
 import { readStdin } from "../../utils/stdin.js";
 import { loadConfig } from "../../config.js";
 import { DeeplakeApi } from "../../deeplake-api.js";
@@ -20,9 +22,16 @@ import { log as _log } from "../../utils/debug.js";
 import { bundleDirFromImportMeta, spawnCodexWikiWorker, wikiLog } from "./spawn-wiki-worker.js";
 import { tryAcquireLock, releaseLock } from "../summary-state.js";
 import { buildSessionPath } from "../../utils/session-path.js";
+import { EmbedClient } from "../../embeddings/client.js";
+import { embeddingSqlLiteral } from "../../embeddings/sql.js";
+import { embeddingsDisabled } from "../../embeddings/disable.js";
 
 const log = (msg: string) => _log("codex-stop", msg);
 
+function resolveEmbedDaemonPath(): string {
+  return join(dirname(fileURLToPath(import.meta.url)), "embeddings", "embed-daemon.js");
+}
+
 interface CodexStopInput {
   session_id: string;
   transcript_path?: string | null;
@@ -105,9 +114,16 @@ async function main(): Promise<void> {
       // sqlStr() would also escape backslashes and strip control chars, corrupting the JSON.
       const jsonForSql = line.replace(/'/g, "''");
 
+      // Best-effort embed: if the daemon is unavailable (no @huggingface/transformers
+      // or HIVEMIND_EMBEDDINGS=false), embed() returns null and the column lands NULL.
+      const embedding = embeddingsDisabled()
+        ? null
+        : await new EmbedClient({ daemonEntry: resolveEmbedDaemonPath() }).embed(line, "document");
+      const embeddingSql = embeddingSqlLiteral(embedding);
+
       const insertSql =
-        `INSERT INTO "${sessionsTable}" (id, path, filename, message, author, size_bytes, project, description, agent, creation_date, last_update_date) ` +
-        `VALUES ('${crypto.randomUUID()}', '${sqlStr(sessionPath)}', '${sqlStr(filename)}', '${jsonForSql}'::jsonb, '${sqlStr(config.userName)}', ` +
+        `INSERT INTO "${sessionsTable}" (id, path, filename, message, message_embedding, author, size_bytes, project, description, agent, creation_date, last_update_date) ` +
+        `VALUES ('${crypto.randomUUID()}', '${sqlStr(sessionPath)}', '${sqlStr(filename)}', '${jsonForSql}'::jsonb, ${embeddingSql}, '${sqlStr(config.userName)}', ` +
         `${Buffer.byteLength(line, "utf-8")}, '${sqlStr(projectName)}', 'Stop', 'codex', '${ts}', '${ts}')`;
 
       await api.query(insertSql);