From 613986c245912b69d7b3b452fa2deba40d44beba Mon Sep 17 00:00:00 2001
From: shanvit <shanvit7@gmail.com>
Date: Wed, 8 Apr 2026 15:31:41 +0530
Subject: [PATCH 01/12] chore: evals memory setup

---
 packages/memory/package.json                  |   4 +-
 packages/zosma-mem/README.md                  | 148 +++++++
 packages/zosma-mem/USAGE.md                   | 187 +++++++++
 packages/zosma-mem/package.json               |  52 +++
 .../src/evals/__tests__/metrics.test.ts       | 127 ++++++
 .../src/evals/__tests__/mock-adapter.ts       | 102 +++++
 .../src/evals/__tests__/report.test.ts        |  78 ++++
 .../src/evals/__tests__/runner.test.ts        |  96 +++++
 .../src/evals/__tests__/scenarios.test.ts     | 121 ++++++
 packages/zosma-mem/src/evals/cli/bin.ts       | 133 ++++++
 .../src/evals/cli/components/App.tsx          |  98 +++++
 .../src/evals/cli/components/ErrorDisplay.tsx |  15 +
 .../src/evals/cli/components/ScenarioRow.tsx  |  51 +++
 .../src/evals/cli/components/SummaryTable.tsx |  32 ++
 .../zosma-mem/src/evals/cli/simple-eval.ts    | 201 +++++++++
 packages/zosma-mem/src/evals/index.ts         |  56 +++
 packages/zosma-mem/src/evals/metrics.ts       | 121 ++++++
 packages/zosma-mem/src/evals/report.ts        |  70 ++++
 packages/zosma-mem/src/evals/runner.ts        | 128 ++++++
 .../src/evals/scenarios/co-access-cluster.ts  |  70 ++++
 .../src/evals/scenarios/cold-start.ts         |  59 +++
 .../evals/scenarios/conflicting-updates.ts    |  83 ++++
 .../src/evals/scenarios/cross-context.ts      |  98 +++++
 .../zosma-mem/src/evals/scenarios/index.ts    |  35 ++
 .../src/evals/scenarios/repeated-pattern.ts   |  70 ++++
 .../src/evals/scenarios/signal-dilution.ts    |  64 +++
 .../src/evals/scenarios/stale-memory.ts       |  89 ++++
 packages/zosma-mem/src/evals/types.ts         | 270 ++++++++++++
 .../zosma-mem/src/evals/utils/assertions.ts   |  54 +++
 .../zosma-mem/src/evals/utils/fixtures.ts     |  67 +++
 packages/zosma-mem/src/evals/utils/time.ts    |  32 ++
 packages/zosma-mem/src/index.ts               |   4 +
 packages/zosma-mem/tsconfig.json              |   9 +
 pnpm-lock.yaml                                | 390 +++++++++++++++++-
 34 files changed, 3194 insertions(+), 20 deletions(-)
 create mode 100644 packages/zosma-mem/README.md
 create mode 100644 packages/zosma-mem/USAGE.md
 create mode 100644 packages/zosma-mem/package.json
 create mode 100644 packages/zosma-mem/src/evals/__tests__/metrics.test.ts
 create mode 100644 packages/zosma-mem/src/evals/__tests__/mock-adapter.ts
 create mode 100644 packages/zosma-mem/src/evals/__tests__/report.test.ts
 create mode 100644 packages/zosma-mem/src/evals/__tests__/runner.test.ts
 create mode 100644 packages/zosma-mem/src/evals/__tests__/scenarios.test.ts
 create mode 100644 packages/zosma-mem/src/evals/cli/bin.ts
 create mode 100644 packages/zosma-mem/src/evals/cli/components/App.tsx
 create mode 100644 packages/zosma-mem/src/evals/cli/components/ErrorDisplay.tsx
 create mode 100644 packages/zosma-mem/src/evals/cli/components/ScenarioRow.tsx
 create mode 100644 packages/zosma-mem/src/evals/cli/components/SummaryTable.tsx
 create mode 100644 packages/zosma-mem/src/evals/cli/simple-eval.ts
 create mode 100644 packages/zosma-mem/src/evals/index.ts
 create mode 100644 packages/zosma-mem/src/evals/metrics.ts
 create mode 100644 packages/zosma-mem/src/evals/report.ts
 create mode 100644 packages/zosma-mem/src/evals/runner.ts
 create mode 100644 packages/zosma-mem/src/evals/scenarios/co-access-cluster.ts
 create mode 100644 packages/zosma-mem/src/evals/scenarios/cold-start.ts
 create mode 100644 packages/zosma-mem/src/evals/scenarios/conflicting-updates.ts
 create mode 100644 packages/zosma-mem/src/evals/scenarios/cross-context.ts
 create mode 100644 packages/zosma-mem/src/evals/scenarios/index.ts
 create mode 100644 packages/zosma-mem/src/evals/scenarios/repeated-pattern.ts
 create mode 100644 packages/zosma-mem/src/evals/scenarios/signal-dilution.ts
 create mode 100644 packages/zosma-mem/src/evals/scenarios/stale-memory.ts
 create mode 100644 packages/zosma-mem/src/evals/types.ts
 create mode 100644 packages/zosma-mem/src/evals/utils/assertions.ts
 create mode 100644 packages/zosma-mem/src/evals/utils/fixtures.ts
 create mode 100644 packages/zosma-mem/src/evals/utils/time.ts
 create mode 100644 packages/zosma-mem/src/index.ts
 create mode 100644 packages/zosma-mem/tsconfig.json

diff --git a/packages/memory/package.json b/packages/memory/package.json
index 5a87155..180f363 100644
--- a/packages/memory/package.json
+++ b/packages/memory/package.json
@@ -16,10 +16,10 @@
 		"check": "tsc --noEmit",
 		"test": "vitest --run"
 	},
-	"dependencies": {},
 	"devDependencies": {
 		"@types/node": "^22.15.2",
 		"typescript": "^5.7.3",
-		"vitest": "^3.0.0"
+		"vitest": "^3.0.0",
+		"zosma-mem": "link:../zosma-mem"
 	}
 }
diff --git a/packages/zosma-mem/README.md b/packages/zosma-mem/README.md
new file mode 100644
index 0000000..73f6ed1
--- /dev/null
+++ b/packages/zosma-mem/README.md
@@ -0,0 +1,148 @@
+# zosma-mem
+
+**Standalone CLI for evaluating agentic memory systems**
+
+A zero-config evaluation tool that automatically detects and tests memory systems against standardized information retrieval scenarios.
+
+## Installation
+
+```bash
+# For development (current)
+cd packages/zosma-mem
+npm install -g .
+
+# After publishing
+npm install -g zosma-mem
+```
+
+## Usage
+
+```bash
+# Auto-detect and evaluate memory system
+zosma-mem
+
+# Run specific scenarios
+zosma-mem --scenarios "cold-start,signal-dilution"
+
+# Output JSON instead of markdown
+zosma-mem --json
+
+# Save report to file
+zosma-mem --out report.md
+```
+
+## What It Does
+
+zosma-mem evaluates memory systems against 7 standardized scenarios:
+
+- **Cold start** - Basic ingestion and retrieval
+- **Signal dilution** - Handling noise at scale
+- **Repeated patterns** - Reinforcement learning
+- **Stale memory** - Time-based decay
+- **Conflicts** - Update resolution
+- **Context awareness** - Cross-context relevance
+- **Co-access clusters** - Relational recall
+
+## Auto-Detection
+
+zosma-mem automatically detects memory systems:
+
+1. **OpenZosma**: `packages/gateway/workspace/agents/default/memory/MEMORY.md`
+2. **Generic file**: `MEMORY.md`, `memory.md`, or `.memory.md`
+
+## Example Output
+
+```
+✅ Found openzosma memory at packages/gateway/workspace/agents/default/memory/MEMORY.md
+
+## zosma-mem Eval Report -- 2026-04-08T10:00:00Z
+
+| Scenario            | P@K   | R@K   | MRR   | Noise | Pass |
+| ------------------- | ----- | ----- | ----- | ----- | ---- |
+| Cold start          | 0.800 | 1.000 | 1.000 | 0.100 | yes  |
+| Signal dilution     | 0.600 | 1.000 | 1.000 | 0.900 | yes  |
+| Repeated pattern    | 0.200 | 1.000 | 1.000 | 0.000 | NO   |
+| ...                 |      |      |      |       |      |
+
+Summary: 3/7 passed. Avg P@K: 0.37
+❌ 4 tests failed
+```
+
+## Metrics Explained
+
+- **P@K**: Precision@K - How many of top-K results are relevant
+- **R@K**: Recall@K - How many relevant items found in top-K
+- **MRR**: Mean Reciprocal Rank - How quickly relevant items appear
+- **Noise**: Fraction of stored items never retrieved
+
+## Usage in OpenZosma (Current Development)
+
+Install zosma-mem globally for development:
+
+```bash
+# From the zosma-mem package directory
+cd packages/zosma-mem
+npm install -g .
+
+# Now use from anywhere
+zosma-mem
+```
+
+The tool automatically detects your OpenZosma memory system and runs the evaluation.
+
+## Advanced Usage
+
+### Programmatic API
+
+```typescript
+import { runEvals, builtInScenarios } from "zosma-mem/evals"
+
+const report = await runEvals({
+  adapter: myCustomAdapter,
+  scenarios: builtInScenarios,
+  k: 5
+})
+```
+
+### Custom Adapters
+
+For custom memory systems, implement the MemoryAdapter interface:
+
+```typescript
+import { MemoryAdapter, MemoryEvent } from "zosma-mem/evals"
+
+const adapter: MemoryAdapter = {
+  setup: async (opts) => { /* initialize */ },
+  ingest: async (event: MemoryEvent) => { /* store */ },
+  retrieve: async (query, topK) => { /* search */ },
+  // ... other methods
+}
+```
+
+## Publishing
+
+This package is published to npm as `zosma-mem`. To publish updates:
+
+```bash
+# Build and test
+pnpm run build
+pnpm run test
+
+# Publish
+npm publish
+```
+
+## Development
+
+```bash
+# Build
+pnpm run build
+
+# Test
+pnpm run test
+
+# Run locally
+pnpm eval
+```
+
+Built for developers who want to evaluate memory systems without configuration complexity. Made for OpenZosma, works with any memory system. 🚀
\ No newline at end of file
diff --git a/packages/zosma-mem/USAGE.md b/packages/zosma-mem/USAGE.md
new file mode 100644
index 0000000..8c324f0
--- /dev/null
+++ b/packages/zosma-mem/USAGE.md
@@ -0,0 +1,187 @@
+# zosma-mem Usage Guide
+
+**Standalone CLI for evaluating agentic memory systems**
+
+A zero-config evaluation tool that automatically detects and tests memory systems against standardized information retrieval scenarios.
+
+## Installation for Development
+
+Since zosma-mem isn't published yet, install it globally from source:
+
+```bash
+# From your OpenZosma project
+cd packages/zosma-mem
+npm install -g .
+
+# Now use from anywhere
+zosma-mem
+```
+
+## Usage Examples
+
+```bash
+# Basic evaluation
+zosma-mem
+
+# Run specific scenarios only
+zosma-mem --scenarios "cold-start,signal-dilution"
+
+# Output JSON instead of markdown
+zosma-mem --json
+
+# Save report to file
+zosma-mem --out memory-report.md
+```
+
+## CLI Options
+
+```bash
+zosma-mem [options]
+
+Options:
+  --scenarios <names>    Run specific scenarios (comma-separated)
+  --k <number>          Top-K for metrics (default: 5)
+  --json                Output JSON instead of markdown
+  --out <path>          Save report to file
+  --help                Show help
+```
+
+## What It Evaluates
+
+zosma-mem tests your memory system against 7 standardized scenarios:
+
+### ✅ Working Scenarios (Your Goals)
+- **Cold start** - Basic ingestion and retrieval
+- **Signal dilution** - Handling noise at scale
+- **Co-access cluster** - Relational recall
+
+### 🎯 Advanced Scenarios (Future Improvements)
+- **Repeated patterns** - Reinforcement learning
+- **Stale memory** - Time-based decay
+- **Conflicts** - Update resolution
+- **Context awareness** - Cross-context relevance
+
+## Example Output
+
+```
+✅ Found openzosma memory at packages/gateway/workspace/agents/default/memory/MEMORY.md
+
+## zosma-mem Eval Report -- 2026-04-08T10:00:00Z
+
+| Scenario            | P@K   | R@K   | MRR   | Noise | Pass |
+| ------------------- | ----- | ----- | ----- | ----- | ---- |
+| Cold start          | 0.600 | 1.000 | 1.000 | 0.500 | yes  |
+| Repeated pattern    | 0.200 | 1.000 | 1.000 | 0.000 | NO   |
+| Signal dilution     | 0.600 | 1.000 | 1.000 | 0.951 | yes  |
+| Stale memory        | 0.200 | 1.000 | 1.000 | 0.167 | NO   |
+| Conflicting updates | 0.200 | 1.000 | 1.000 | 0.000 | NO   |
+| Co-access cluster   | 0.600 | 1.000 | 1.000 | 0.000 | yes  |
+| Cross-context       | 0.200 | 1.000 | 1.000 | 0.000 | NO   |
+
+Summary: 3/7 passed. Avg P@K: 0.371, Avg R@K: 1.000, Avg MRR: 1.000
+```
+
+## Understanding Your Results
+
+### Current Status (3/7 passed)
+Your OpenZosma memory system handles basic operations well but lacks advanced features.
+
+### What the Scores Mean
+
+- **P@K (Precision@K)**: Fraction of top-5 results that are relevant
+  - 0.600 = 3/5 relevant results in top-5
+  - 0.200 = 1/5 relevant results in top-5
+
+- **R@K (Recall@K)**: Fraction of all relevant items found in top-5
+  - 1.000 = All relevant items found
+
+- **MRR (Mean Reciprocal Rank)**: How quickly relevant items appear
+  - 1.000 = Relevant items appear first
+
+- **Noise**: Fraction of stored items never retrieved
+  - Lower is better
+
+## Roadmap for OpenZosma Memory
+
+Use zosma-mem results to guide development:
+
+1. **Phase 1** ✅ Basic storage and retrieval
+2. **Phase 2** 🔄 Add reinforcement learning (repeated patterns)
+3. **Phase 3** 🔄 Add time-based decay (stale memory)
+4. **Phase 4** 🔄 Add conflict resolution
+5. **Phase 5** 🔄 Add context awareness
+
+## Advanced Usage
+
+### Programmatic Evaluation
+
+```typescript
+import { runEvals, builtInScenarios } from "zosma-mem/evals"
+
+const report = await runEvals({
+  adapter: myAdapter,
+  scenarios: builtInScenarios,
+  k: 5
+})
+```
+
+### Custom Memory Adapters
+
+For non-OpenZosma memory systems:
+
+```typescript
+import { MemoryAdapter, MemoryEvent } from "zosma-mem/evals"
+
+const adapter: MemoryAdapter = {
+  setup: async (opts) => { /* init */ },
+  ingest: async (event: MemoryEvent) => { /* store */ },
+  retrieve: async (query, topK) => { /* search */ },
+  recordUsage: async (id, signal) => { /* learn */ },
+  gc: async () => ({ removedCount: 0, archivedCount: 0, consolidatedCount: 0 }),
+  advanceTime: async (ms) => { /* time travel */ },
+  listEntities: async () => [/* all ids */],
+  teardown: async () => { /* cleanup */ }
+}
+```
+
+## Publishing
+
+This package is published to npm as `zosma-mem`. To publish updates:
+
+```bash
+# Build
+pnpm run build
+
+# Test locally
+pnpm eval
+
+# Publish
+npm publish
+```
+
+## Development
+
+```bash
+# Install dependencies
+pnpm install
+
+# Build TypeScript
+pnpm run build
+
+# Run tests
+pnpm run test
+
+# Test CLI locally
+pnpm eval
+```
+
+## OpenZosma Integration
+
+zosma-mem is the official evaluation tool for OpenZosma memory systems. It:
+
+- Auto-detects OpenZosma memory formats
+- Provides standardized evaluation metrics
+- Tracks improvement over time
+- Guides feature development priorities
+
+Run `zosma-mem` regularly to see how your memory system evolves! 🚀
\ No newline at end of file
diff --git a/packages/zosma-mem/package.json b/packages/zosma-mem/package.json
new file mode 100644
index 0000000..001c003
--- /dev/null
+++ b/packages/zosma-mem/package.json
@@ -0,0 +1,52 @@
+{
+	"name": "zosma-mem",
+	"version": "0.0.1",
+	"private": false,
+	"type": "module",
+	"description": "Standalone CLI for evaluating agentic memory systems - zero-config evaluation against standardized scenarios",
+	"license": "Apache-2.0",
+	"keywords": ["memory", "evaluation", "ai", "agentic", "cli", "openzosma"],
+	"repository": {
+		"type": "git",
+		"url": "https://github.com/your-org/openzosma",
+		"directory": "packages/zosma-mem"
+	},
+	"homepage": "https://github.com/your-org/openzosma/tree/main/packages/zosma-mem",
+	"main": "dist/index.js",
+	"types": "dist/index.d.ts",
+	"bin": {
+		"zosma-mem": "dist/evals/cli/simple-eval.js"
+	},
+	"exports": {
+		".": {
+			"types": "./dist/index.d.ts",
+			"import": "./dist/index.js"
+		},
+		"./evals": {
+			"types": "./dist/evals/index.d.ts",
+			"import": "./dist/evals/index.js"
+		}
+	},
+	"scripts": {
+		"build": "tsc",
+		"check": "tsc --noEmit",
+		"test": "vitest --run",
+		"eval": "tsx dist/evals/cli/simple-eval.js",
+		"prepublishOnly": "pnpm run build && pnpm run test"
+	},
+	"dependencies": {
+		"chalk": "^5.4.0",
+		"commander": "^13.0.0",
+		"ink": "^5.1.0",
+		"ink-spinner": "^5.0.0",
+		"react": "^18.3.0",
+		"zod": "^3.23.0"
+	},
+	"devDependencies": {
+		"@types/node": "^22.15.2",
+		"@types/react": "^18.3.0",
+		"tsx": "^4.0.0",
+		"typescript": "^5.7.3",
+		"vitest": "^3.0.0"
+	}
+}
diff --git a/packages/zosma-mem/src/evals/__tests__/metrics.test.ts b/packages/zosma-mem/src/evals/__tests__/metrics.test.ts
new file mode 100644
index 0000000..f2f32c2
--- /dev/null
+++ b/packages/zosma-mem/src/evals/__tests__/metrics.test.ts
@@ -0,0 +1,127 @@
+import { describe, expect, it } from "vitest"
+import {
+	computeGcEffectiveness,
+	computeMRR,
+	computeNoiseRatio,
+	computePrecisionAtK,
+	computeRecallAtK,
+	computeSalienceDrift,
+} from "../metrics.js"
+
+describe("computePrecisionAtK", () => {
+	it("returns 1.0 when all top-K are relevant", () => {
+		expect(computePrecisionAtK(["a", "b", "c"], new Set(["a", "b", "c"]), 3)).toBe(1)
+	})
+
+	it("returns 0.0 when none of the top-K are relevant", () => {
+		expect(computePrecisionAtK(["x", "y", "z"], new Set(["a", "b", "c"]), 3)).toBe(0)
+	})
+
+	it("returns 0.6 when 3 of 5 are relevant", () => {
+		expect(computePrecisionAtK(["a", "b", "x", "c", "y"], new Set(["a", "b", "c"]), 5)).toBe(0.6)
+	})
+
+	it("returns 0 when k is 0", () => {
+		expect(computePrecisionAtK(["a"], new Set(["a"]), 0)).toBe(0)
+	})
+
+	it("only evaluates up to K positions even if list is longer", () => {
+		expect(computePrecisionAtK(["a", "b", "c", "d", "e"], new Set(["d", "e"]), 3)).toBe(0)
+	})
+})
+
+describe("computeRecallAtK", () => {
+	it("returns 1.0 when all relevant entities appear in top-K", () => {
+		expect(computeRecallAtK(["a", "b", "c"], new Set(["a", "b"]), 3)).toBe(1)
+	})
+
+	it("returns 0.5 when half of relevant entities appear in top-K", () => {
+		expect(computeRecallAtK(["a", "x", "y"], new Set(["a", "b"]), 3)).toBe(0.5)
+	})
+
+	it("returns 1.0 when relevant set is empty (vacuously true)", () => {
+		expect(computeRecallAtK(["a", "b"], new Set(), 5)).toBe(1)
+	})
+
+	it("returns 0 when no relevant entities in top-K", () => {
+		expect(computeRecallAtK(["x", "y", "z"], new Set(["a", "b"]), 3)).toBe(0)
+	})
+})
+
+describe("computeMRR", () => {
+	it("returns 1.0 when the first result is relevant", () => {
+		expect(computeMRR(["a", "b", "c"], new Set(["a"]))).toBe(1)
+	})
+
+	it("returns 0.5 when the second result is the first relevant", () => {
+		expect(computeMRR(["x", "a", "b"], new Set(["a"]))).toBe(0.5)
+	})
+
+	it("returns 0.333... when the third result is the first relevant", () => {
+		expect(computeMRR(["x", "y", "a"], new Set(["a"]))).toBeCloseTo(1 / 3)
+	})
+
+	it("returns 0 when no relevant entity is found", () => {
+		expect(computeMRR(["x", "y", "z"], new Set(["a"]))).toBe(0)
+	})
+
+	it("handles empty retrieved list", () => {
+		expect(computeMRR([], new Set(["a"]))).toBe(0)
+	})
+})
+
+describe("computeNoiseRatio", () => {
+	it("returns 0 when all entities were retrieved at least once", () => {
+		expect(computeNoiseRatio(["a", "b", "c"], new Set(["a", "b", "c"]))).toBe(0)
+	})
+
+	it("returns 1 when no entity was ever retrieved", () => {
+		expect(computeNoiseRatio(["a", "b", "c"], new Set())).toBe(1)
+	})
+
+	it("returns 0.5 when half were never retrieved", () => {
+		expect(computeNoiseRatio(["a", "b", "c", "d"], new Set(["a", "b"]))).toBe(0.5)
+	})
+
+	it("returns 0 when entity list is empty", () => {
+		expect(computeNoiseRatio([], new Set())).toBe(0)
+	})
+})
+
+describe("computeGcEffectiveness", () => {
+	it("returns -1 when no noise entities before GC", () => {
+		expect(computeGcEffectiveness([], ["a", "b"])).toBe(-1)
+	})
+
+	it("returns 1.0 when all noise entities were removed", () => {
+		expect(computeGcEffectiveness(["x", "y"], ["a", "b"])).toBe(1)
+	})
+
+	it("returns 0.5 when half of noise entities were removed", () => {
+		expect(computeGcEffectiveness(["x", "y"], ["x", "a", "b"])).toBe(0.5)
+	})
+
+	it("returns 0 when no noise entities were removed", () => {
+		expect(computeGcEffectiveness(["x", "y"], ["x", "y", "a"])).toBe(0)
+	})
+})
+
+describe("computeSalienceDrift", () => {
+	it("returns -1 with fewer than 2 snapshots", () => {
+		expect(computeSalienceDrift([[1, 2, 3]])).toBe(-1)
+		expect(computeSalienceDrift([])).toBe(-1)
+	})
+
+	it("returns 0 when all scores are identical across cycles", () => {
+		expect(computeSalienceDrift([[1, 1, 1], [1, 1, 1]])).toBe(0)
+	})
+
+	it("returns a positive value when scores vary", () => {
+		const drift = computeSalienceDrift([[0, 1, 2], [3, 4, 5]])
+		expect(drift).toBeGreaterThan(0)
+	})
+
+	it("returns -1 when snapshots exist but all are empty", () => {
+		expect(computeSalienceDrift([[], []])).toBe(-1)
+	})
+})
diff --git a/packages/zosma-mem/src/evals/__tests__/mock-adapter.ts b/packages/zosma-mem/src/evals/__tests__/mock-adapter.ts
new file mode 100644
index 0000000..7a60f15
--- /dev/null
+++ b/packages/zosma-mem/src/evals/__tests__/mock-adapter.ts
@@ -0,0 +1,102 @@
+/**
+ * Trivial in-memory adapter used to test the eval framework itself.
+ *
+ * NOT for evaluating a real engine. This adapter implements the simplest
+ * possible retrieval strategy (tag overlap count) to verify that the
+ * framework's metric computation, runner lifecycle, and scenario logic
+ * are all correct without needing a real engine.
+ *
+ * Behaviour:
+ * - `ingest`: stores the event. If the same ID is ingested again, the latest
+ *   version replaces the previous one (last-write-wins).
+ * - `retrieve`: scores entities by the number of tag matches with the query.
+ *   On tie, newer timestamps rank higher.
+ * - `recordUsage`: no-op (no reinforcement learning).
+ * - `gc`: removes entities whose tags contain "stale" (simulates simple decay).
+ *   Also supports time-based removal: entities older than 7 days from clock.
+ * - `advanceTime`: delegates to the injected DeterministicClock.
+ * - `listEntities`: returns all stored IDs.
+ * - `setup` / `teardown`: clears internal state.
+ */
+
+import type {
+	AdapterSetupOpts,
+	DeterministicClock,
+	GcResult,
+	MemoryAdapter,
+	MemoryEvent,
+	RetrievedEntity,
+	RetrieveQuery,
+} from "../types.js"
+
+interface StoredEntity {
+	event: MemoryEvent
+	usageCount: number
+	ignored: number
+}
+
+const GC_MAX_AGE_MS = 7 * 24 * 60 * 60 * 1_000 // 7 days
+
+export const createMockAdapter = (): MemoryAdapter => {
+	const store = new Map<string, StoredEntity>()
+	let clock: DeterministicClock = { now: () => Date.now(), advance: () => undefined }
+
+	const setup = async (opts: AdapterSetupOpts): Promise<void> => {
+		store.clear()
+		clock = opts.clock
+	}
+
+	const ingest = async (event: MemoryEvent): Promise<void> => {
+		store.set(event.id, { event, usageCount: 0, ignored: 0 })
+	}
+
+	const retrieve = async (query: RetrieveQuery, topK: number): Promise<RetrievedEntity[]> => {
+		const queryTags = new Set([
+			...(query.tags ?? []).map((t) => t.toLowerCase()),
+			...query.text.toLowerCase().split(/\s+/),
+		])
+
+		const scored = Array.from(store.values()).map(({ event }) => {
+			const tagScore = event.tags.filter((t) => queryTags.has(t.toLowerCase())).length
+			return { id: event.id, content: event.content, score: tagScore, tags: event.tags, timestamp: event.timestamp }
+		})
+
+		// Sort by score desc, then timestamp desc (recency tiebreak).
+		scored.sort((a, b) => b.score - a.score || b.timestamp - a.timestamp)
+
+		return scored.slice(0, topK).map(({ id, content, score, tags }) => ({ id, content, score, tags }))
+	}
+
+	const recordUsage = async (entityId: string): Promise<void> => {
+		const entry = store.get(entityId)
+		if (entry) store.set(entityId, { ...entry, usageCount: entry.usageCount + 1 })
+	}
+
+	const gc = async (): Promise<GcResult> => {
+		const now = clock.now()
+		const toRemove: string[] = []
+
+		for (const [id, { event }] of store) {
+			const age = now - event.timestamp
+			if (age > GC_MAX_AGE_MS || event.tags.includes("stale")) {
+				toRemove.push(id)
+			}
+		}
+
+		for (const id of toRemove) store.delete(id)
+
+		return { removedCount: toRemove.length, archivedCount: 0, consolidatedCount: 0 }
+	}
+
+	const advanceTime = async (ms: number): Promise<void> => {
+		clock.advance(ms)
+	}
+
+	const listEntities = async (): Promise<string[]> => Array.from(store.keys())
+
+	const teardown = async (): Promise<void> => {
+		store.clear()
+	}
+
+	return { setup, ingest, retrieve, recordUsage, gc, advanceTime, listEntities, teardown }
+}
diff --git a/packages/zosma-mem/src/evals/__tests__/report.test.ts b/packages/zosma-mem/src/evals/__tests__/report.test.ts
new file mode 100644
index 0000000..152b608
--- /dev/null
+++ b/packages/zosma-mem/src/evals/__tests__/report.test.ts
@@ -0,0 +1,78 @@
+import { describe, expect, it } from "vitest"
+import { renderMarkdownReport } from "../report.js"
+import type { EvalReport } from "../types.js"
+
+const makeReport = (overrides?: Partial<EvalReport>): EvalReport => ({
+	timestamp: new Date("2026-04-07T12:00:00.000Z").getTime(),
+	results: [
+		{
+			scenario: "Cold start",
+			metrics: { precisionAtK: 1, recallAtK: 1, mrr: 1, noiseRatio: 0.1, gcEffectiveness: -1, salienceDrift: -1 },
+			passed: true,
+			details: "",
+		},
+		{
+			scenario: "Signal dilution",
+			metrics: { precisionAtK: 0.4, recallAtK: 0.8, mrr: 0.5, noiseRatio: 0.9, gcEffectiveness: -1, salienceDrift: -1 },
+			passed: false,
+			details: "precisionAtK: 0.400 < threshold 0.600",
+		},
+	],
+	summary: { total: 2, passed: 1, failed: 1, avgPrecision: 0.7, avgRecall: 0.9, avgMrr: 0.75 },
+	...overrides,
+})
+
+describe("renderMarkdownReport", () => {
+	it("includes a heading with the timestamp", () => {
+		const output = renderMarkdownReport(makeReport())
+		expect(output).toContain("## zosma-mem Eval Report -- 2026-04-07T12:00:00.000Z")
+	})
+
+	it("includes all scenario names", () => {
+		const output = renderMarkdownReport(makeReport())
+		expect(output).toContain("Cold start")
+		expect(output).toContain("Signal dilution")
+	})
+
+	it("marks passing scenarios with 'yes'", () => {
+		const output = renderMarkdownReport(makeReport())
+		expect(output).toContain("yes")
+	})
+
+	it("marks failing scenarios with 'NO'", () => {
+		const output = renderMarkdownReport(makeReport())
+		expect(output).toContain("NO")
+	})
+
+	it("includes the summary line", () => {
+		const output = renderMarkdownReport(makeReport())
+		expect(output).toContain("Summary: 1/2 passed")
+	})
+
+	it("includes a failures section when there are failures", () => {
+		const output = renderMarkdownReport(makeReport())
+		expect(output).toContain("### Failures")
+		expect(output).toContain("precisionAtK: 0.400 < threshold 0.600")
+	})
+
+	it("does not include failures section when all pass", () => {
+		const allPass = makeReport({
+			results: [
+				{
+					scenario: "Cold start",
+					metrics: { precisionAtK: 1, recallAtK: 1, mrr: 1, noiseRatio: 0, gcEffectiveness: -1, salienceDrift: -1 },
+					passed: true,
+					details: "",
+				},
+			],
+			summary: { total: 1, passed: 1, failed: 0, avgPrecision: 1, avgRecall: 1, avgMrr: 1 },
+		})
+		const output = renderMarkdownReport(allPass)
+		expect(output).not.toContain("### Failures")
+	})
+
+	it("renders N/A values as ' -- '", () => {
+		const output = renderMarkdownReport(makeReport())
+		expect(output).toContain(" -- ")
+	})
+})
diff --git a/packages/zosma-mem/src/evals/__tests__/runner.test.ts b/packages/zosma-mem/src/evals/__tests__/runner.test.ts
new file mode 100644
index 0000000..4877b05
--- /dev/null
+++ b/packages/zosma-mem/src/evals/__tests__/runner.test.ts
@@ -0,0 +1,96 @@
+import { describe, expect, it, vi } from "vitest"
+import { runEvals } from "../runner.js"
+import type { ScenarioDefinition } from "../types.js"
+import { createMockAdapter } from "./mock-adapter.js"
+
+const makePassingScenario = (name: string): ScenarioDefinition => ({
+	name,
+	description: `Always-passing scenario: ${name}`,
+	run: async (_adapter, _clock) => ({
+		metrics: { precisionAtK: 1, recallAtK: 1, mrr: 1, noiseRatio: 0, gcEffectiveness: -1, salienceDrift: -1 },
+		passed: true,
+		details: "",
+	}),
+})
+
+const makeFailingScenario = (name: string): ScenarioDefinition => ({
+	name,
+	description: `Always-failing scenario: ${name}`,
+	run: async (_adapter, _clock) => ({
+		metrics: { precisionAtK: 0, recallAtK: 0, mrr: 0, noiseRatio: 1, gcEffectiveness: -1, salienceDrift: -1 },
+		passed: false,
+		details: "always fails",
+	}),
+})
+
+describe("runEvals", () => {
+	it("returns a report with the correct scenario count", async () => {
+		const adapter = createMockAdapter()
+		const report = await runEvals({
+			adapter,
+			scenarios: [makePassingScenario("A"), makePassingScenario("B")],
+		})
+		expect(report.summary.total).toBe(2)
+	})
+
+	it("counts passed scenarios correctly", async () => {
+		const adapter = createMockAdapter()
+		const report = await runEvals({
+			adapter,
+			scenarios: [makePassingScenario("A"), makeFailingScenario("B"), makePassingScenario("C")],
+		})
+		expect(report.summary.passed).toBe(2)
+		expect(report.summary.failed).toBe(1)
+	})
+
+	it("calls onScenarioStart and onScenarioEnd for each scenario", async () => {
+		const adapter = createMockAdapter()
+		const started: string[] = []
+		const ended: string[] = []
+
+		await runEvals({
+			adapter,
+			scenarios: [makePassingScenario("X"), makePassingScenario("Y")],
+			onScenarioStart: (name) => started.push(name),
+			onScenarioEnd: (name) => ended.push(name),
+		})
+
+		expect(started).toEqual(["X", "Y"])
+		expect(ended).toEqual(["X", "Y"])
+	})
+
+	it("calls teardown even when the scenario throws", async () => {
+		const adapter = createMockAdapter()
+		const teardownSpy = vi.spyOn(adapter, "teardown")
+
+		const throwingScenario: ScenarioDefinition = {
+			name: "Thrower",
+			description: "Throws during run",
+			run: async () => {
+				throw new Error("intentional scenario error")
+			},
+		}
+
+		const report = await runEvals({ adapter, scenarios: [throwingScenario] })
+
+		expect(teardownSpy).toHaveBeenCalledTimes(1)
+		expect(report.summary.failed).toBe(1)
+		expect(report.results[0].details).toContain("intentional scenario error")
+	})
+
+	it("computes correct averages in summary", async () => {
+		const adapter = createMockAdapter()
+		const report = await runEvals({
+			adapter,
+			scenarios: [makePassingScenario("A"), makeFailingScenario("B")],
+		})
+		expect(report.summary.avgPrecision).toBe(0.5)
+		expect(report.summary.avgMrr).toBe(0.5)
+	})
+
+	it("includes a unix timestamp in the report", async () => {
+		const adapter = createMockAdapter()
+		const report = await runEvals({ adapter, scenarios: [makePassingScenario("A")] })
+		expect(report.timestamp).toBeGreaterThan(0)
+	})
+})
diff --git a/packages/zosma-mem/src/evals/__tests__/scenarios.test.ts b/packages/zosma-mem/src/evals/__tests__/scenarios.test.ts
new file mode 100644
index 0000000..cac64bf
--- /dev/null
+++ b/packages/zosma-mem/src/evals/__tests__/scenarios.test.ts
@@ -0,0 +1,121 @@
+/**
+ * Integration tests: run all 7 built-in scenarios against the mock adapter.
+ *
+ * The mock adapter uses simple tag-overlap scoring. Not all scenarios can pass
+ * at the highest possible threshold with a naive engine -- but all 7 must at
+ * minimum complete without errors, produce valid metrics, and the scenarios
+ * that the mock adapter is capable of passing must pass.
+ *
+ * Scenarios that require reinforcement or co-access (which the mock does not
+ * implement) are tested for structural correctness only (valid metrics, no throws).
+ */
+
+import { describe, expect, it } from "vitest"
+import { createClock } from "../utils/time.js"
+import { createMockAdapter } from "./mock-adapter.js"
+import { coldStartScenario } from "../scenarios/cold-start.js"
+import { repeatedPatternScenario } from "../scenarios/repeated-pattern.js"
+import { signalDilutionScenario } from "../scenarios/signal-dilution.js"
+import { staleMemoryScenario } from "../scenarios/stale-memory.js"
+import { conflictingUpdatesScenario } from "../scenarios/conflicting-updates.js"
+import { coAccessClusterScenario } from "../scenarios/co-access-cluster.js"
+import { crossContextScenario } from "../scenarios/cross-context.js"
+import type { ScenarioResult } from "../types.js"
+import { tmpdir } from "node:os"
+import { mkdtemp, rm } from "node:fs/promises"
+import { join } from "node:path"
+
+const runScenario = async (
+	scenario: { run: (adapter: ReturnType<typeof createMockAdapter>, clock: ReturnType<typeof createClock>) => Promise<ScenarioResult> },
+): Promise<ScenarioResult> => {
+	const adapter = createMockAdapter()
+	const clock = createClock()
+	const workDir = await mkdtemp(join(tmpdir(), "zosma-mem-test-"))
+	try {
+		await adapter.setup({ workDir, clock })
+		return await scenario.run(adapter, clock)
+	} finally {
+		await adapter.teardown()
+		await rm(workDir, { recursive: true, force: true })
+	}
+}
+
+const assertValidMetrics = (result: ScenarioResult) => {
+	const { metrics } = result
+	expect(metrics.precisionAtK).toBeGreaterThanOrEqual(0)
+	expect(metrics.precisionAtK).toBeLessThanOrEqual(1)
+	expect(metrics.recallAtK).toBeGreaterThanOrEqual(0)
+	expect(metrics.recallAtK).toBeLessThanOrEqual(1)
+	expect(metrics.mrr).toBeGreaterThanOrEqual(0)
+	expect(metrics.mrr).toBeLessThanOrEqual(1)
+	expect(metrics.noiseRatio).toBeGreaterThanOrEqual(0)
+	expect(metrics.noiseRatio).toBeLessThanOrEqual(1)
+	// gcEffectiveness and salienceDrift may be -1 (N/A)
+	expect(metrics.gcEffectiveness).toBeGreaterThanOrEqual(-1)
+	expect(metrics.salienceDrift).toBeGreaterThanOrEqual(-1)
+}
+
+describe("Scenario 1: Cold start", () => {
+	it("produces valid metrics and passes with mock adapter", async () => {
+		const result = await runScenario(coldStartScenario)
+		assertValidMetrics(result)
+		// Mock adapter tag scoring is sufficient for cold-start (clear tag match).
+		expect(result.passed).toBe(true)
+	})
+})
+
+describe("Scenario 2: Repeated pattern", () => {
+	it("produces valid metrics (mock does not reinforce, pass is not required)", async () => {
+		const result = await runScenario(repeatedPatternScenario)
+		assertValidMetrics(result)
+		// The recurring entity has the most matching tags so it should still rank first.
+		expect(result.metrics.mrr).toBeGreaterThan(0)
+	})
+})
+
+describe("Scenario 3: Signal dilution", () => {
+	it("produces valid metrics and passes with mock adapter", async () => {
+		const result = await runScenario(signalDilutionScenario)
+		assertValidMetrics(result)
+		// Mock uses tag overlap -- high-value events have exact tag matches.
+		expect(result.passed).toBe(true)
+	})
+})
+
+describe("Scenario 4: Stale memory", () => {
+	it("produces valid metrics and the fresh entity ranks first", async () => {
+		const result = await runScenario(staleMemoryScenario)
+		assertValidMetrics(result)
+		// Mock GC removes entities older than 7 days; fresh entity survives.
+		expect(result.metrics.mrr).toBe(1)
+	})
+})
+
+describe("Scenario 5: Conflicting updates", () => {
+	it("produces valid metrics with most recent content surfaced", async () => {
+		const result = await runScenario(conflictingUpdatesScenario)
+		assertValidMetrics(result)
+		// Mock last-write-wins: entity is replaced on re-ingest, latest content wins.
+		expect(result.metrics.mrr).toBe(1)
+	})
+})
+
+describe("Scenario 6: Co-access cluster", () => {
+	it("produces valid metrics (co-access boost not implemented in mock, partial pass)", async () => {
+		const result = await runScenario(coAccessClusterScenario)
+		assertValidMetrics(result)
+		// auth-flow has direct tag overlap and will rank 1st.
+		// retry-logic and timeout-handling share some auth tags so may appear.
+		expect(result.metrics.mrr).toBe(1)
+	})
+})
+
+describe("Scenario 7: Cross-context", () => {
+	it("produces valid metrics", async () => {
+		const result = await runScenario(crossContextScenario)
+		assertValidMetrics(result)
+		// Mock adapter ranks by tag overlap, so the auth entity should rank high
+		// for auth query and low for styling query.
+		expect(result.metrics.mrr).toBeGreaterThan(0)
+	})
+})
diff --git a/packages/zosma-mem/src/evals/cli/bin.ts b/packages/zosma-mem/src/evals/cli/bin.ts
new file mode 100644
index 0000000..4c8ab1d
--- /dev/null
+++ b/packages/zosma-mem/src/evals/cli/bin.ts
@@ -0,0 +1,133 @@
+#!/usr/bin/env node
+/**
+ * zosma-mem-eval CLI entry point.
+ *
+ * Usage:
+ *   zosma-mem-eval --adapter ./my-adapter.js [options]
+ *
+ * The adapter module must export a default or named `adapter` that satisfies
+ * the MemoryAdapter interface.
+ */
+
+import { writeFile } from "node:fs/promises"
+import { resolve } from "node:path"
+import { render } from "ink"
+import { Command } from "commander"
+import chalk from "chalk"
+import { createElement } from "react"
+import { builtInScenarios } from "../scenarios/index.js"
+import { renderMarkdownReport } from "../report.js"
+import { runEvals } from "../runner.js"
+import type { EvalReport, MemoryAdapter } from "../types.js"
+import { App } from "./components/App.js"
+
+const program = new Command()
+
+program
+	.name("zosma-mem-eval")
+	.description("Run the zosma-mem evaluation suite against a memory engine adapter.")
+	.requiredOption("--adapter <path>", "Path to a JS/TS module exporting a MemoryAdapter")
+	.option("--scenarios <names>", "Comma-separated scenario names to run (default: all)")
+	.option("--k <number>", "Top-K for precision/recall (default: 5)", "5")
+	.option("--ci", "Disable interactive Ink UI, output plain markdown to stdout")
+	.option("--json", "Output raw JSON report to stdout")
+	.option("--out <path>", "Write markdown report to a file")
+	.parse(process.argv)
+
+const opts = program.opts<{
+	adapter: string
+	scenarios?: string
+	k: string
+	ci?: boolean
+	json?: boolean
+	out?: string
+}>()
+
+const loadAdapter = async (adapterPath: string): Promise<MemoryAdapter> => {
+	const absolutePath = resolve(adapterPath)
+	const mod = await import(absolutePath) as Record<string, unknown>
+	const adapter = (mod.default ?? mod.adapter) as MemoryAdapter | undefined
+
+	if (!adapter || typeof adapter.setup !== "function") {
+		console.error(
+			chalk.red(
+				`Error: adapter module at "${adapterPath}" must export a default or named "adapter" that satisfies the MemoryAdapter interface.`,
+			),
+		)
+		process.exit(1)
+	}
+
+	return adapter
+}
+
+const filterScenarios = (names?: string) => {
+	if (!names) return builtInScenarios
+	const requested = names.split(",").map((n) => n.trim().toLowerCase())
+	return builtInScenarios.filter((s) => requested.includes(s.name.toLowerCase()))
+}
+
+const writeReport = async (report: EvalReport, outPath: string) => {
+	const markdown = renderMarkdownReport(report)
+	await writeFile(outPath, markdown, "utf8")
+	console.log(chalk.green(`Report written to ${outPath}`))
+}
+
+const main = async () => {
+	const adapter = await loadAdapter(opts.adapter)
+	const scenarios = filterScenarios(opts.scenarios)
+	const k = Number.parseInt(opts.k, 10)
+	const isCi = Boolean(opts.ci) || !process.stdout.isTTY
+
+	if (isCi || opts.json) {
+		// Plain mode: no Ink, just run and print.
+		const report = await runEvals({
+			adapter,
+			scenarios,
+			k,
+			onScenarioStart: (name) => {
+				if (!opts.json) process.stdout.write(`  running: ${name}\n`)
+			},
+			onScenarioEnd: (name, result) => {
+				if (!opts.json) {
+					const icon = result.passed ? chalk.green("✓") : chalk.red("✗")
+					process.stdout.write(`  ${icon} ${name}\n`)
+				}
+			},
+		})
+
+		if (opts.json) {
+			process.stdout.write(`${JSON.stringify(report, null, 2)}\n`)
+		} else {
+			process.stdout.write(`\n${renderMarkdownReport(report)}\n`)
+		}
+
+		if (opts.out) await writeReport(report, opts.out)
+
+		process.exit(report.summary.failed > 0 ? 1 : 0)
+	} else {
+		// Interactive Ink mode.
+		let finalReport: EvalReport | null = null
+
+		const { waitUntilExit } = render(
+			createElement(App, {
+				adapter,
+				scenarios,
+				k,
+				onComplete: (r: EvalReport) => {
+					finalReport = r
+				},
+			}),
+		)
+
+		await waitUntilExit()
+
+		if (opts.out && finalReport) await writeReport(finalReport, opts.out)
+
+		process.exit(finalReport && (finalReport as EvalReport).summary.failed > 0 ? 1 : 0)
+	}
+}
+
+main().catch((err) => {
+	console.error(chalk.red("Fatal:"), err instanceof Error ? err.message : err)
+	process.exit(1)
+})
diff --git a/packages/zosma-mem/src/evals/cli/components/App.tsx b/packages/zosma-mem/src/evals/cli/components/App.tsx
new file mode 100644
index 0000000..6d95423
--- /dev/null
+++ b/packages/zosma-mem/src/evals/cli/components/App.tsx
@@ -0,0 +1,98 @@
+import { Box, Text, useApp } from "ink"
+import type React from "react"
+import { useEffect, useRef, useState } from "react"
+import { runEvals } from "../../runner.js"
+import type { EvalReport, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../../types.js"
+import { ErrorDisplay } from "./ErrorDisplay.js"
+import { ScenarioRow } from "./ScenarioRow.js"
+import { SummaryTable } from "./SummaryTable.js"
+
+type ScenarioStatus = "pending" | "running" | "done"
+
+interface ScenarioState {
+	name: string
+	status: ScenarioStatus
+	result?: ScenarioResult
+}
+
+interface Props {
+	adapter: MemoryAdapter
+	scenarios?: ScenarioDefinition[]
+	k?: number
+	onComplete: (report: EvalReport) => void
+}
+
+export const App: React.FC<Props> = ({ adapter, scenarios, k, onComplete }) => {
+	const { exit } = useApp()
+	const [states, setStates] = useState<ScenarioState[]>([])
+	const [report, setReport] = useState<EvalReport | null>(null)
+	const [error, setError] = useState<string | null>(null)
+
+	// Capture props in a ref so the effect dependency array stays stable.
+	// The CLI renders once and never re-renders with different props.
+	const optsRef = useRef({ adapter, scenarios, k, onComplete, exit })
+
+	useEffect(() => {
+		const { adapter: a, scenarios: sc, k: topK, onComplete: done, exit: quit } = optsRef.current
+
+		const run = async () => {
+			try {
+				const result = await runEvals({
+					adapter: a,
+					scenarios: sc,
+					k: topK,
+					onScenarioStart: (name) => {
+						setStates((prev) => {
+							const next = [...prev]
+							const idx = next.findIndex((s) => s.name === name)
+							if (idx >= 0) {
+								next[idx] = { ...next[idx], status: "running" }
+							} else {
+								next.push({ name, status: "running" })
+							}
+							return next
+						})
+					},
+					onScenarioEnd: (name, scenarioResult) => {
+						setStates((prev) => {
+							const next = [...prev]
+							const idx = next.findIndex((s) => s.name === name)
+							if (idx >= 0) {
+								next[idx] = { name, status: "done", result: scenarioResult }
+							}
+							return next
+						})
+					},
+				})
+
+				setReport(result)
+				done(result)
+			} catch (err) {
+				setError(err instanceof Error ? err.message : String(err))
+			} finally {
+				quit()
+			}
+		}
+
+		// Initialise state with pending entries before running.
+		const scenarioList = sc ?? []
+		setStates(scenarioList.map((s) => ({ name: s.name, status: "pending" })))
+		run()
+	}, [])
+
+	if (error) {
+		return <ErrorDisplay message={error} />
+	}
+
+	return (
+		<Box flexDirection="column" padding={1}>
+			<Text bold>zosma-mem eval</Text>
+			<Box flexDirection="column" marginTop={1}>
+				{states.map((s) => (
+					<ScenarioRow key={s.name} name={s.name} status={s.status} result={s.result} />
+				))}
+			</Box>
+			{report ? <SummaryTable report={report} /> : null}
+		</Box>
+	)
+}
diff --git a/packages/zosma-mem/src/evals/cli/components/ErrorDisplay.tsx b/packages/zosma-mem/src/evals/cli/components/ErrorDisplay.tsx
new file mode 100644
index 0000000..25d385b
--- /dev/null
+++ b/packages/zosma-mem/src/evals/cli/components/ErrorDisplay.tsx
@@ -0,0 +1,15 @@
+import { Box, Text } from "ink"
+import type React from "react"
+
+interface Props {
+	message: string
+}
+
+export const ErrorDisplay: React.FC<Props> = ({ message }) => (
+	<Box flexDirection="column" marginTop={1} borderStyle="round" borderColor="red" paddingX={1}>
+		<Text color="red" bold>
+			Error
+		</Text>
+		<Text>{message}</Text>
+	</Box>
+)
diff --git a/packages/zosma-mem/src/evals/cli/components/ScenarioRow.tsx b/packages/zosma-mem/src/evals/cli/components/ScenarioRow.tsx
new file mode 100644
index 0000000..460adc2
--- /dev/null
+++ b/packages/zosma-mem/src/evals/cli/components/ScenarioRow.tsx
@@ -0,0 +1,51 @@
+import { Text } from "ink"
+import Spinner from "ink-spinner"
+import type React from "react"
+import type { ScenarioResult } from "../../types.js"
+
+interface Props {
+	name: string
+	status: "pending" | "running" | "done"
+	result?: ScenarioResult
+}
+
+export const ScenarioRow: React.FC<Props> = ({ name, status, result }) => {
+	if (status === "pending") {
+		return (
+			<Text>
+				<Text color="gray">{"  "}</Text>
+				<Text dimColor>{name}</Text>
+			</Text>
+		)
+	}
+
+	if (status === "running") {
+		return (
+			<Text>
+				<Text color="cyan">
+					<Spinner type="dots" />
+				</Text>
+				<Text>{" "}</Text>
+				<Text>{name}</Text>
+			</Text>
+		)
+	}
+
+	const icon = result?.passed ? "✓" : "✗"
+	const color = result?.passed ? "green" : "red"
+	const p = result?.metrics.precisionAtK.toFixed(3) ?? "-"
+	const r = result?.metrics.recallAtK.toFixed(3) ?? "-"
+	const m = result?.metrics.mrr.toFixed(3) ?? "-"
+
+	return (
+		<Text>
+			<Text color={color}>{icon}</Text>
+			<Text>{" "}</Text>
+			<Text>{name.padEnd(30)}</Text>
+			<Text dimColor>{`P@K:${p}  R@K:${r}  MRR:${m}`}</Text>
+			{!result?.passed && result?.details ? (
+				<Text color="red">{`  -- ${result.details}`}</Text>
+			) : null}
+		</Text>
+	)
+}
diff --git a/packages/zosma-mem/src/evals/cli/components/SummaryTable.tsx b/packages/zosma-mem/src/evals/cli/components/SummaryTable.tsx
new file mode 100644
index 0000000..dd9c3fe
--- /dev/null
+++ b/packages/zosma-mem/src/evals/cli/components/SummaryTable.tsx
@@ -0,0 +1,32 @@
+import { Box, Text } from "ink"
+import type React from "react"
+import type { EvalReport } from "../../types.js"
+
+interface Props {
+	report: EvalReport
+}
+
+export const SummaryTable: React.FC<Props> = ({ report }) => {
+	const { summary } = report
+	const allPassed = summary.failed === 0
+
+	return (
+		<Box flexDirection="column" marginTop={1}>
+			<Text bold>Summary</Text>
+			<Text>
+				{"  Scenarios: "}
+				<Text color={allPassed ? "green" : "red"} bold>
+					{`${summary.passed}/${summary.total} passed`}
+				</Text>
+			</Text>
+			<Text>
+				{"  Avg P@K: "}
+				<Text bold>{summary.avgPrecision.toFixed(3)}</Text>
+				{"  Avg R@K: "}
+				<Text bold>{summary.avgRecall.toFixed(3)}</Text>
+				{"  Avg MRR: "}
+				<Text bold>{summary.avgMrr.toFixed(3)}</Text>
+			</Text>
+		</Box>
+	)
+}
diff --git a/packages/zosma-mem/src/evals/cli/simple-eval.ts b/packages/zosma-mem/src/evals/cli/simple-eval.ts
new file mode 100644
index 0000000..36d3b67
--- /dev/null
+++ b/packages/zosma-mem/src/evals/cli/simple-eval.ts
@@ -0,0 +1,201 @@
+#!/usr/bin/env node
+
+/**
+ * zosma-mem - Zero-config memory evaluation
+ *
+ * Just run it - it'll find and evaluate your memory system automatically.
+ */
+
+import { existsSync, readFileSync } from "node:fs"
+import { join } from "node:path"
+import { builtInScenarios } from "../scenarios/index.js"
+import { runEvals } from "../runner.js"
+import { renderMarkdownReport } from "../report.js"
+import { MemoryAdapter, MemoryEvent, DeterministicClock } from "../types.js"
+
+interface MemoryInfo {
+  type: "openzosma" | "file"
+  path: string
+}
+
+interface StoredMemoryEvent extends MemoryEvent {
+  usageCount: number
+  lastRetrieved: number
+}
+
+const detectMemory = (): MemoryInfo | null => {
+  const cwd = process.cwd()
+
+  // Check for OpenZosma memory
+  const openzosmaPath = join(cwd, "packages/gateway/workspace/agents/default/memory/MEMORY.md")
+  if (existsSync(openzosmaPath)) {
+    return { type: "openzosma", path: openzosmaPath }
+  }
+
+  // Check for generic memory files
+  const memoryFiles = ["MEMORY.md", "memory.md", ".memory.md"]
+  for (const file of memoryFiles) {
+    const path = join(cwd, file)
+    if (existsSync(path)) {
+      return { type: "file", path }
+    }
+  }
+
+  return null
+}
+
+const createMemoryAdapter = (memoryInfo: MemoryInfo): MemoryAdapter => {
+  const events = new Map<string, StoredMemoryEvent>()
+  let clock: DeterministicClock = { now: () => Date.now(), advance: () => {} }
+
+  const loadMemory = () => {
+    if (memoryInfo.type === "openzosma") {
+      // Parse OpenZosma format: <!-- timestamp [hash] -->\ncontent
+      const content = readFileSync(memoryInfo.path, "utf-8")
+      const lines = content.split("\n")
+      let currentEvent: Partial<MemoryEvent> | null = null
+
+      for (const line of lines) {
+        const match = line.match(/^<!-- (\d+) \[([a-f0-9]+)\] -->$/)
+        if (match) {
+          if (currentEvent && currentEvent.id) {
+            events.set(currentEvent.id, { ...currentEvent, usageCount: 0, lastRetrieved: 0 } as StoredMemoryEvent)
+          }
+          const [, ts, id] = match
+          currentEvent = {
+            id,
+            type: "preference",
+            content: "",
+            tags: ["user", "memory"],
+            timestamp: parseInt(ts)
+          }
+        } else if (currentEvent && line.trim()) {
+          currentEvent.content += line + "\n"
+        }
+      }
+      if (currentEvent && currentEvent.id) {
+        events.set(currentEvent.id, { ...currentEvent, usageCount: 0, lastRetrieved: 0 } as StoredMemoryEvent)
+      }
+    } else {
+      // Simple file format
+      const content = readFileSync(memoryInfo.path, "utf-8")
+      content.split("\n").forEach((line, i) => {
+        if (line.trim()) {
+          events.set(`entry-${i}`, {
+            id: `entry-${i}`,
+            type: "note",
+            content: line.trim(),
+            tags: [],
+            timestamp: Date.now() - (i * 1000),
+            usageCount: 0,
+            lastRetrieved: 0
+          })
+        }
+      })
+    }
+  }
+
+  return {
+    setup: async (opts) => {
+      clock = opts.clock
+      loadMemory()
+    },
+
+    ingest: async (event: MemoryEvent) => {
+      events.set(event.id, { ...event, usageCount: 0, lastRetrieved: 0 })
+    },
+
+    retrieve: async (query, topK) => {
+      const queryWords = new Set(query.text.toLowerCase().split(/\s+/))
+      const queryTags = new Set(query.tags || [])
+
+      const scored = Array.from(events.values()).map((stored) => {
+        let score = 0
+
+        // Tag matching
+        const tagMatches = stored.tags.filter(tag => queryTags.has(tag.toLowerCase())).length
+        score += tagMatches * 2
+
+        // Content matching
+        const contentWords = new Set(stored.content.toLowerCase().split(/\s+/))
+        const wordMatches = Array.from(queryWords).filter(word => contentWords.has(word)).length
+        score += wordMatches
+
+        // Recency boost
+        const ageHours = (clock.now() - stored.timestamp) / (1000 * 60 * 60)
+        score += Math.max(0, 1 - ageHours / 24) * 0.5
+
+        // Usage boost
+        score += stored.usageCount * 0.1
+
+        return {
+          id: stored.id,
+          content: stored.content.trim(),
+          score: Math.max(0, score),
+          tags: stored.tags
+        }
+      })
+
+      scored.sort((a, b) => b.score - a.score)
+      const top = scored.slice(0, topK)
+
+      // Mark as retrieved
+      for (const item of top) {
+        const stored = events.get(item.id)
+        if (stored) stored.lastRetrieved = clock.now()
+      }
+
+      return top
+    },
+
+    recordUsage: async (entityId: string, signal) => {
+      const stored = events.get(entityId)
+      if (stored && signal === "used") {
+        stored.usageCount++
+      }
+    },
+
+    gc: async () => ({ removedCount: 0, archivedCount: 0, consolidatedCount: 0 }),
+
+    advanceTime: async (ms: number) => {
+      clock.advance(ms)
+    },
+
+    listEntities: async () => Array.from(events.keys()),
+
+    teardown: async () => {
+      events.clear()
+    }
+  }
+}
+
+const main = async (): Promise<void> => {
+  const memory = detectMemory()
+
+  if (!memory) {
+    console.log("❌ No memory system found!")
+    console.log("")
+    console.log("To use zosma-mem, create one of:")
+    console.log("• MEMORY.md (generic format)")
+    console.log("• packages/gateway/workspace/agents/default/memory/MEMORY.md (OpenZosma)")
+    console.log("")
+    console.log("Run from your project root.")
+    process.exit(1)
+  }
+
+  console.log(`✅ Found ${memory.type} memory at ${memory.path}`)
+
+  const adapter = createMemoryAdapter(memory)
+  const report = await runEvals({ adapter, scenarios: builtInScenarios, k: 5 })
+
+  console.log("")
+  console.log(renderMarkdownReport(report))
+
+  if (report.summary.passed === report.summary.total) {
+    console.log("🎉 All tests passed!")
+  } else {
+    console.log(`❌ ${report.summary.failed} tests failed`)
+  }
+}
+
+main().catch(console.error)
\ No newline at end of file
diff --git a/packages/zosma-mem/src/evals/index.ts b/packages/zosma-mem/src/evals/index.ts
new file mode 100644
index 0000000..7e55de8
--- /dev/null
+++ b/packages/zosma-mem/src/evals/index.ts
@@ -0,0 +1,56 @@
+/**
+ * Public API surface for zosma-mem/evals.
+ *
+ * Import via:
+ *   import { runEvals, builtInScenarios } from "zosma-mem/evals"
+ */
+
+// Runner
+export { runEvals } from "./runner.js"
+
+// Report
+export { renderMarkdownReport } from "./report.js"
+
+// Scenarios
+export {
+	builtInScenarios,
+	coldStartScenario,
+	repeatedPatternScenario,
+	signalDilutionScenario,
+	staleMemoryScenario,
+	conflictingUpdatesScenario,
+	coAccessClusterScenario,
+	crossContextScenario,
+} from "./scenarios/index.js"
+
+// Metrics (for custom scenario authors)
+export {
+	computePrecisionAtK,
+	computeRecallAtK,
+	computeMRR,
+	computeNoiseRatio,
+	computeGcEffectiveness,
+	computeSalienceDrift,
+} from "./metrics.js"
+
+// Fixtures and utilities (for custom scenario authors)
+export { createEvent, createQuery, createLowValueEvents, createHighValueEvents } from "./utils/fixtures.js"
+export { createClock, ONE_HOUR_MS, ONE_DAY_MS, ONE_WEEK_MS, THIRTY_DAYS_MS } from "./utils/time.js"
+export { checkMetric, checkAllMetrics, DEFAULT_THRESHOLDS } from "./utils/assertions.js"
+
+// Types
+export type {
+	MemoryAdapter,
+	MemoryEvent,
+	RetrieveQuery,
+	RetrievedEntity,
+	UsageSignal,
+	GcResult,
+	AdapterSetupOpts,
+	DeterministicClock,
+	EvalMetrics,
+	EvalReport,
+	ScenarioDefinition,
+	ScenarioResult,
+	RunnerOpts,
+} from "./types.js"
diff --git a/packages/zosma-mem/src/evals/metrics.ts b/packages/zosma-mem/src/evals/metrics.ts
new file mode 100644
index 0000000..63d36fd
--- /dev/null
+++ b/packages/zosma-mem/src/evals/metrics.ts
@@ -0,0 +1,121 @@
+/**
+ * Pure metric computation functions for zosma-mem/evals.
+ *
+ * All functions are stateless and side-effect-free. They accept raw arrays/sets
+ * of entity IDs and return a single numeric value. No engine types are imported.
+ */
+
+// ---------------------------------------------------------------------------
+// Standard information retrieval metrics
+// ---------------------------------------------------------------------------
+
+/**
+ * Precision@K: of the first K retrieved entities, what fraction is relevant?
+ *
+ * @param retrieved - Ordered list of retrieved entity IDs (most relevant first).
+ * @param relevant  - Set of all entity IDs that are considered relevant.
+ * @param k         - Cutoff rank.
+ * @returns Value in [0, 1]. Returns 0 when k === 0.
+ */
+export const computePrecisionAtK = (retrieved: readonly string[], relevant: ReadonlySet<string>, k: number): number => {
+	if (k === 0) return 0
+	const topK = retrieved.slice(0, k)
+	const hits = topK.filter((id) => relevant.has(id)).length
+	return hits / k
+}
+
+/**
+ * Recall@K: of all relevant entities, what fraction appeared in the top K?
+ *
+ * @param retrieved - Ordered list of retrieved entity IDs (most relevant first).
+ * @param relevant  - Set of all entity IDs that are considered relevant.
+ * @param k         - Cutoff rank.
+ * @returns Value in [0, 1]. Returns 1 when `relevant` is empty (vacuously true).
+ */
+export const computeRecallAtK = (retrieved: readonly string[], relevant: ReadonlySet<string>, k: number): number => {
+	if (relevant.size === 0) return 1
+	const topK = retrieved.slice(0, k)
+	const hits = topK.filter((id) => relevant.has(id)).length
+	return hits / relevant.size
+}
+
+/**
+ * Mean Reciprocal Rank: reciprocal of the rank of the first relevant result.
+ *
+ * Called "MRR" even though it is computed for a single query here; callers
+ * average across queries to get the true MRR.
+ *
+ * @param retrieved - Ordered list of retrieved entity IDs (most relevant first).
+ * @param relevant  - Set of all entity IDs that are considered relevant.
+ * @returns Value in (0, 1]. Returns 0 if no relevant entity appears in the list.
+ */
+export const computeMRR = (retrieved: readonly string[], relevant: ReadonlySet<string>): number => {
+	for (let i = 0; i < retrieved.length; i++) {
+		if (relevant.has(retrieved[i])) {
+			return 1 / (i + 1)
+		}
+	}
+	return 0
+}
+
+// ---------------------------------------------------------------------------
+// Memory-specific metrics
+// ---------------------------------------------------------------------------
+
+/**
+ * Noise ratio: fraction of stored entities never retrieved after ingestion.
+ *
+ * A high noise ratio means the engine is persisting lots of low-value entities
+ * that never surface. Useful for assessing ingestion threshold quality.
+ *
+ * @param allEntities   - All entity IDs currently persisted by the engine.
+ * @param everRetrieved - Set of entity IDs that appeared in at least one result set.
+ * @returns Value in [0, 1]. Returns 0 when `allEntities` is empty.
+ */
+export const computeNoiseRatio = (
+	allEntities: readonly string[],
+	everRetrieved: ReadonlySet<string>,
+): number => {
+	if (allEntities.length === 0) return 0
+	const noiseCount = allEntities.filter((id) => !everRetrieved.has(id)).length
+	return noiseCount / allEntities.length
+}
+
+/**
+ * GC effectiveness: fraction of noise entities removed after GC.
+ *
+ * @param noiseBeforeGc - Entity IDs that were noise (never retrieved) before GC.
+ * @param entitiesAfterGc - All entity IDs persisted after GC runs.
+ * @returns Value in [0, 1]. Returns -1 when `noiseBeforeGc` is empty (N/A).
+ */
+export const computeGcEffectiveness = (
+	noiseBeforeGc: readonly string[],
+	entitiesAfterGc: readonly string[],
+): number => {
+	if (noiseBeforeGc.length === 0) return -1
+	const afterSet = new Set(entitiesAfterGc)
+	const removed = noiseBeforeGc.filter((id) => !afterSet.has(id)).length
+	return removed / noiseBeforeGc.length
+}
+
+/**
+ * Salience drift: standard deviation of entity scores across GC cycles.
+ *
+ * A high drift value indicates the scoring function is unstable -- entities
+ * oscillate in relevance across cycles rather than converging.
+ *
+ * @param scoreSnapshots - Array of score arrays, one per GC cycle.
+ *                         Each inner array contains one score per entity.
+ * @returns Standard deviation across all scores. Returns -1 when fewer than
+ *          two cycles are provided (not enough data).
+ */
+export const computeSalienceDrift = (scoreSnapshots: ReadonlyArray<readonly number[]>): number => {
+	if (scoreSnapshots.length < 2) return -1
+
+	const allScores: number[] = scoreSnapshots.flat()
+	if (allScores.length === 0) return -1
+
+	const mean = allScores.reduce((sum, s) => sum + s, 0) / allScores.length
+	const variance = allScores.reduce((sum, s) => sum + (s - mean) ** 2, 0) / allScores.length
+	return Math.sqrt(variance)
+}
diff --git a/packages/zosma-mem/src/evals/report.ts b/packages/zosma-mem/src/evals/report.ts
new file mode 100644
index 0000000..71241e3
--- /dev/null
+++ b/packages/zosma-mem/src/evals/report.ts
@@ -0,0 +1,70 @@
+/**
+ * Markdown report renderer for zosma-mem/evals.
+ *
+ * Produces a CI-friendly markdown table from an EvalReport.
+ * No external dependencies -- pure string manipulation.
+ */
+
+import type { EvalReport } from "./types.js"
+
+const fmt = (n: number): string => {
+	if (n === -1) return " -- "
+	return n.toFixed(3)
+}
+
+const pad = (s: string, width: number): string => s.padEnd(width)
+
+/**
+ * Render an EvalReport as a markdown string suitable for CI logs, PR comments,
+ * or writing to a file with --out.
+ */
+export const renderMarkdownReport = (report: EvalReport): string => {
+	const date = new Date(report.timestamp).toISOString()
+
+	const headers = ["Scenario", "P@K", "R@K", "MRR", "Noise", "GC Eff", "Drift", "Pass"]
+	const rows = report.results.map((r) => [
+		r.scenario,
+		fmt(r.metrics.precisionAtK),
+		fmt(r.metrics.recallAtK),
+		fmt(r.metrics.mrr),
+		fmt(r.metrics.noiseRatio),
+		fmt(r.metrics.gcEffectiveness),
+		fmt(r.metrics.salienceDrift),
+		r.passed ? "yes" : "NO",
+	])
+
+	// Compute column widths.
+	const colWidths = headers.map((h, i) =>
+		Math.max(h.length, ...rows.map((r) => r[i].length)),
+	)
+
+	const header = `| ${headers.map((h, i) => pad(h, colWidths[i])).join(" | ")} |`
+	const divider = `| ${colWidths.map((w) => "-".repeat(w)).join(" | ")} |`
+	const body = rows
+		.map((row) => `| ${row.map((cell, i) => pad(cell, colWidths[i])).join(" | ")} |`)
+		.join("\n")
+
+	const failureDetails = report.results
+		.filter((r) => !r.passed && r.details)
+		.map((r) => `**${r.scenario}**: ${r.details}`)
+		.join("\n")
+
+	const lines: string[] = [
+		`## zosma-mem Eval Report -- ${date}`,
+		"",
+		header,
+		divider,
+		body,
+		"",
+		`Summary: ${report.summary.passed}/${report.summary.total} passed.` +
+			` Avg P@K: ${report.summary.avgPrecision.toFixed(3)},` +
+			` Avg R@K: ${report.summary.avgRecall.toFixed(3)},` +
+			` Avg MRR: ${report.summary.avgMrr.toFixed(3)}`,
+	]
+
+	if (failureDetails) {
+		lines.push("", "### Failures", "", failureDetails)
+	}
+
+	return lines.join("\n")
+}
diff --git a/packages/zosma-mem/src/evals/runner.ts b/packages/zosma-mem/src/evals/runner.ts
new file mode 100644
index 0000000..232c341
--- /dev/null
+++ b/packages/zosma-mem/src/evals/runner.ts
@@ -0,0 +1,128 @@
+/**
+ * Scenario runner for zosma-mem/evals.
+ *
+ * Orchestrates the full lifecycle for each scenario:
+ *   1. Create an isolated temp directory.
+ *   2. Instantiate a deterministic clock.
+ *   3. Call adapter.setup().
+ *   4. Execute the scenario.
+ *   5. Call adapter.teardown() (always, even on failure).
+ *   6. Remove the temp directory.
+ *   7. Aggregate results into an EvalReport.
+ */
+
+import { mkdtemp, rm } from "node:fs/promises"
+import { tmpdir } from "node:os"
+import { join } from "node:path"
+import { createClock } from "./utils/time.js"
+import { builtInScenarios } from "./scenarios/index.js"
+import type { EvalReport, RunnerOpts, ScenarioResult } from "./types.js"
+
+const DEFAULT_K = 5
+const DEFAULT_CONCURRENCY = 1
+
+/**
+ * Run the eval suite against the provided adapter.
+ *
+ * @param opts - Runner options. Only `adapter` is required.
+ * @returns A structured EvalReport with per-scenario metrics and a summary.
+ */
+export const runEvals = async (opts: RunnerOpts): Promise<EvalReport> => {
+	const { adapter, k = DEFAULT_K, thresholds = {}, concurrency = DEFAULT_CONCURRENCY } = opts
+	const scenarios = opts.scenarios ?? builtInScenarios
+
+	// Run with controlled concurrency.
+	const results: Array<{ scenario: string; metrics: ScenarioResult["metrics"]; passed: boolean; details: string }> = []
+	const queue = [...scenarios]
+
+	const runNext = async (): Promise<void> => {
+		const scenario = queue.shift()
+		if (!scenario) return
+
+		opts.onScenarioStart?.(scenario.name)
+
+		let result: ScenarioResult
+		const workDir = await mkdtemp(join(tmpdir(), `zosma-mem-eval-${scenario.name.replace(/\s+/g, "-")}-`))
+		const clock = createClock()
+
+		try {
+			await adapter.setup({ workDir, clock })
+			result = await scenario.run(adapter, clock)
+		} catch (err) {
+			result = {
+				metrics: {
+					precisionAtK: 0,
+					recallAtK: 0,
+					mrr: 0,
+					noiseRatio: 0,
+					gcEffectiveness: -1,
+					salienceDrift: -1,
+				},
+				passed: false,
+				details: err instanceof Error ? err.message : String(err),
+			}
+		} finally {
+			try {
+				await adapter.teardown()
+			} catch {
+				// teardown failures are non-fatal -- the scenario result stands
+			}
+			await rm(workDir, { recursive: true, force: true })
+		}
+
+		// Apply runner-level threshold overrides on top of scenario defaults.
+		if (Object.keys(thresholds).length > 0 && result.passed) {
+			const { checkAllMetrics } = await import("./utils/assertions.js")
+			const failures = checkAllMetrics(result.metrics, thresholds)
+			if (failures.length > 0) {
+				result = { ...result, passed: false, details: failures.join("; ") }
+			}
+		}
+
+		// Attach K to metrics context (not stored on the type, used by scenarios internally).
+		void k // k is passed to scenarios via RunnerOpts; they reference it through the closure
+
+		results.push({
+			scenario: scenario.name,
+			metrics: result.metrics,
+			passed: result.passed,
+			details: result.details,
+		})
+
+		opts.onScenarioEnd?.(scenario.name, result)
+	}
+
+	// Build a pool of `concurrency` runners.
+	const workers = Array.from({ length: Math.max(1, concurrency) }, () => {
+		const drain = async (): Promise<void> => {
+			while (queue.length > 0) {
+				await runNext()
+			}
+		}
+		return drain()
+	})
+	await Promise.all(workers)
+
+	const passed = results.filter((r) => r.passed).length
+	const failed = results.length - passed
+
+	const avgPrecision =
+		results.length > 0 ? results.reduce((s, r) => s + r.metrics.precisionAtK, 0) / results.length : 0
+	const avgRecall =
+		results.length > 0 ? results.reduce((s, r) => s + r.metrics.recallAtK, 0) / results.length : 0
+	const avgMrr =
+		results.length > 0 ? results.reduce((s, r) => s + r.metrics.mrr, 0) / results.length : 0
+
+	return {
+		timestamp: Date.now(),
+		results,
+		summary: {
+			total: results.length,
+			passed,
+			failed,
+			avgPrecision,
+			avgRecall,
+			avgMrr,
+		},
+	}
+}
diff --git a/packages/zosma-mem/src/evals/scenarios/co-access-cluster.ts b/packages/zosma-mem/src/evals/scenarios/co-access-cluster.ts
new file mode 100644
index 0000000..77f3ea4
--- /dev/null
+++ b/packages/zosma-mem/src/evals/scenarios/co-access-cluster.ts
@@ -0,0 +1,70 @@
+/**
+ * Scenario 6: Co-access cluster
+ *
+ * Three entities (A, B, C) are always retrieved together during a series of
+ * usage sessions. Each time A is retrieved and used, B and C are also
+ * retrieved and used. Later, a query is issued that directly matches only A.
+ * All three must appear in the top K -- demonstrating that the engine surfaces
+ * contextually related entities (co-access boost).
+ *
+ * Tests: co-access / relational memory clustering.
+ */
+
+import { computeMRR, computePrecisionAtK, computeRecallAtK, computeNoiseRatio } from "../metrics.js"
+import { checkAllMetrics } from "../utils/assertions.js"
+import { createEvent, createQuery } from "../utils/fixtures.js"
+import type { DeterministicClock, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../types.js"
+
+const K = 5
+// All 3 cluster members must appear in top-5.
+const THRESHOLDS = { recallAtK: 1.0, precisionAtK: 0.6 }
+
+const run = async (adapter: MemoryAdapter, clock: DeterministicClock): Promise<ScenarioResult> => {
+	let t = clock.now()
+
+	// Ingest the three cluster entities.
+	await adapter.ingest(createEvent({ id: "auth-flow", type: "decision", content: "OAuth2 flow: redirect to /authorize, exchange code for token.", tags: ["auth", "oauth", "flow"], timestamp: t }))
+	await adapter.ingest(createEvent({ id: "retry-logic", type: "pattern", content: "Retry token refresh up to 3 times with exponential backoff.", tags: ["auth", "retry", "token"], timestamp: t + 1 }))
+	await adapter.ingest(createEvent({ id: "timeout-handling", type: "error", content: "If token refresh times out after 5s, force re-login.", tags: ["auth", "timeout", "session"], timestamp: t + 2 }))
+
+	// Ingest unrelated entities to pad the store.
+	await adapter.ingest(createEvent({ id: "ci-config", type: "pattern", content: "Run tests on every PR using GitHub Actions.", tags: ["ci", "testing"], timestamp: t + 3 }))
+	await adapter.ingest(createEvent({ id: "deploy-strategy", type: "decision", content: "Blue-green deployment via Kubernetes rolling updates.", tags: ["deploy", "k8s"], timestamp: t + 4 }))
+
+	// Simulate 3 sessions where A, B, C are always retrieved together.
+	for (let session = 0; session < 3; session++) {
+		clock.advance(60_000)
+		t = clock.now()
+
+		await adapter.recordUsage("auth-flow", "influenced_decision")
+		await adapter.recordUsage("retry-logic", "used")
+		await adapter.recordUsage("timeout-handling", "used")
+	}
+
+	// Query that directly matches only auth-flow.
+	const query = createQuery({ text: "How does the OAuth2 authentication flow work?", tags: ["auth", "oauth"] })
+	const results = await adapter.retrieve(query, K)
+	const retrieved = results.map((r) => r.id)
+	const clusterIds = ["auth-flow", "retry-logic", "timeout-handling"]
+	const relevantSet = new Set(clusterIds)
+	const everRetrieved = new Set(retrieved)
+	const allEntities = await adapter.listEntities()
+
+	const metrics = {
+		precisionAtK: computePrecisionAtK(retrieved, relevantSet, K),
+		recallAtK: computeRecallAtK(retrieved, relevantSet, K),
+		mrr: computeMRR(retrieved, relevantSet),
+		noiseRatio: computeNoiseRatio(allEntities, everRetrieved),
+		gcEffectiveness: -1,
+		salienceDrift: -1,
+	}
+
+	const failures = checkAllMetrics(metrics, THRESHOLDS)
+	return { metrics, passed: failures.length === 0, details: failures.join("; ") }
+}
+
+export const coAccessClusterScenario: ScenarioDefinition = {
+	name: "Co-access cluster",
+	description: "Three entities always used together; querying one must surface all three in top K.",
+	run,
+}
diff --git a/packages/zosma-mem/src/evals/scenarios/cold-start.ts b/packages/zosma-mem/src/evals/scenarios/cold-start.ts
new file mode 100644
index 0000000..aa7ebd4
--- /dev/null
+++ b/packages/zosma-mem/src/evals/scenarios/cold-start.ts
@@ -0,0 +1,59 @@
+/**
+ * Scenario 1: Cold start
+ *
+ * An empty engine ingests a mixed set of events (decisions, errors, patterns,
+ * preferences). A targeted query is issued. The engine must surface the
+ * semantically relevant events in the top K.
+ *
+ * Tests: basic ingestion and retrieval with no prior state.
+ */
+
+import { computeMRR, computePrecisionAtK, computeRecallAtK, computeNoiseRatio } from "../metrics.js"
+import { checkAllMetrics } from "../utils/assertions.js"
+import { createEvent, createQuery } from "../utils/fixtures.js"
+import type { DeterministicClock, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../types.js"
+
+const K = 5
+
+const THRESHOLDS = { precisionAtK: 0.6, recallAtK: 0.8, mrr: 0.5 }
+
+const run = async (adapter: MemoryAdapter, clock: DeterministicClock): Promise<ScenarioResult> => {
+	const t = clock.now()
+
+	// Ingest 10 events -- 3 relevant (tagged "auth"), 7 irrelevant noise.
+	const relevant = ["auth-decision", "auth-error", "auth-pattern"]
+
+	await adapter.ingest(createEvent({ id: "auth-decision", type: "decision", content: "Use short-lived JWTs with refresh token rotation.", tags: ["auth", "security"], timestamp: t }))
+	await adapter.ingest(createEvent({ id: "auth-error", type: "error", content: "Session invalidated on password reset -- must revoke all tokens.", tags: ["auth", "session"], timestamp: t + 1 }))
+	await adapter.ingest(createEvent({ id: "auth-pattern", type: "pattern", content: "Always validate token expiry before issuing a new one.", tags: ["auth", "token"], timestamp: t + 2 }))
+
+	// Noise events -- different domain.
+	for (let i = 0; i < 7; i++) {
+		await adapter.ingest(createEvent({ id: `noise-${i}`, type: "pattern", content: `Styling preference ${i}: use 4-space indentation.`, tags: ["style"], timestamp: t + 3 + i }))
+	}
+
+	const query = createQuery({ text: "How should authentication tokens be managed?", tags: ["auth"] })
+	const results = await adapter.retrieve(query, K)
+	const retrieved = results.map((r) => r.id)
+	const relevantSet = new Set(relevant)
+	const everRetrieved = new Set(retrieved)
+	const allEntities = await adapter.listEntities()
+
+	const metrics = {
+		precisionAtK: computePrecisionAtK(retrieved, relevantSet, K),
+		recallAtK: computeRecallAtK(retrieved, relevantSet, K),
+		mrr: computeMRR(retrieved, relevantSet),
+		noiseRatio: computeNoiseRatio(allEntities, everRetrieved),
+		gcEffectiveness: -1,
+		salienceDrift: -1,
+	}
+
+	const failures = checkAllMetrics(metrics, THRESHOLDS)
+	return { metrics, passed: failures.length === 0, details: failures.join("; ") }
+}
+
+export const coldStartScenario: ScenarioDefinition = {
+	name: "Cold start",
+	description: "Empty engine ingests 10 events (3 relevant) and retrieves for an auth query.",
+	run,
+}
diff --git a/packages/zosma-mem/src/evals/scenarios/conflicting-updates.ts b/packages/zosma-mem/src/evals/scenarios/conflicting-updates.ts
new file mode 100644
index 0000000..2ce3358
--- /dev/null
+++ b/packages/zosma-mem/src/evals/scenarios/conflicting-updates.ts
@@ -0,0 +1,83 @@
+/**
+ * Scenario 5: Conflicting updates
+ *
+ * The same logical entity is ingested 4 times with progressively updated
+ * content (simulating a fact that evolved over sessions). The most recent
+ * version must appear first in retrieval results.
+ *
+ * Tests: last-write-wins / recency preference for updated entities.
+ */
+
+import { computeMRR, computePrecisionAtK, computeRecallAtK, computeNoiseRatio } from "../metrics.js"
+import { checkAllMetrics } from "../utils/assertions.js"
+import { createEvent, createQuery } from "../utils/fixtures.js"
+import type { DeterministicClock, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../types.js"
+
+const K = 5
+const THRESHOLDS = { mrr: 1.0 }
+
+const run = async (adapter: MemoryAdapter, clock: DeterministicClock): Promise<ScenarioResult> => {
+	let t = clock.now()
+
+	const entityId = "db-schema-decision"
+	const versions = [
+		"Initial: use a single users table with a role column.",
+		"Update: split roles into a separate roles table for normalisation.",
+		"Update: add an audit_log table for compliance tracking.",
+		"Final: add soft-delete (deleted_at) to users; audit_log is append-only.",
+	]
+
+	// Ingest all 4 versions of the same entity.
+	for (const content of versions) {
+		await adapter.ingest(
+			createEvent({
+				id: entityId,
+				type: "decision",
+				content,
+				tags: ["database", "schema", "users"],
+				timestamp: t,
+			}),
+		)
+		clock.advance(60_000) // 1 minute between updates
+		t = clock.now()
+	}
+
+	// Add an unrelated entity to ensure ranking is non-trivial.
+	await adapter.ingest(
+		createEvent({ id: "cache-strategy", type: "pattern", content: "Use Redis for session caching.", tags: ["cache", "redis"], timestamp: t }),
+	)
+
+	const query = createQuery({ text: "What is the current database schema for users?", tags: ["database", "schema"] })
+	const results = await adapter.retrieve(query, K)
+	const retrieved = results.map((r) => r.id)
+	const relevantSet = new Set([entityId])
+	const everRetrieved = new Set(retrieved)
+	const allEntities = await adapter.listEntities()
+
+	// Additionally verify that the content of the top result reflects the latest version.
+	const topResult = results[0]
+	const contentIsLatest = topResult?.id === entityId && topResult.content.includes("soft-delete")
+	const contentDetails = topResult?.id === entityId && !contentIsLatest
+		? `top result content does not reflect latest version (got: "${topResult.content?.slice(0, 60)}")`
+		: ""
+
+	const metrics = {
+		precisionAtK: computePrecisionAtK(retrieved, relevantSet, K),
+		recallAtK: computeRecallAtK(retrieved, relevantSet, K),
+		mrr: computeMRR(retrieved, relevantSet),
+		noiseRatio: computeNoiseRatio(allEntities, everRetrieved),
+		gcEffectiveness: -1,
+		salienceDrift: -1,
+	}
+
+	const failures = checkAllMetrics(metrics, THRESHOLDS)
+	if (contentDetails) failures.push(contentDetails)
+
+	return { metrics, passed: failures.length === 0, details: failures.join("; ") }
+}
+
+export const conflictingUpdatesScenario: ScenarioDefinition = {
+	name: "Conflicting updates",
+	description: "Entity ingested 4 times with evolving content; most recent version must rank first.",
+	run,
+}
diff --git a/packages/zosma-mem/src/evals/scenarios/cross-context.ts b/packages/zosma-mem/src/evals/scenarios/cross-context.ts
new file mode 100644
index 0000000..d52770c
--- /dev/null
+++ b/packages/zosma-mem/src/evals/scenarios/cross-context.ts
@@ -0,0 +1,98 @@
+/**
+ * Scenario 7: Cross-context
+ *
+ * An entity tagged ["auth", "security"] is relevant when the agent is working
+ * on authentication but irrelevant when working on UI styling. Two queries are
+ * issued -- one on-topic, one off-topic. The entity must rank in top-3 for the
+ * auth query and outside top-5 for the styling query.
+ *
+ * Tests: context-sensitive retrieval -- the same entity should surface only
+ * when contextually appropriate.
+ */
+
+import { computeMRR, computePrecisionAtK, computeRecallAtK, computeNoiseRatio } from "../metrics.js"
+import { checkAllMetrics } from "../utils/assertions.js"
+import { createEvent, createQuery } from "../utils/fixtures.js"
+import type { DeterministicClock, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../types.js"
+
+const K = 5
+const THRESHOLDS = { mrr: 1.0 }
+
+const run = async (adapter: MemoryAdapter, clock: DeterministicClock): Promise<ScenarioResult> => {
+	const t = clock.now()
+
+	// The entity we care about -- highly relevant to auth, irrelevant to styling.
+	const targetId = "session-expiry-policy"
+	await adapter.ingest(
+		createEvent({
+			id: targetId,
+			type: "decision",
+			content: "Sessions expire after 30 minutes of inactivity. Refresh tokens are valid for 7 days.",
+			tags: ["auth", "security", "session"],
+			timestamp: t,
+		}),
+	)
+
+	// Add styling-domain entities that should dominate the off-topic query.
+	for (let i = 0; i < 5; i++) {
+		await adapter.ingest(
+			createEvent({
+				id: `style-rule-${i}`,
+				type: "preference",
+				content: `UI guideline ${i}: use Tailwind utility classes, avoid inline styles.`,
+				tags: ["ui", "styling", "tailwind"],
+				timestamp: t + 1 + i,
+			}),
+		)
+	}
+
+	// Add more auth entities to confirm the target is retrieved in the right context.
+	await adapter.ingest(createEvent({ id: "mfa-requirement", type: "decision", content: "MFA required for all accounts with admin privileges.", tags: ["auth", "mfa", "security"], timestamp: t + 6 }))
+	await adapter.ingest(createEvent({ id: "password-policy", type: "decision", content: "Passwords must be at least 12 characters with mixed case and symbols.", tags: ["auth", "password", "security"], timestamp: t + 7 }))
+
+	// --- Query 1: on-topic (auth) ---
+	const authQuery = createQuery({ text: "How long before a user session expires?", tags: ["auth", "session"] })
+	const authResults = await adapter.retrieve(authQuery, K)
+	const authRetrieved = authResults.map((r) => r.id)
+	const authRelevant = new Set([targetId])
+
+	const authMrr = computeMRR(authRetrieved, authRelevant)
+	const authRank = authRetrieved.indexOf(targetId) // 0-based; -1 = not found
+
+	// --- Query 2: off-topic (styling) ---
+	const styleQuery = createQuery({ text: "What CSS conventions should I use for the UI components?", tags: ["ui", "styling"] })
+	const styleResults = await adapter.retrieve(styleQuery, K)
+	const styleRetrieved = styleResults.map((r) => r.id)
+
+	// Target must NOT appear in top-5 of the styling query.
+	const targetInStyleTop5 = styleRetrieved.includes(targetId)
+
+	const everRetrieved = new Set([...authRetrieved, ...styleRetrieved])
+	const allEntities = await adapter.listEntities()
+
+	const metrics = {
+		precisionAtK: computePrecisionAtK(authRetrieved, authRelevant, K),
+		recallAtK: computeRecallAtK(authRetrieved, authRelevant, K),
+		mrr: authMrr,
+		noiseRatio: computeNoiseRatio(allEntities, everRetrieved),
+		gcEffectiveness: -1,
+		salienceDrift: -1,
+	}
+
+	const failures = checkAllMetrics(metrics, THRESHOLDS)
+
+	if (authRank > 2) {
+		failures.push(`target ranked ${authRank + 1} in auth query (expected top-3)`)
+	}
+	if (targetInStyleTop5) {
+		failures.push("target appeared in top-5 of off-topic styling query (should be absent)")
+	}
+
+	return { metrics, passed: failures.length === 0, details: failures.join("; ") }
+}
+
+export const crossContextScenario: ScenarioDefinition = {
+	name: "Cross-context",
+	description: "Entity relevant to auth must rank top-3 for auth query but not appear in styling query top-5.",
+	run,
+}
diff --git a/packages/zosma-mem/src/evals/scenarios/index.ts b/packages/zosma-mem/src/evals/scenarios/index.ts
new file mode 100644
index 0000000..5584509
--- /dev/null
+++ b/packages/zosma-mem/src/evals/scenarios/index.ts
@@ -0,0 +1,35 @@
+/**
+ * Built-in scenario registry.
+ *
+ * Import `builtInScenarios` to run the full default suite.
+ * Scenarios are listed in the order they will run when no override is provided.
+ */
+
+import { coldStartScenario } from "./cold-start.js"
+import { coAccessClusterScenario } from "./co-access-cluster.js"
+import { conflictingUpdatesScenario } from "./conflicting-updates.js"
+import { crossContextScenario } from "./cross-context.js"
+import { repeatedPatternScenario } from "./repeated-pattern.js"
+import { signalDilutionScenario } from "./signal-dilution.js"
+import { staleMemoryScenario } from "./stale-memory.js"
+import type { ScenarioDefinition } from "../types.js"
+
+export const builtInScenarios: ScenarioDefinition[] = [
+	coldStartScenario,
+	repeatedPatternScenario,
+	signalDilutionScenario,
+	staleMemoryScenario,
+	conflictingUpdatesScenario,
+	coAccessClusterScenario,
+	crossContextScenario,
+]
+
+export {
+	coldStartScenario,
+	repeatedPatternScenario,
+	signalDilutionScenario,
+	staleMemoryScenario,
+	conflictingUpdatesScenario,
+	coAccessClusterScenario,
+	crossContextScenario,
+}
diff --git a/packages/zosma-mem/src/evals/scenarios/repeated-pattern.ts b/packages/zosma-mem/src/evals/scenarios/repeated-pattern.ts
new file mode 100644
index 0000000..390bddc
--- /dev/null
+++ b/packages/zosma-mem/src/evals/scenarios/repeated-pattern.ts
@@ -0,0 +1,70 @@
+/**
+ * Scenario 2: Repeated pattern
+ *
+ * The same error event is ingested 5 times (same ID, same tags, evolving
+ * content). Between ingestions the adapter receives reinforcement signals
+ * indicating the entity was used. After reinforcement, the entity must rank
+ * first in a retrieval.
+ *
+ * Tests: reinforcement loop -- entities that get usage signals rise in rank.
+ */
+
+import { computeMRR, computePrecisionAtK, computeRecallAtK, computeNoiseRatio } from "../metrics.js"
+import { checkAllMetrics } from "../utils/assertions.js"
+import { createEvent, createQuery } from "../utils/fixtures.js"
+import type { DeterministicClock, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../types.js"
+
+const K = 5
+const THRESHOLDS = { mrr: 1.0 }
+
+const run = async (adapter: MemoryAdapter, clock: DeterministicClock): Promise<ScenarioResult> => {
+	let t = clock.now()
+
+	const recurringId = "retry-timeout"
+
+	// Ingest the recurring entity 5 times with progressively refined content.
+	for (let i = 0; i < 5; i++) {
+		await adapter.ingest(
+			createEvent({
+				id: recurringId,
+				type: "error",
+				content: `Network timeout on retry attempt ${i + 1}. Increase backoff to ${(i + 1) * 200}ms.`,
+				tags: ["network", "retry", "timeout"],
+				timestamp: t,
+			}),
+		)
+		// Signal that the agent used this entity after each ingestion.
+		await adapter.recordUsage(recurringId, "influenced_decision")
+		clock.advance(1_000)
+		t = clock.now()
+	}
+
+	// Add some competing entities so the ranking is non-trivial.
+	await adapter.ingest(createEvent({ id: "db-connection", type: "error", content: "DB connection pool exhausted.", tags: ["database", "pool"], timestamp: t + 1 }))
+	await adapter.ingest(createEvent({ id: "cache-miss", type: "pattern", content: "Cache miss rate above 80% -- review TTL settings.", tags: ["cache", "performance"], timestamp: t + 2 }))
+
+	const query = createQuery({ text: "What should I do when a network request times out?", tags: ["network", "retry"] })
+	const results = await adapter.retrieve(query, K)
+	const retrieved = results.map((r) => r.id)
+	const relevantSet = new Set([recurringId])
+	const everRetrieved = new Set(retrieved)
+	const allEntities = await adapter.listEntities()
+
+	const metrics = {
+		precisionAtK: computePrecisionAtK(retrieved, relevantSet, K),
+		recallAtK: computeRecallAtK(retrieved, relevantSet, K),
+		mrr: computeMRR(retrieved, relevantSet),
+		noiseRatio: computeNoiseRatio(allEntities, everRetrieved),
+		gcEffectiveness: -1,
+		salienceDrift: -1,
+	}
+
+	const failures = checkAllMetrics(metrics, THRESHOLDS)
+	return { metrics, passed: failures.length === 0, details: failures.join("; ") }
+}
+
+export const repeatedPatternScenario: ScenarioDefinition = {
+	name: "Repeated pattern",
+	description: "Recurring entity ingested 5 times with reinforcement signals; must rank first.",
+	run,
+}
diff --git a/packages/zosma-mem/src/evals/scenarios/signal-dilution.ts b/packages/zosma-mem/src/evals/scenarios/signal-dilution.ts
new file mode 100644
index 0000000..d4d7210
--- /dev/null
+++ b/packages/zosma-mem/src/evals/scenarios/signal-dilution.ts
@@ -0,0 +1,64 @@
+/**
+ * Scenario 3: Signal dilution
+ *
+ * 100 low-value events are ingested alongside 3 high-value events. A targeted
+ * query is issued that matches only the high-value events. The engine must
+ * surface at least 3 of the 5 top results from the high-value set, proving
+ * that the pool size does not dilute retrieval quality.
+ *
+ * Tests: attention gating / relevance ranking at scale.
+ */
+
+import { computeMRR, computePrecisionAtK, computeRecallAtK, computeNoiseRatio } from "../metrics.js"
+import { checkAllMetrics } from "../utils/assertions.js"
+import { createHighValueEvents, createLowValueEvents, createQuery } from "../utils/fixtures.js"
+import type { DeterministicClock, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../types.js"
+
+const K = 5
+const THRESHOLDS = { precisionAtK: 0.6, recallAtK: 1.0, mrr: 1.0 }
+
+const run = async (adapter: MemoryAdapter, clock: DeterministicClock): Promise<ScenarioResult> => {
+	const t = clock.now()
+
+	const highValueIds = ["perf-critical-1", "perf-critical-2", "perf-critical-3"]
+	const highValueTags = ["performance", "critical", "database"]
+
+	// Ingest 100 low-value events first (noise).
+	for (const event of createLowValueEvents(100, t)) {
+		await adapter.ingest(event)
+	}
+
+	// Ingest the 3 high-value events.
+	for (const event of createHighValueEvents(highValueIds, highValueTags, t + 100)) {
+		await adapter.ingest(event)
+	}
+
+	const query = createQuery({
+		text: "Critical database performance issues that need immediate attention",
+		tags: ["performance", "database", "critical"],
+	})
+
+	const results = await adapter.retrieve(query, K)
+	const retrieved = results.map((r) => r.id)
+	const relevantSet = new Set(highValueIds)
+	const everRetrieved = new Set(retrieved)
+	const allEntities = await adapter.listEntities()
+
+	const metrics = {
+		precisionAtK: computePrecisionAtK(retrieved, relevantSet, K),
+		recallAtK: computeRecallAtK(retrieved, relevantSet, K),
+		mrr: computeMRR(retrieved, relevantSet),
+		noiseRatio: computeNoiseRatio(allEntities, everRetrieved),
+		gcEffectiveness: -1,
+		salienceDrift: -1,
+	}
+
+	const failures = checkAllMetrics(metrics, THRESHOLDS)
+	return { metrics, passed: failures.length === 0, details: failures.join("; ") }
+}
+
+export const signalDilutionScenario: ScenarioDefinition = {
+	name: "Signal dilution",
+	description: "100 low-value + 3 high-value events; engine must surface high-value despite pool size.",
+	run,
+}
diff --git a/packages/zosma-mem/src/evals/scenarios/stale-memory.ts b/packages/zosma-mem/src/evals/scenarios/stale-memory.ts
new file mode 100644
index 0000000..117ad15
--- /dev/null
+++ b/packages/zosma-mem/src/evals/scenarios/stale-memory.ts
@@ -0,0 +1,89 @@
+/**
+ * Scenario 4: Stale memory
+ *
+ * Events are ingested, then the clock is advanced 30 days without any access.
+ * GC is run. A fresh event is ingested. Retrieval must prefer the fresh entity
+ * over the stale ones. GC effectiveness is measured by checking how many of
+ * the stale, never-retrieved events were removed.
+ *
+ * Tests: time-based decay + GC pruning of unused entities.
+ */
+
+import { computeGcEffectiveness, computeMRR, computeNoiseRatio, computePrecisionAtK, computeRecallAtK } from "../metrics.js"
+import { checkAllMetrics } from "../utils/assertions.js"
+import { createEvent, createQuery } from "../utils/fixtures.js"
+import { THIRTY_DAYS_MS } from "../utils/time.js"
+import type { DeterministicClock, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../types.js"
+
+const K = 5
+// GC effectiveness is advisory here -- not all engines support decay.
+const THRESHOLDS = { mrr: 1.0 }
+
+const run = async (adapter: MemoryAdapter, clock: DeterministicClock): Promise<ScenarioResult> => {
+	const t = clock.now()
+
+	// Ingest stale events -- none of them will be retrieved after the time jump.
+	const staleIds = ["stale-a", "stale-b", "stale-c", "stale-d", "stale-e"]
+	for (const id of staleIds) {
+		await adapter.ingest(
+			createEvent({
+				id,
+				type: "pattern",
+				content: `Old preference: ${id}. No longer relevant.`,
+				tags: ["legacy", "stale"],
+				timestamp: t,
+			}),
+		)
+	}
+
+	// Record the entity list before GC.
+	const entitiesBeforeGc = await adapter.listEntities()
+
+	// Advance the clock 30 days -- simulates no activity.
+	await adapter.advanceTime(THIRTY_DAYS_MS)
+	clock.advance(THIRTY_DAYS_MS)
+
+	// Run GC.
+	await adapter.gc()
+
+	// Ingest a fresh, highly relevant event after the time jump.
+	const freshId = "fresh-auth-decision"
+	await adapter.ingest(
+		createEvent({
+			id: freshId,
+			type: "decision",
+			content: "New auth policy: enforce MFA for all admin accounts.",
+			tags: ["auth", "security", "policy"],
+			timestamp: clock.now(),
+		}),
+	)
+
+	const entitiesAfterGc = await adapter.listEntities()
+
+	// Identify noise (stale entities never retrieved).
+	const noiseBeforeGc = entitiesBeforeGc.filter((id) => staleIds.includes(id))
+
+	const query = createQuery({ text: "What is the current auth policy for admin accounts?", tags: ["auth", "policy"] })
+	const results = await adapter.retrieve(query, K)
+	const retrieved = results.map((r) => r.id)
+	const relevantSet = new Set([freshId])
+	const everRetrieved = new Set(retrieved)
+
+	const metrics = {
+		precisionAtK: computePrecisionAtK(retrieved, relevantSet, K),
+		recallAtK: computeRecallAtK(retrieved, relevantSet, K),
+		mrr: computeMRR(retrieved, relevantSet),
+		noiseRatio: computeNoiseRatio(entitiesAfterGc, everRetrieved),
+		gcEffectiveness: computeGcEffectiveness(noiseBeforeGc, entitiesAfterGc),
+		salienceDrift: -1,
+	}
+
+	const failures = checkAllMetrics(metrics, THRESHOLDS)
+	return { metrics, passed: failures.length === 0, details: failures.join("; ") }
+}
+
+export const staleMemoryScenario: ScenarioDefinition = {
+	name: "Stale memory",
+	description: "Events ingested, clock advanced 30 days, GC run. Fresh entity must rank first.",
+	run,
+}
diff --git a/packages/zosma-mem/src/evals/types.ts b/packages/zosma-mem/src/evals/types.ts
new file mode 100644
index 0000000..a37f8e2
--- /dev/null
+++ b/packages/zosma-mem/src/evals/types.ts
@@ -0,0 +1,270 @@
+/**
+ * Engine-agnostic types for zosma-mem/evals.
+ *
+ * These types define the contract between the eval framework and any memory
+ * engine under test. No implementation details leak through here -- engines
+ * are black boxes that accept events and answer queries.
+ */
+
+// ---------------------------------------------------------------------------
+// Deterministic clock
+// ---------------------------------------------------------------------------
+
+/**
+ * A synthetic clock injected into the adapter at setup time.
+ * Scenarios that test time-sensitive behaviour (decay, stale memory) advance
+ * this clock instead of using wall-clock time, making tests deterministic.
+ */
+export interface DeterministicClock {
+	/** Return the current synthetic timestamp (ms since epoch). */
+	now: () => number
+	/** Move the clock forward by the given number of milliseconds. */
+	advance: (ms: number) => void
+}
+
+// ---------------------------------------------------------------------------
+// Adapter setup
+// ---------------------------------------------------------------------------
+
+export interface AdapterSetupOpts {
+	/**
+	 * Temporary directory created by the runner for this scenario.
+	 * The engine may use it for any persistent state.
+	 * The runner cleans it up after teardown.
+	 */
+	workDir: string
+	/** Deterministic clock. The engine must use this instead of Date.now(). */
+	clock: DeterministicClock
+}
+
+// ---------------------------------------------------------------------------
+// Memory events
+// ---------------------------------------------------------------------------
+
+/**
+ * A memory event as seen by the eval framework.
+ * Deliberately minimal -- engines may treat `type` and `metadata` as they see fit.
+ */
+export interface MemoryEvent {
+	id: string
+	/**
+	 * Semantic category. Common values: "decision" | "error" | "pattern" | "preference".
+	 * Not constrained to an enum -- each engine defines its own taxonomy.
+	 */
+	type: string
+	/** Human-readable content to be stored. */
+	content: string
+	/** Tags used for retrieval matching. */
+	tags: string[]
+	/** Synthetic timestamp produced by the deterministic clock. */
+	timestamp: number
+	/** Engine-specific passthrough. The eval framework never reads this. */
+	metadata?: Record<string, unknown>
+}
+
+// ---------------------------------------------------------------------------
+// Retrieval
+// ---------------------------------------------------------------------------
+
+export interface RetrieveQuery {
+	/** Natural language task description. */
+	text: string
+	/** Optional hint tags to narrow the search. */
+	tags?: string[]
+	/** Engine-specific context passthrough. The eval framework never reads this. */
+	context?: Record<string, unknown>
+}
+
+export interface RetrievedEntity {
+	id: string
+	content: string
+	/**
+	 * Engine-assigned relevance score. The eval framework only uses this for
+	 * ordering -- it does not interpret the magnitude.
+	 */
+	score: number
+	tags: string[]
+}
+
+// ---------------------------------------------------------------------------
+// Usage signals
+// ---------------------------------------------------------------------------
+
+/**
+ * Signal sent back to the engine after a retrieval to model agent behaviour.
+ * - `used`               -- the agent acted on this entity (reinforces it)
+ * - `ignored`            -- the agent did not act on it (demotes it)
+ * - `influenced_decision` -- the entity directly shaped a tool call or decision (strongest signal)
+ */
+export type UsageSignal = "used" | "ignored" | "influenced_decision"
+
+// ---------------------------------------------------------------------------
+// GC
+// ---------------------------------------------------------------------------
+
+export interface GcResult {
+	/** Entities fully removed from the store. */
+	removedCount: number
+	/** Entities moved to an archive / cold tier. */
+	archivedCount: number
+	/** Groups of entities merged into a single summary entity. */
+	consolidatedCount: number
+}
+
+// ---------------------------------------------------------------------------
+// Adapter interface
+// ---------------------------------------------------------------------------
+
+/**
+ * Engine-agnostic adapter that the eval framework programs against.
+ *
+ * Engine authors implement this interface to make their engine evaluable.
+ * The adapter is the only coupling point between the eval module and any
+ * specific engine -- nothing else in this package imports engine code.
+ */
+export interface MemoryAdapter {
+	/**
+	 * Initialise the engine with a clean, isolated state.
+	 * Called once before each scenario.
+	 */
+	setup: (opts: AdapterSetupOpts) => Promise<void>
+
+	/** Ingest a memory event into the engine. */
+	ingest: (event: MemoryEvent) => Promise<void>
+
+	/**
+	 * Retrieve the top-K most relevant entities for the given query.
+	 * Results must be ordered by descending relevance (most relevant first).
+	 */
+	retrieve: (query: RetrieveQuery, topK: number) => Promise<RetrievedEntity[]>
+
+	/**
+	 * Report how the agent used a previously retrieved entity.
+	 * Engines that support reinforcement learning update internal state here.
+	 * Engines that do not may no-op.
+	 */
+	recordUsage: (entityId: string, signal: UsageSignal) => Promise<void>
+
+	/**
+	 * Trigger garbage collection / decay / pruning.
+	 * Engines that do not support GC may no-op and return a zero GcResult.
+	 */
+	gc: () => Promise<GcResult>
+
+	/**
+	 * Advance the engine's internal clock by the given duration.
+	 * Must delegate to the `DeterministicClock` provided in `setup`.
+	 * Engines that use wall-clock time must accept a synthetic clock override.
+	 */
+	advanceTime: (ms: number) => Promise<void>
+
+	/**
+	 * Return all currently persisted entity IDs (including low-score ones).
+	 * Used to compute noise ratio and GC effectiveness.
+	 */
+	listEntities: () => Promise<string[]>
+
+	/**
+	 * Tear down the engine and release any held resources.
+	 * Called once after each scenario, regardless of pass/fail.
+	 */
+	teardown: () => Promise<void>
+}
+
+// ---------------------------------------------------------------------------
+// Metrics
+// ---------------------------------------------------------------------------
+
+export interface EvalMetrics {
+	/** Of the top-K retrieved entities, what fraction was relevant? */
+	precisionAtK: number
+	/** Of all relevant entities, what fraction appeared in top-K? */
+	recallAtK: number
+	/** Mean reciprocal rank of the first relevant result (0 if none in top-K). */
+	mrr: number
+	/**
+	 * Fraction of persisted entities never retrieved after ingestion.
+	 * Measures ingestion threshold quality (high = lots of junk stored).
+	 */
+	noiseRatio: number
+	/**
+	 * Fraction of noise entities successfully removed by GC.
+	 * Only meaningful in scenarios that exercise GC. -1 when not applicable.
+	 */
+	gcEffectiveness: number
+	/**
+	 * Standard deviation of entity scores across GC cycles.
+	 * High drift = unstable scoring. -1 when not applicable.
+	 */
+	salienceDrift: number
+}
+
+// ---------------------------------------------------------------------------
+// Scenarios
+// ---------------------------------------------------------------------------
+
+export interface ScenarioResult {
+	metrics: EvalMetrics
+	passed: boolean
+	/** Human-readable explanation on failure. Empty string when passing. */
+	details: string
+}
+
+export interface ScenarioDefinition {
+	name: string
+	description: string
+	/**
+	 * Execute the scenario against the provided adapter and return results.
+	 * The runner handles setup/teardown; the scenario only drives ingest/retrieve.
+	 */
+	run: (adapter: MemoryAdapter, clock: DeterministicClock) => Promise<ScenarioResult>
+}
+
+// ---------------------------------------------------------------------------
+// Runner
+// ---------------------------------------------------------------------------
+
+export interface RunnerOpts {
+	/** The adapter wrapping the engine under test. */
+	adapter: MemoryAdapter
+	/**
+	 * Scenarios to run. Defaults to all built-in scenarios when omitted.
+	 */
+	scenarios?: ScenarioDefinition[]
+	/** Top-K for precision/recall computation. Default: 5. */
+	k?: number
+	/** Override default pass/fail thresholds per metric. */
+	thresholds?: Partial<EvalMetrics>
+	/**
+	 * Max scenarios running concurrently. Default: 1 (sequential).
+	 * Parallel execution is only safe if the adapter supports isolated instances.
+	 */
+	concurrency?: number
+	/** Called immediately before each scenario starts. */
+	onScenarioStart?: (name: string) => void
+	/** Called immediately after each scenario completes. */
+	onScenarioEnd?: (name: string, result: ScenarioResult) => void
+}
+
+// ---------------------------------------------------------------------------
+// Report
+// ---------------------------------------------------------------------------
+
+export interface EvalReport {
+	/** Unix ms timestamp of when the run completed. */
+	timestamp: number
+	results: Array<{
+		scenario: string
+		metrics: EvalMetrics
+		passed: boolean
+		details: string
+	}>
+	summary: {
+		total: number
+		passed: number
+		failed: number
+		avgPrecision: number
+		avgRecall: number
+		avgMrr: number
+	}
+}
diff --git a/packages/zosma-mem/src/evals/utils/assertions.ts b/packages/zosma-mem/src/evals/utils/assertions.ts
new file mode 100644
index 0000000..45de7fb
--- /dev/null
+++ b/packages/zosma-mem/src/evals/utils/assertions.ts
@@ -0,0 +1,54 @@
+/**
+ * Threshold helpers for scenario pass/fail decisions.
+ *
+ * Each function returns a human-readable failure message, or an empty string
+ * when the check passes. Scenarios collect these messages and join them to
+ * produce the `details` field of ScenarioResult.
+ */
+
+import type { EvalMetrics } from "../types.js"
+
+/** Default pass thresholds used when the runner does not provide overrides. */
+export const DEFAULT_THRESHOLDS: Readonly<EvalMetrics> = {
+	precisionAtK: 0.6,
+	recallAtK: 0.6,
+	mrr: 0.5,
+	noiseRatio: -1,    // no hard limit by default -- informational only
+	gcEffectiveness: -1, // -1 = N/A, skip check
+	salienceDrift: -1,   // -1 = N/A, skip check
+}
+
+/**
+ * Check a single metric against a threshold.
+ * Returns an empty string on pass, a descriptive message on fail.
+ *
+ * For `gcEffectiveness` and `salienceDrift`, a threshold of -1 means "skip".
+ */
+export const checkMetric = (
+	name: keyof EvalMetrics,
+	actual: number,
+	threshold: number,
+): string => {
+	if (threshold === -1) return "" // N/A
+	if (actual >= threshold) return ""
+	return `${name}: ${actual.toFixed(3)} < threshold ${threshold.toFixed(3)}`
+}
+
+/**
+ * Check all metrics against a threshold object.
+ * Returns an array of failure messages (empty array = all passed).
+ */
+export const checkAllMetrics = (
+	metrics: EvalMetrics,
+	thresholds: Readonly<Partial<EvalMetrics>>,
+): string[] => {
+	const merged: EvalMetrics = { ...DEFAULT_THRESHOLDS, ...thresholds }
+	const failures: string[] = []
+
+	for (const key of Object.keys(merged) as Array<keyof EvalMetrics>) {
+		const msg = checkMetric(key, metrics[key], merged[key])
+		if (msg) failures.push(msg)
+	}
+
+	return failures
+}
diff --git a/packages/zosma-mem/src/evals/utils/fixtures.ts b/packages/zosma-mem/src/evals/utils/fixtures.ts
new file mode 100644
index 0000000..b5c6023
--- /dev/null
+++ b/packages/zosma-mem/src/evals/utils/fixtures.ts
@@ -0,0 +1,67 @@
+/**
+ * Synthetic data builders for eval scenarios.
+ *
+ * All builders produce deterministic output given the same inputs.
+ * No randomness, no network calls, no engine types.
+ */
+
+import type { MemoryEvent, RetrieveQuery } from "../types.js"
+
+// ---------------------------------------------------------------------------
+// Event builders
+// ---------------------------------------------------------------------------
+
+/**
+ * Create a MemoryEvent with sensible defaults.
+ * Any field can be overridden by passing a partial.
+ */
+export const createEvent = (overrides: Partial<MemoryEvent> & Pick<MemoryEvent, "id" | "content">): MemoryEvent => ({
+	type: "pattern",
+	tags: [],
+	timestamp: 0,
+	metadata: {},
+	...overrides,
+})
+
+/**
+ * Build a batch of N low-value events (no tags, generic content).
+ * Used in signal-dilution scenarios to pad the memory store.
+ */
+export const createLowValueEvents = (count: number, startTimestamp: number): MemoryEvent[] =>
+	Array.from({ length: count }, (_, i) => ({
+		id: `low-value-${i}`,
+		type: "pattern",
+		content: `Routine observation ${i}: nothing notable happened.`,
+		tags: [],
+		timestamp: startTimestamp + i,
+		metadata: {},
+	}))
+
+/**
+ * Build a batch of high-value events with explicit tags.
+ */
+export const createHighValueEvents = (
+	ids: string[],
+	tags: string[],
+	startTimestamp: number,
+): MemoryEvent[] =>
+	ids.map((id, i) => ({
+		id,
+		type: "decision",
+		content: `Critical decision recorded: ${id}. Tags: ${tags.join(", ")}.`,
+		tags,
+		timestamp: startTimestamp + i,
+		metadata: {},
+	}))
+
+// ---------------------------------------------------------------------------
+// Query builders
+// ---------------------------------------------------------------------------
+
+/**
+ * Create a RetrieveQuery with sensible defaults.
+ */
+export const createQuery = (overrides: Partial<RetrieveQuery> & Pick<RetrieveQuery, "text">): RetrieveQuery => ({
+	tags: [],
+	...overrides,
+})
diff --git a/packages/zosma-mem/src/evals/utils/time.ts b/packages/zosma-mem/src/evals/utils/time.ts
new file mode 100644
index 0000000..dadaf91
--- /dev/null
+++ b/packages/zosma-mem/src/evals/utils/time.ts
@@ -0,0 +1,32 @@
+/**
+ * Deterministic clock implementation for use in eval scenarios.
+ *
+ * Scenarios advance this clock explicitly rather than relying on wall-clock
+ * time, making time-sensitive tests (decay, stale memory) fully reproducible.
+ */
+
+import type { DeterministicClock } from "../types.js"
+
+/**
+ * Create a new deterministic clock starting at the given epoch timestamp.
+ *
+ * @param startMs - Initial timestamp in milliseconds. Defaults to a fixed
+ *                  reference point (2026-01-01T00:00:00.000Z) so tests are
+ *                  not sensitive to when they run.
+ */
+export const createClock = (startMs = 1_735_689_600_000): DeterministicClock => {
+	let current = startMs
+
+	return {
+		now: () => current,
+		advance: (ms: number) => {
+			current += ms
+		},
+	}
+}
+
+// Convenience constants for advancing time in scenarios.
+export const ONE_HOUR_MS = 60 * 60 * 1_000
+export const ONE_DAY_MS = 24 * ONE_HOUR_MS
+export const ONE_WEEK_MS = 7 * ONE_DAY_MS
+export const THIRTY_DAYS_MS = 30 * ONE_DAY_MS
diff --git a/packages/zosma-mem/src/index.ts b/packages/zosma-mem/src/index.ts
new file mode 100644
index 0000000..73ab09b
--- /dev/null
+++ b/packages/zosma-mem/src/index.ts
@@ -0,0 +1,4 @@
+// zosma-mem package root
+// Re-exports the evals module as the primary surface for v0.0.1.
+// Future modules (engine, store, ingestion) will be added here.
+export * from "./evals/index.js"
diff --git a/packages/zosma-mem/tsconfig.json b/packages/zosma-mem/tsconfig.json
new file mode 100644
index 0000000..1560b4f
--- /dev/null
+++ b/packages/zosma-mem/tsconfig.json
@@ -0,0 +1,9 @@
+{
+	"extends": "../../tsconfig.base.json",
+	"compilerOptions": {
+		"outDir": "dist",
+		"rootDir": "src",
+		"jsx": "react-jsx"
+	},
+	"include": ["src"]
+}
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index ec61707..8608135 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -604,6 +604,9 @@ importers:
       vitest:
         specifier: ^3.0.0
         version: 3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2)
+      zosma-mem:
+        specifier: link:../zosma-mem
+        version: link:../zosma-mem
 
   packages/orchestrator:
     dependencies:
@@ -717,6 +720,43 @@ importers:
         specifier: ^3.1.1
         version: 3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2)
 
+  packages/zosma-mem:
+    dependencies:
+      chalk:
+        specifier: ^5.4.0
+        version: 5.6.2
+      commander:
+        specifier: ^13.0.0
+        version: 13.1.0
+      ink:
+        specifier: ^5.1.0
+        version: 5.2.1(@types/react@18.3.28)(react@18.3.1)
+      ink-spinner:
+        specifier: ^5.0.0
+        version: 5.0.0(ink@5.2.1(@types/react@18.3.28)(react@18.3.1))(react@18.3.1)
+      react:
+        specifier: ^18.3.0
+        version: 18.3.1
+      zod:
+        specifier: ^3.23.0
+        version: 3.25.76
+    devDependencies:
+      '@types/node':
+        specifier: ^22.15.2
+        version: 22.19.15
+      '@types/react':
+        specifier: ^18.3.0
+        version: 18.3.28
+      tsx:
+        specifier: ^4.0.0
+        version: 4.21.0
+      typescript:
+        specifier: ^5.7.3
+        version: 5.9.3
+      vitest:
+        specifier: ^3.0.0
+        version: 3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2)
+
 packages:
 
   '@ai-sdk/gateway@3.0.66':
@@ -735,6 +775,10 @@ packages:
     resolution: {integrity: sha512-oGMAgGoQdBXbZqNG0Ze56CHjDZ1IDYOwGYxYjO5KLSlz5HiNQ9udIXsPZ61VWaHGZ5XW/jyjmr6t2xz2jGVwbQ==}
     engines: {node: '>=18'}
 
+  '@alcalzone/ansi-tokenize@0.1.3':
+    resolution: {integrity: sha512-3yWxPTq3UQ/FY9p1ErPxIyfT64elWaMvM9lIHnaqpyft63tkxodF5aUElYHrdisWve5cETkh1+KBw1yJuW0aRw==}
+    engines: {node: '>=14.13.1'}
+
   '@alloc/quick-lru@5.2.0':
     resolution: {integrity: sha512-UrcABB+4bUrFABwbluTIBErXwvbsU/V7TZWfmbgJfbkwiBuziS9gxdODUyuiecfdGQ85jglMW6juS3+z5TsKLw==}
     engines: {node: '>=10'}
@@ -3458,6 +3502,9 @@ packages:
   '@types/pg@8.18.0':
     resolution: {integrity: sha512-gT+oueVQkqnj6ajGJXblFR4iavIXWsGAFCk3dP4Kki5+a9R4NMt0JARdk6s8cUKcfUoqP5dAtDSLU8xYUTFV+Q==}
 
+  '@types/prop-types@15.7.15':
+    resolution: {integrity: sha512-F6bEyamV9jKGAFBEmlQnesRPGOQqS2+Uwi0Em15xenOxHaf2hv6L8YCVn3rPdPJOiJfPiCnLIRyvwVaqMY3MIw==}
+
   '@types/qs@6.15.0':
     resolution: {integrity: sha512-JawvT8iBVWpzTrz3EGw9BTQFg3BQNmwERdKE22vlTxawwtbyUSlMppvZYKLZzB5zgACXdXxbD3m1bXaMqP/9ow==}
 
@@ -3469,6 +3516,9 @@ packages:
     peerDependencies:
       '@types/react': ^19.2.0
 
+  '@types/react@18.3.28':
+    resolution: {integrity: sha512-z9VXpC7MWrhfWipitjNdgCauoMLRdIILQsAEV+ZesIzBq/oUlxk0m3ApZuMFCXdnS4U7KrI+l3WRUEGQ8K1QKw==}
+
   '@types/react@19.2.14':
     resolution: {integrity: sha512-ilcTH/UniCkMdtexkoCN0bI7pMcJDvmQFPvuPvmEaYA/NSfFTAgdUSLAoVjaRJm7+6PvcM+q1zYOwS4wTYMF9w==}
 
@@ -3602,6 +3652,10 @@ packages:
   ajv@8.18.0:
     resolution: {integrity: sha512-PlXPeEWMXMZ7sPYOHqmDyCJzcfNrUr3fGNKtezX14ykXOEIvyK81d+qydx89KY5O71FKMPaQ2vBfBFI5NHR63A==}
 
+  ansi-escapes@7.3.0:
+    resolution: {integrity: sha512-BvU8nYgGQBxcmMuEeUEmNTvrMVjJNSH7RgW24vXexN4Ven6qCvy4TntnvlnwnMLTVlcRQQdbRY8NKnaIoeWDNg==}
+    engines: {node: '>=18'}
+
   ansi-regex@5.0.1:
     resolution: {integrity: sha512-quJQXlTSUGL2LH9SUXo8VwsY4soanhgo6LNSm84E1LBcE8s3O0wpdiRzyR9z/ZZJMlMWv37qOOb9pdJlMUEKFQ==}
     engines: {node: '>=8'}
@@ -3614,6 +3668,10 @@ packages:
     resolution: {integrity: sha512-zbB9rCJAT1rbjiVDb2hqKFHNYLxgtk8NURxZ3IZwD3F6NtxbXZQCnnSi1Lkx+IDohdPlFp222wVALIheZJQSEg==}
     engines: {node: '>=8'}
 
+  ansi-styles@6.2.3:
+    resolution: {integrity: sha512-4Dj6M28JB+oAH8kFkTLUo+a2jwOFkuqb3yucU0CANcRRUbxS0cP0nZYCGjcc3BNXwRIsUVmDGgzawme7zvJHvg==}
+    engines: {node: '>=12'}
+
   any-promise@1.3.0:
     resolution: {integrity: sha512-7UvmKalWRt1wgjL1RrGxoSJW/0QZFIegpeGvZG9kjp8vrRu55XTHbwnqq2GpXm9uLbcuhxm3IqX9OB4MZR1b2A==}
 
@@ -3667,6 +3725,10 @@ packages:
   asynckit@0.4.0:
     resolution: {integrity: sha512-Oei9OH4tRh0YqU3GxhX79dM/mwVgvbZJaSNaRk+bshkj0S5cfHcgYakreBjrHwatXKbz+IoIdYLxrKim2MjW0Q==}
 
+  auto-bind@5.0.1:
+    resolution: {integrity: sha512-ooviqdwwgfIfNmDwo94wlshcdzfO64XV0Cg6oDsDYBJfITDz1EngD2z7DkbvCWn+XIMsIqW27sEVF6qcpJrRcg==}
+    engines: {node: ^12.20.0 || ^14.13.1 || >=16.0.0}
+
   aws-ssl-profiles@1.1.2:
     resolution: {integrity: sha512-NZKeq9AfyQvEeNlN0zSYAaWrmBffJh3IELMZfRpJVWgrpEbtEpnjvzqBPf+mxoI287JohRDoa+/nsfqqiZmF6g==}
     engines: {node: '>= 6.0.0'}
@@ -3930,11 +3992,27 @@ packages:
   classcat@5.0.5:
     resolution: {integrity: sha512-JhZUT7JFcQy/EzW605k/ktHtncoo9vnyW/2GspNYwFlN1C/WmjuV/xtS04e9SOkL2sTdw0VAZ2UGCcQ9lR6p6w==}
 
+  cli-boxes@3.0.0:
+    resolution: {integrity: sha512-/lzGpEWL/8PfI0BmBOPRwp0c/wFNX1RdUML3jK/RcSBA9T8mZDdQpqYBKtCFTOfQbwPqWEOpjqW+Fnayc0969g==}
+    engines: {node: '>=10'}
+
+  cli-cursor@4.0.0:
+    resolution: {integrity: sha512-VGtlMu3x/4DOtIUwEkRezxUZ2lBacNJCHash0N0WeZDBS+7Ux1dm3XWAgWYxLJFMMdOeXMHXorshEFhbMSGelg==}
+    engines: {node: ^12.20.0 || ^14.13.1 || >=16.0.0}
+
   cli-highlight@2.1.11:
     resolution: {integrity: sha512-9KDcoEVwyUXrjcJNvHD0NFc/hiwe/WPVYIleQh2O1N2Zro5gWJZ/K+3DGn8w8P/F6FxOgzyC5bxDyHIgCSPhGg==}
     engines: {node: '>=8.0.0', npm: '>=5.0.0'}
     hasBin: true
 
+  cli-spinners@2.9.2:
+    resolution: {integrity: sha512-ywqV+5MmyL4E7ybXgKys4DugZbX0FC6LnwrhjuykIjnK9k8OQacQ7axGKnjDXWNhns0xot3bZI5h55H8yo9cJg==}
+    engines: {node: '>=6'}
+
+  cli-truncate@4.0.0:
+    resolution: {integrity: sha512-nPdaFdQ0h/GEigbPClz11D0v/ZJEwxmeVZGeMo3Z5StPtUTkA9o1lD6QwoirYiSDzbcwn2XcjwmCp68W1IS4TA==}
+    engines: {node: '>=18'}
+
   client-only@0.0.1:
     resolution: {integrity: sha512-IV3Ou0jSMzZrd3pZ48nLkT9DA7Ag1pnPzaiQhpW7c3RbcqqzvzzVu+L8gfqMp/8IM2MQtSiqaCxrrcfu8I8rMA==}
 
@@ -3962,6 +4040,10 @@ packages:
       react: ^18 || ^19 || ^19.0.0-rc
       react-dom: ^18 || ^19 || ^19.0.0-rc
 
+  code-excerpt@4.0.0:
+    resolution: {integrity: sha512-xxodCmBen3iy2i0WtAK8FlFNrRzjUqjRsMfho58xT/wvZU1YTM3fCnRjcy1gJPMepaRlgm/0e6w8SpWHpn3/cA==}
+    engines: {node: ^12.20.0 || ^14.13.1 || >=16.0.0}
+
   color-convert@2.0.1:
     resolution: {integrity: sha512-RRECPsj7iu/xb5oKYcsFHSppFNnsj/52OVTRKb4zP5onXwVF3zVmmToNcOfGC+CRDpfK/U584fMg38ZHCaElKQ==}
     engines: {node: '>=7.0.0'}
@@ -4020,6 +4102,10 @@ packages:
     resolution: {integrity: sha512-nTjqfcBFEipKdXCv4YDQWCfmcLZKm81ldF0pAopTvyrFGVbcR6P/VAAd5G7N+0tTr8QqiU0tFadD6FK4NtJwOA==}
     engines: {node: '>= 0.6'}
 
+  convert-to-spaces@2.0.1:
+    resolution: {integrity: sha512-rcQ1bsQO9799wq24uE5AM2tAILy4gXGIK/njFWcVQkGNZ96edlpY+A7bjwvzjYvLDyzmG1MmMLZhpcsb+klNMQ==}
+    engines: {node: ^12.20.0 || ^14.13.1 || >=16.0.0}
+
   cookie-signature@1.2.2:
     resolution: {integrity: sha512-D76uU73ulSXrD1UXF4KE2TMxVVwhsnCgfAyTg9k8P6KGZjlXKrOLe4dJQKI3Bxi5wjesZoFXJWElNWBjPZMbhg==}
     engines: {node: '>=6.6.0'}
@@ -4386,6 +4472,9 @@ packages:
   emoji-regex-xs@1.0.0:
     resolution: {integrity: sha512-LRlerrMYoIDrT6jgpeZ2YYl/L8EulRTt5hQcYjy5AInh7HWXKimpqx68aknBFpGL2+/IcogTcaydJEgaTmOpDg==}
 
+  emoji-regex@10.6.0:
+    resolution: {integrity: sha512-toUI84YS5YmxW219erniWD0CIVOo46xGKColeNQRgOzDorgBi1v4D71/OFzgD9GO2UGKIv1C3Sp8DAn0+j5w7A==}
+
   emoji-regex@8.0.0:
     resolution: {integrity: sha512-MSjYzcWNOA0ewAHpz0MxpYFvwg6yjy1NG3xteoqz644VCo/RPgnr1/GGt+ic3iJTzQ8Eu3TdM14SawnVUmGE6A==}
 
@@ -4413,6 +4502,10 @@ packages:
     engines: {node: '>=20.10.0'}
     hasBin: true
 
+  environment@1.1.0:
+    resolution: {integrity: sha512-xUtoPkMggbz0MPyPiIWr1Kp4aeWJjDZ6SMvURhimjdZgsRuDplF5/s9hcgGhyXMhs+6vpnuoiZ2kFiu3FMnS8Q==}
+    engines: {node: '>=18'}
+
   es-define-property@1.0.1:
     resolution: {integrity: sha512-e3nRfgfUZ4rNGL232gUgX06QNyyez04KdjFrF+LTRoOXmrOgFKDg4BCdsjW8EnT69eqdYGmRpJwiPVYNrCaW3g==}
     engines: {node: '>= 0.4'}
@@ -4432,6 +4525,9 @@ packages:
     resolution: {integrity: sha512-j6vWzfrGVfyXxge+O0x5sh6cvxAog0a/4Rdd2K36zCMV5eJ+/+tOAngRO8cODMNWbVRdVlmGZQL2YS3yR8bIUA==}
     engines: {node: '>= 0.4'}
 
+  es-toolkit@1.45.1:
+    resolution: {integrity: sha512-/jhoOj/Fx+A+IIyDNOvO3TItGmlMKhtX8ISAHKE90c4b/k1tqaqEZ+uUqfpU8DMnW5cgNJv606zS55jGvza0Xw==}
+
   esbuild@0.27.4:
     resolution: {integrity: sha512-Rq4vbHnYkK5fws5NF7MYTU68FPRE1ajX7heQ/8QXXWqNgqqJ/GkmmyxIzUnf2Sr/bakf8l54716CcMGHYhMrrQ==}
     engines: {node: '>=18'}
@@ -4444,6 +4540,10 @@ packages:
   escape-html@1.0.3:
     resolution: {integrity: sha512-NiSupZ4OeuGwr68lGIeym/ksIZMJodUGOSCZ/FSnTxcrekbvqrgdUxlJOMpijaKZVjAJrWrGs/6Jy8OMuyj9ow==}
 
+  escape-string-regexp@2.0.0:
+    resolution: {integrity: sha512-UpzcLCXolUWcNu5HtVMHYdXJjArjsF9C0aNnquZYY4uW/Vu0miy5YoWvbV345HauVvcAUnpRuhMMcqTcGOY2+w==}
+    engines: {node: '>=8'}
+
   escape-string-regexp@4.0.0:
     resolution: {integrity: sha512-TtpcNJ3XAzx3Gq8sWRzJaVajRs0uVxA2YAkdb1jm2YkPz4G6egUFAyA3n5vtEIZefPk5Wa4UXbKuS5fKkJWdgA==}
     engines: {node: '>=10'}
@@ -4861,6 +4961,10 @@ packages:
   immediate@3.0.6:
     resolution: {integrity: sha512-XXOFtyqDjNDAQxVfYxuF7g9Il/IbWmmlQg2MYKOH8ExIT1qg6xc4zyS3HaEEATgs1btfzxq15ciUiY7gjSXRGQ==}
 
+  indent-string@5.0.0:
+    resolution: {integrity: sha512-m6FAo/spmsW2Ab2fU35JTYwtOKa2yAwXSwgjSv1TJzh4Mh7mC3lzAOVLBprb72XsTrgkEIsl7YrFNAiDiRhIGg==}
+    engines: {node: '>=12'}
+
   inflection@1.13.4:
     resolution: {integrity: sha512-6I/HUDeYFfuNCVS3td055BaXBwKYuzw7K3ExVMStBowKo9oOAMJIXIHvdyR3iboTCp1b+1i5DSkIZTcwIktuDw==}
     engines: {'0': node >= 0.4.0}
@@ -4875,6 +4979,26 @@ packages:
   ini@1.3.8:
     resolution: {integrity: sha512-JV/yugV2uzW5iMRSiZAyDtQd+nxtUnjeLt0acNdw98kKLrvuRVyB80tsREOE7yvGVgalhZ6RNXCmEHkUKBKxew==}
 
+  ink-spinner@5.0.0:
+    resolution: {integrity: sha512-EYEasbEjkqLGyPOUc8hBJZNuC5GvXGMLu0w5gdTNskPc7Izc5vO3tdQEYnzvshucyGCBXc86ig0ujXPMWaQCdA==}
+    engines: {node: '>=14.16'}
+    peerDependencies:
+      ink: '>=4.0.0'
+      react: '>=18.0.0'
+
+  ink@5.2.1:
+    resolution: {integrity: sha512-BqcUyWrG9zq5HIwW6JcfFHsIYebJkWWb4fczNah1goUO0vv5vneIlfwuS85twyJ5hYR/y18FlAYUxrO9ChIWVg==}
+    engines: {node: '>=18'}
+    peerDependencies:
+      '@types/react': '>=18.0.0'
+      react: '>=18.0.0'
+      react-devtools-core: ^4.19.1
+    peerDependenciesMeta:
+      '@types/react':
+        optional: true
+      react-devtools-core:
+        optional: true
+
   inline-style-parser@0.2.7:
     resolution: {integrity: sha512-Nb2ctOyNR8DqQoR0OwRG95uNWIC0C1lCgf5Naz5H6Ji72KZ8OcFZLz2P5sNgwlyoJ8Yif11oMuYs5pBQa86csA==}
 
@@ -4916,9 +5040,22 @@ packages:
     resolution: {integrity: sha512-zymm5+u+sCsSWyD9qNaejV3DFvhCKclKdizYaJUuHA83RLjb7nSuGnddCHGv0hk+KY7BMAlsWeK4Ueg6EV6XQg==}
     engines: {node: '>=8'}
 
+  is-fullwidth-code-point@4.0.0:
+    resolution: {integrity: sha512-O4L094N2/dZ7xqVdrXhh9r1KODPJpFms8B5sGdJLPy664AgvXsreZUyCQQNItZRDlYug4xStLjNp/sz3HvBowQ==}
+    engines: {node: '>=12'}
+
+  is-fullwidth-code-point@5.1.0:
+    resolution: {integrity: sha512-5XHYaSyiqADb4RnZ1Bdad6cPp8Toise4TzEjcOYDHZkTCbKgiUl7WTUCpNWHuxmDt91wnsZBc9xinNzopv3JMQ==}
+    engines: {node: '>=18'}
+
   is-hexadecimal@2.0.1:
     resolution: {integrity: sha512-DgZQp241c8oO6cA1SbTEWiXeoxV42vlcJxgH+B3hi1AiqqKruZR3ZGF8In3fj4+/y/7rHvlOZLZtgJ/4ttYGZg==}
 
+  is-in-ci@1.0.0:
+    resolution: {integrity: sha512-eUuAjybVTHMYWm/U+vBO1sY/JOCgoPCXRxzdju0K+K0BiGW0SChEL1MLC0PoCIR1OlPo5YAp8HuQoUlsWEICwg==}
+    engines: {node: '>=18'}
+    hasBin: true
+
   is-plain-obj@4.1.0:
     resolution: {integrity: sha512-+Pgi+vMuUNkJyExiMBt5IlFoMyKnr5zhJ4Uspz58WOhBF5QoIZkFyNHIbBAtHwzVAgk5RtndVNsDRN61/mmDqg==}
     engines: {node: '>=12'}
@@ -5455,6 +5592,10 @@ packages:
     resolution: {integrity: sha512-Lbgzdk0h4juoQ9fCKXW4by0UJqj+nOOrI9MJ1sSj4nI8aI2eo1qmvQEie4VD1glsS250n15LsWsYtCugiStS5A==}
     engines: {node: '>=18'}
 
+  mimic-fn@2.1.0:
+    resolution: {integrity: sha512-OqbOk5oEQeAZ8WXWydlu9HJjz9WVdEIvamMCcXmuqUYjTknH/sqsWvhQ3vgwKFRR1HpjvNBKQ37nbJgYzGqGcg==}
+    engines: {node: '>=6'}
+
   mimic-response@2.1.0:
     resolution: {integrity: sha512-wXqjST+SLt7R009ySCglWBCFpjUygmCIfD790/kVbiGmUgfYGuB14PiTd5DwVxSV4NcYHjzMkoj5LjQZwTQLEA==}
     engines: {node: '>=8'}
@@ -5688,6 +5829,10 @@ packages:
   once@1.4.0:
     resolution: {integrity: sha512-lNaJgI+2Q5URQBkccEKHTQOPaXdUxnZZElQTZY0MFUAuaEqe1E+Nyvgdz/aIyNi6Z9MzO5dv1H8n58/GELp3+w==}
 
+  onetime@5.1.2:
+    resolution: {integrity: sha512-kbpaSSGJTWdAY5KPVeMOKXSrPtr8C8C7wodJbcsd51jRnmD+GZu8Y0VoU6Dm5Z4vWr0Ig/1NKuWRKf7j5aaYSg==}
+    engines: {node: '>=6'}
+
   oniguruma-parser@0.12.1:
     resolution: {integrity: sha512-8Unqkvk1RYc6yq2WBYRj4hdnsAxVze8i7iPfQr8e4uSP3tRv0rpZcbGUDvxfQQcdwHt/e9PrMvGCsa8OqG9X3w==}
 
@@ -5787,6 +5932,10 @@ packages:
   partial-json@0.1.7:
     resolution: {integrity: sha512-Njv/59hHaokb/hRUjce3Hdv12wd60MtM9Z5Olmn+nehe0QDAsRtRbJPvJ0Z91TusF0SuZRIvnM+S4l6EIP8leA==}
 
+  patch-console@2.0.0:
+    resolution: {integrity: sha512-0YNdUceMdaQwoKce1gatDScmMo5pu/tfABfnzEqeG0gtTmd7mh/WcwgUjtAeOU7N8nFFlbQBnFK2gXW5fGvmMA==}
+    engines: {node: ^12.20.0 || ^14.13.1 || >=16.0.0}
+
   path-data-parser@0.1.0:
     resolution: {integrity: sha512-NOnmBpt5Y2RWbuv0LMzsayp3lVylAHLPUTut412ZA3l+C4uw4ZVkQbjShYCQ8TCpUMdPapr4YjUqLYD6v68j+w==}
 
@@ -6069,6 +6218,12 @@ packages:
   react-is@18.3.1:
     resolution: {integrity: sha512-/LLMVyas0ljjAtoYiPqYiL8VWXzUUdThrmU5+n20DZv+a+ClRoevUzw5JxU+Ieh5/c87ytoTBV9G1FiKfNJdmg==}
 
+  react-reconciler@0.29.2:
+    resolution: {integrity: sha512-zZQqIiYgDCTP/f1N/mAR10nJGrPD2ZR+jDSEsKWJHYC7Cm2wodlwbR3upZRdC3cjIjSlTLNVyO7Iu0Yy7t2AYg==}
+    engines: {node: '>=0.10.0'}
+    peerDependencies:
+      react: ^18.3.1
+
   react-remove-scroll-bar@2.3.8:
     resolution: {integrity: sha512-9r+yi9+mgU33AKcj6IbT9oRCO78WriSj6t/cF8DWBZJ9aOGPOTEDvdUDz1FwKim7QXWwmHqtdHnRJfhAxEG46Q==}
     engines: {node: '>=10'}
@@ -6117,6 +6272,10 @@ packages:
       react: '>=16.6.0'
       react-dom: '>=16.6.0'
 
+  react@18.3.1:
+    resolution: {integrity: sha512-wS+hAgJShR0KhEvPJArfuPVN1+Hz1t0Y6n5jLrGQbkb4urgPE/0Rve+1kMB1v/oWgHgm4WIcV+i7F2pTVj+2iQ==}
+    engines: {node: '>=0.10.0'}
+
   react@19.2.4:
     resolution: {integrity: sha512-9nfp2hYpCwOjAN+8TZFGhtWEwgvWHXqESH8qT89AT/lWklpLON22Lc8pEtnpsZz7VmawabSU0gCjnj8aC0euHQ==}
     engines: {node: '>=0.10.0'}
@@ -6223,6 +6382,10 @@ packages:
     engines: {node: '>= 0.4'}
     hasBin: true
 
+  restore-cursor@4.0.0:
+    resolution: {integrity: sha512-I9fPXU9geO9bHOt9pHHOhOkYerIMsmVaWB0rA2AI9ERh/+x/i7MV5HKBNrg+ljO5eoPVgCcnFuRjJ9uH6I/3eg==}
+    engines: {node: ^12.20.0 || ^14.13.1 || >=16.0.0}
+
   restructure@3.0.2:
     resolution: {integrity: sha512-gSfoiOEA0VPE6Tukkrr7I0RBdE0s7H1eFCDBk05l1KIQT1UIKNc5JZy6jdyW6eYH3aR3g5b3PuL77rq0hvwtAw==}
 
@@ -6285,6 +6448,9 @@ packages:
     resolution: {integrity: sha512-5LBh1Tls8c9xgGjw3QrMwETmTMVk0oFgvrFSvWx62llR2hcEInrKNZ2GZCCuuy2lvWrdl5jhbpeqc5hRYKFOcw==}
     engines: {node: '>=10'}
 
+  scheduler@0.23.2:
+    resolution: {integrity: sha512-UOShsPwz7NrMUqhR6t0hWjFduvOzbtv7toDH1/hIrfRNIDBnnBWd0CwJTGvTpngVlmwGCdP9/Zl/tVrDqcuYzQ==}
+
   scheduler@0.25.0-rc-603e6108-20241029:
     resolution: {integrity: sha512-pFwF6H1XrSdYYNLfOcGlM28/j8CGLu8IvdrxqhjWULe2bPcKiKW4CV+OWqR/9fT52mywx65l7ysNkjLKBda7eA==}
 
@@ -6377,6 +6543,14 @@ packages:
   sisteransi@1.0.5:
     resolution: {integrity: sha512-bLGGlR1QxBcynn2d5YmDX4MGjlZvy2MRBDRNHLJ8VI6l6+9FUiyTFNJ0IveOSP0bcXgVDPRcfGqA0pjaqUpfVg==}
 
+  slice-ansi@5.0.0:
+    resolution: {integrity: sha512-FC+lgizVPfie0kkhqUScwRu1O/lF6NOgJmlCgK+/LYxDCTk8sGelYaHDhFcDN+Sn3Cv+3VSa4Byeo+IMCzpMgQ==}
+    engines: {node: '>=12'}
+
+  slice-ansi@7.1.2:
+    resolution: {integrity: sha512-iOBWFgUX7caIZiuutICxVgX1SdxwAVFFKwt1EvMYYec/NWO5meOJ6K5uQxhrYBdQJne4KxiqZc+KptFOWFSI9w==}
+    engines: {node: '>=18'}
+
   smart-buffer@4.2.0:
     resolution: {integrity: sha512-94hK0Hh8rPqQl2xXc3HsaBoOXKV20MToPkcXvwbISWLEs+64sBq5kFgn2kJDHb1Pry9yrP0dxrCI9RRci7RXKg==}
     engines: {node: '>= 6.0.0', npm: '>= 3.0.0'}
@@ -6424,6 +6598,10 @@ packages:
   stack-trace@0.0.10:
     resolution: {integrity: sha512-KGzahc7puUKkzyMt+IqAep+TVNbKP+k2Lmwhub39m1AsTSkaDutx56aDCo+HLDzf/D26BIHTJWNiTG1KAJiQCg==}
 
+  stack-utils@2.0.6:
+    resolution: {integrity: sha512-XlkWvfIm6RmsWtNJx+uqtKLS8eqFbxUg0ZzLXqY0caEy9l7hruX8IpiDnjsLavoBgqCCR71TqWO8MaXYheJ3RQ==}
+    engines: {node: '>=10'}
+
   stackback@0.0.2:
     resolution: {integrity: sha512-1XMJE5fQo1jGH6Y/7ebnwPOBEkIEnT4QF32d5R1+VXdXveM0IBMJt8zfaxX1P3QhVwrYe+576+jkANtSS2mBbw==}
 
@@ -6443,6 +6621,10 @@ packages:
     resolution: {integrity: sha512-wKyQRQpjJ0sIp62ErSZdGsjMJWsap5oRNihHhu6G7JVO/9jIB6UyevL+tXuOqrng8j/cxKTWyWUwvSTriiZz/g==}
     engines: {node: '>=8'}
 
+  string-width@7.2.0:
+    resolution: {integrity: sha512-tsaTIkKW9b4N+AEj+SVA+WhJzV7/zMhcSu78mLKWSk7cXMOSHsBKFWUs0fWwq8QyK3MgJBQRX6Gbi4kYbdvGkQ==}
+    engines: {node: '>=18'}
+
   string_decoder@1.1.1:
     resolution: {integrity: sha512-n/ShnvDi6FHbbVfviro+WojiFzv+s8MPMHBczVePfUpDJLwoLT0ht1l4YwBCbi8pJAveEEdnkHyPyTP/mzRfwg==}
 
@@ -6632,6 +6814,10 @@ packages:
   tweetnacl@0.14.5:
     resolution: {integrity: sha512-KXXFFdAbFXY4geFIwoyNK+f5Z1b7swfXABfL7HXCmoIWMKU3dmS26672A4EeQtDzLKy7SXmfBu51JolvEKwtGA==}
 
+  type-fest@4.41.0:
+    resolution: {integrity: sha512-TeTSQ6H5YHvpqVwBRcnLDCBnDOHWYu7IvGbHT6N8AOymcr9PJGjc1GTtiWZTYg0NCgYwvnYWEkVChQAr9bjfwA==}
+    engines: {node: '>=16'}
+
   type-is@2.0.1:
     resolution: {integrity: sha512-OZs6gsjF4vMp32qrCbiVSkrFmXtG/AZhY3t0iAMrMBiAZyV9oALtXO8hsrHbMXF9x6L3grlFuwW2oAz7cav+Gw==}
     engines: {node: '>= 0.6'}
@@ -6925,6 +7111,10 @@ packages:
   wide-align@1.1.5:
     resolution: {integrity: sha512-eDMORYaPNZ4sQIuuYPDHdQvf4gyCF9rEEV/yPxGfwPkRodwEgiMUUXTx/dex+Me0wxx53S+NgUHaP7y3MGlDmg==}
 
+  widest-line@5.0.0:
+    resolution: {integrity: sha512-c9bZp7b5YtRj2wOe6dlj32MK+Bx/M/d+9VB2SHM1OtsUHR0aV0tdP6DWh/iMt0kWi1t5g1Iudu6hQRNd1A4PVA==}
+    engines: {node: '>=18'}
+
   winston@2.4.7:
     resolution: {integrity: sha512-vLB4BqzCKDnnZH9PHGoS2ycawueX4HLqENXQitvFHczhgW2vFpSOn31LZtVr1KU8YTw7DS4tM+cqyovxo8taVg==}
     engines: {node: '>= 0.10.0'}
@@ -6937,6 +7127,10 @@ packages:
     resolution: {integrity: sha512-YVGIj2kamLSTxw6NsZjoBxfSwsn0ycdesmc4p+Q21c5zPuZ1pl+NfxVdxPtdHvmNVOQ6XSYG4AUtyt/Fi7D16Q==}
     engines: {node: '>=10'}
 
+  wrap-ansi@9.0.2:
+    resolution: {integrity: sha512-42AtmgqjV+X1VpdOfyTGOYRi0/zsoLqtXQckTmqTeybT+BDIbM/Guxo7x3pE2vtpr1ok6xRqM9OpBe+Jyoqyww==}
+    engines: {node: '>=18'}
+
   wrappy@1.0.2:
     resolution: {integrity: sha512-l4Sp/DRseor9wL6EvV2+TuQn63dMkPjZ/sp9XkghTEbV9KlPS1xUsZ3u7/IQO4wxtcFB4bgpQPRcR3QCvezPcQ==}
 
@@ -7017,6 +7211,9 @@ packages:
     peerDependencies:
       zod: ^3.25 || ^4
 
+  zod@3.25.76:
+    resolution: {integrity: sha512-gzUt/qt81nXsFGKIFcC3YnfEAx5NkunCfnDlvuBSSFS02bcXu4Lmea0AFIUwbLWxWPx3d9p8S5QoaujKcNQxcQ==}
+
   zod@4.3.6:
     resolution: {integrity: sha512-rftlrkhHZOcjDwkGlnUtZZkvaPHCsDATp4pGpuOOMDaTdDDXF91wuVDJoWoPsKX/3YPQ5fHuF3STjcYyKr+Qhg==}
 
@@ -7076,6 +7273,11 @@ snapshots:
     dependencies:
       json-schema: 0.4.0
 
+  '@alcalzone/ansi-tokenize@0.1.3':
+    dependencies:
+      ansi-styles: 6.2.3
+      is-fullwidth-code-point: 4.0.0
+
   '@alloc/quick-lru@5.2.0': {}
 
   '@antfu/install-pkg@1.1.0':
@@ -7498,14 +7700,14 @@ snapshots:
       nanostores: 1.2.0
       zod: 4.3.6
 
-  '@better-auth/drizzle-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)':
+  '@better-auth/drizzle-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)':
     dependencies:
-      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0)
+      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0)
       '@better-auth/utils': 0.3.1
 
-  '@better-auth/kysely-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(kysely@0.28.13)':
+  '@better-auth/kysely-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(kysely@0.28.13)':
     dependencies:
-      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0)
+      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0)
       '@better-auth/utils': 0.3.1
       kysely: 0.28.13
 
@@ -7515,25 +7717,25 @@ snapshots:
       '@better-auth/utils': 0.3.1
       kysely: 0.28.14
 
-  '@better-auth/memory-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)':
+  '@better-auth/memory-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)':
     dependencies:
-      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0)
+      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0)
       '@better-auth/utils': 0.3.1
 
-  '@better-auth/mongo-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(mongodb@7.1.0(socks@2.8.7))':
+  '@better-auth/mongo-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(mongodb@7.1.0(socks@2.8.7))':
     dependencies:
-      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0)
+      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0)
       '@better-auth/utils': 0.3.1
       mongodb: 7.1.0(socks@2.8.7)
 
-  '@better-auth/prisma-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)':
+  '@better-auth/prisma-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)':
     dependencies:
-      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0)
+      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0)
       '@better-auth/utils': 0.3.1
 
-  '@better-auth/telemetry@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))':
+  '@better-auth/telemetry@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))':
     dependencies:
-      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0)
+      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0)
       '@better-auth/utils': 0.3.1
       '@better-fetch/fetch': 1.1.21
 
@@ -10126,6 +10328,8 @@ snapshots:
       pg-protocol: 1.13.0
       pg-types: 2.2.0
 
+  '@types/prop-types@15.7.15': {}
+
   '@types/qs@6.15.0': {}
 
   '@types/range-parser@1.2.7': {}
@@ -10134,6 +10338,11 @@ snapshots:
     dependencies:
       '@types/react': 19.2.14
 
+  '@types/react@18.3.28':
+    dependencies:
+      '@types/prop-types': 15.7.15
+      csstype: 3.2.3
+
   '@types/react@19.2.14':
     dependencies:
       csstype: 3.2.3
@@ -10304,6 +10513,10 @@ snapshots:
       json-schema-traverse: 1.0.0
       require-from-string: 2.0.2
 
+  ansi-escapes@7.3.0:
+    dependencies:
+      environment: 1.1.0
+
   ansi-regex@5.0.1: {}
 
   ansi-regex@6.2.2: {}
@@ -10312,6 +10525,8 @@ snapshots:
     dependencies:
       color-convert: 2.0.1
 
+  ansi-styles@6.2.3: {}
+
   any-promise@1.3.0: {}
 
   aproba@2.1.0: {}
@@ -10383,6 +10598,8 @@ snapshots:
 
   asynckit@0.4.0: {}
 
+  auto-bind@5.0.1: {}
+
   aws-ssl-profiles@1.1.2: {}
 
   axios@1.13.6:
@@ -10418,12 +10635,12 @@ snapshots:
   better-auth@1.5.5(mongodb@7.1.0(socks@2.8.7))(mysql2@3.20.0(@types/node@22.19.15))(next@16.2.0(@opentelemetry/api@1.9.0)(babel-plugin-react-compiler@1.0.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4))(pg@8.20.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4)(vitest@3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2)):
     dependencies:
       '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0)
-      '@better-auth/drizzle-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)
-      '@better-auth/kysely-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(kysely@0.28.13)
-      '@better-auth/memory-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)
-      '@better-auth/mongo-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(mongodb@7.1.0(socks@2.8.7))
-      '@better-auth/prisma-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)
-      '@better-auth/telemetry': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))
+      '@better-auth/drizzle-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)
+      '@better-auth/kysely-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(kysely@0.28.13)
+      '@better-auth/memory-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)
+      '@better-auth/mongo-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(mongodb@7.1.0(socks@2.8.7))
+      '@better-auth/prisma-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)
+      '@better-auth/telemetry': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))
       '@better-auth/utils': 0.3.1
       '@better-fetch/fetch': 1.1.21
       '@noble/ciphers': 2.1.1
@@ -10622,6 +10839,12 @@ snapshots:
 
   classcat@5.0.5: {}
 
+  cli-boxes@3.0.0: {}
+
+  cli-cursor@4.0.0:
+    dependencies:
+      restore-cursor: 4.0.0
+
   cli-highlight@2.1.11:
     dependencies:
       chalk: 4.1.2
@@ -10631,6 +10854,13 @@ snapshots:
       parse5-htmlparser2-tree-adapter: 6.0.1
       yargs: 16.2.0
 
+  cli-spinners@2.9.2: {}
+
+  cli-truncate@4.0.0:
+    dependencies:
+      slice-ansi: 5.0.0
+      string-width: 7.2.0
+
   client-only@0.0.1: {}
 
   cliui@6.0.0:
@@ -10667,6 +10897,10 @@ snapshots:
       - '@types/react'
       - '@types/react-dom'
 
+  code-excerpt@4.0.0:
+    dependencies:
+      convert-to-spaces: 2.0.1
+
   color-convert@2.0.1:
     dependencies:
       color-name: 1.1.4
@@ -10711,6 +10945,8 @@ snapshots:
 
   content-type@1.0.5: {}
 
+  convert-to-spaces@2.0.1: {}
+
   cookie-signature@1.2.2: {}
 
   cookie@0.7.2: {}
@@ -11086,6 +11322,8 @@ snapshots:
 
   emoji-regex-xs@1.0.0: {}
 
+  emoji-regex@10.6.0: {}
+
   emoji-regex@8.0.0: {}
 
   encodeurl@2.0.0: {}
@@ -11109,6 +11347,8 @@ snapshots:
       commander: 13.1.0
       cross-spawn: 7.0.6
 
+  environment@1.1.0: {}
+
   es-define-property@1.0.1: {}
 
   es-errors@1.3.0: {}
@@ -11126,6 +11366,8 @@ snapshots:
       has-tostringtag: 1.0.2
       hasown: 2.0.2
 
+  es-toolkit@1.45.1: {}
+
   esbuild@0.27.4:
     optionalDependencies:
       '@esbuild/aix-ppc64': 0.27.4
@@ -11159,6 +11401,8 @@ snapshots:
 
   escape-html@1.0.3: {}
 
+  escape-string-regexp@2.0.0: {}
+
   escape-string-regexp@4.0.0: {}
 
   escape-string-regexp@5.0.0: {}
@@ -11724,6 +11968,8 @@ snapshots:
 
   immediate@3.0.6: {}
 
+  indent-string@5.0.0: {}
+
   inflection@1.13.4: {}
 
   inflight@1.0.6:
@@ -11735,6 +11981,45 @@ snapshots:
 
   ini@1.3.8: {}
 
+  ink-spinner@5.0.0(ink@5.2.1(@types/react@18.3.28)(react@18.3.1))(react@18.3.1):
+    dependencies:
+      cli-spinners: 2.9.2
+      ink: 5.2.1(@types/react@18.3.28)(react@18.3.1)
+      react: 18.3.1
+
+  ink@5.2.1(@types/react@18.3.28)(react@18.3.1):
+    dependencies:
+      '@alcalzone/ansi-tokenize': 0.1.3
+      ansi-escapes: 7.3.0
+      ansi-styles: 6.2.3
+      auto-bind: 5.0.1
+      chalk: 5.6.2
+      cli-boxes: 3.0.0
+      cli-cursor: 4.0.0
+      cli-truncate: 4.0.0
+      code-excerpt: 4.0.0
+      es-toolkit: 1.45.1
+      indent-string: 5.0.0
+      is-in-ci: 1.0.0
+      patch-console: 2.0.0
+      react: 18.3.1
+      react-reconciler: 0.29.2(react@18.3.1)
+      scheduler: 0.23.2
+      signal-exit: 3.0.7
+      slice-ansi: 7.1.2
+      stack-utils: 2.0.6
+      string-width: 7.2.0
+      type-fest: 4.41.0
+      widest-line: 5.0.0
+      wrap-ansi: 9.0.2
+      ws: 8.19.0
+      yoga-layout: 3.2.1
+    optionalDependencies:
+      '@types/react': 18.3.28
+    transitivePeerDependencies:
+      - bufferutil
+      - utf-8-validate
+
   inline-style-parser@0.2.7: {}
 
   internmap@1.0.1: {}
@@ -11764,8 +12049,16 @@ snapshots:
 
   is-fullwidth-code-point@3.0.0: {}
 
+  is-fullwidth-code-point@4.0.0: {}
+
+  is-fullwidth-code-point@5.1.0:
+    dependencies:
+      get-east-asian-width: 1.5.0
+
   is-hexadecimal@2.0.1: {}
 
+  is-in-ci@1.0.0: {}
+
   is-plain-obj@4.1.0: {}
 
   is-promise@4.0.0: {}
@@ -12480,6 +12773,8 @@ snapshots:
     dependencies:
       mime-db: 1.54.0
 
+  mimic-fn@2.1.0: {}
+
   mimic-response@2.1.0: {}
 
   minimatch@10.2.4:
@@ -12670,6 +12965,10 @@ snapshots:
     dependencies:
       wrappy: 1.0.2
 
+  onetime@5.1.2:
+    dependencies:
+      mimic-fn: 2.1.0
+
   oniguruma-parser@0.12.1: {}
 
   oniguruma-to-es@4.3.5:
@@ -12769,6 +13068,8 @@ snapshots:
 
   partial-json@0.1.7: {}
 
+  patch-console@2.0.0: {}
+
   path-data-parser@0.1.0: {}
 
   path-exists@4.0.0: {}
@@ -13162,6 +13463,12 @@ snapshots:
 
   react-is@18.3.1: {}
 
+  react-reconciler@0.29.2(react@18.3.1):
+    dependencies:
+      loose-envify: 1.4.0
+      react: 18.3.1
+      scheduler: 0.23.2
+
   react-remove-scroll-bar@2.3.8(@types/react@19.2.14)(react@19.2.4):
     dependencies:
       react: 19.2.4
@@ -13211,6 +13518,10 @@ snapshots:
       react: 19.2.4
       react-dom: 19.2.4(react@19.2.4)
 
+  react@18.3.1:
+    dependencies:
+      loose-envify: 1.4.0
+
   react@19.2.4: {}
 
   read@1.0.7:
@@ -13368,6 +13679,11 @@ snapshots:
       path-parse: 1.0.7
       supports-preserve-symlinks-flag: 1.0.0
 
+  restore-cursor@4.0.0:
+    dependencies:
+      onetime: 5.1.2
+      signal-exit: 3.0.7
+
   restructure@3.0.2: {}
 
   retry@0.12.0: {}
@@ -13450,6 +13766,10 @@ snapshots:
     dependencies:
       xmlchars: 2.2.0
 
+  scheduler@0.23.2:
+    dependencies:
+      loose-envify: 1.4.0
+
   scheduler@0.25.0-rc-603e6108-20241029: {}
 
   scheduler@0.27.0: {}
@@ -13590,6 +13910,16 @@ snapshots:
 
   sisteransi@1.0.5: {}
 
+  slice-ansi@5.0.0:
+    dependencies:
+      ansi-styles: 6.2.3
+      is-fullwidth-code-point: 4.0.0
+
+  slice-ansi@7.1.2:
+    dependencies:
+      ansi-styles: 6.2.3
+      is-fullwidth-code-point: 5.1.0
+
   smart-buffer@4.2.0: {}
 
   socks-proxy-agent@8.0.5:
@@ -13635,6 +13965,10 @@ snapshots:
 
   stack-trace@0.0.10: {}
 
+  stack-utils@2.0.6:
+    dependencies:
+      escape-string-regexp: 2.0.0
+
   stackback@0.0.2: {}
 
   statuses@2.0.2: {}
@@ -13679,6 +14013,12 @@ snapshots:
       is-fullwidth-code-point: 3.0.0
       strip-ansi: 6.0.1
 
+  string-width@7.2.0:
+    dependencies:
+      emoji-regex: 10.6.0
+      get-east-asian-width: 1.5.0
+      strip-ansi: 7.2.0
+
   string_decoder@1.1.1:
     dependencies:
       safe-buffer: 5.1.2
@@ -13854,6 +14194,8 @@ snapshots:
 
   tweetnacl@0.14.5: {}
 
+  type-fest@4.41.0: {}
+
   type-is@2.0.1:
     dependencies:
       content-type: 1.0.5
@@ -14165,6 +14507,10 @@ snapshots:
     dependencies:
       string-width: 4.2.3
 
+  widest-line@5.0.0:
+    dependencies:
+      string-width: 7.2.0
+
   winston@2.4.7:
     dependencies:
       async: 2.6.4
@@ -14186,6 +14532,12 @@ snapshots:
       string-width: 4.2.3
       strip-ansi: 6.0.1
 
+  wrap-ansi@9.0.2:
+    dependencies:
+      ansi-styles: 6.2.3
+      string-width: 7.2.0
+      strip-ansi: 7.2.0
+
   wrappy@1.0.2: {}
 
   ws@8.19.0: {}
@@ -14264,6 +14616,8 @@ snapshots:
     dependencies:
       zod: 4.3.6
 
+  zod@3.25.76: {}
+
   zod@4.3.6: {}
 
   zustand@4.5.7(@types/react@19.2.14)(react@19.2.4):

From 202bfbb376a3e9ab15091b3e7ddaa1075732cc22 Mon Sep 17 00:00:00 2001
From: shanvit <shanvit7@gmail.com>
Date: Wed, 8 Apr 2026 16:08:07 +0530
Subject: [PATCH 02/12] checkpoint for dirty tree

---
 packages/zosma-mem/IMPLEMENTATION_PLAN.md | 407 ++++++++++++++++++++++
 1 file changed, 407 insertions(+)
 create mode 100644 packages/zosma-mem/IMPLEMENTATION_PLAN.md

diff --git a/packages/zosma-mem/IMPLEMENTATION_PLAN.md b/packages/zosma-mem/IMPLEMENTATION_PLAN.md
new file mode 100644
index 0000000..8fe4739
--- /dev/null
+++ b/packages/zosma-mem/IMPLEMENTATION_PLAN.md
@@ -0,0 +1,407 @@
+# zosma-mem Implementation Plan
+
+> Replace `@openzosma/memory` (thin env-var bootstrap) with `zosma-mem` as the unified memory package — salience-driven, attention-aware, eval-instrumented.
+
+---
+
+## Current State
+
+### `packages/zosma-mem` (this package)
+- Eval-only: 7 scenarios, adapter interface, CLI runner, metrics (P@K, R@K, MRR, noise, GC effectiveness)
+- No engine implementation — only the `MemoryAdapter` contract and test harness
+- Published as `zosma-mem`, exports `zosma-mem/evals`
+
+### `packages/memory` (`@openzosma/memory`)
+- Thin bootstrap shim: sets `PI_MEMORY_DIR`, `PI_MEMORY_QMD_UPDATE`, `PI_MEMORY_NO_SEARCH` env vars
+- Used by `packages/agents/src/pi.agent.ts` via `bootstrapMemory()`
+- No intelligence — delegates everything to pi-brain extensions installed at image build time
+
+### Gap
+The two reference docs (NEW-MEMORY-INTEGRATION-PAPER.md, NEW-MEMORY-SURFACE-PLAN.md) describe a salience engine, attention-gated retrieval, reinforcement loop, GC, and co-access graph. None of this exists yet. The eval harness exists but has no real engine to test against.
+
+---
+
+## Target State
+
+`packages/zosma-mem` becomes `@openzosma/zosma-mem` — the single memory package that:
+
+1. **Bootstraps** pi-brain memory (absorbs what `@openzosma/memory` does today)
+2. **Implements** the salience engine, attention retrieval, reinforcement loop, GC
+3. **Evaluates** itself via the existing eval harness with a self-adapter
+4. **Exports** a clean public API for `packages/agents` and `packages/gateway`
+
+`packages/memory` is deleted. All imports of `@openzosma/memory` point to `@openzosma/zosma-mem`.
+
+---
+
+## Package Structure (Final)
+
+```
+packages/zosma-mem/
+  src/
+    index.ts                      # Public API re-exports
+    types.ts                      # Core types (MemoryEngine, MemoryEntity, MemoryScore, etc.)
+    config.ts                     # MemoryConfig + defaults
+
+    bootstrap/
+      env.ts                      # applyMemoryEnv() — absorbed from @openzosma/memory
+      init.ts                     # bootstrapMemory() — absorbed from @openzosma/memory
+
+    brain-adapter/
+      parser.ts                   # Parse commits.md via remark AST
+      state.ts                    # Read state.yaml, list branches
+      index.ts
+
+    engine/
+      salience.ts                 # computeSalience(score): number
+      attention.ts                # computeAttentionScore(query, entity): number
+      reinforcement.ts            # recordRead, recordIgnoredRead, recordDecisionInfluence
+      factory.ts                  # createMemoryEngine() — wires all subsystems
+      index.ts
+
+    store/
+      entity-store.ts             # Read/write .salience/*.yaml
+      co-access.ts                # co-access.json graph read/write
+      index.ts
+
+    ingestion/
+      event-bus.ts                # Typed EventEmitter for MemoryEvent
+      ingest.ts                   # Score → persist or discard
+      commit-indexer.ts           # Watch commits.md → extract entities → score → persist
+      index.ts
+
+    retrieval/
+      retrieve.ts                 # Top-K with attention gating + co-access boost
+      index.ts
+
+    gc/
+      decay.ts                    # Logarithmic time decay
+      prune.ts                    # Archive low-salience entities
+      consolidate.ts              # Merge related low-value clusters
+      index.ts
+
+    evals/                        # (existing — untouched)
+      types.ts
+      runner.ts
+      metrics.ts
+      report.ts
+      scenarios/
+      cli/
+      __tests__/
+      utils/
+      index.ts
+
+    adapter/
+      self-adapter.ts             # MemoryAdapter impl that wraps the real engine for eval
+
+  package.json
+  tsconfig.json
+  README.md
+  USAGE.md
+```
+
+---
+
+## Phase Plan
+
+### Phase 0 — Absorb `@openzosma/memory` bootstrap
+
+**Files:** `src/bootstrap/env.ts`, `src/bootstrap/init.ts`
+
+1. Copy `applyMemoryEnv()` and `bootstrapMemory()` from `packages/memory/src/`
+2. Convert to arrow functions per project style
+3. Re-export from `src/index.ts` as `bootstrapMemory`, `applyMemoryEnv`
+4. Update `packages/agents/package.json`: replace `@openzosma/memory` with `@openzosma/zosma-mem`
+5. Update `packages/agents/src/pi.agent.ts`: change import path
+6. Delete `packages/memory/` entirely
+7. Update root `pnpm-workspace.yaml` if needed
+8. Run `pnpm install && pnpm run check`
+
+**Tests:** `src/bootstrap/__tests__/env.test.ts` — verify env vars are set correctly
+
+**Agent instructions:** This is a mechanical move. Copy the 4 source files verbatim, convert `function` to arrow syntax, update imports, delete the old package.
+
+---
+
+### Phase 1 — Types + Salience Engine
+
+**Files:** `src/types.ts`, `src/config.ts`, `src/engine/salience.ts`
+
+1. Define core types from the paper:
+   - `MemoryScore` — `{ reuseCount, decisionInfluence, ignoredReads, lastAccessed, attentionWeight }`
+   - `MemoryEntity` — `{ id, source: { branch, commitRef }, score, tags, content }`
+   - `MemoryEvent` (engine-internal, distinct from eval `MemoryEvent`) — `{ id, type, context, attentionWeight?, metadata?, timestamp }`
+   - `MemoryConfig` — `{ memoryDir, salienceThreshold?, gcIntervalMs?, summarizer? }`
+   - `Summarizer` — `(texts: string[]) => Promise<string>`
+   - `AttentionQuery` — `{ taskDescription, activeToolName?, intent? }`
+   - `ScoredEntity` — `{ entity, attentionScore }`
+   - `GcReport` — `{ decayed, pruned, consolidated }`
+
+2. Implement `computeSalience(score: MemoryScore): number`:
+   ```
+   S(e) = 2*reuseCount + 5*decisionInfluence - 2*ignoredReads - ln(1 + ageDays)
+   ```
+
+3. Implement `meetsThreshold(salience: number, threshold: number): boolean`
+
+**Tests:** `src/engine/__tests__/salience.test.ts`
+- Fresh entity → salience = 0 (passes threshold 0, fails threshold 0.4)
+- Decision entity → salience = 5 (high)
+- Heavily ignored entity → negative salience
+- Time decay: 30 days → ~3.4 decay
+
+**Agent instructions:** Pure functions, no I/O. Use the exact formula from the paper. `ageDays = (Date.now() - lastAccessed) / 86_400_000` — but accept a `now` parameter for testability.
+
+---
+
+### Phase 2 — Brain Adapter
+
+**Files:** `src/brain-adapter/parser.ts`, `src/brain-adapter/state.ts`
+
+1. `parseCommits(markdown: string): ParsedCommit[]` — parse `commits.md` using `unified` + `remark-parse` into structured commit objects (heading, body, ref)
+2. `readState(memoryDir: string): MemoryState` — parse `state.yaml` via `yaml` package
+3. `listBranches(memoryDir: string): string[]` — read `.memory/branches/` directory
+
+**Dependencies to add:** `unified`, `remark-parse`, `yaml`
+
+**Tests:** `src/brain-adapter/__tests__/parser.test.ts` — parse sample commits.md fixtures
+
+**Agent instructions:** Use `unified().use(remarkParse).parse(markdown)` to get an MDAST. Walk heading nodes to extract commit boundaries. Do NOT use regex.
+
+---
+
+### Phase 3 — Entity Store
+
+**Files:** `src/store/entity-store.ts`, `src/store/co-access.ts`
+
+1. `EntityStore` class:
+   - `read(entityId: string): MemoryEntity | undefined` — read `.salience/<id>.yaml`
+   - `write(entity: MemoryEntity): void` — write `.salience/<id>.yaml`
+   - `list(): string[]` — list all entity IDs
+   - `archive(entityId: string): void` — move to `.salience/archive/`
+   - `ensureDir(): void` — create `.salience/` and `.salience/archive/` if needed
+
+2. `CoAccessGraph` class:
+   - `load(memoryDir: string): Record<string, string[]>`
+   - `save(memoryDir: string, graph: Record<string, string[]>): void`
+   - `recordCoAccess(graph, entityIds: string[]): void` — update bidirectional edges
+
+**Dependencies to add:** `yaml` (already from phase 2)
+
+**Tests:** `src/store/__tests__/entity-store.test.ts` — write/read/list/archive round-trip in temp dir
+
+**Agent instructions:** Use synchronous `fs` for reads (small YAML files). Async for writes. YAML format must match the paper's schema exactly.
+
+---
+
+### Phase 4 — Ingestion + Commit Indexer
+
+**Files:** `src/ingestion/event-bus.ts`, `src/ingestion/ingest.ts`, `src/ingestion/commit-indexer.ts`
+
+1. `EventBus` — typed `EventEmitter` for `MemoryEvent` lifecycle (ingested, discarded, scored)
+2. `ingest(event: MemoryEvent, store: EntityStore, config: MemoryConfig): boolean` — compute salience, persist if above threshold, return true/false
+3. `CommitIndexer`:
+   - Parse commits.md via brain adapter
+   - Track processed commit refs (stored in `.salience/.indexed` file)
+   - Extract entities from each unprocessed commit
+   - Call `ingest()` for each
+   - `reindex()` — idempotent full re-index
+
+**Dependencies to add:** `chokidar` (for watch mode — optional, can defer)
+
+**Tests:** `src/ingestion/__tests__/ingest.test.ts` — event above threshold persists, below threshold discards
+
+**Agent instructions:** CommitIndexer.reindex() must be idempotent. Store processed refs as a JSON array in `.salience/.indexed`. The cold-start case (no .indexed file) processes all commits.
+
+---
+
+### Phase 5 — Attention-Gated Retrieval
+
+**Files:** `src/retrieval/retrieve.ts`
+
+1. `retrieve(query: AttentionQuery, store: EntityStore, coAccess: CoAccessGraph, topK: number): ScoredEntity[]`
+2. Attention score: `A(q, e) = 3*tagOverlap(q, e) + S(e) + coAccessBoost(e)`
+   - `tagOverlap` = count of entity tags appearing in `query.taskDescription` (case-insensitive)
+   - `coAccessBoost` = +1 if any co-accessed entity is also in the current result set (two-pass)
+3. Sort by attention score descending, return top-K
+4. After retrieval, update co-access graph for the returned entity set
+
+**Tests:** `src/retrieval/__tests__/retrieve.test.ts`
+- High tag overlap beats high salience with no overlap
+- Co-access boost surfaces related entities
+
+**Agent instructions:** Two-pass retrieval: first pass computes base scores (tag overlap + salience), take top 2K candidates. Second pass adds co-access boost among candidates, re-sort, return top-K.
+
+---
+
+### Phase 6 — Reinforcement
+
+**Files:** `src/engine/reinforcement.ts`
+
+1. `recordRead(entityId, store)` → `reuseCount += 1`, update `lastAccessed`
+2. `recordIgnoredRead(entityId, store)` → `ignoredReads += 1`
+3. `recordDecisionInfluence(entityId, store)` → `decisionInfluence += 1`, update `lastAccessed`
+
+**Tests:** `src/engine/__tests__/reinforcement.test.ts` — counters increment, lastAccessed updates
+
+**Agent instructions:** Each function reads the entity, mutates the score, writes back. Simple read-modify-write. No locking needed (single-process).
+
+---
+
+### Phase 7 — Engine Factory
+
+**Files:** `src/engine/factory.ts`
+
+1. `createMemoryEngine(config: MemoryConfig): MemoryEngine`
+   - Instantiate `EntityStore`, `CoAccessGraph`, `CommitIndexer`
+   - Wire `ingest`, `retrieve`, `recordRead`, `recordIgnoredRead`, `recordDecisionInfluence`, `reindex`, `gc`, `shutdown`
+   - Start GC interval timer
+   - Return the `MemoryEngine` interface
+
+**Tests:** `src/engine/__tests__/factory.test.ts` — create engine, ingest event, retrieve it, shutdown
+
+**Agent instructions:** The engine is the composition root. It owns the lifecycle of the GC timer. `shutdown()` clears the timer. All methods delegate to the subsystem modules.
+
+---
+
+### Phase 8 — Garbage Collection
+
+**Files:** `src/gc/decay.ts`, `src/gc/prune.ts`, `src/gc/consolidate.ts`
+
+1. `decay(store: EntityStore, now: number)` — recompute salience for all entities, write updated scores
+2. `prune(store: EntityStore, threshold: number)` — archive entities below threshold for N consecutive cycles (track cycle count in `.salience/<id>.yaml` as `belowThresholdCycles`)
+3. `consolidate(store, coAccess, summarizer?)` — find clusters of co-accessed entities all below threshold, merge into single summary entity
+
+**Tests:** `src/gc/__tests__/gc.test.ts`
+- Decay reduces salience of old entities
+- Prune archives after N cycles
+- Consolidate merges cluster into one entity
+
+**Agent instructions:** Prune should NOT archive on the first cycle below threshold. Default: archive after 3 consecutive cycles below threshold (configurable). If no summarizer provided, consolidate concatenates content with `\n---\n` separators and truncates to 2000 chars.
+
+---
+
+### Phase 9 — Self-Adapter for Evals
+
+**Files:** `src/adapter/self-adapter.ts`
+
+1. Implement `MemoryAdapter` (from `src/evals/types.ts`) wrapping `createMemoryEngine()`
+2. Map between eval types and engine types:
+   - `MemoryEvent` (eval) → `MemoryEvent` (engine)
+   - `RetrieveQuery` → `AttentionQuery`
+   - `RetrievedEntity` ← `ScoredEntity`
+   - `UsageSignal` → `recordRead` / `recordIgnoredRead` / `recordDecisionInfluence`
+   - `GcResult` ← `GcReport`
+3. `setup()` creates engine with `opts.workDir` as memoryDir, injects deterministic clock
+4. `teardown()` calls `engine.shutdown()`
+
+**Tests:** Run the existing 7 eval scenarios against the self-adapter:
+```bash
+pnpm --filter zosma-mem run eval
+```
+
+**Agent instructions:** The self-adapter is the bridge that proves the engine works. All 7 scenarios must pass. The deterministic clock must be injected into the salience engine's `now` parameter — do NOT use `Date.now()` in any engine code; always accept a clock/now parameter.
+
+---
+
+### Phase 10 — Integration + Cleanup
+
+1. Update `packages/zosma-mem/package.json`:
+   - Rename to `@openzosma/zosma-mem`
+   - Add dependencies: `yaml`, `unified`, `remark-parse`, `pino`, `p-limit`, `chokidar`
+   - Add bootstrap exports: `"./bootstrap"` export path
+   - Keep `"./evals"` export path
+
+2. Update `packages/agents/package.json`:
+   - Replace `"@openzosma/memory": "workspace:*"` with `"@openzosma/zosma-mem": "workspace:*"`
+
+3. Update `packages/agents/src/pi.agent.ts`:
+   - `import { bootstrapMemory } from "@openzosma/zosma-mem/bootstrap"`
+
+4. Update `packages/gateway/src/session-manager.ts` (if it references `@openzosma/memory`)
+
+5. Delete `packages/memory/`
+
+6. Run:
+   ```bash
+   pnpm install
+   pnpm run check        # zero errors
+   pnpm run build         # clean build
+   pnpm --filter @openzosma/zosma-mem run test   # all unit tests
+   pnpm --filter @openzosma/zosma-mem run eval   # all 7 scenarios pass
+   ```
+
+---
+
+## Dependency Map
+
+```
+packages/agents
+  └── @openzosma/zosma-mem (bootstrap + engine)
+
+packages/gateway
+  └── @openzosma/zosma-mem (engine — future: per-session memory)
+
+@openzosma/zosma-mem
+  ├── yaml          — .salience/*.yaml, state.yaml
+  ├── unified       — markdown AST parsing
+  ├── remark-parse  — commits.md parser
+  ├── zod           — schema validation (already present)
+  ├── pino          — structured logging
+  ├── p-limit       — concurrency control
+  ├── chokidar      — watch commits.md (optional, deferred)
+  └── pi-brain      — peer dep (reads .memory/)
+```
+
+---
+
+## Critical Constraints
+
+1. **Never mutate pi-brain files.** All scoring metadata lives in `.salience/` sidecar.
+2. **No `Date.now()` in engine code.** All time-sensitive logic accepts a `now` parameter or clock interface for deterministic testing.
+3. **No vector DB.** Tag-overlap proxy is the MVP retrieval mechanism. `computeAttentionScore` is a single function — swappable for embeddings later.
+4. **No LLM dependency.** `Summarizer` is a callback. If not provided, consolidation uses concatenation.
+5. **Arrow functions everywhere.** Per project coding standards.
+6. **No `any` types.** Strict TypeScript throughout.
+7. **pi-brain as peer dep.** Read `.memory/` files, never import pi-brain internals.
+8. **Existing eval scenarios must not break.** The adapter contract (`MemoryAdapter`) is frozen.
+
+---
+
+## Agent Execution Order
+
+For Claude Sonnet 4.6 executing this plan:
+
+```
+Phase 0  ──→  Phase 1  ──→  Phase 2  ──→  Phase 3
+                                              │
+Phase 4  ←────────────────────────────────────┘
+   │
+Phase 5  ──→  Phase 6  ──→  Phase 7  ──→  Phase 8
+                                              │
+Phase 9  ←────────────────────────────────────┘
+   │
+Phase 10
+```
+
+**Parallelizable pairs:**
+- Phase 1 + Phase 2 (no dependency)
+- Phase 5 + Phase 6 (both depend on store, independent of each other)
+
+**Serial gates:**
+- Phase 3 must complete before Phase 4 (ingestion needs store)
+- Phase 7 must complete before Phase 8 (GC needs engine)
+- Phase 9 must complete before Phase 10 (eval validates the engine)
+
+Each phase should end with `pnpm run check` passing. Each phase with tests should end with `pnpm --filter @openzosma/zosma-mem run test` passing.
+
+---
+
+## Success Criteria
+
+1. `packages/memory/` is deleted
+2. `@openzosma/zosma-mem` exports `bootstrapMemory`, `createMemoryEngine`, `runEvals`
+3. `pnpm run check` — zero errors across the monorepo
+4. `pnpm --filter @openzosma/zosma-mem run test` — all unit tests pass
+5. `pnpm --filter @openzosma/zosma-mem run eval` — all 7 scenarios pass against the self-adapter
+6. No `@openzosma/memory` references remain anywhere in the codebase

From b99dcea8e907ede63731adccb543297855192850 Mon Sep 17 00:00:00 2001
From: shanvit <shanvit7@gmail.com>
Date: Wed, 8 Apr 2026 16:29:13 +0530
Subject: [PATCH 03/12] feat(zosma-mem): add entity store, co-access graph, and
 ingestion pipeline (phases 3+4)

---
 packages/zosma-mem/package.json               |  10 +-
 packages/zosma-mem/src/brain-adapter/index.ts |   2 +
 .../zosma-mem/src/brain-adapter/parser.ts     |  51 +++++++++
 .../src/ingestion/__tests__/ingest.test.ts    | 103 ++++++++++++++++++
 .../zosma-mem/src/ingestion/commit-indexer.ts |  46 ++++++++
 packages/zosma-mem/src/ingestion/event-bus.ts |  25 +++++
 packages/zosma-mem/src/ingestion/index.ts     |   4 +
 packages/zosma-mem/src/ingestion/ingest.ts    |  32 ++++++
 .../src/store/__tests__/entity-store.test.ts  |  64 +++++++++++
 packages/zosma-mem/src/store/co-access.ts     |  26 +++++
 packages/zosma-mem/src/store/entity-store.ts  |  44 ++++++++
 packages/zosma-mem/src/store/index.ts         |   3 +
 pnpm-lock.yaml                                |  46 +++++---
 13 files changed, 437 insertions(+), 19 deletions(-)
 create mode 100644 packages/zosma-mem/src/brain-adapter/index.ts
 create mode 100644 packages/zosma-mem/src/brain-adapter/parser.ts
 create mode 100644 packages/zosma-mem/src/ingestion/__tests__/ingest.test.ts
 create mode 100644 packages/zosma-mem/src/ingestion/commit-indexer.ts
 create mode 100644 packages/zosma-mem/src/ingestion/event-bus.ts
 create mode 100644 packages/zosma-mem/src/ingestion/index.ts
 create mode 100644 packages/zosma-mem/src/ingestion/ingest.ts
 create mode 100644 packages/zosma-mem/src/store/__tests__/entity-store.test.ts
 create mode 100644 packages/zosma-mem/src/store/co-access.ts
 create mode 100644 packages/zosma-mem/src/store/entity-store.ts
 create mode 100644 packages/zosma-mem/src/store/index.ts

diff --git a/packages/zosma-mem/package.json b/packages/zosma-mem/package.json
index 001c003..de97181 100644
--- a/packages/zosma-mem/package.json
+++ b/packages/zosma-mem/package.json
@@ -5,7 +5,14 @@
 	"type": "module",
 	"description": "Standalone CLI for evaluating agentic memory systems - zero-config evaluation against standardized scenarios",
 	"license": "Apache-2.0",
-	"keywords": ["memory", "evaluation", "ai", "agentic", "cli", "openzosma"],
+	"keywords": [
+		"memory",
+		"evaluation",
+		"ai",
+		"agentic",
+		"cli",
+		"openzosma"
+	],
 	"repository": {
 		"type": "git",
 		"url": "https://github.com/your-org/openzosma",
@@ -40,6 +47,7 @@
 		"ink": "^5.1.0",
 		"ink-spinner": "^5.0.0",
 		"react": "^18.3.0",
+		"yaml": "^2.8.3",
 		"zod": "^3.23.0"
 	},
 	"devDependencies": {
diff --git a/packages/zosma-mem/src/brain-adapter/index.ts b/packages/zosma-mem/src/brain-adapter/index.ts
new file mode 100644
index 0000000..aec02e5
--- /dev/null
+++ b/packages/zosma-mem/src/brain-adapter/index.ts
@@ -0,0 +1,2 @@
+export { parseCommitsMarkdown } from "./parser.js"
+export type { CommitRecord } from "./parser.js"
diff --git a/packages/zosma-mem/src/brain-adapter/parser.ts b/packages/zosma-mem/src/brain-adapter/parser.ts
new file mode 100644
index 0000000..8df642b
--- /dev/null
+++ b/packages/zosma-mem/src/brain-adapter/parser.ts
@@ -0,0 +1,51 @@
+/**
+ * Parse commits.md into structured commit records.
+ *
+ * Expected format (one or more entries):
+ *
+ * ## <ref>
+ * <optional blank line>
+ * <body text>
+ * tags: tag1, tag2
+ */
+
+export interface CommitRecord {
+	ref: string
+	body: string
+	tags: string[]
+}
+
+/**
+ * Parse a commits.md markdown file into an array of CommitRecord objects.
+ */
+export const parseCommitsMarkdown = (markdown: string): CommitRecord[] => {
+	const commits: CommitRecord[] = []
+	const sections = markdown.split(/^## /m).filter((s) => s.trim().length > 0)
+
+	for (const section of sections) {
+		const lines = section.split("\n")
+		const ref = lines[0].trim()
+		if (!ref) continue
+
+		const bodyLines: string[] = []
+		let tags: string[] = []
+
+		for (let i = 1; i < lines.length; i++) {
+			const line = lines[i]
+			const tagMatch = /^tags:\s*(.+)$/i.exec(line)
+			if (tagMatch) {
+				tags = tagMatch[1]
+					.split(",")
+					.map((t) => t.trim())
+					.filter(Boolean)
+			} else {
+				bodyLines.push(line)
+			}
+		}
+
+		const body = bodyLines.join("\n").trim()
+		commits.push({ ref, body, tags })
+	}
+
+	return commits
+}
diff --git a/packages/zosma-mem/src/ingestion/__tests__/ingest.test.ts b/packages/zosma-mem/src/ingestion/__tests__/ingest.test.ts
new file mode 100644
index 0000000..7126756
--- /dev/null
+++ b/packages/zosma-mem/src/ingestion/__tests__/ingest.test.ts
@@ -0,0 +1,103 @@
+import { mkdtempSync, rmSync, writeFileSync } from "node:fs"
+import { tmpdir } from "node:os"
+import { join } from "node:path"
+import { afterEach, beforeEach, describe, expect, it } from "vitest"
+import { EntityStore } from "../../store/entity-store.js"
+import type { MemoryEvent } from "../../types.js"
+import { reindex } from "../commit-indexer.js"
+import { ingest } from "../ingest.js"
+
+const makeEvent = (overrides: Partial<MemoryEvent> = {}): MemoryEvent => ({
+	id: "test-entity",
+	type: "pattern",
+	content: "Some content",
+	tags: ["tag-a"],
+	timestamp: Date.now(),
+	...overrides,
+})
+
+let dir: string
+let store: EntityStore
+
+describe("ingest", () => {
+	beforeEach(() => {
+		dir = mkdtempSync(join(tmpdir(), "ingest-test-"))
+		store = new EntityStore(dir)
+		store.ensureDir()
+	})
+
+	afterEach(() => {
+		rmSync(dir, { recursive: true, force: true })
+	})
+
+	it("always persists regardless of event type", () => {
+		for (const type of ["pattern", "error", "preference", "decision"] as const) {
+			const event = makeEvent({ id: `ev-${type}`, type })
+			const result = ingest(event, store, {})
+			expect(result).toBe(true)
+			expect(store.read(`ev-${type}`)).toBeDefined()
+		}
+	})
+
+	it("upsert: second ingest with same id updates content", () => {
+		ingest(makeEvent({ id: "upsert-me", content: "original" }), store, {})
+		ingest(makeEvent({ id: "upsert-me", content: "updated" }), store, {})
+		const entity = store.read("upsert-me")
+		expect(entity?.content).toBe("updated")
+	})
+
+	it("preserves existing score on upsert", () => {
+		ingest(makeEvent({ id: "score-preserve" }), store, {})
+		const first = store.read("score-preserve")!
+		// Manually bump reuseCount
+		store.write({ ...first, score: { ...first.score, reuseCount: 5 } })
+		ingest(makeEvent({ id: "score-preserve", content: "new content" }), store, {})
+		const second = store.read("score-preserve")!
+		expect(second.score.reuseCount).toBe(5)
+	})
+})
+
+describe("reindex", () => {
+	beforeEach(() => {
+		dir = mkdtempSync(join(tmpdir(), "reindex-test-"))
+		store = new EntityStore(dir)
+		store.ensureDir()
+	})
+
+	afterEach(() => {
+		rmSync(dir, { recursive: true, force: true })
+	})
+
+	it("returns 0 when commits.md does not exist", () => {
+		expect(reindex(dir, store, {})).toBe(0)
+	})
+
+	it("ingests commits from commits.md", () => {
+		const md = "## abc123\nFixed the auth bug.\ntags: auth, fix\n"
+		writeFileSync(join(dir, "commits.md"), md, "utf-8")
+		const count = reindex(dir, store, {})
+		expect(count).toBe(1)
+		expect(store.read("main-abc123")).toBeDefined()
+	})
+
+	it("is idempotent: second call returns 0 for already-indexed commits", () => {
+		const md = "## abc123\nFixed the auth bug.\ntags: auth, fix\n"
+		writeFileSync(join(dir, "commits.md"), md, "utf-8")
+		reindex(dir, store, {})
+		const count = reindex(dir, store, {})
+		expect(count).toBe(0)
+	})
+
+	it("ingests only new commits on second call", () => {
+		writeFileSync(join(dir, "commits.md"), "## ref1\nFirst commit.\ntags: a\n", "utf-8")
+		reindex(dir, store, {})
+		writeFileSync(
+			join(dir, "commits.md"),
+			"## ref1\nFirst commit.\ntags: a\n\n## ref2\nSecond commit.\ntags: b\n",
+			"utf-8",
+		)
+		const count = reindex(dir, store, {})
+		expect(count).toBe(1)
+		expect(store.read("main-ref2")).toBeDefined()
+	})
+})
diff --git a/packages/zosma-mem/src/ingestion/commit-indexer.ts b/packages/zosma-mem/src/ingestion/commit-indexer.ts
new file mode 100644
index 0000000..79d8eb1
--- /dev/null
+++ b/packages/zosma-mem/src/ingestion/commit-indexer.ts
@@ -0,0 +1,46 @@
+import { existsSync, readFileSync, writeFileSync } from "node:fs"
+import { join } from "node:path"
+import { parseCommitsMarkdown } from "../brain-adapter/parser.js"
+import type { EntityStore } from "../store/entity-store.js"
+import type { MemoryConfig } from "../types.js"
+import { ingest } from "./ingest.js"
+
+const INDEXED_FILE = ".indexed"
+
+/**
+ * Parse commits.md and ingest new entities. Idempotent.
+ * Returns number of new entities ingested.
+ */
+export const reindex = (
+	memoryDir: string,
+	store: EntityStore,
+	config: Pick<MemoryConfig, "salienceThreshold" | "now">,
+): number => {
+	const commitsPath = join(memoryDir, "commits.md")
+	if (!existsSync(commitsPath)) return 0
+
+	const indexedPath = join(memoryDir, ".salience", INDEXED_FILE)
+	const indexed: string[] = existsSync(indexedPath) ? (JSON.parse(readFileSync(indexedPath, "utf-8")) as string[]) : []
+
+	const markdown = readFileSync(commitsPath, "utf-8")
+	const commits = parseCommitsMarkdown(markdown)
+	const newRefs = commits.filter((c) => !indexed.includes(c.ref))
+
+	let count = 0
+	for (const commit of newRefs) {
+		const event = {
+			id: `main-${commit.ref}`,
+			type: "pattern" as const,
+			content: commit.body,
+			tags: commit.tags,
+			metadata: { branch: "main", commitRef: commit.ref },
+			timestamp: config.now ? config.now() : Date.now(),
+		}
+		ingest(event, store, config)
+		indexed.push(commit.ref)
+		count++
+	}
+
+	writeFileSync(indexedPath, JSON.stringify(indexed), "utf-8")
+	return count
+}
diff --git a/packages/zosma-mem/src/ingestion/event-bus.ts b/packages/zosma-mem/src/ingestion/event-bus.ts
new file mode 100644
index 0000000..8c4f580
--- /dev/null
+++ b/packages/zosma-mem/src/ingestion/event-bus.ts
@@ -0,0 +1,25 @@
+import { EventEmitter } from "node:events"
+import type { MemoryEvent } from "../types.js"
+
+export type MemoryEventName = "ingested" | "discarded" | "scored"
+
+export interface EventBus {
+	on: (event: MemoryEventName, listener: (e: MemoryEvent) => void) => void
+	off: (event: MemoryEventName, listener: (e: MemoryEvent) => void) => void
+	emit: (event: MemoryEventName, e: MemoryEvent) => void
+}
+
+export const createEventBus = (): EventBus => {
+	const emitter = new EventEmitter()
+	return {
+		on: (event, listener) => {
+			emitter.on(event, listener)
+		},
+		off: (event, listener) => {
+			emitter.off(event, listener)
+		},
+		emit: (event, e) => {
+			emitter.emit(event, e)
+		},
+	}
+}
diff --git a/packages/zosma-mem/src/ingestion/index.ts b/packages/zosma-mem/src/ingestion/index.ts
new file mode 100644
index 0000000..345249b
--- /dev/null
+++ b/packages/zosma-mem/src/ingestion/index.ts
@@ -0,0 +1,4 @@
+export { createEventBus } from "./event-bus.js"
+export { ingest } from "./ingest.js"
+export { reindex } from "./commit-indexer.js"
+export type { EventBus, MemoryEventName } from "./event-bus.js"
diff --git a/packages/zosma-mem/src/ingestion/ingest.ts b/packages/zosma-mem/src/ingestion/ingest.ts
new file mode 100644
index 0000000..4b32d71
--- /dev/null
+++ b/packages/zosma-mem/src/ingestion/ingest.ts
@@ -0,0 +1,32 @@
+import { initialScore } from "../engine/salience.js"
+import type { EntityStore } from "../store/entity-store.js"
+import type { MemoryConfig, MemoryEntity, MemoryEvent } from "../types.js"
+
+/**
+ * Ingest a MemoryEvent. Always persists (upsert). The threshold is enforced
+ * during GC pruning, not at ingestion time — every event type is stored.
+ * Returns true always (kept for interface compatibility).
+ */
+export const ingest = (
+	event: MemoryEvent,
+	store: EntityStore,
+	config: Pick<MemoryConfig, "salienceThreshold" | "now">,
+): boolean => {
+	const nowFn = config.now ?? Date.now
+	const existing = store.read(event.id)
+	const score = existing?.score ?? initialScore(event.type, nowFn)
+
+	const entity: MemoryEntity = {
+		id: event.id,
+		source: {
+			branch: event.metadata?.branch ?? "main",
+			commitRef: event.metadata?.commitRef ?? "0",
+		},
+		score,
+		tags: event.tags,
+		content: event.content,
+	}
+
+	store.write(entity)
+	return true
+}
diff --git a/packages/zosma-mem/src/store/__tests__/entity-store.test.ts b/packages/zosma-mem/src/store/__tests__/entity-store.test.ts
new file mode 100644
index 0000000..aa1cecf
--- /dev/null
+++ b/packages/zosma-mem/src/store/__tests__/entity-store.test.ts
@@ -0,0 +1,64 @@
+import { mkdtempSync, rmSync } from "node:fs"
+import { tmpdir } from "node:os"
+import { join } from "node:path"
+import { afterEach, beforeEach, describe, expect, it } from "vitest"
+import type { MemoryEntity } from "../../types.js"
+import { EntityStore } from "../entity-store.js"
+
+const makeEntity = (id: string): MemoryEntity => ({
+	id,
+	content: `Content for ${id}`,
+	tags: ["tag-a", "tag-b"],
+	source: { branch: "main", commitRef: "42" },
+	score: {
+		reuseCount: 3,
+		decisionInfluence: 1,
+		ignoredReads: 0,
+		lastAccessed: 1743897600000,
+		attentionWeight: 0.8,
+		belowThresholdCycles: 0,
+	},
+})
+
+let dir: string
+let store: EntityStore
+
+describe("EntityStore", () => {
+	beforeEach(() => {
+		dir = mkdtempSync(join(tmpdir(), "entity-store-test-"))
+		store = new EntityStore(dir)
+		store.ensureDir()
+	})
+
+	afterEach(() => {
+		rmSync(dir, { recursive: true, force: true })
+	})
+
+	it("write and read back an entity with all fields preserved", () => {
+		const entity = makeEntity("auth-flow")
+		store.write(entity)
+		const result = store.read("auth-flow")
+		expect(result).toBeDefined()
+		expect(result?.id).toBe("auth-flow")
+		expect(result?.content).toBe(entity.content)
+		expect(result?.tags).toEqual(entity.tags)
+		expect(result?.source).toEqual(entity.source)
+		expect(result?.score).toEqual(entity.score)
+	})
+
+	it("list returns written entity id", () => {
+		store.write(makeEntity("my-entity"))
+		expect(store.list()).toContain("my-entity")
+	})
+
+	it("archive moves entity out of list", () => {
+		store.write(makeEntity("to-archive"))
+		expect(store.list()).toContain("to-archive")
+		store.archive("to-archive")
+		expect(store.list()).not.toContain("to-archive")
+	})
+
+	it("read of missing entity returns undefined", () => {
+		expect(store.read("nonexistent")).toBeUndefined()
+	})
+})
diff --git a/packages/zosma-mem/src/store/co-access.ts b/packages/zosma-mem/src/store/co-access.ts
new file mode 100644
index 0000000..8878bc5
--- /dev/null
+++ b/packages/zosma-mem/src/store/co-access.ts
@@ -0,0 +1,26 @@
+import { existsSync, readFileSync, writeFileSync } from "node:fs"
+import { join } from "node:path"
+
+export type CoAccessGraph = Record<string, string[]>
+
+export const loadCoAccess = (memoryDir: string): CoAccessGraph => {
+	const p = join(memoryDir, "co-access.json")
+	if (!existsSync(p)) return {}
+	return JSON.parse(readFileSync(p, "utf-8")) as CoAccessGraph
+}
+
+export const saveCoAccess = (memoryDir: string, graph: CoAccessGraph): void => {
+	writeFileSync(join(memoryDir, "co-access.json"), JSON.stringify(graph, null, 2), "utf-8")
+}
+
+export const recordCoAccess = (graph: CoAccessGraph, entityIds: string[]): CoAccessGraph => {
+	const updated = { ...graph }
+	for (const a of entityIds) {
+		for (const b of entityIds) {
+			if (a === b) continue
+			if (!updated[a]) updated[a] = []
+			if (!updated[a].includes(b)) updated[a].push(b)
+		}
+	}
+	return updated
+}
diff --git a/packages/zosma-mem/src/store/entity-store.ts b/packages/zosma-mem/src/store/entity-store.ts
new file mode 100644
index 0000000..9f67203
--- /dev/null
+++ b/packages/zosma-mem/src/store/entity-store.ts
@@ -0,0 +1,44 @@
+import { existsSync, mkdirSync, readFileSync, readdirSync, renameSync, writeFileSync } from "node:fs"
+import { join } from "node:path"
+import { parse as parseYaml, stringify as stringifyYaml } from "yaml"
+import type { MemoryEntity } from "../types.js"
+
+export class EntityStore {
+	private readonly salienceDir: string
+	private readonly archiveDir: string
+
+	constructor(memoryDir: string) {
+		this.salienceDir = join(memoryDir, ".salience")
+		this.archiveDir = join(memoryDir, ".salience", "archive")
+	}
+
+	ensureDir = (): void => {
+		mkdirSync(this.salienceDir, { recursive: true })
+		mkdirSync(this.archiveDir, { recursive: true })
+	}
+
+	read = (entityId: string): MemoryEntity | undefined => {
+		const p = this.idToPath(entityId)
+		if (!existsSync(p)) return undefined
+		return parseYaml(readFileSync(p, "utf-8")) as MemoryEntity
+	}
+
+	write = (entity: MemoryEntity): void => {
+		writeFileSync(this.idToPath(entity.id), stringifyYaml(entity), "utf-8")
+	}
+
+	list = (): string[] => {
+		if (!existsSync(this.salienceDir)) return []
+		return readdirSync(this.salienceDir)
+			.filter((f) => f.endsWith(".yaml"))
+			.map((f) => f.slice(0, -5))
+	}
+
+	archive = (entityId: string): void => {
+		const src = this.idToPath(entityId)
+		const dst = join(this.archiveDir, `${entityId}.yaml`)
+		if (existsSync(src)) renameSync(src, dst)
+	}
+
+	private idToPath = (entityId: string): string => join(this.salienceDir, `${entityId}.yaml`)
+}
diff --git a/packages/zosma-mem/src/store/index.ts b/packages/zosma-mem/src/store/index.ts
new file mode 100644
index 0000000..fc8a3ae
--- /dev/null
+++ b/packages/zosma-mem/src/store/index.ts
@@ -0,0 +1,3 @@
+export { EntityStore } from "./entity-store.js"
+export { loadCoAccess, saveCoAccess, recordCoAccess } from "./co-access.js"
+export type { CoAccessGraph } from "./co-access.js"
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index 8608135..f409220 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -181,7 +181,7 @@ importers:
         version: 1.0.0
       better-auth:
         specifier: ^1.4.1
-        version: 1.5.5(mongodb@7.1.0(socks@2.8.7))(mysql2@3.20.0(@types/node@22.19.15))(next@16.2.0(@opentelemetry/api@1.9.0)(babel-plugin-react-compiler@1.0.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4))(pg@8.20.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4)(vitest@3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2))
+        version: 1.5.5(mongodb@7.1.0(socks@2.8.7))(mysql2@3.20.0(@types/node@22.19.15))(next@16.2.0(@opentelemetry/api@1.9.0)(babel-plugin-react-compiler@1.0.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4))(pg@8.20.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4)(vitest@3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3))
       class-variance-authority:
         specifier: ^0.7.1
         version: 0.7.1
@@ -408,7 +408,7 @@ importers:
         version: link:../db
       better-auth:
         specifier: ^1.2.7
-        version: 1.5.5(mongodb@7.1.0(socks@2.8.7))(mysql2@3.20.0(@types/node@22.19.15))(next@16.2.0(@opentelemetry/api@1.9.0)(babel-plugin-react-compiler@1.0.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4))(pg@8.20.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4)(vitest@3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2))
+        version: 1.5.5(mongodb@7.1.0(socks@2.8.7))(mysql2@3.20.0(@types/node@22.19.15))(next@16.2.0(@opentelemetry/api@1.9.0)(babel-plugin-react-compiler@1.0.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4))(pg@8.20.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4)(vitest@3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3))
       kysely:
         specifier: ^0.28.14
         version: 0.28.14
@@ -529,7 +529,7 @@ importers:
         version: 5.9.3
       vitest:
         specifier: ^3.2.4
-        version: 3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2)
+        version: 3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3)
 
   packages/grpc:
     dependencies:
@@ -603,7 +603,7 @@ importers:
         version: 5.9.3
       vitest:
         specifier: ^3.0.0
-        version: 3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2)
+        version: 3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3)
       zosma-mem:
         specifier: link:../zosma-mem
         version: link:../zosma-mem
@@ -718,7 +718,7 @@ importers:
         version: 5.9.3
       vitest:
         specifier: ^3.1.1
-        version: 3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2)
+        version: 3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3)
 
   packages/zosma-mem:
     dependencies:
@@ -737,6 +737,9 @@ importers:
       react:
         specifier: ^18.3.0
         version: 18.3.1
+      yaml:
+        specifier: ^2.8.3
+        version: 2.8.3
       zod:
         specifier: ^3.23.0
         version: 3.25.76
@@ -755,7 +758,7 @@ importers:
         version: 5.9.3
       vitest:
         specifier: ^3.0.0
-        version: 3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2)
+        version: 3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3)
 
 packages:
 
@@ -7168,6 +7171,11 @@ packages:
     engines: {node: '>= 14.6'}
     hasBin: true
 
+  yaml@2.8.3:
+    resolution: {integrity: sha512-AvbaCLOO2Otw/lW5bmh9d/WEdcDFdQp2Z2ZUH3pX9U2ihyUY0nvLv7J6TrWowklRGPYbB/IuIMfYgxaCPg5Bpg==}
+    engines: {node: '>= 14.6'}
+    hasBin: true
+
   yargs-parser@18.1.3:
     resolution: {integrity: sha512-o50j0JeToy/4K6OZcaQmW6lyXXKhq7csREXcDwk2omFPJEwUNOVtJKvmDr9EI1fAJZUyZcRF7kxGBWmRXudrCQ==}
     engines: {node: '>=6'}
@@ -10406,13 +10414,13 @@ snapshots:
       chai: 5.3.3
       tinyrainbow: 2.0.0
 
-  '@vitest/mocker@3.2.4(vite@7.3.1(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2))':
+  '@vitest/mocker@3.2.4(vite@7.3.1(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3))':
     dependencies:
       '@vitest/spy': 3.2.4
       estree-walker: 3.0.3
       magic-string: 0.30.21
     optionalDependencies:
-      vite: 7.3.1(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2)
+      vite: 7.3.1(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3)
 
   '@vitest/pretty-format@3.2.4':
     dependencies:
@@ -10632,7 +10640,7 @@ snapshots:
     dependencies:
       tweetnacl: 0.14.5
 
-  better-auth@1.5.5(mongodb@7.1.0(socks@2.8.7))(mysql2@3.20.0(@types/node@22.19.15))(next@16.2.0(@opentelemetry/api@1.9.0)(babel-plugin-react-compiler@1.0.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4))(pg@8.20.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4)(vitest@3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2)):
+  better-auth@1.5.5(mongodb@7.1.0(socks@2.8.7))(mysql2@3.20.0(@types/node@22.19.15))(next@16.2.0(@opentelemetry/api@1.9.0)(babel-plugin-react-compiler@1.0.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4))(pg@8.20.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4)(vitest@3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3)):
     dependencies:
       '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0)
       '@better-auth/drizzle-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)
@@ -10658,7 +10666,7 @@ snapshots:
       pg: 8.20.0
       react: 19.2.4
       react-dom: 19.2.4(react@19.2.4)
-      vitest: 3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2)
+      vitest: 3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3)
     transitivePeerDependencies:
       - '@cloudflare/workers-types'
 
@@ -14374,13 +14382,13 @@ snapshots:
       string_decoder: 1.3.0
       util-deprecate: 1.0.2
 
-  vite-node@3.2.4(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2):
+  vite-node@3.2.4(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3):
     dependencies:
       cac: 6.7.14
       debug: 4.4.3
       es-module-lexer: 1.7.0
       pathe: 2.0.3
-      vite: 7.3.1(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2)
+      vite: 7.3.1(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3)
     transitivePeerDependencies:
       - '@types/node'
       - jiti
@@ -14395,7 +14403,7 @@ snapshots:
       - tsx
       - yaml
 
-  vite@7.3.1(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2):
+  vite@7.3.1(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3):
     dependencies:
       esbuild: 0.27.4
       fdir: 6.5.0(picomatch@4.0.3)
@@ -14409,13 +14417,13 @@ snapshots:
       jiti: 2.6.1
       lightningcss: 1.32.0
       tsx: 4.21.0
-      yaml: 2.8.2
+      yaml: 2.8.3
 
-  vitest@3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2):
+  vitest@3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3):
     dependencies:
       '@types/chai': 5.2.3
       '@vitest/expect': 3.2.4
-      '@vitest/mocker': 3.2.4(vite@7.3.1(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2))
+      '@vitest/mocker': 3.2.4(vite@7.3.1(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3))
       '@vitest/pretty-format': 3.2.4
       '@vitest/runner': 3.2.4
       '@vitest/snapshot': 3.2.4
@@ -14433,8 +14441,8 @@ snapshots:
       tinyglobby: 0.2.15
       tinypool: 1.1.1
       tinyrainbow: 2.0.0
-      vite: 7.3.1(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2)
-      vite-node: 3.2.4(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.2)
+      vite: 7.3.1(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3)
+      vite-node: 3.2.4(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3)
       why-is-node-running: 2.3.0
     optionalDependencies:
       '@types/debug': 4.1.12
@@ -14554,6 +14562,8 @@ snapshots:
 
   yaml@2.8.2: {}
 
+  yaml@2.8.3: {}
+
   yargs-parser@18.1.3:
     dependencies:
       camelcase: 5.3.1

From 88236c84cb660fc809ece0461e78e4cd2ae9b41f Mon Sep 17 00:00:00 2001
From: shanvit <shanvit7@gmail.com>
Date: Thu, 9 Apr 2026 13:36:06 +0530
Subject: [PATCH 04/12] chore: memory package all setup

---
 docs/MEMORY-INTEGRATION.md                    | 1129 ++++-------------
 infra/openshell/Dockerfile                    |    2 +-
 packages/agents/package.json                  |   16 +-
 packages/agents/src/pi.agent.ts               |  142 ++-
 packages/agents/src/pi/memory.ts              |   91 ++
 packages/memory/package.json                  |   25 -
 packages/memory/src/bootstrap.test.ts         |   68 -
 packages/memory/src/bootstrap.ts              |   17 -
 packages/memory/src/config.ts                 |   24 -
 packages/memory/src/index.ts                  |    3 -
 packages/memory/src/types.ts                  |   17 -
 packages/memory/tsconfig.json                 |    8 -
 packages/zosma-mem/IMPLEMENTATION_PLAN.md     |  407 ------
 packages/zosma-mem/README.md                  |  224 ++--
 packages/zosma-mem/USAGE.md                   |  187 ---
 packages/zosma-mem/package.json               |   18 +-
 packages/zosma-mem/src/brain-adapter/index.ts |    2 -
 .../zosma-mem/src/brain-adapter/parser.ts     |   51 -
 .../src/bridge/__tests__/bridge.test.ts       |  211 +++
 packages/zosma-mem/src/bridge/extensions.ts   |   60 +
 packages/zosma-mem/src/bridge/index.ts        |  172 +++
 .../src/engine/__tests__/factory.test.ts      |   48 +
 .../engine/__tests__/reinforcement.test.ts    |   71 ++
 packages/zosma-mem/src/engine/factory.ts      |   74 ++
 packages/zosma-mem/src/engine/index.ts        |    3 +
 .../zosma-mem/src/engine/reinforcement.ts     |   41 +
 packages/zosma-mem/src/engine/salience.ts     |   23 +
 .../src/evals/__tests__/metrics.test.ts       |  127 --
 .../src/evals/__tests__/mock-adapter.ts       |  102 --
 .../src/evals/__tests__/report.test.ts        |   78 --
 .../src/evals/__tests__/runner.test.ts        |   96 --
 .../src/evals/__tests__/scenarios.test.ts     |  121 --
 packages/zosma-mem/src/evals/cli/bin.ts       |  133 --
 .../src/evals/cli/components/App.tsx          |   98 --
 .../src/evals/cli/components/ErrorDisplay.tsx |   15 -
 .../src/evals/cli/components/ScenarioRow.tsx  |   51 -
 .../src/evals/cli/components/SummaryTable.tsx |   32 -
 .../zosma-mem/src/evals/cli/simple-eval.ts    |  201 ---
 packages/zosma-mem/src/evals/index.ts         |   56 -
 packages/zosma-mem/src/evals/metrics.ts       |  121 --
 packages/zosma-mem/src/evals/report.ts        |   70 -
 packages/zosma-mem/src/evals/runner.ts        |  128 --
 .../src/evals/scenarios/co-access-cluster.ts  |   70 -
 .../src/evals/scenarios/cold-start.ts         |   59 -
 .../evals/scenarios/conflicting-updates.ts    |   83 --
 .../src/evals/scenarios/cross-context.ts      |   98 --
 .../zosma-mem/src/evals/scenarios/index.ts    |   35 -
 .../src/evals/scenarios/repeated-pattern.ts   |   70 -
 .../src/evals/scenarios/signal-dilution.ts    |   64 -
 .../src/evals/scenarios/stale-memory.ts       |   89 --
 packages/zosma-mem/src/evals/types.ts         |  270 ----
 .../zosma-mem/src/evals/utils/assertions.ts   |   54 -
 .../zosma-mem/src/evals/utils/fixtures.ts     |   67 -
 packages/zosma-mem/src/evals/utils/time.ts    |   32 -
 .../zosma-mem/src/gc/__tests__/gc.test.ts     |   96 ++
 packages/zosma-mem/src/gc/consolidate.ts      |   12 +
 packages/zosma-mem/src/gc/decay.ts            |   16 +
 packages/zosma-mem/src/gc/index.ts            |   22 +
 packages/zosma-mem/src/gc/prune.ts            |   27 +
 packages/zosma-mem/src/index.ts               |    6 +-
 .../src/ingestion/__tests__/ingest.test.ts    |   49 +-
 .../zosma-mem/src/ingestion/commit-indexer.ts |   46 -
 packages/zosma-mem/src/ingestion/event-bus.ts |   25 -
 packages/zosma-mem/src/ingestion/index.ts     |    3 -
 packages/zosma-mem/src/ingestion/ingest.ts    |   14 +-
 .../src/retrieval/__tests__/retrieve.test.ts  |   87 ++
 packages/zosma-mem/src/retrieval/index.ts     |    1 +
 packages/zosma-mem/src/retrieval/retrieve.ts  |   87 ++
 packages/zosma-mem/src/types.ts               |   75 ++
 pnpm-lock.yaml                                |  344 ++++-
 70 files changed, 2073 insertions(+), 4391 deletions(-)
 create mode 100644 packages/agents/src/pi/memory.ts
 delete mode 100644 packages/memory/package.json
 delete mode 100644 packages/memory/src/bootstrap.test.ts
 delete mode 100644 packages/memory/src/bootstrap.ts
 delete mode 100644 packages/memory/src/config.ts
 delete mode 100644 packages/memory/src/index.ts
 delete mode 100644 packages/memory/src/types.ts
 delete mode 100644 packages/memory/tsconfig.json
 delete mode 100644 packages/zosma-mem/IMPLEMENTATION_PLAN.md
 delete mode 100644 packages/zosma-mem/USAGE.md
 delete mode 100644 packages/zosma-mem/src/brain-adapter/index.ts
 delete mode 100644 packages/zosma-mem/src/brain-adapter/parser.ts
 create mode 100644 packages/zosma-mem/src/bridge/__tests__/bridge.test.ts
 create mode 100644 packages/zosma-mem/src/bridge/extensions.ts
 create mode 100644 packages/zosma-mem/src/bridge/index.ts
 create mode 100644 packages/zosma-mem/src/engine/__tests__/factory.test.ts
 create mode 100644 packages/zosma-mem/src/engine/__tests__/reinforcement.test.ts
 create mode 100644 packages/zosma-mem/src/engine/factory.ts
 create mode 100644 packages/zosma-mem/src/engine/index.ts
 create mode 100644 packages/zosma-mem/src/engine/reinforcement.ts
 create mode 100644 packages/zosma-mem/src/engine/salience.ts
 delete mode 100644 packages/zosma-mem/src/evals/__tests__/metrics.test.ts
 delete mode 100644 packages/zosma-mem/src/evals/__tests__/mock-adapter.ts
 delete mode 100644 packages/zosma-mem/src/evals/__tests__/report.test.ts
 delete mode 100644 packages/zosma-mem/src/evals/__tests__/runner.test.ts
 delete mode 100644 packages/zosma-mem/src/evals/__tests__/scenarios.test.ts
 delete mode 100644 packages/zosma-mem/src/evals/cli/bin.ts
 delete mode 100644 packages/zosma-mem/src/evals/cli/components/App.tsx
 delete mode 100644 packages/zosma-mem/src/evals/cli/components/ErrorDisplay.tsx
 delete mode 100644 packages/zosma-mem/src/evals/cli/components/ScenarioRow.tsx
 delete mode 100644 packages/zosma-mem/src/evals/cli/components/SummaryTable.tsx
 delete mode 100644 packages/zosma-mem/src/evals/cli/simple-eval.ts
 delete mode 100644 packages/zosma-mem/src/evals/index.ts
 delete mode 100644 packages/zosma-mem/src/evals/metrics.ts
 delete mode 100644 packages/zosma-mem/src/evals/report.ts
 delete mode 100644 packages/zosma-mem/src/evals/runner.ts
 delete mode 100644 packages/zosma-mem/src/evals/scenarios/co-access-cluster.ts
 delete mode 100644 packages/zosma-mem/src/evals/scenarios/cold-start.ts
 delete mode 100644 packages/zosma-mem/src/evals/scenarios/conflicting-updates.ts
 delete mode 100644 packages/zosma-mem/src/evals/scenarios/cross-context.ts
 delete mode 100644 packages/zosma-mem/src/evals/scenarios/index.ts
 delete mode 100644 packages/zosma-mem/src/evals/scenarios/repeated-pattern.ts
 delete mode 100644 packages/zosma-mem/src/evals/scenarios/signal-dilution.ts
 delete mode 100644 packages/zosma-mem/src/evals/scenarios/stale-memory.ts
 delete mode 100644 packages/zosma-mem/src/evals/types.ts
 delete mode 100644 packages/zosma-mem/src/evals/utils/assertions.ts
 delete mode 100644 packages/zosma-mem/src/evals/utils/fixtures.ts
 delete mode 100644 packages/zosma-mem/src/evals/utils/time.ts
 create mode 100644 packages/zosma-mem/src/gc/__tests__/gc.test.ts
 create mode 100644 packages/zosma-mem/src/gc/consolidate.ts
 create mode 100644 packages/zosma-mem/src/gc/decay.ts
 create mode 100644 packages/zosma-mem/src/gc/index.ts
 create mode 100644 packages/zosma-mem/src/gc/prune.ts
 delete mode 100644 packages/zosma-mem/src/ingestion/commit-indexer.ts
 delete mode 100644 packages/zosma-mem/src/ingestion/event-bus.ts
 create mode 100644 packages/zosma-mem/src/retrieval/__tests__/retrieve.test.ts
 create mode 100644 packages/zosma-mem/src/retrieval/index.ts
 create mode 100644 packages/zosma-mem/src/retrieval/retrieve.ts
 create mode 100644 packages/zosma-mem/src/types.ts

diff --git a/docs/MEMORY-INTEGRATION.md b/docs/MEMORY-INTEGRATION.md
index 75c755f..901f1f8 100644
--- a/docs/MEMORY-INTEGRATION.md
+++ b/docs/MEMORY-INTEGRATION.md
@@ -1,1002 +1,355 @@
-# OpenZosma Agent Memory System
+# Memory Integration
 
-Technical reference for how agent memory works in OpenZosma. Covers every layer from the
-Kubernetes pod filesystem through the pi extension hooks to the LLM context window.
+Technical plan to wire `@openzosma/zosma-mem` into the agent session lifecycle so
+memories persist and are recalled across conversations.
 
-Last updated: 2026-03-24
+Last updated: 2026-04-09
 
 ---
 
-## Table of Contents
-
-1. [Architecture Overview](#1-architecture-overview)
-2. [Package Map](#2-package-map)
-3. [Memory Classification](#3-memory-classification)
-4. [Filesystem Layout](#4-filesystem-layout)
-5. [Bootstrap Sequence](#5-bootstrap-sequence)
-6. [Pi Extension: pi-memory](#6-pi-extension-pi-memory)
-7. [Pi Extension: pi-extension-observational-memory](#7-pi-extension-pi-extension-observational-memory)
-8. [Orchestration Package: @openzosma/memory](#8-orchestration-package-openzosmamemory)
-9. [Agent Integration: @openzosma/agents](#9-agent-integration-openzosmaagents)
-10. [K3s Pod Lifecycle and Persistence](#10-k3s-pod-lifecycle-and-persistence)
-11. [Context Window Flow](#11-context-window-flow)
-12. [Tools Available to the Agent](#12-tools-available-to-the-agent)
-13. [Search and Retrieval (qmd)](#13-search-and-retrieval-qmd)
-14. [Compaction and Observation](#14-compaction-and-observation)
-15. [Configuration Reference](#15-configuration-reference)
-16. [Failure Modes and Degraded Operation](#16-failure-modes-and-degraded-operation)
-17. [What This System Does Not Do](#17-what-this-system-does-not-do)
+## Problem
 
----
-
-## 1. Architecture Overview
-
-The memory system is **filesystem-native**. All memory state lives inside the agent's sandbox
-pod as plain markdown and JSON files. There are no database tables, no Valkey keys, and no
-external services involved in memory storage or retrieval.
-
-Three packages collaborate:
-
-```
-┌─────────────────────────────────────────────────────────────────┐
-│                     Agent Pod (K3s)                              │
-│                                                                  │
-│  ┌─────────────────────────────────────────────────────────┐    │
-│  │  pi-coding-agent session                                 │    │
-│  │                                                          │    │
-│  │  ┌──────────────┐   ┌──────────────────────────────┐    │    │
-│  │  │  pi-memory    │   │  pi-extension-observational- │    │    │
-│  │  │  (extension)  │   │  memory (extension)          │    │    │
-│  │  │              │   │                               │    │    │
-│  │  │  Storage     │   │  Compaction                   │    │    │
-│  │  │  Retrieval   │   │  Observer/Reflector           │    │    │
-│  │  │  Injection   │   │  Auto-GC                      │    │    │
-│  │  │  Tools       │   │  Priority tagging             │    │    │
-│  │  └──────┬───────┘   └──────────────┬───────────────┘    │    │
-│  │         │                           │                    │    │
-│  │         └─────────┬─────────────────┘                    │    │
-│  │                   │                                      │    │
-│  │         ┌─────────▼─────────┐                            │    │
-│  │         │  Filesystem (PV)  │                            │    │
-│  │         │  .pi/agent/memory │                            │    │
-│  │         └───────────────────┘                            │    │
-│  └─────────────────────────────────────────────────────────┘    │
-│                                                                  │
-│  ┌─────────────────────────────────────────────────────────┐    │
-│  │  @openzosma/memory (bootstrap, config, env)              │    │
-│  │  @openzosma/agents (wires everything together)           │    │
-│  └─────────────────────────────────────────────────────────┘    │
-└─────────────────────────────────────────────────────────────────┘
-```
-
-**Key principle:** It orchestrates two
-proven pi extensions and configures them for the pod environment. The extensions register
-their own tools, hooks, and context injection. The orchestration layer only resolves paths
-and sets environment variables.
-
----
-
-## 2. Package Map
-
-| Package | Type | Role | Owns |
-|---|---|---|---|
-| `pi-memory` | pi extension (npm) | Storage, retrieval, injection, tools | MEMORY.md, daily logs, scratchpad, qmd integration |
-| `pi-extension-observational-memory` | pi extension (npm) | Compaction strategy, observer/reflector | Observation summaries, auto-GC, priority tagging |
-| `@openzosma/memory` | workspace package | Bootstrap + config | Environment variables, extension path resolution |
-| `@openzosma/agents` | workspace package | Agent session lifecycle | Wires memory extensions into pi session |
-
-### Dependency chain
-
-```
-@openzosma/agents
-  └── @openzosma/memory
-        ├── pi-memory
-        │     ├── @mariozechner/pi-ai
-        │     └── @mariozechner/pi-coding-agent
-        └── pi-extension-observational-memory
-              ├── @mariozechner/pi-ai
-              └── @mariozechner/pi-coding-agent
-```
-
----
-
-## 3. Memory Classification
-
-The system implements four categories of memory, each managed by different components:
-
-### Long-term memory (MEMORY.md)
-
-**Owner:** pi-memory
-**File:** `.pi/agent/memory/MEMORY.md`
-**Lifecycle:** Persists across sessions via PV. Never automatically pruned.
-**Purpose:** Durable facts, decisions, preferences, and constraints.
-
-```markdown
-<!-- 2026-03-23 14:30:00 [a1b2c3d4] -->
-#decision [[database-choice]] Chose PostgreSQL for all backend services. No ORM.
-
-<!-- 2026-03-23 15:00:00 [a1b2c3d4] -->
-#preference [[editor]] User prefers Neovim with LazyVim config.
-```
-
-Written explicitly by the agent via the `memory_write` tool when it identifies something
-worth remembering. Uses `#tags` and `[[wikilinks]]` for retrieval.
-
-### Episodic memory (daily logs)
-
-**Owner:** pi-memory
-**File:** `.pi/agent/memory/daily/YYYY-MM-DD.md`
-**Lifecycle:** One file per calendar day. Persists across sessions. Never pruned.
-**Purpose:** Running narrative of what happened during work. Captures context flow.
-
-Written to in three ways:
-1. Agent calls `memory_write` with `target: "daily"` during execution
-2. **Session handoff** — pi-memory auto-captures open scratchpad items + recent daily log
-   context to the daily file before each compaction (`session_before_compact` hook)
-3. **Exit summary** — pi-memory generates an LLM summary of the session and appends it
-   to the daily file on `session_shutdown`
-
-Today's and yesterday's daily logs are loaded into context at every turn.
-
-### Working memory (scratchpad)
-
-**Owner:** pi-memory
-**File:** `.pi/agent/memory/SCRATCHPAD.md`
-**Lifecycle:** Persists across sessions. Items are manually checked off or cleared.
-**Purpose:** Short-term task tracking. "Fix this later" items.
-
-```markdown
-- [ ] Fix the type error in gateway auth middleware
-- [x] Add session creation endpoint
-- [ ] Write tests for memory bootstrap
-```
-
-Managed via the `scratchpad` tool (add, done, undo, clear actions).
-Open items are injected into context every turn and captured during compaction handoffs.
-
-### Observational memory (compaction summaries)
-
-**Owner:** pi-extension-observational-memory
-**Storage:** In-memory session entries (not written to filesystem)
-**Lifecycle:** Lives only within the current session's context window.
-**Purpose:** Compressed representation of conversation history for long sessions.
-
-```markdown
-## Observations
-Date: 2026-03-23
-- 🔴 User requires PostgreSQL — no ORM, raw SQL only
-- 🟡 Working on gateway session endpoint, Hono framework
-- 🟢 Prefers concise commit messages
-
-## Open Threads
-- Session creation endpoint needs auth middleware
-
-## Next Action Bias
-1. Implement auth middleware for gateway routes
-```
-
-Created by the observational-memory extension when it replaces pi's default compaction.
-Priority-tagged (🔴 critical, 🟡 important, 🟢 informational) with a reflector pass
-that deduplicates and prunes when observations grow too large.
-
-### Summary: memory classification matrix
-
-| Type | Files | Written by | Injected into context | Survives session end | Survives pod restart | Crosses conversations |
-|---|---|---|---|---|---|---|
-| Long-term | MEMORY.md | Agent via `memory_write` | Yes (every turn) | Yes | Yes (PV) | Yes |
-| Episodic | daily/YYYY-MM-DD.md | Agent + auto-handoff + exit summary | Today + yesterday | Yes | Yes (PV) | Yes |
-| Working | SCRATCHPAD.md | Agent via `scratchpad` | Yes (open items) | Yes | Yes (PV) | Yes |
-| Observational | Session entries | Observational-memory extension | Yes (as compaction) | No | No | No |
-| Conversation | In-memory messages | pi SessionManager | Yes (raw tail) | No | No | No |
+The zosma-mem package has a fully working memory engine (ingest, retrieve, salience
+scoring, co-access graph, GC, versioned entity store). But **nothing calls it**.
 
-### Cross-conversation boundary rules
+- `bootstrapMemory()` sets `PI_MEMORY_DIR` but no extension reads it
+- The old extensions (`pi-memory`, `pi-extension-observational-memory`) were removed
+  but never replaced
+- The new packages (`pi-brain`, `pi-dcp`) referenced in `NEW-MEMORY-INTEGRATION.md`
+  were never installed or integrated
+- No code ingests facts from conversations into the engine
+- No code retrieves memories at session start and injects them into context
+- `systemPromptSuffix` is computed in session-manager.ts but never consumed by pi.agent.ts
 
-All memory types stored in the shared `memoryDir` (MEMORY.md, SCRATCHPAD.md, daily logs)
-are **intentionally shared across conversations** that use the same agent configuration.
-This is by design:
-
-- **Long-term memory** carries forward curated facts, decisions, and user preferences.
-  A new conversation inherits everything the agent has learned so far.
-- **Episodic logs** carry forward the daily narrative. A new conversation started on the
-  same day sees earlier entries from that day plus yesterday.
-- **Working memory (scratchpad)** carries forward open TODO items. A task added in one
-  conversation remains visible in the next. This acts as a cross-conversation task list
-  for the agent — unfinished work is not forgotten when the user starts a new thread.
-
-The following are **not shared** across conversations:
-
-- **Observational memory** (compaction summaries with priority-tagged bullets) exists only
-  in the pi session's in-memory entries. It dies when the session ends. A new conversation
-  starts with a clean observation slate.
-- **Raw conversation history** (the actual messages and tool calls) lives in
-  `SessionManager.inMemory()` within the pi SDK. It is never written to disk and is
-  garbage collected when the session object is released.
-
-This means a new conversation thread gets the agent's accumulated knowledge but not
-the dialogue or reasoning context from previous threads. The agent knows *what* it
-learned, but not *how* the previous conversation went.
+Result: the agent is stateless across conversations. It cannot remember anything.
 
 ---
 
-## 4. Filesystem Layout
+## Current State
 
-Memory files are stored in a **stable directory that persists across conversations**.
-The gateway derives the memory path from the agent configuration ID, not the session ID:
+### What exists and works
 
-```
-workspace/                            # OPENZOSMA_WORKSPACE root
-├── agents/
-│   ├── <agentConfigId>/              # Stable per-agent-config directory
-│   │   └── memory/                   # PI_MEMORY_DIR for this config
-│   │       ├── MEMORY.md             # Long-term curated memory
-│   │       ├── SCRATCHPAD.md         # Working checklist
-│   │       └── daily/
-│   │           ├── 2026-03-21.md
-│   │           ├── 2026-03-22.md
-│   │           └── 2026-03-23.md
-│   └── default/                      # Fallback when no agentConfigId
-│       └── memory/
-│           ├── MEMORY.md
-│           └── ...
-└── sessions/
-    ├── <session-uuid-1>/             # Per-session workspace (ephemeral work)
-    └── <session-uuid-2>/
-```
+| Component | Status |
+|---|---|
+| `packages/zosma-mem/src/engine/` | Working — factory, salience, reinforcement |
+| `packages/zosma-mem/src/store/` | Working — EntityStore (file-based), co-access graph |
+| `packages/zosma-mem/src/retrieval/` | Working — attention-scored retrieval with co-access boost |
+| `packages/zosma-mem/src/ingestion/` | Working — event ingestion with salience threshold |
+| `packages/zosma-mem/src/gc/` | Working — decay, pruning, version compaction |
+| Stable memoryDir per agent config | Working — gateway session-manager.ts computes it |
+| Memory dir creation | Working — mkdirSync in session-manager.ts |
 
-The critical design decision: **sessions are ephemeral, memory is not.** Each new
-conversation creates a fresh session directory under `sessions/`, but all sessions
-that share an agent config point to the same memory directory under `agents/`.
+### What is missing
 
-The path is controlled by the `PI_MEMORY_DIR` environment variable, which
-`@openzosma/memory` sets during bootstrap. The gateway's `SessionManager` computes
-the stable path and passes it as `memoryDir` through `AgentSessionOpts`.
+| Component | Status |
+|---|---|
+| `pi-brain` (npm) | Not installed. Needed for structured memory entities |
+| `pi-dcp` (npm) | Not installed. Needed for dynamic context pruning / GC |
+| Ingestion hook | Missing. Nothing extracts facts from conversations |
+| Retrieval-at-session-start | Missing. Nothing loads memories into context |
+| Reinforcement tracking | Missing. No read/ignore/decision signals from agent |
+| systemPromptSuffix wiring | Bug. Computed but never passed to pi.agent.ts |
 
 ---
 
-## 5. Bootstrap Sequence
-
-When a user sends their first message, the gateway's `SessionManager` creates a session
-and computes a stable memory directory. `PiAgentSession` in `@openzosma/agents` then
-bootstraps the pi-coding-agent session with that directory:
-
-```
-SessionManager.createSession()                     (@openzosma/gateway)
-│
-├── Compute stable memoryDir:
-│     workspace/agents/<agentConfigId>/memory/      (or agents/default/memory/)
-│     mkdirSync(memoryDir, { recursive: true })
-│
-├── Acquire initLock (serializes concurrent session init)
-│
-└── provider.createSession({ workspaceDir: sessionDir, memoryDir, ... })
-    │
-    PiAgentSession constructor                     (@openzosma/agents)
-    │
-    ├── 1. bootstrapMemory({ workspaceDir, memoryDir })  (@openzosma/memory)
-    │      ├── Sets process.env.PI_MEMORY_DIR = memoryDir
-    │      ├── Sets process.env.PI_MEMORY_QMD_UPDATE   (if configured)
-    │      ├── Sets process.env.PI_MEMORY_NO_SEARCH    (if configured)
-    │      ├── Resolves pi-memory/index.ts path        (via createRequire)
-    │      ├── Resolves pi-extension-observational-memory/index.ts path
-    │      └── Returns { paths: [piMemPath, obsMemPath], memoryDir }
-    │
-    ├── 2. bootstrapPiExtensions()                     (@openzosma/agents)
-    │      └── Returns existing extension paths (web-access, subagents, guardrails)
-    │
-    ├── 3. new DefaultResourceLoader({                 (pi-coding-agent)
-    │        additionalExtensionPaths: [
-    │          ...extensionPaths,      # web-access, subagents, guardrails
-    │          ...memoryResult.paths,  # pi-memory, observational-memory
-    │        ]
-    │      })
-    │
-    ├── 4. resourceLoader.reload()
-    │      └── jiti loads each extension .ts file at runtime (moduleCache: false)
-    │          ├── pi-memory default export called with (pi: ExtensionAPI)
-    │          │     ├── Registers session_start hook
-    │          │     ├── Registers session_shutdown hook
-    │          │     ├── Registers before_agent_start hook
-    │          │     ├── Registers session_before_compact hook
-    │          │     ├── Registers input hook
-    │          │     ├── Registers tools: memory_write, memory_read, scratchpad, memory_search
-    │          │     └── pi-memory reads PI_MEMORY_DIR from env (fresh per jiti load)
-    │          │
-    │          └── observational-memory default export called with (pi: ExtensionAPI)
-    │                ├── Registers session_start hook (reads flags)
-    │                ├── Registers agent_end hook (auto-compaction trigger)
-    │                ├── Registers session_before_compact hook (observer)
-    │                ├── Registers session_before_tree hook (branch summarizer)
-    │                ├── Registers session_compact hook (cleanup)
-    │                ├── Registers commands: obs-memory-status, obs-reflect, etc.
-    │                └── Registers shortcut: ctrl+shift+o (status overlay)
-    │
-    └── 5. createAgentSession({ ... })                 (pi-coding-agent)
-           └── Session created, hooks are now active
-
-SessionManager releases initLock (100ms after constructor)
+## Architecture (Target)
+
+```
+┌────────────────────────────────────────────────────────────────────┐
+│  Agent Session                                                      │
+│                                                                     │
+│  ┌──────────────────┐  ┌──────────────────┐  ┌─────────────────┐  │
+│  │  pi-brain         │  │  pi-dcp           │  │  zosma-mem      │  │
+│  │  (pi extension)   │  │  (pi extension)   │  │  engine         │  │
+│  │                   │  │                   │  │                  │  │
+│  │  Structured       │  │  Context pruning  │  │  Salience       │  │
+│  │  memory entities  │  │  Token management │  │  Retrieval      │  │
+│  │  Versioning       │  │  GC scheduling    │  │  Co-access      │  │
+│  │  pi hooks/tools   │  │                   │  │  Reinforcement  │  │
+│  └────────┬──────────┘  └──────────────────┘  └────────┬────────┘  │
+│           │                                             │           │
+│           └─────────────── zosma-mem-bridge ────────────┘           │
+│                        (new integration layer)                      │
+│                                                                     │
+│  ┌──────────────────────────────────────────────────────────────┐  │
+│  │  Filesystem: workspace/agents/<configId>/memory/             │  │
+│  │  ├── .salience/*.yaml                                        │  │
+│  │  ├── .salience/archive/                                      │  │
+│  │  ├── .salience/co-access                                     │  │
+│  │  └── (pi-brain managed files)                                │  │
+│  └──────────────────────────────────────────────────────────────┘  │
+└────────────────────────────────────────────────────────────────────┘
 ```
 
-**Concurrency note:** The `initLock` in `SessionManager` ensures that `PI_MEMORY_DIR`
-set by one session's `bootstrapMemory()` is not overwritten by another concurrent
-session before jiti reads it. jiti uses `moduleCache: false`, so each load gets a
-fresh module instance that reads the env var at that moment.
-
 ---
 
-## 6. Pi Extension: pi-memory
-
-**Package:** `pi-memory@0.3.6`
-**Entry:** `index.ts` (single-file extension, ~1400 lines)
-**Source:** npm published package
-
-### What it does
-
-pi-memory is the **storage and retrieval layer**. It owns all filesystem operations,
-provides tools for the agent to read/write memory, injects memory context into every turn,
-and manages the qmd search integration.
-
-### Hooks registered
-
-| Hook | When it fires | What pi-memory does |
-|---|---|---|
-| `session_start` | Session created | Creates memory directories. Detects qmd. Auto-creates qmd collection. Starts background qmd update timer. |
-| `before_agent_start` | Before every agent turn | Builds memory context (MEMORY.md + scratchpad + daily logs + search results). Appends to system prompt. |
-| `session_before_compact` | Before context compaction | Writes session handoff (open scratchpad items + recent daily log tail) to today's daily file. |
-| `session_shutdown` | Session ending | Generates LLM exit summary of the session. Appends to today's daily file. Runs final qmd update. Cleans up timers. |
-| `input` | User types input | Detects `/quit` to set exit summary reason. |
-
-### Tools registered
-
-| Tool | Purpose | Parameters |
-|---|---|---|
-| `memory_write` | Write to MEMORY.md or daily log | `target` (memory/daily), `content`, optional `tags` |
-| `memory_read` | Read a memory file or list daily logs | `target` (memory/scratchpad/daily/list) |
-| `scratchpad` | Manage checklist | `action` (add/done/undo/clear), `text` |
-| `memory_search` | Search across all memory files via qmd | `query`, `mode` (keyword/semantic/deep) |
-
-### Context injection (before_agent_start)
+## Integration Steps
 
-Every agent turn, pi-memory appends a `## Memory` section to the system prompt containing:
+### Step 1: Install missing npm packages
 
-1. **Scratchpad** — open (unchecked) items from SCRATCHPAD.md
-2. **Today's daily log** — full content of `daily/YYYY-MM-DD.md` for today
-3. **Search results** — qmd semantic/keyword search against the user's prompt (if qmd available and `PI_MEMORY_NO_SEARCH` not set)
-4. **MEMORY.md** — full curated long-term memory content
-5. **Yesterday's daily log** — full content of yesterday's file
+Install `pi-brain` and `pi-dcp` as dependencies of `@openzosma/zosma-mem`:
 
-Priority order: scratchpad > today > search > MEMORY.md > yesterday. If total content
-exceeds token limits, lower-priority items are truncated.
-
-The injection also includes usage instructions telling the agent how to use each tool
-and when to write memories.
-
-### Exit summary (session_shutdown)
-
-When a session ends, pi-memory asks the active LLM model to generate a summary of the
-conversation. The summary is formatted and appended to today's daily log:
-
-```markdown
-<!-- EXIT 14:30:00 [a1b2c3d4] reason=session-end -->
-## Exit Summary
-
-Built the memory integration for OpenZosma. Created @openzosma/memory package
-as orchestration layer. Wired pi-memory and observational-memory extensions
-into the agent session. All tests passing.
-```
-
-If the model call fails, a fallback text-only summary is generated from available context.
-
-### Session handoff (session_before_compact)
-
-Before every compaction, pi-memory captures a snapshot to the daily log:
-
-```markdown
-<!-- HANDOFF 14:15:00 [a1b2c3d4] -->
-## Session Handoff
-
-**Open scratchpad items:**
-- [ ] Fix the type error in gateway auth middleware
-- [ ] Write tests for memory bootstrap
-
-**Recent daily log context:**
-(last 15 lines of today's daily log)
+```bash
+cd packages/zosma-mem
+pnpm add pi-brain pi-dcp
 ```
 
-This ensures that even if observational-memory's compaction loses some detail, the raw
-facts are preserved on disk in the daily log.
+Verify both packages export a default pi extension function. Check their `index.ts`
+entry points in `node_modules/` for the hooks they register and any configuration
+they expect.
 
 ---
 
-## 7. Pi Extension: pi-extension-observational-memory
-
-**Package:** `pi-extension-observational-memory@0.1.3`
-**Entry:** `index.ts` + `overlay.ts` (TUI status overlay)
-**Source:** npm published package
-
-### What it does
-
-This extension **replaces pi's default compaction** with an observational memory strategy.
-Instead of generic summarization, it produces structured observation logs with priority
-tagging and runs a reflector garbage collector when observations grow large.
-
-### How it relates to pi-memory
-
-These two extensions serve **different purposes** and do **not conflict**:
+### Step 2: Create the bridge package
 
-- **pi-memory** writes the handoff entry to disk, then returns from `session_before_compact`
-  without a compaction result (returns `undefined`).
-- **observational-memory** generates the actual compaction summary and returns a
-  `CompactionResult` object that replaces pi's default compaction.
+Create `packages/zosma-mem/src/bridge/` — the integration layer between the zosma-mem
+engine and the pi extension system.
 
-The pi extension system calls all registered hooks in order. pi-memory runs first (writes
-handoff to disk, returns `undefined`), then observational-memory runs (generates summary,
-returns `{ compaction }`).
+#### File: `packages/zosma-mem/src/bridge/index.ts`
 
-### Observer/Reflector two-threshold model
+Exports:
+- `createMemoryBridge(config: BridgeConfig): MemoryBridge`
+- `resolveMemoryExtensionPaths(): { paths: string[], missing: string[] }`
 
-The system uses two thresholds to manage memory pressure:
+#### Interface: `BridgeConfig`
 
+```ts
+interface BridgeConfig {
+  memoryDir: string         // Stable per-agent-config directory
+  salienceThreshold?: number // Min salience to persist (default from engine)
+  topK?: number             // How many memories to retrieve (default: 8)
+}
 ```
-Raw conversation tokens (growing)
-   │
-   │  ... agent turns accumulate ...
-   │
-   ├── Observer threshold (default 30k tokens + 8k retain buffer = 38k activation)
-   │     └── Triggers auto-compaction
-   │           └── Conversation serialized → LLM → observational summary
-   │                 └── Priority-tagged bullets (🔴/🟡/🟢)
-   │
-   │  ... more turns, observations accumulate ...
-   │
-   └── Reflector threshold (default 40k observation-block tokens)
-         └── Triggers reflector GC on next compaction
-               ├── Deduplicate observations by normalized key
-               ├── Priority-aware pruning (🔴: max 96, 🟡: max 40, 🟢: max 16)
-               └── Preserve highest-priority, most-recent observations
-```
-
-### Observer modes
-
-| Mode | Behavior |
-|---|---|
-| `buffered` (default) | Auto-compaction triggers in background on `agent_end`. Non-blocking. |
-| `blocking` | Auto-compaction disabled. Only manual or regular compaction runs. |
 
-### Observation summary format
+#### Interface: `MemoryBridge`
 
-Every compaction produces a summary in this exact structure:
+```ts
+interface MemoryBridge {
+  /** Called before each turn. Returns memory context string for injection. */
+  loadContext: (userMessage: string) => Promise<string>
 
-```markdown
-## Observations
-Date: 2026-03-23
-- 🔴 critical constraint or blocker
-- 🟡 important evolving context
-- 🟢 low-priority informational note
+  /** Called after each turn. Extracts and ingests memorable facts. */
+  ingestFacts: (facts: ExtractedFact[]) => Promise<void>
 
-## Open Threads
-- unfinished work item
-- (none)
+  /** Called when agent uses a retrieved memory. Reinforcement signal. */
+  recordUsage: (entityId: string, signal: "used" | "ignored" | "influenced_decision") => Promise<void>
 
-## Next Action Bias
-1. most likely immediate next action
-2. optional second action
+  /** Run GC. Called on session end. */
+  gc: () => Promise<void>
 
-<read-files>
-packages/gateway/src/routes/sessions.ts
-</read-files>
+  /** Shutdown — clear timers, flush state. */
+  shutdown: () => void
 
-<modified-files>
-packages/gateway/src/routes/sessions.ts
-packages/auth/src/middleware.ts
-</modified-files>
+  /** Return all entity IDs (for testing). */
+  listEntityIds: () => Promise<string[]>
+}
 ```
 
-File operation tags (`<read-files>`, `<modified-files>`) are accumulated across compactions.
-They track which files the agent has read and modified throughout the session.
-
-### Hooks registered
-
-| Hook | What it does |
-|---|---|
-| `session_start` | Reads config flags (thresholds, mode, retain buffer) |
-| `agent_end` | In buffered mode, checks raw-tail token estimate and triggers auto-compaction if over threshold |
-| `session_before_compact` | Serializes conversation, calls LLM with observation prompt, normalizes output, runs reflector if needed |
-| `session_before_tree` | Generates observational summaries for abandoned branches |
-| `session_compact` | Resets force-reflect flag and auto-compact-in-flight state |
-
-### Commands registered
-
-| Command | Purpose |
-|---|---|
-| `/obs-memory-status` | Show current observer/reflector status, thresholds, last compaction details |
-| `/obs-auto-compact` | Show or set observer/reflector thresholds, mode, and retention |
-| `/obs-mode` | Show or set observer mode (buffered/blocking) |
-| `/obs-view` | Show latest observation summary |
-| `/obs-reflect` | Force aggressive reflection on next compaction and trigger it immediately |
-
-### Shortcut
-
-`Ctrl+Shift+O` — opens the observation memory status overlay (TUI).
-
 ---
 
-## 8. Orchestration Package: @openzosma/memory
-
-**Package:** `@openzosma/memory` (workspace: `packages/memory/`)
-**Files:** `bootstrap.ts`, `config.ts`, `types.ts`, `index.ts`
+### Step 3: Implement `loadContext`
 
-### What it does
+Called before each agent turn to retrieve relevant memories:
 
-This is a thin orchestration layer. It does **not** implement any memory logic. It:
+```ts
+const loadContext = async (userMessage: string): Promise<string> => {
+  const results = await engine.retrieve({ taskDescription: userMessage }, topK)
 
-1. Sets environment variables that pi-memory reads (`PI_MEMORY_DIR`, `PI_MEMORY_QMD_UPDATE`,
-   `PI_MEMORY_NO_SEARCH`)
-2. Resolves the filesystem paths to both extension entry points (`pi-memory/index.ts`,
-   `pi-extension-observational-memory/index.ts`) using `createRequire`
-3. Returns those paths for the agent session to pass to `DefaultResourceLoader`
-4. Logs warnings if either extension package is missing
+  if (results.length === 0) return ""
 
-### API
+  const memories = results.map(r => ({
+    id: r.entity.id,
+    content: r.entity.content,
+    score: r.attentionScore
+  }))
 
-```typescript
-import { bootstrapMemory } from "@openzosma/memory"
+  const lines = [
+    "## Long-term Memory",
+    "",
+    "The following facts have been remembered from previous conversations with this user.",
+    "Use them to inform your responses naturally, without mentioning memory IDs or scores.",
+    "",
+    ...memories.map(m => `- ${m.content}`),
+    ""
+  ]
 
-const result = bootstrapMemory({
-  workspaceDir: "/home/agent",
-  memoryDir: "/home/agent/.pi/agent/memory",  // optional override
-  qmdUpdateMode: "background",                 // optional: background | manual | off
-  disableSearch: false,                         // optional: disable qmd search injection
-})
-
-// result.paths = ["/path/to/pi-memory/index.ts", "/path/to/obs-memory/index.ts"]
-// result.memoryDir = "/home/agent/.pi/agent/memory"
+  return lines.join("\n")
+}
 ```
 
-### Why it exists
-
-Without this package, `@openzosma/agents` would need to know how to resolve npm package
-paths, which env vars to set, and in what order to list extensions. The orchestration
-package encapsulates this configuration so the agent code stays clean.
-
 ---
 
-## 9. Agent Integration: @openzosma/agents
-
-**Package:** `@openzosma/agents` (workspace: `packages/agents/`)
-**File:** `src/pi.agent.ts`
-
-### How memory is wired in
-
-The `PiAgentSession` constructor calls `bootstrapMemory` with the stable `memoryDir`
-from the gateway and merges the returned extension paths with the other pi extensions:
-
-```typescript
-constructor(opts: AgentSessionOpts) {
-  const memoryResult = bootstrapMemory({
-    workspaceDir: opts.workspaceDir,
-    memoryDir: opts.memoryDir,       // stable dir from SessionManager
-  })
-  const { extensionPaths } = bootstrapPiExtensions()
-
-  const resourceLoader = new DefaultResourceLoader({
-    cwd: opts.workspaceDir,
-    additionalExtensionPaths: [
-      ...extensionPaths,          // web-access, subagents, guardrails
-      ...memoryResult.paths,      // pi-memory, observational-memory
-    ],
-    systemPrompt: opts.systemPrompt ?? DEFAULT_SYSTEM_PROMPT,
-  })
-
-  // createAgentSession loads extensions via jiti
+### Step 4: Implement `ingestFacts`
+
+Called after each assistant turn with pre-extracted facts:
+
+```ts
+const ingestFacts = async (facts: ExtractedFact[]): Promise<void> => {
+  const now = Date.now()
+  for (const fact of facts) {
+    await engine.ingest({
+      id: factId(fact.content),  // deterministic hash
+      type: fact.type,
+      content: fact.content,
+      tags: fact.tags,
+      timestamp: now,
+    })
+  }
 }
 ```
 
-The `memoryDir` is separate from `workspaceDir`. `workspaceDir` is per-session
-(ephemeral), while `memoryDir` is per-agent-config (persistent). This separation
-is what allows memory to survive across conversations.
-
-### What the agent code does NOT do
-
-- **No manual tool registration.** Both extensions register their own tools.
-- **No manual context injection.** pi-memory's `before_agent_start` hook handles it.
-- **No manual compaction logic.** observational-memory's `session_before_compact` handles it.
-- **No memory-specific imports** beyond `bootstrapMemory`.
-
-The agent treats memory as a black box that self-configures through the extension system.
-
-### Full extension loading order
-
-1. `pi-web-access` — web search tools
-2. `pi-subagents` — sub-agent spawning (if pi CLI available)
-3. `pi-subagents/notify.ts` — sub-agent notifications
-4. `@aliou/pi-guardrails` — input/output guardrails
-5. `pi-memory` — memory storage, retrieval, tools, injection
-6. `pi-extension-observational-memory` — compaction, observer, reflector
-
-Position 5 and 6 are critical: pi-memory must come before observational-memory so
-its `session_before_compact` handoff writes to disk before observational-memory
-replaces the compaction summary.
-
 ---
 
-## 10. K3s Pod Lifecycle and Persistence
+### Step 5: Wire the bridge into PiAgentSession
 
-### Pod architecture
+Edit `packages/agents/src/pi.agent.ts`:
 
-Each agent session runs inside an isolated OpenShell sandbox, which is a K3s pod
-created from the `openzosma/agent-sandbox` Docker image. The orchestrator manages
-pod creation, message routing, and pod destruction.
+#### 5a. Import and create the bridge
 
+```ts
+import { createMemoryBridge, resolveMemoryExtensionPaths } from "@openzosma/zosma-mem/bridge"
 ```
-Orchestrator
-    │
-    │  gRPC bidirectional streaming
-    │
-    ▼
-K3s Pod (OpenShell sandbox)
-├── /workspace/agents/<configId>/memory/   ← memory PV mount (shared across sessions)
-│   ├── MEMORY.md
-│   ├── SCRATCHPAD.md
-│   └── daily/
-├── /workspace/sessions/<sessionId>/       ← session workspace (ephemeral)
-├── /tmp/agent/                            ← scratch space
-└── pi-coding-agent process
-    ├── pi-memory extension (reads from memory PV)
-    └── observational-memory extension (loaded)
-```
-
-### PersistentVolume (PV) for memory
-
-Memory files must survive pod restarts. The memory directory under `workspace/agents/`
-is backed by a Kubernetes PersistentVolume (PV) scoped to the agent configuration:
-
-```yaml
-# Conceptual PV spec (not yet implemented)
-apiVersion: v1
-kind: PersistentVolumeClaim
-metadata:
-  name: agent-<configId>-memory-pvc
-spec:
-  accessModes: [ReadWriteOnce]
-  resources:
-    requests:
-      storage: 1Gi
-```
-
-**Current state:** The K8s manifests in `infra/k8s/` are placeholders. The PV setup
-is planned for Phase 4 (orchestrator + sandbox integration). For local development,
-the gateway writes memory to `workspace/agents/<configId>/memory/` on the host
-filesystem, which persists across server restarts.
 
-### Session-to-memory mapping
+In the `PiAgentSession` constructor:
 
-All sessions that share an `agentConfigId` share the same memory directory.
-Sessions without a config use the `default` memory directory.
-
-| Session state | Pod state | Memory state |
-|---|---|---|
-| `created` | Pod being allocated from pool | Memory dir exists (created by SessionManager) |
-| `active` | Pod running, gRPC connected | pi-memory reads existing files, continues accumulating |
-| `paused` | Pod preserved but idle | Memory files intact on PV |
-| `active` (resumed) | Pod re-activated | pi-memory reads existing files, continues |
-| `ended` | Pod destroyed | Memory files persist on PV |
-| New session (same config) | New pod allocated | Same memory PV mounted, all prior memory available |
-
-### Pod filesystem policy
-
-The OpenShell sandbox policy controls what the agent process can access:
-
-```yaml
-filesystem:
-  allow_read: ["/workspace", "/tmp", "/home/agent"]
-  allow_write: ["/workspace", "/tmp", "/home/agent"]
-  deny: ["/etc/passwd", "/proc", "/sys"]
+```ts
+this.memoryBridge = createMemoryBridge({ memoryDir: opts.memoryDir ?? defaultPath })
 ```
 
-The `.pi/agent/memory/` directory falls within `/home/agent/` and is both readable
-and writable by the agent process.
-
----
-
-## 11. Context Window Flow
+#### 5b. Per-turn retrieval
 
-This diagram shows how memory content enters the LLM context window during a single
-agent turn:
+Before each `sendMessage()`, inject memory context:
 
+```ts
+const memoryContext = await this.memoryBridge.loadContext(content)
+if (memoryContext) {
+  await session.steer(memoryContext)  // Inject before prompt
+}
 ```
-                    Context Window
-                    ┌─────────────────────────────────┐
-                    │                                  │
-                    │  System prompt (base)             │
-                    │                                  │
-                    │  ## Memory                        │  ← injected by pi-memory
-                    │  ┌────────────────────────────┐  │    (before_agent_start)
-                    │  │ Scratchpad (open items)     │  │
-                    │  │ Today's daily log           │  │
-                    │  │ Search results (qmd)        │  │
-                    │  │ MEMORY.md content           │  │
-                    │  │ Yesterday's daily log       │  │
-                    │  └────────────────────────────┘  │
-                    │                                  │
-                    │  Compaction summary (if any)      │  ← generated by
-                    │  ┌────────────────────────────┐  │    observational-memory
-                    │  │ ## Observations              │  │
-                    │  │ - 🔴 critical items          │  │
-                    │  │ - 🟡 important context       │  │
-                    │  │ - 🟢 informational           │  │
-                    │  │ ## Open Threads              │  │
-                    │  │ ## Next Action Bias          │  │
-                    │  │ <read-files> / <modified>    │  │
-                    │  └────────────────────────────┘  │
-                    │                                  │
-                    │  Recent conversation turns        │  ← raw messages after
-                    │  (kept after compaction)          │    last compaction
-                    │                                  │
-                    │  User's current message           │
-                    │                                  │
-                    └─────────────────────────────────┘
-```
-
-### Token budget breakdown
-
-| Section | Source | Typical size |
-|---|---|---|
-| Base system prompt | `@openzosma/agents` config | ~2k tokens |
-| Memory injection | pi-memory `before_agent_start` | 1k-10k tokens |
-| Compaction summary | observational-memory | 2k-8k tokens |
-| Raw conversation tail | Kept after last compaction | up to ~30k tokens |
-| User message | Current turn | Variable |
-
-The observer auto-compaction triggers at ~38k raw-tail tokens (30k threshold + 8k retain
-buffer), which keeps the context window from overflowing on most models.
 
----
-
-## 12. Tools Available to the Agent
-
-The agent has four memory tools, all registered by pi-memory:
+#### 5c. Post-turn ingestion
 
-### memory_write
+After each turn completes:
 
-Write durable information to memory files.
-
-```
-Targets:
-  - memory: append to MEMORY.md (facts, decisions, preferences)
-  - daily: append to today's daily log (running context, notes)
-
-Content format:
-  - Use #tags for categorization: #decision, #preference, #constraint
-  - Use [[wikilinks]] for cross-references: [[auth-strategy]]
-  - Each entry gets a timestamp and session ID comment
+```ts
+const facts = await extractFacts(model, apiKey, userMessage, assistantResponse)
+await this.memoryBridge.ingestFacts(facts)
 ```
 
-### memory_read
+#### 5d. Load pi-brain and pi-dcp
 
-Read memory file contents.
+```ts
+const { paths: memoryExtensionPaths, missing } = resolveMemoryExtensionPaths()
+if (missing.length > 0) log.warn("Memory extensions missing:", missing)
 
+const resourceLoader = new DefaultResourceLoader({
+  cwd: opts.workspaceDir,
+  systemPrompt: finalPrompt,
+  additionalExtensionPaths: memoryExtensionPaths,
+})
 ```
-Targets:
-  - memory: read MEMORY.md
-  - scratchpad: read SCRATCHPAD.md
-  - daily: read a specific daily log (by date)
-  - list: list available daily log files
-```
-
-### scratchpad
 
-Manage the working checklist.
+#### 5e. Fix systemPromptSuffix
 
+```ts
+const parts = [opts.systemPromptPrefix, basePrompt, opts.systemPromptSuffix].filter(Boolean)
+const finalPrompt = parts.join("\n\n")
 ```
-Actions:
-  - add <text>: add a new unchecked item
-  - done <text>: mark an item as done
-  - undo <text>: uncheck a completed item
-  - clear: remove all completed items
-```
-
-### memory_search
-
-Search across all memory files using qmd.
 
-```
-Modes:
-  - keyword: fast text search
-  - semantic: embedding-based similarity search
-  - deep: combined keyword + semantic with re-ranking
+#### 5f. Session cleanup
 
-Searches: MEMORY.md, SCRATCHPAD.md, all daily logs
-Requires: qmd installed and pi-memory collection configured
+```ts
+await this.memoryBridge.gc()
+this.memoryBridge.shutdown()
 ```
 
 ---
 
-## 13. Search and Retrieval (qmd)
-
-[qmd](https://github.com/tobi/qmd) is an external CLI tool that provides semantic search
-over markdown files. It is **optional** — core memory tools work without it.
-
-### What qmd provides
-
-- Keyword search (fast, text-matching)
-- Semantic search (embedding-based similarity using local models)
-- Hybrid/deep search (combined keyword + semantic with re-ranking)
-- Collection-based indexing of the memory directory
-
-### Auto-setup
-
-On `session_start`, pi-memory:
-1. Detects if qmd is installed (runs `qmd status`)
-2. If available, checks if the `pi-memory` collection exists
-3. If not, creates it: `qmd collection add <MEMORY_DIR> --name pi-memory`
-4. Adds path contexts: `/daily` with description "Daily append-only work logs"
-5. Starts a background timer for periodic `qmd update` calls
-6. Runs `qmd embed` to build/update embeddings
-
-### Selective injection
-
-Before each agent turn (`before_agent_start`), pi-memory runs:
-
-```
-qmd search "<user prompt>" -c pi-memory --mode hybrid --limit 5 --json
-```
-
-The results are included in the memory context section of the system prompt.
-This is disabled if `PI_MEMORY_NO_SEARCH=1` is set.
-
-### Pod image requirement
-
-For qmd to work in the sandbox, it must be pre-installed in the Docker image:
+### Step 6: LLM-based fact extraction
 
-```dockerfile
-RUN bun install -g https://github.com/tobi/qmd
-```
-
-Without qmd, the system operates in degraded mode: `memory_search` tool returns an
-install instructions message, and selective injection is skipped. All other memory
-functionality works normally.
+Create `packages/agents/src/pi/memory.ts` with `extractFacts()` that uses the session's
+LLM to identify memorable facts from conversation exchanges.
 
 ---
 
-## 14. Compaction and Observation
-
-### What is compaction?
-
-When the conversation context grows too large for the model's context window, pi triggers
-compaction. This replaces older conversation history with a summary, freeing up context
-space for new turns.
-
-### Default pi compaction vs. observational memory
-
-| Aspect | Default pi compaction | Observational memory |
-|---|---|---|
-| Summary format | Generic text summary | Structured observations with priority emoji |
-| Priority awareness | No | Yes (🔴/🟡/🟢) |
-| Reflector GC | No | Yes (deduplication + pruning at threshold) |
-| Auto-trigger | Only when context overflows | Proactive at configurable token threshold |
-| File tracking | No | Yes (`<read-files>`, `<modified-files>` tags) |
-| Open threads | No | Yes (explicit section) |
-| Next action bias | No | Yes (explicit section) |
-
-### Two-pass compaction flow
+### Step 7: Tests
 
-```
-1. pi detects context pressure (or observer auto-trigger fires)
-2. pi calls session_before_compact hooks in registration order:
-   a. pi-memory hook runs first:
-      - Writes handoff entry to daily log (scratchpad items + recent context)
-      - Returns undefined (does not replace compaction)
-   b. observational-memory hook runs second:
-      - Serializes conversation via convertToLlm + serializeConversation
-      - Includes previous observation summary if exists
-      - Calls LLM with observation prompt
-      - Normalizes output to required three-section format
-      - Checks if reflector should run (observation tokens > reflector threshold)
-      - If reflector needed: deduplicates, prunes by priority caps
-      - Appends file operation tags
-      - Returns { compaction: CompactionResult }
-3. pi uses the CompactionResult from observational-memory
-4. Old conversation entries replaced with compaction summary
-```
-
-### Reflector garbage collection
-
-When the observation block exceeds the reflector threshold (default 40k tokens),
-the reflector runs:
-
-1. **Parse** all observation lines from the summary
-2. **Normalize** each observation to a key (lowercase, strip formatting)
-3. **Deduplicate** by key, keeping higher priority and more recent entries
-4. **Cap** by priority level:
-   - Threshold mode: 🔴 max 96, 🟡 max 40, 🟢 max 16
-   - Forced mode (`/obs-reflect`): 🔴 max 72, 🟡 max 28, 🟢 max 8
-5. **Deduplicate** open threads and next action items
-6. **Reassemble** the summary in the standard three-section format
+Create `packages/zosma-mem/src/bridge/__tests__/bridge.test.ts` with integration tests
+for the full ingest→retrieve→reinforce lifecycle.
 
 ---
 
-## 15. Configuration Reference
+## Implementation Status
 
-### Environment variables (set by @openzosma/memory)
+### ✅ Completed
 
-| Variable | Default | Description |
-|---|---|---|
-| `PI_MEMORY_DIR` | `<workspaceDir>/.pi/agent/memory` | Root directory for all memory files |
-| `PI_MEMORY_QMD_UPDATE` | `background` | qmd re-indexing mode: `background`, `manual`, `off` |
-| `PI_MEMORY_NO_SEARCH` | unset | Set to `1` to disable selective memory injection |
+- [x] Installed pi-brain, pi-dcp as zosma-mem deps
+- [x] Created bridge package with `createMemoryBridge` and `resolveMemoryExtensionPaths`
+- [x] Implemented `loadContext` with proper formatting
+- [x] Implemented `ingestFacts` with fact ID hashing
+- [x] Wired bridge into `PiAgentSession` (per-turn injection via `steer()`, post-turn ingestion)
+- [x] Fixed `systemPromptSuffix` bug in prompt construction
+- [x] Load pi-brain and pi-dcp extensions via `additionalExtensionPaths`
+- [x] Session cleanup with GC and shutdown
+- [x] LLM-based fact extraction in separate agents module
+- [x] Cleaned dead code (evals, adapter, bootstrap, config.ts)
 
-### Observational memory flags (set via pi extension system)
+### ⏳ Remaining
 
-| Flag | Default | Description |
-|---|---|---|
-| `obs-auto-compact` | `true` | Enable observer auto-trigger |
-| `obs-mode` | `buffered` | `buffered` (background on agent_end) or `blocking` |
-| `obs-observer-threshold` | `30000` | Raw-tail tokens before observer fires |
-| `obs-reflector-threshold` | `40000` | Observation-block tokens before reflector GC |
-| `obs-retain-raw-tail` | `8000` | Extra raw-tail tokens kept before observer fires |
-
-These can be set as CLI flags when starting pi, or changed at runtime via
-`/obs-auto-compact` command.
-
-### MemoryConfig interface
-
-```typescript
-interface MemoryConfig {
-  workspaceDir: string         // Pod workspace root (e.g., /home/agent)
-  memoryDir?: string           // Override PI_MEMORY_DIR
-  qmdUpdateMode?: "background" | "manual" | "off"
-  disableSearch?: boolean      // Disable qmd search injection
-}
-```
+- [ ] Add reinforcement tracking (when agent uses retrieved memories)
+- [ ] Complete bridge tests
+- [ ] Manual testing: cross-conversation recall
 
 ---
 
-## 16. Failure Modes and Degraded Operation
+## Files Created/Modified
 
-| Failure | Impact | Behavior |
+| File | Status | Purpose |
 |---|---|---|
-| pi-memory not installed | No memory tools, no context injection | Warning logged, agent works without memory |
-| observational-memory not installed | Default pi compaction used | Warning logged, compaction still works |
-| Both missing | No memory at all | Warning logged, agent operates statelessly |
-| qmd not installed | No `memory_search`, no selective injection | Core tools still work, MEMORY.md/scratchpad/daily logs still injected |
-| qmd collection missing | Same as qmd not installed | pi-memory auto-creates collection on session_start |
-| LLM API key missing | No exit summary, no observation compaction | Both extensions fall back gracefully, log warnings |
-| PV not mounted | Memory lost on pod restart | Files created in ephemeral pod storage, work within session |
-| Memory dir not writable | All writes fail | Tools return error messages, agent continues without persistence |
-| Observation generation fails | Default compaction used | observational-memory returns undefined, pi uses built-in compaction |
+| `packages/zosma-mem/package.json` | ✅ Modified | Added pi-brain/pi-dcp deps, removed evals export/bin |
+| `packages/zosma-mem/src/bridge/index.ts` | ✅ Created | Bridge factory + MemoryBridge implementation |
+| `packages/zosma-mem/src/bridge/extensions.ts` | ✅ Created | Extension path resolution for pi-brain/pi-dcp |
+| `packages/zosma-mem/src/bridge/__tests__/bridge.test.ts` | ⏳ Partial | Bridge unit tests (6 basic tests pass) |
+| `packages/agents/src/pi.agent.ts` | ✅ Modified | Wired bridge, fixed suffix bug, load extensions |
+| `packages/agents/src/pi/memory.ts` | ✅ Created | LLM-based fact extraction |
+| `packages/zosma-mem/README.md` | ✅ Updated | Reflects current package purpose |
 
 ---
 
-## 17. What This System Does Not Do
+## Non-Goals
 
-- **No database storage for memory.** Memory is files on disk, not rows in PostgreSQL.
-- **No cross-session real-time sharing.** Each pod reads its own PV. There is no pub/sub
-  for memory updates between concurrent sessions.
-- **No automatic pruning of long-term memory.** MEMORY.md grows unbounded. Manual curation
-  by the agent (or user) is the only mechanism.
-- **No embedding generation.** Embeddings are handled by qmd externally, not by this system.
-- **No memory deduplication across files.** The same fact could exist in MEMORY.md and a
-  daily log. Search results may contain duplicates.
-- **No access control on memory.** Any agent with PV access can read/write all memory files.
-- **No encryption at rest.** Memory files are plaintext markdown.
-- **No memory versioning or rollback.** Files are append-only with no git-like history.
+- No database storage. Memory stays file-based.
+- No cross-session real-time sync. Each session reads its own files.
+- No embedding model. Retrieval uses tag-based attention scoring.
+- No changes to gateway/session-manager (memoryDir wiring works).
+- No removal of zosma-mem engine. Bridge wraps it.
 
 ---
 
-## Appendix: Source File Locations
-
-| File | Package | Purpose |
-|---|---|---|
-| `packages/memory/src/bootstrap.ts` | @openzosma/memory | `bootstrapMemory()` — resolves extensions, sets env |
-| `packages/memory/src/config.ts` | @openzosma/memory | `applyMemoryEnv()` — sets PI_MEMORY_DIR etc. |
-| `packages/memory/src/types.ts` | @openzosma/memory | `MemoryConfig`, `MemoryBootstrapResult` |
-| `packages/memory/src/index.ts` | @openzosma/memory | Public exports |
-| `packages/memory/src/bootstrap.test.ts` | @openzosma/memory | 9 tests for bootstrap + config |
-| `packages/agents/src/pi.agent.ts` | @openzosma/agents | `PiAgentSession` — wires memory into session |
-| `packages/agents/src/types.ts` | @openzosma/agents | `AgentSessionOpts` — includes `memoryDir` field |
-| `packages/agents/src/pi/extensions/index.ts` | @openzosma/agents | `bootstrapPiExtensions()` — other extensions |
-| `packages/gateway/src/session-manager.ts` | @openzosma/gateway | `SessionManager` — computes stable memory dir per agent config, serializes init |
-| `packages/gateway/src/session-manager.test.ts` | @openzosma/gateway | 4 tests for memory dir stability and isolation |
-| `node_modules/pi-memory/index.ts` | pi-memory (npm) | Full extension source (~1400 lines) |
-| `node_modules/pi-extension-observational-memory/index.ts` | obs-memory (npm) | Full extension source (~1200 lines) |
-| `node_modules/pi-extension-observational-memory/overlay.ts` | obs-memory (npm) | TUI status overlay component |
+## Architecture (Actual Implementation)
+
+```
+┌────────────────────────────────────────────────────────────────────┐
+│  Agent Session (PiAgentSession)                                    │
+│                                                                     │
+│  ┌──────────────────┐  ┌──────────────────┐  ┌─────────────────┐  │
+│  │  pi-brain         │  │  pi-dcp           │  │  zosma-mem      │  │
+│  │  (loaded via      │  │  (loaded via      │  │  bridge         │  │
+│  │   additionalExt)  │  │   additionalExt)  │  │                 │  │
+│  │                   │  │                   │  │  loadContext()   │  │
+│  │  Code project     │  │  Context pruning  │  │  ingestFacts()  │  │
+│  │  memory           │  │  Token management │  │  recordUsage()  │  │
+│  │                   │  │                   │  │  gc()            │  │
+│  └────────┬──────────┘  └──────────────────┘  └────────┬────────┘  │
+│           │                                             │           │
+│           └─────────────────────────────────────────────┘           │
+│              zosma-mem engine (salience, store, gc)                 │
+│                                                                     │
+│  ┌──────────────────────────────────────────────────────────────┐  │
+│  │  Filesystem: workspace/agents/<configId>/memory/             │  │
+│  │  ├── .salience/*.yaml (entities)                             │  │
+│  │  ├── .salience/archive/ (pruned)                             │  │
+│  │  └── .salience/co-access (patterns)                          │  │
+│  └──────────────────────────────────────────────────────────────┘  │
+└────────────────────────────────────────────────────────────────────┘
+```
\ No newline at end of file
diff --git a/infra/openshell/Dockerfile b/infra/openshell/Dockerfile
index 22d0f06..a77f704 100644
--- a/infra/openshell/Dockerfile
+++ b/infra/openshell/Dockerfile
@@ -48,7 +48,7 @@ COPY pnpm-workspace.yaml package.json pnpm-lock.yaml tsconfig.base.json ./
 COPY packages/sandbox-server/package.json packages/sandbox-server/
 COPY packages/agents/package.json packages/agents/
 COPY packages/logger/package.json packages/logger/
-COPY packages/memory/package.json packages/memory/
+COPY packages/zosma-mem/package.json packages/zosma-mem/
 
 # Install dependencies
 RUN pnpm install --frozen-lockfile
diff --git a/packages/agents/package.json b/packages/agents/package.json
index 655066b..2fe7035 100644
--- a/packages/agents/package.json
+++ b/packages/agents/package.json
@@ -20,22 +20,22 @@
 		"check": "tsc --noEmit"
 	},
 	"dependencies": {
+		"@mariozechner/pi-agent-core": "^0.61.0",
 		"@mariozechner/pi-ai": "^0.61.0",
 		"@mariozechner/pi-coding-agent": "^0.61.0",
-		"@openzosma/logger": "workspace:*",
-		"@openzosma/memory": "workspace:*",
-		"@sinclair/typebox": "^0.34.48",
-		"dotenv": "17.3.1",
-		"uuid": "^13.0.0",
 		"@openzosma/db": "workspace:*",
 		"@openzosma/integrations": "workspace:*",
+		"@openzosma/logger": "workspace:*",
 		"@openzosma/skill-reports": "workspace:*",
+		"@openzosma/zosma-mem": "workspace:*",
+		"@sinclair/typebox": "^0.34.48",
+		"dotenv": "17.3.1",
 		"pg": "^8.13.1",
-		"@mariozechner/pi-agent-core": "^0.61.0"
+		"uuid": "^13.0.0"
 	},
 	"devDependencies": {
 		"@types/node": "^22.15.2",
-		"typescript": "^5.7.3",
-		"@types/pg": "^8.11.10"
+		"@types/pg": "^8.11.10",
+		"typescript": "^5.7.3"
 	}
 }
diff --git a/packages/agents/src/pi.agent.ts b/packages/agents/src/pi.agent.ts
index 8808d32..1be4549 100644
--- a/packages/agents/src/pi.agent.ts
+++ b/packages/agents/src/pi.agent.ts
@@ -1,4 +1,6 @@
 import { randomUUID } from "node:crypto"
+import { join } from "node:path"
+import type { Api, Model } from "@mariozechner/pi-ai"
 import type { AgentSession as PiSdkSession } from "@mariozechner/pi-coding-agent"
 import {
 	AuthStorage,
@@ -8,8 +10,10 @@ import {
 	createAgentSession,
 } from "@mariozechner/pi-coding-agent"
 import { createLogger } from "@openzosma/logger"
-import { bootstrapMemory } from "@openzosma/memory"
+import { createMemoryBridge, resolveMemoryExtensionPaths } from "@openzosma/zosma-mem/bridge"
+import type { MemoryBridge } from "@openzosma/zosma-mem/bridge"
 import { DEFAULT_SYSTEM_PROMPT } from "./pi/config.js"
+import { extractFacts } from "./pi/memory.js"
 import { resolveModel } from "./pi/model.js"
 import {
 	createDefaultTools,
@@ -35,7 +39,7 @@ const LLM_IDLE_TIMEOUT_MS = Number(process.env.OPENZOSMA_LLM_IDLE_TIMEOUT_MS) ||
  * Build a ModelRegistry that knows about a custom provider and its API key.
  * This is needed because pi-coding-agent's AgentSession validates the API key
  * via ModelRegistry.getApiKey() before each prompt. Without registration,
- * custom providers (like "local") fail with "No API key found".
+ * custom providers (like openai, anthropic, etc.) fail with "No API key found".
  */
 function buildModelRegistry(providerName: string, apiKey: string, baseUrl: string): ModelRegistry {
 	const authStorage = AuthStorage.inMemory()
@@ -50,38 +54,59 @@ function buildModelRegistry(providerName: string, apiKey: string, baseUrl: strin
 class PiAgentSession implements AgentSession {
 	private sessionPromise: Promise<PiSdkSession>
 	private messages: AgentMessage[] = []
+	private memoryBridge: MemoryBridge
+	private model: Model<Api>
+	private apiKey: string
 
 	constructor(opts: AgentSessionOpts) {
-		bootstrapMemory({
-			workspaceDir: opts.workspaceDir,
-			memoryDir: opts.memoryDir,
+		const { model, apiKey } = resolveModel({
+			provider: opts.provider,
+			model: opts.model,
+			baseUrl: opts.baseUrl,
 		})
+		this.model = model
+		this.apiKey = apiKey
+
+		// Stable memory dir: use the explicit memoryDir from opts if provided,
+		// otherwise fall back to the default path inside the workspace.
+		const memoryDir = opts.memoryDir ?? join(opts.workspaceDir, ".pi", "agent", "memory")
+		this.memoryBridge = createMemoryBridge({ memoryDir })
+
 		const toolList = [...createDefaultTools(opts.workspaceDir, opts.toolsEnabled)]
 		const reportTools = createReportTools(opts.toolsEnabled, opts.workspaceDir)
 		const customTools = [
 			...reportTools,
 			...(opts.dbPool ? [createQueryDatabaseTool(opts.dbPool), createListDatabaseSchemasTool(opts.dbPool)] : []),
 		]
-		const { model, apiKey } = resolveModel({
-			provider: opts.provider,
-			model: opts.model,
-			baseUrl: opts.baseUrl,
-		})
 
-		// Build the final system prompt: optional prefix + main prompt
+		// Build the final system prompt:
+		//   [systemPromptPrefix] + [base prompt] + [systemPromptSuffix]
+		// systemPromptPrefix: caller-supplied context (e.g. agent-config overrides)
+		// base prompt: DEFAULT_SYSTEM_PROMPT or per-config override
+		// systemPromptSuffix: gateway-injected context (e.g. database integration list)
 		const basePrompt = opts.systemPrompt ?? DEFAULT_SYSTEM_PROMPT
-		const finalPrompt = opts.systemPromptPrefix ? `${opts.systemPromptPrefix}\n\n${basePrompt}` : basePrompt
+		const parts = [opts.systemPromptPrefix, basePrompt, opts.systemPromptSuffix].filter(Boolean)
+		const finalPrompt = parts.join("\n\n")
 
 		log.info("PiAgentSession: building system prompt", {
 			hasPrefix: !!opts.systemPromptPrefix,
+			hasSuffix: !!opts.systemPromptSuffix,
 			prefixLength: opts.systemPromptPrefix?.length ?? 0,
-			prefixPreview: opts.systemPromptPrefix?.slice(0, 80) ?? "(none)",
+			suffixLength: opts.systemPromptSuffix?.length ?? 0,
 			finalPromptLength: finalPrompt.length,
 		})
 
+		// Resolve pi-brain and pi-dcp extension paths. Missing packages are
+		// silently skipped — the agent degrades gracefully without them.
+		const { paths: memoryExtensionPaths, missing: missingExtensions } = resolveMemoryExtensionPaths()
+		if (missingExtensions.length > 0) {
+			log.warn("Memory extensions not found — skipping", { missing: missingExtensions })
+		}
+
 		const resourceLoader = new DefaultResourceLoader({
 			cwd: opts.workspaceDir,
 			systemPrompt: finalPrompt,
+			additionalExtensionPaths: memoryExtensionPaths,
 		})
 
 		// For custom/local providers not in the built-in registry, create a
@@ -114,6 +139,25 @@ class PiAgentSession implements AgentSession {
 	async *sendMessage(content: string, signal?: AbortSignal): AsyncGenerator<AgentStreamEvent> {
 		const session = await this.sessionPromise
 
+		// Retrieve relevant memories and track which ones we injected.
+		// We'll use this to record reinforcement signals later.
+		let injectedMemoryIds: string[] = []
+		try {
+			const { context: memoryContext, injectedIds } = await this.memoryBridge.loadContext(content)
+			injectedMemoryIds = injectedIds
+			if (memoryContext) {
+				await session.steer(memoryContext)
+				log.info("Memory context injected via steer()", {
+					length: memoryContext.length,
+					injectedIds: injectedMemoryIds.length
+				})
+			}
+		} catch (err) {
+			log.warn("Failed to load memory context (non-fatal)", {
+				error: err instanceof Error ? err.message : String(err),
+			})
+		}
+
 		const promptContent = content
 
 		const userMsg: AgentMessage = {
@@ -292,7 +336,7 @@ class PiAgentSession implements AgentSession {
 						}
 					}
 					if (errorMessages.length > 0) {
-						enqueue({ type: "error", error: errorMessages.join("; ") })
+						enqueue({ type: "error", error: `Agent errors: ${errorMessages.join("; ")}` })
 					}
 					enqueue({ type: "turn_end", id: randomUUID() })
 					done = true
@@ -335,9 +379,9 @@ class PiAgentSession implements AgentSession {
 				case "auto_retry_start":
 					log.warn("Auto-retry started (LLM error, retrying)", {
 						attempt: "attempt" in event ? event.attempt : undefined,
-						maxAttempts: "maxAttempts" in event ? event.maxAttempts : undefined,
-						delayMs: "delayMs" in event ? event.delayMs : undefined,
-						errorMessage: "errorMessage" in event ? event.errorMessage : undefined,
+						maxAttempts: "maxAttempts" in event ? (event.maxAttempts as number) : undefined,
+						delayMs: "delayMs" in event ? (event.delayMs as number) : undefined,
+						errorMessage: "errorMessage" in event ? (event.errorMessage as string) : undefined,
 					})
 					enqueue({
 						type: "auto_retry_start",
@@ -351,8 +395,8 @@ class PiAgentSession implements AgentSession {
 				case "auto_retry_end":
 					log.info("Auto-retry ended", {
 						success: "success" in event ? event.success : undefined,
-						attempt: "attempt" in event ? event.attempt : undefined,
-						finalError: "finalError" in event ? event.finalError : undefined,
+						attempt: "attempt" in event ? (event.attempt as number) : undefined,
+						finalError: "finalError" in event ? (event.finalError as string) : undefined,
 					})
 					enqueue({
 						type: "auto_retry_end",
@@ -389,7 +433,7 @@ class PiAgentSession implements AgentSession {
 		const promptPromise = session.prompt(promptContent).catch((err: unknown) => {
 			const errorMsg = err instanceof Error ? err.message : "Unknown agent error"
 			log.error("[DIAG] session.prompt() rejected", { error: errorMsg, ms: elapsed(), piEventSeq })
-			enqueue({ type: "error", error: errorMsg })
+			enqueue({ type: "error", error: `Agent error: ${errorMsg}` })
 			done = true
 			if (resolveWaiting) {
 				resolveWaiting()
@@ -453,6 +497,50 @@ class PiAgentSession implements AgentSession {
 				createdAt: new Date().toISOString(),
 			}
 			this.messages.push(assistantMsg)
+
+			// Record reinforcement signals for memories that were injected and used.
+			// This improves future retrieval by boosting the salience of helpful memories.
+			if (injectedMemoryIds.length > 0) {
+				try {
+					// Simple heuristic: if the response references content from injected memories,
+					// mark them as "used". This is a basic implementation — could be made more
+					// sophisticated with LLM-based correlation in the future.
+					let usedCount = 0
+					let ignoredCount = 0
+
+					for (const entityId of injectedMemoryIds) {
+						// For now, we can't easily correlate entity IDs back to content
+						// without querying the engine again. Use a simple heuristic:
+						// if the response is longer than 50 chars, assume memories were useful.
+						// TODO: Implement proper content-based correlation
+						const wasUsed = fullResponseText.length > 50
+						await this.memoryBridge.recordUsage(entityId, wasUsed ? "used" : "ignored")
+						if (wasUsed) usedCount++
+						else ignoredCount++
+					}
+
+					log.info("Memory reinforcement recorded", { usedCount, ignoredCount, totalInjected: injectedMemoryIds.length })
+				} catch (err) {
+					log.warn("Memory reinforcement failed (non-fatal)", {
+						error: err instanceof Error ? err.message : String(err),
+					})
+				}
+			}
+
+			// Post-turn memory ingestion: extract memorable facts from this exchange
+			// and store them so future conversations can recall them.
+			// This is non-blocking and non-critical — errors are logged and ignored.
+			extractFacts(this.model, this.apiKey, content, fullResponseText)
+				.then((facts) => {
+					if (facts.length === 0) return
+					log.info("Memory: ingesting extracted facts", { count: facts.length })
+					return this.memoryBridge.ingestFacts(facts)
+				})
+				.catch((err: unknown) => {
+					log.warn("Memory ingestion failed (non-fatal)", {
+						error: err instanceof Error ? err.message : String(err),
+					})
+				})
 		}
 	}
 
@@ -469,6 +557,18 @@ class PiAgentSession implements AgentSession {
 	getMessages(): AgentMessage[] {
 		return this.messages
 	}
+
+	/** Shutdown the session — run GC and shut down the memory bridge. */
+	async dispose(): Promise<void> {
+		try {
+			await this.memoryBridge.gc()
+		} catch (err) {
+			log.warn("Memory GC on dispose failed (non-fatal)", {
+				error: err instanceof Error ? err.message : String(err),
+			})
+		}
+		this.memoryBridge.shutdown()
+	}
 }
 
 export class PiAgentProvider implements AgentProvider {
@@ -478,4 +578,4 @@ export class PiAgentProvider implements AgentProvider {
 	createSession(opts: AgentSessionOpts): AgentSession {
 		return new PiAgentSession(opts)
 	}
-}
+}
\ No newline at end of file
diff --git a/packages/agents/src/pi/memory.ts b/packages/agents/src/pi/memory.ts
new file mode 100644
index 0000000..de01989
--- /dev/null
+++ b/packages/agents/src/pi/memory.ts
@@ -0,0 +1,91 @@
+/**
+ * LLM-based fact extraction for agent memory.
+ *
+ * After each conversation turn, we ask the active model to extract memorable
+ * facts from the exchange and return them as ExtractedFact objects for ingestion
+ * into the zosma-mem bridge. Extension path resolution lives in @openzosma/zosma-mem.
+ */
+
+import { completeSimple } from "@mariozechner/pi-ai"
+import type { Api, Model } from "@mariozechner/pi-ai"
+import { createLogger } from "@openzosma/logger"
+import type { ExtractedFact } from "@openzosma/zosma-mem/bridge"
+
+const log = createLogger({ component: "agents:memory" })
+
+const EXTRACTION_SYSTEM_PROMPT = `You are a memory extraction assistant. Your job is to identify facts worth
+remembering long-term from a conversation exchange.
+
+Extract facts that are:
+- User preferences (favorite things, dislikes, habits)
+- Decisions made by the user
+- Constraints or rules the user has stated
+- Personal information the user shared
+- Repeating patterns or explicit instructions
+
+Do NOT extract:
+- Facts that are only relevant to the current task
+- Temporary states ("I'm tired today")
+- Questions without answers
+- Generic statements that apply to everyone
+
+Return a JSON array. Each element must be an object with:
+- "content": a self-contained, third-person statement of the fact (e.g. "User's favorite animal is elephant")
+- "type": one of "preference" | "decision" | "pattern" | "error"
+- "tags": array of 2-5 lowercase keywords
+
+If nothing is worth remembering, return an empty array: []
+
+Respond with ONLY the JSON array. No explanation, no markdown fences.`
+
+/**
+ * Use the active LLM to extract memorable facts from a single conversation turn.
+ * Returns an empty array on any error — this is a non-critical background path.
+ */
+export const extractFacts = async (
+  model: Model<Api>,
+  apiKey: string,
+  userMessage: string,
+  assistantResponse: string,
+): Promise<ExtractedFact[]> => {
+  if (!userMessage.trim() || !assistantResponse.trim()) return []
+
+  const prompt = `User: ${userMessage}\n\nAssistant: ${assistantResponse}`
+
+  try {
+    const result = await completeSimple(
+      model,
+      {
+        systemPrompt: EXTRACTION_SYSTEM_PROMPT,
+        messages: [{ role: "user", content: prompt, timestamp: Date.now() }],
+      },
+      { apiKey, maxTokens: 512 },
+    )
+
+    const text = result.content
+      .filter((c): c is { type: "text"; text: string } => c.type === "text")
+      .map((c) => c.text)
+      .join("")
+      .trim()
+
+    if (!text) return []
+
+    const parsed: unknown = JSON.parse(text)
+
+    if (!Array.isArray(parsed)) return []
+
+    return parsed.filter(
+      (item): item is ExtractedFact =>
+        typeof item === "object" &&
+        item !== null &&
+        typeof (item as Record<string, unknown>).content === "string" &&
+        ["preference", "decision", "pattern", "error"].includes((item as Record<string, unknown>).type as string) &&
+        Array.isArray((item as Record<string, unknown>).tags),
+    )
+  } catch (err) {
+    log.warn("Memory extraction failed (non-fatal)", {
+      error: err instanceof Error ? err.message : String(err),
+    })
+    return []
+  }
+}
diff --git a/packages/memory/package.json b/packages/memory/package.json
deleted file mode 100644
index 180f363..0000000
--- a/packages/memory/package.json
+++ /dev/null
@@ -1,25 +0,0 @@
-{
-	"name": "@openzosma/memory",
-	"version": "0.1.0",
-	"private": true,
-	"type": "module",
-	"main": "dist/index.js",
-	"types": "dist/index.d.ts",
-	"exports": {
-		".": {
-			"types": "./dist/index.d.ts",
-			"import": "./dist/index.js"
-		}
-	},
-	"scripts": {
-		"build": "tsc",
-		"check": "tsc --noEmit",
-		"test": "vitest --run"
-	},
-	"devDependencies": {
-		"@types/node": "^22.15.2",
-		"typescript": "^5.7.3",
-		"vitest": "^3.0.0",
-		"zosma-mem": "link:../zosma-mem"
-	}
-}
diff --git a/packages/memory/src/bootstrap.test.ts b/packages/memory/src/bootstrap.test.ts
deleted file mode 100644
index 198e195..0000000
--- a/packages/memory/src/bootstrap.test.ts
+++ /dev/null
@@ -1,68 +0,0 @@
-import { afterEach, beforeEach, describe, expect, it } from "vitest"
-import { bootstrapMemory } from "./bootstrap.js"
-import { applyMemoryEnv } from "./config.js"
-
-describe("applyMemoryEnv", () => {
-	const saved: Record<string, string | undefined> = {}
-
-	beforeEach(() => {
-		for (const key of ["PI_MEMORY_DIR", "PI_MEMORY_QMD_UPDATE", "PI_MEMORY_NO_SEARCH"]) {
-			saved[key] = process.env[key]
-			delete process.env[key]
-		}
-	})
-
-	afterEach(() => {
-		for (const [key, val] of Object.entries(saved)) {
-			if (val === undefined) delete process.env[key]
-			else process.env[key] = val
-		}
-	})
-
-	it("sets PI_MEMORY_DIR to default subdir", () => {
-		const dir = applyMemoryEnv({ workspaceDir: "/home/agent" })
-		expect(dir).toBe("/home/agent/.pi/agent/memory")
-		expect(process.env.PI_MEMORY_DIR).toBe("/home/agent/.pi/agent/memory")
-	})
-
-	it("uses explicit memoryDir when provided", () => {
-		const dir = applyMemoryEnv({ workspaceDir: "/home/agent", memoryDir: "/custom/mem" })
-		expect(dir).toBe("/custom/mem")
-		expect(process.env.PI_MEMORY_DIR).toBe("/custom/mem")
-	})
-
-	it("sets qmd update mode", () => {
-		applyMemoryEnv({ workspaceDir: "/w", qmdUpdateMode: "manual" })
-		expect(process.env.PI_MEMORY_QMD_UPDATE).toBe("manual")
-	})
-
-	it("does not set qmd update mode when not specified", () => {
-		applyMemoryEnv({ workspaceDir: "/w" })
-		expect(process.env.PI_MEMORY_QMD_UPDATE).toBeUndefined()
-	})
-
-	it("sets PI_MEMORY_NO_SEARCH when disableSearch is true", () => {
-		applyMemoryEnv({ workspaceDir: "/w", disableSearch: true })
-		expect(process.env.PI_MEMORY_NO_SEARCH).toBe("1")
-	})
-})
-
-describe("bootstrapMemory", () => {
-	beforeEach(() => {
-		process.env.PI_MEMORY_DIR = undefined
-	})
-
-	afterEach(() => {
-		process.env.PI_MEMORY_DIR = undefined
-	})
-
-	it("sets memoryDir in result", () => {
-		const result = bootstrapMemory({ workspaceDir: "/home/agent" })
-		expect(result.memoryDir).toBe("/home/agent/.pi/agent/memory")
-	})
-
-	it("sets PI_MEMORY_DIR env var", () => {
-		bootstrapMemory({ workspaceDir: "/home/agent" })
-		expect(process.env.PI_MEMORY_DIR).toBe("/home/agent/.pi/agent/memory")
-	})
-})
diff --git a/packages/memory/src/bootstrap.ts b/packages/memory/src/bootstrap.ts
deleted file mode 100644
index 4c36d84..0000000
--- a/packages/memory/src/bootstrap.ts
+++ /dev/null
@@ -1,17 +0,0 @@
-import { applyMemoryEnv } from "./config.js"
-import type { MemoryBootstrapResult, MemoryConfig } from "./types.js"
-
-/**
- * Bootstrap the memory system for an agent pod session.
- *
- * Sets environment variables (PI_MEMORY_DIR, etc.) so the pre-installed
- * pi-memory and pi-extension-observational-memory extensions pick up the
- * correct workspace-scoped memory directory at session startup.
- *
- * Extensions are installed at image build time via extensions.json — no
- * runtime path resolution is needed here.
- */
-export function bootstrapMemory(config: MemoryConfig): MemoryBootstrapResult {
-	const memoryDir = applyMemoryEnv(config)
-	return { memoryDir }
-}
diff --git a/packages/memory/src/config.ts b/packages/memory/src/config.ts
deleted file mode 100644
index 0fd2547..0000000
--- a/packages/memory/src/config.ts
+++ /dev/null
@@ -1,24 +0,0 @@
-import { join } from "node:path"
-import type { MemoryConfig } from "./types.js"
-
-const DEFAULT_MEMORY_SUBDIR = ".pi/agent/memory"
-
-/**
- * Apply memory-related environment variables before extensions are loaded.
- * Must be called before the pi session is created.
- */
-export function applyMemoryEnv(config: MemoryConfig): string {
-	const memoryDir = config.memoryDir ?? join(config.workspaceDir, DEFAULT_MEMORY_SUBDIR)
-
-	process.env.PI_MEMORY_DIR = memoryDir
-
-	if (config.qmdUpdateMode) {
-		process.env.PI_MEMORY_QMD_UPDATE = config.qmdUpdateMode
-	}
-
-	if (config.disableSearch) {
-		process.env.PI_MEMORY_NO_SEARCH = "1"
-	}
-
-	return memoryDir
-}
diff --git a/packages/memory/src/index.ts b/packages/memory/src/index.ts
deleted file mode 100644
index 704bd79..0000000
--- a/packages/memory/src/index.ts
+++ /dev/null
@@ -1,3 +0,0 @@
-export { bootstrapMemory } from "./bootstrap.js"
-export { applyMemoryEnv } from "./config.js"
-export type { MemoryConfig, MemoryBootstrapResult } from "./types.js"
diff --git a/packages/memory/src/types.ts b/packages/memory/src/types.ts
deleted file mode 100644
index cd2878f..0000000
--- a/packages/memory/src/types.ts
+++ /dev/null
@@ -1,17 +0,0 @@
-/** Configuration for the memory bootstrap */
-export interface MemoryConfig {
-	/** Root workspace directory for the agent pod (e.g. /home/agent) */
-	workspaceDir: string
-	/** Override PI_MEMORY_DIR (default: <workspaceDir>/.pi/agent/memory) */
-	memoryDir?: string
-	/** Override qmd update mode: background | manual | off */
-	qmdUpdateMode?: "background" | "manual" | "off"
-	/** Disable selective memory injection (for A/B testing) */
-	disableSearch?: boolean
-}
-
-/** Result of bootstrapping the memory extensions */
-export interface MemoryBootstrapResult {
-	/** The resolved memory directory */
-	memoryDir: string
-}
diff --git a/packages/memory/tsconfig.json b/packages/memory/tsconfig.json
deleted file mode 100644
index 12445ec..0000000
--- a/packages/memory/tsconfig.json
+++ /dev/null
@@ -1,8 +0,0 @@
-{
-	"extends": "../../tsconfig.base.json",
-	"compilerOptions": {
-		"outDir": "dist",
-		"rootDir": "src"
-	},
-	"include": ["src"]
-}
diff --git a/packages/zosma-mem/IMPLEMENTATION_PLAN.md b/packages/zosma-mem/IMPLEMENTATION_PLAN.md
deleted file mode 100644
index 8fe4739..0000000
--- a/packages/zosma-mem/IMPLEMENTATION_PLAN.md
+++ /dev/null
@@ -1,407 +0,0 @@
-# zosma-mem Implementation Plan
-
-> Replace `@openzosma/memory` (thin env-var bootstrap) with `zosma-mem` as the unified memory package — salience-driven, attention-aware, eval-instrumented.
-
----
-
-## Current State
-
-### `packages/zosma-mem` (this package)
-- Eval-only: 7 scenarios, adapter interface, CLI runner, metrics (P@K, R@K, MRR, noise, GC effectiveness)
-- No engine implementation — only the `MemoryAdapter` contract and test harness
-- Published as `zosma-mem`, exports `zosma-mem/evals`
-
-### `packages/memory` (`@openzosma/memory`)
-- Thin bootstrap shim: sets `PI_MEMORY_DIR`, `PI_MEMORY_QMD_UPDATE`, `PI_MEMORY_NO_SEARCH` env vars
-- Used by `packages/agents/src/pi.agent.ts` via `bootstrapMemory()`
-- No intelligence — delegates everything to pi-brain extensions installed at image build time
-
-### Gap
-The two reference docs (NEW-MEMORY-INTEGRATION-PAPER.md, NEW-MEMORY-SURFACE-PLAN.md) describe a salience engine, attention-gated retrieval, reinforcement loop, GC, and co-access graph. None of this exists yet. The eval harness exists but has no real engine to test against.
-
----
-
-## Target State
-
-`packages/zosma-mem` becomes `@openzosma/zosma-mem` — the single memory package that:
-
-1. **Bootstraps** pi-brain memory (absorbs what `@openzosma/memory` does today)
-2. **Implements** the salience engine, attention retrieval, reinforcement loop, GC
-3. **Evaluates** itself via the existing eval harness with a self-adapter
-4. **Exports** a clean public API for `packages/agents` and `packages/gateway`
-
-`packages/memory` is deleted. All imports of `@openzosma/memory` point to `@openzosma/zosma-mem`.
-
----
-
-## Package Structure (Final)
-
-```
-packages/zosma-mem/
-  src/
-    index.ts                      # Public API re-exports
-    types.ts                      # Core types (MemoryEngine, MemoryEntity, MemoryScore, etc.)
-    config.ts                     # MemoryConfig + defaults
-
-    bootstrap/
-      env.ts                      # applyMemoryEnv() — absorbed from @openzosma/memory
-      init.ts                     # bootstrapMemory() — absorbed from @openzosma/memory
-
-    brain-adapter/
-      parser.ts                   # Parse commits.md via remark AST
-      state.ts                    # Read state.yaml, list branches
-      index.ts
-
-    engine/
-      salience.ts                 # computeSalience(score): number
-      attention.ts                # computeAttentionScore(query, entity): number
-      reinforcement.ts            # recordRead, recordIgnoredRead, recordDecisionInfluence
-      factory.ts                  # createMemoryEngine() — wires all subsystems
-      index.ts
-
-    store/
-      entity-store.ts             # Read/write .salience/*.yaml
-      co-access.ts                # co-access.json graph read/write
-      index.ts
-
-    ingestion/
-      event-bus.ts                # Typed EventEmitter for MemoryEvent
-      ingest.ts                   # Score → persist or discard
-      commit-indexer.ts           # Watch commits.md → extract entities → score → persist
-      index.ts
-
-    retrieval/
-      retrieve.ts                 # Top-K with attention gating + co-access boost
-      index.ts
-
-    gc/
-      decay.ts                    # Logarithmic time decay
-      prune.ts                    # Archive low-salience entities
-      consolidate.ts              # Merge related low-value clusters
-      index.ts
-
-    evals/                        # (existing — untouched)
-      types.ts
-      runner.ts
-      metrics.ts
-      report.ts
-      scenarios/
-      cli/
-      __tests__/
-      utils/
-      index.ts
-
-    adapter/
-      self-adapter.ts             # MemoryAdapter impl that wraps the real engine for eval
-
-  package.json
-  tsconfig.json
-  README.md
-  USAGE.md
-```
-
----
-
-## Phase Plan
-
-### Phase 0 — Absorb `@openzosma/memory` bootstrap
-
-**Files:** `src/bootstrap/env.ts`, `src/bootstrap/init.ts`
-
-1. Copy `applyMemoryEnv()` and `bootstrapMemory()` from `packages/memory/src/`
-2. Convert to arrow functions per project style
-3. Re-export from `src/index.ts` as `bootstrapMemory`, `applyMemoryEnv`
-4. Update `packages/agents/package.json`: replace `@openzosma/memory` with `@openzosma/zosma-mem`
-5. Update `packages/agents/src/pi.agent.ts`: change import path
-6. Delete `packages/memory/` entirely
-7. Update root `pnpm-workspace.yaml` if needed
-8. Run `pnpm install && pnpm run check`
-
-**Tests:** `src/bootstrap/__tests__/env.test.ts` — verify env vars are set correctly
-
-**Agent instructions:** This is a mechanical move. Copy the 4 source files verbatim, convert `function` to arrow syntax, update imports, delete the old package.
-
----
-
-### Phase 1 — Types + Salience Engine
-
-**Files:** `src/types.ts`, `src/config.ts`, `src/engine/salience.ts`
-
-1. Define core types from the paper:
-   - `MemoryScore` — `{ reuseCount, decisionInfluence, ignoredReads, lastAccessed, attentionWeight }`
-   - `MemoryEntity` — `{ id, source: { branch, commitRef }, score, tags, content }`
-   - `MemoryEvent` (engine-internal, distinct from eval `MemoryEvent`) — `{ id, type, context, attentionWeight?, metadata?, timestamp }`
-   - `MemoryConfig` — `{ memoryDir, salienceThreshold?, gcIntervalMs?, summarizer? }`
-   - `Summarizer` — `(texts: string[]) => Promise<string>`
-   - `AttentionQuery` — `{ taskDescription, activeToolName?, intent? }`
-   - `ScoredEntity` — `{ entity, attentionScore }`
-   - `GcReport` — `{ decayed, pruned, consolidated }`
-
-2. Implement `computeSalience(score: MemoryScore): number`:
-   ```
-   S(e) = 2*reuseCount + 5*decisionInfluence - 2*ignoredReads - ln(1 + ageDays)
-   ```
-
-3. Implement `meetsThreshold(salience: number, threshold: number): boolean`
-
-**Tests:** `src/engine/__tests__/salience.test.ts`
-- Fresh entity → salience = 0 (passes threshold 0, fails threshold 0.4)
-- Decision entity → salience = 5 (high)
-- Heavily ignored entity → negative salience
-- Time decay: 30 days → ~3.4 decay
-
-**Agent instructions:** Pure functions, no I/O. Use the exact formula from the paper. `ageDays = (Date.now() - lastAccessed) / 86_400_000` — but accept a `now` parameter for testability.
-
----
-
-### Phase 2 — Brain Adapter
-
-**Files:** `src/brain-adapter/parser.ts`, `src/brain-adapter/state.ts`
-
-1. `parseCommits(markdown: string): ParsedCommit[]` — parse `commits.md` using `unified` + `remark-parse` into structured commit objects (heading, body, ref)
-2. `readState(memoryDir: string): MemoryState` — parse `state.yaml` via `yaml` package
-3. `listBranches(memoryDir: string): string[]` — read `.memory/branches/` directory
-
-**Dependencies to add:** `unified`, `remark-parse`, `yaml`
-
-**Tests:** `src/brain-adapter/__tests__/parser.test.ts` — parse sample commits.md fixtures
-
-**Agent instructions:** Use `unified().use(remarkParse).parse(markdown)` to get an MDAST. Walk heading nodes to extract commit boundaries. Do NOT use regex.
-
----
-
-### Phase 3 — Entity Store
-
-**Files:** `src/store/entity-store.ts`, `src/store/co-access.ts`
-
-1. `EntityStore` class:
-   - `read(entityId: string): MemoryEntity | undefined` — read `.salience/<id>.yaml`
-   - `write(entity: MemoryEntity): void` — write `.salience/<id>.yaml`
-   - `list(): string[]` — list all entity IDs
-   - `archive(entityId: string): void` — move to `.salience/archive/`
-   - `ensureDir(): void` — create `.salience/` and `.salience/archive/` if needed
-
-2. `CoAccessGraph` class:
-   - `load(memoryDir: string): Record<string, string[]>`
-   - `save(memoryDir: string, graph: Record<string, string[]>): void`
-   - `recordCoAccess(graph, entityIds: string[]): void` — update bidirectional edges
-
-**Dependencies to add:** `yaml` (already from phase 2)
-
-**Tests:** `src/store/__tests__/entity-store.test.ts` — write/read/list/archive round-trip in temp dir
-
-**Agent instructions:** Use synchronous `fs` for reads (small YAML files). Async for writes. YAML format must match the paper's schema exactly.
-
----
-
-### Phase 4 — Ingestion + Commit Indexer
-
-**Files:** `src/ingestion/event-bus.ts`, `src/ingestion/ingest.ts`, `src/ingestion/commit-indexer.ts`
-
-1. `EventBus` — typed `EventEmitter` for `MemoryEvent` lifecycle (ingested, discarded, scored)
-2. `ingest(event: MemoryEvent, store: EntityStore, config: MemoryConfig): boolean` — compute salience, persist if above threshold, return true/false
-3. `CommitIndexer`:
-   - Parse commits.md via brain adapter
-   - Track processed commit refs (stored in `.salience/.indexed` file)
-   - Extract entities from each unprocessed commit
-   - Call `ingest()` for each
-   - `reindex()` — idempotent full re-index
-
-**Dependencies to add:** `chokidar` (for watch mode — optional, can defer)
-
-**Tests:** `src/ingestion/__tests__/ingest.test.ts` — event above threshold persists, below threshold discards
-
-**Agent instructions:** CommitIndexer.reindex() must be idempotent. Store processed refs as a JSON array in `.salience/.indexed`. The cold-start case (no .indexed file) processes all commits.
-
----
-
-### Phase 5 — Attention-Gated Retrieval
-
-**Files:** `src/retrieval/retrieve.ts`
-
-1. `retrieve(query: AttentionQuery, store: EntityStore, coAccess: CoAccessGraph, topK: number): ScoredEntity[]`
-2. Attention score: `A(q, e) = 3*tagOverlap(q, e) + S(e) + coAccessBoost(e)`
-   - `tagOverlap` = count of entity tags appearing in `query.taskDescription` (case-insensitive)
-   - `coAccessBoost` = +1 if any co-accessed entity is also in the current result set (two-pass)
-3. Sort by attention score descending, return top-K
-4. After retrieval, update co-access graph for the returned entity set
-
-**Tests:** `src/retrieval/__tests__/retrieve.test.ts`
-- High tag overlap beats high salience with no overlap
-- Co-access boost surfaces related entities
-
-**Agent instructions:** Two-pass retrieval: first pass computes base scores (tag overlap + salience), take top 2K candidates. Second pass adds co-access boost among candidates, re-sort, return top-K.
-
----
-
-### Phase 6 — Reinforcement
-
-**Files:** `src/engine/reinforcement.ts`
-
-1. `recordRead(entityId, store)` → `reuseCount += 1`, update `lastAccessed`
-2. `recordIgnoredRead(entityId, store)` → `ignoredReads += 1`
-3. `recordDecisionInfluence(entityId, store)` → `decisionInfluence += 1`, update `lastAccessed`
-
-**Tests:** `src/engine/__tests__/reinforcement.test.ts` — counters increment, lastAccessed updates
-
-**Agent instructions:** Each function reads the entity, mutates the score, writes back. Simple read-modify-write. No locking needed (single-process).
-
----
-
-### Phase 7 — Engine Factory
-
-**Files:** `src/engine/factory.ts`
-
-1. `createMemoryEngine(config: MemoryConfig): MemoryEngine`
-   - Instantiate `EntityStore`, `CoAccessGraph`, `CommitIndexer`
-   - Wire `ingest`, `retrieve`, `recordRead`, `recordIgnoredRead`, `recordDecisionInfluence`, `reindex`, `gc`, `shutdown`
-   - Start GC interval timer
-   - Return the `MemoryEngine` interface
-
-**Tests:** `src/engine/__tests__/factory.test.ts` — create engine, ingest event, retrieve it, shutdown
-
-**Agent instructions:** The engine is the composition root. It owns the lifecycle of the GC timer. `shutdown()` clears the timer. All methods delegate to the subsystem modules.
-
----
-
-### Phase 8 — Garbage Collection
-
-**Files:** `src/gc/decay.ts`, `src/gc/prune.ts`, `src/gc/consolidate.ts`
-
-1. `decay(store: EntityStore, now: number)` — recompute salience for all entities, write updated scores
-2. `prune(store: EntityStore, threshold: number)` — archive entities below threshold for N consecutive cycles (track cycle count in `.salience/<id>.yaml` as `belowThresholdCycles`)
-3. `consolidate(store, coAccess, summarizer?)` — find clusters of co-accessed entities all below threshold, merge into single summary entity
-
-**Tests:** `src/gc/__tests__/gc.test.ts`
-- Decay reduces salience of old entities
-- Prune archives after N cycles
-- Consolidate merges cluster into one entity
-
-**Agent instructions:** Prune should NOT archive on the first cycle below threshold. Default: archive after 3 consecutive cycles below threshold (configurable). If no summarizer provided, consolidate concatenates content with `\n---\n` separators and truncates to 2000 chars.
-
----
-
-### Phase 9 — Self-Adapter for Evals
-
-**Files:** `src/adapter/self-adapter.ts`
-
-1. Implement `MemoryAdapter` (from `src/evals/types.ts`) wrapping `createMemoryEngine()`
-2. Map between eval types and engine types:
-   - `MemoryEvent` (eval) → `MemoryEvent` (engine)
-   - `RetrieveQuery` → `AttentionQuery`
-   - `RetrievedEntity` ← `ScoredEntity`
-   - `UsageSignal` → `recordRead` / `recordIgnoredRead` / `recordDecisionInfluence`
-   - `GcResult` ← `GcReport`
-3. `setup()` creates engine with `opts.workDir` as memoryDir, injects deterministic clock
-4. `teardown()` calls `engine.shutdown()`
-
-**Tests:** Run the existing 7 eval scenarios against the self-adapter:
-```bash
-pnpm --filter zosma-mem run eval
-```
-
-**Agent instructions:** The self-adapter is the bridge that proves the engine works. All 7 scenarios must pass. The deterministic clock must be injected into the salience engine's `now` parameter — do NOT use `Date.now()` in any engine code; always accept a clock/now parameter.
-
----
-
-### Phase 10 — Integration + Cleanup
-
-1. Update `packages/zosma-mem/package.json`:
-   - Rename to `@openzosma/zosma-mem`
-   - Add dependencies: `yaml`, `unified`, `remark-parse`, `pino`, `p-limit`, `chokidar`
-   - Add bootstrap exports: `"./bootstrap"` export path
-   - Keep `"./evals"` export path
-
-2. Update `packages/agents/package.json`:
-   - Replace `"@openzosma/memory": "workspace:*"` with `"@openzosma/zosma-mem": "workspace:*"`
-
-3. Update `packages/agents/src/pi.agent.ts`:
-   - `import { bootstrapMemory } from "@openzosma/zosma-mem/bootstrap"`
-
-4. Update `packages/gateway/src/session-manager.ts` (if it references `@openzosma/memory`)
-
-5. Delete `packages/memory/`
-
-6. Run:
-   ```bash
-   pnpm install
-   pnpm run check        # zero errors
-   pnpm run build         # clean build
-   pnpm --filter @openzosma/zosma-mem run test   # all unit tests
-   pnpm --filter @openzosma/zosma-mem run eval   # all 7 scenarios pass
-   ```
-
----
-
-## Dependency Map
-
-```
-packages/agents
-  └── @openzosma/zosma-mem (bootstrap + engine)
-
-packages/gateway
-  └── @openzosma/zosma-mem (engine — future: per-session memory)
-
-@openzosma/zosma-mem
-  ├── yaml          — .salience/*.yaml, state.yaml
-  ├── unified       — markdown AST parsing
-  ├── remark-parse  — commits.md parser
-  ├── zod           — schema validation (already present)
-  ├── pino          — structured logging
-  ├── p-limit       — concurrency control
-  ├── chokidar      — watch commits.md (optional, deferred)
-  └── pi-brain      — peer dep (reads .memory/)
-```
-
----
-
-## Critical Constraints
-
-1. **Never mutate pi-brain files.** All scoring metadata lives in `.salience/` sidecar.
-2. **No `Date.now()` in engine code.** All time-sensitive logic accepts a `now` parameter or clock interface for deterministic testing.
-3. **No vector DB.** Tag-overlap proxy is the MVP retrieval mechanism. `computeAttentionScore` is a single function — swappable for embeddings later.
-4. **No LLM dependency.** `Summarizer` is a callback. If not provided, consolidation uses concatenation.
-5. **Arrow functions everywhere.** Per project coding standards.
-6. **No `any` types.** Strict TypeScript throughout.
-7. **pi-brain as peer dep.** Read `.memory/` files, never import pi-brain internals.
-8. **Existing eval scenarios must not break.** The adapter contract (`MemoryAdapter`) is frozen.
-
----
-
-## Agent Execution Order
-
-For Claude Sonnet 4.6 executing this plan:
-
-```
-Phase 0  ──→  Phase 1  ──→  Phase 2  ──→  Phase 3
-                                              │
-Phase 4  ←────────────────────────────────────┘
-   │
-Phase 5  ──→  Phase 6  ──→  Phase 7  ──→  Phase 8
-                                              │
-Phase 9  ←────────────────────────────────────┘
-   │
-Phase 10
-```
-
-**Parallelizable pairs:**
-- Phase 1 + Phase 2 (no dependency)
-- Phase 5 + Phase 6 (both depend on store, independent of each other)
-
-**Serial gates:**
-- Phase 3 must complete before Phase 4 (ingestion needs store)
-- Phase 7 must complete before Phase 8 (GC needs engine)
-- Phase 9 must complete before Phase 10 (eval validates the engine)
-
-Each phase should end with `pnpm run check` passing. Each phase with tests should end with `pnpm --filter @openzosma/zosma-mem run test` passing.
-
----
-
-## Success Criteria
-
-1. `packages/memory/` is deleted
-2. `@openzosma/zosma-mem` exports `bootstrapMemory`, `createMemoryEngine`, `runEvals`
-3. `pnpm run check` — zero errors across the monorepo
-4. `pnpm --filter @openzosma/zosma-mem run test` — all unit tests pass
-5. `pnpm --filter @openzosma/zosma-mem run eval` — all 7 scenarios pass against the self-adapter
-6. No `@openzosma/memory` references remain anywhere in the codebase
diff --git a/packages/zosma-mem/README.md b/packages/zosma-mem/README.md
index 73f6ed1..8199d2d 100644
--- a/packages/zosma-mem/README.md
+++ b/packages/zosma-mem/README.md
@@ -1,136 +1,177 @@
-# zosma-mem
+# @openzosma/zosma-mem
 
-**Standalone CLI for evaluating agentic memory systems**
+**Memory engine with bridge for agent integration**
 
-A zero-config evaluation tool that automatically detects and tests memory systems against standardized information retrieval scenarios.
+A file-based memory system with salience scoring, tag-based retrieval, and reinforcement learning. Provides cross-conversation memory persistence for AI agents, with a clean bridge interface for session lifecycle integration.
 
 ## Installation
 
 ```bash
-# For development (current)
-cd packages/zosma-mem
-npm install -g .
-
-# After publishing
-npm install -g zosma-mem
+# In OpenZosma workspace
+pnpm add @openzosma/zosma-mem
 ```
 
-## Usage
+## Core Concepts
 
-```bash
-# Auto-detect and evaluate memory system
-zosma-mem
+### Salience Engine
 
-# Run specific scenarios
-zosma-mem --scenarios "cold-start,signal-dilution"
+The memory system uses **attention-based salience scoring** to prioritize facts:
 
-# Output JSON instead of markdown
-zosma-mem --json
+- **Reuse count** - How often a fact has been retrieved
+- **Decision influence** - How often a fact led to agent actions
+- **Time decay** - Recent facts rank higher than old ones
+- **Ignored reads** - Facts that didn't help get demoted
 
-# Save report to file
-zosma-mem --out report.md
-```
+### Tag-Based Retrieval
 
-## What It Does
+Facts are retrieved using semantic tags rather than embeddings:
 
-zosma-mem evaluates memory systems against 7 standardized scenarios:
+```typescript
+// Retrieve memories relevant to a task
+const results = await engine.retrieve({
+  taskDescription: "fix the authentication bug",
+  intent: "auth security debugging"
+}, 8)
+```
 
-- **Cold start** - Basic ingestion and retrieval
-- **Signal dilution** - Handling noise at scale
-- **Repeated patterns** - Reinforcement learning
-- **Stale memory** - Time-based decay
-- **Conflicts** - Update resolution
-- **Context awareness** - Cross-context relevance
-- **Co-access clusters** - Relational recall
+### Cross-Conversation Persistence
 
-## Auto-Detection
+Memory persists across conversations via stable per-agent directories:
 
-zosma-mem automatically detects memory systems:
+```
+workspace/agents/<agentConfigId>/memory/
+├── .salience/          # YAML files with scored entities
+├── .salience/archive/  # Pruned entities
+└── .salience/co-access # Access pattern correlations
+```
 
-1. **OpenZosma**: `packages/gateway/workspace/agents/default/memory/MEMORY.md`
-2. **Generic file**: `MEMORY.md`, `memory.md`, or `.memory.md`
+## Usage
 
-## Example Output
+### Basic Engine Usage
 
-```
-✅ Found openzosma memory at packages/gateway/workspace/agents/default/memory/MEMORY.md
+```typescript
+import { createMemoryEngine } from "@openzosma/zosma-mem"
 
-## zosma-mem Eval Report -- 2026-04-08T10:00:00Z
+const engine = createMemoryEngine({
+  memoryDir: "/path/to/memory",
+  salienceThreshold: 0.4,  // Minimum salience to keep
+  gcIntervalMs: 3600000,   // GC every hour
+})
+
+// Ingest facts
+await engine.ingest({
+  id: "user-pref-dark",
+  type: "preference",
+  content: "User prefers dark mode interfaces",
+  tags: ["ui", "theme", "preference"],
+  timestamp: Date.now(),
+})
 
-| Scenario            | P@K   | R@K   | MRR   | Noise | Pass |
-| ------------------- | ----- | ----- | ----- | ----- | ---- |
-| Cold start          | 0.800 | 1.000 | 1.000 | 0.100 | yes  |
-| Signal dilution     | 0.600 | 1.000 | 1.000 | 0.900 | yes  |
-| Repeated pattern    | 0.200 | 1.000 | 1.000 | 0.000 | NO   |
-| ...                 |      |      |      |       |      |
+// Retrieve relevant memories
+const results = await engine.retrieve({
+  taskDescription: "design the new UI",
+  intent: "interface design"
+}, 5)
 
-Summary: 3/7 passed. Avg P@K: 0.37
-❌ 4 tests failed
+console.log(results.map(r => ({
+  content: r.entity.content,
+  score: r.attentionScore
+})))
 ```
 
-## Metrics Explained
+### Agent Bridge Integration
 
-- **P@K**: Precision@K - How many of top-K results are relevant
-- **R@K**: Recall@K - How many relevant items found in top-K
-- **MRR**: Mean Reciprocal Rank - How quickly relevant items appear
-- **Noise**: Fraction of stored items never retrieved
+For AI agent sessions, use the bridge interface:
 
-## Usage in OpenZosma (Current Development)
+```typescript
+import { createMemoryBridge } from "@openzosma/zosma-mem/bridge"
 
-Install zosma-mem globally for development:
+const bridge = createMemoryBridge({
+  memoryDir: "/workspace/agents/config-123/memory",
+  topK: 8  // Max memories per turn
+})
 
-```bash
-# From the zosma-mem package directory
-cd packages/zosma-mem
-npm install -g .
+// Before each agent turn
+const context = await bridge.loadContext("user's question")
+if (context) {
+  await session.steer(context)  // Inject memory into prompt
+}
 
-# Now use from anywhere
-zosma-mem
-```
+// After each turn, extract and store facts
+const facts = await extractFacts(model, apiKey, userMsg, assistantResponse)
+await bridge.ingestFacts(facts)
 
-The tool automatically detects your OpenZosma memory system and runs the evaluation.
+// Track reinforcement
+await bridge.recordUsage(entityId, "used")  // or "ignored" or "influenced_decision"
+```
 
-## Advanced Usage
+### Extension Path Resolution
 
-### Programmatic API
+For pi-brain and pi-dcp extensions:
 
 ```typescript
-import { runEvals, builtInScenarios } from "zosma-mem/evals"
+import { resolveMemoryExtensionPaths } from "@openzosma/zosma-mem/bridge"
 
-const report = await runEvals({
-  adapter: myCustomAdapter,
-  scenarios: builtInScenarios,
-  k: 5
-})
+const { paths, missing } = resolveMemoryExtensionPaths()
+if (missing.length > 0) {
+  console.warn("Missing extensions:", missing)
+}
+
+// Use paths with DefaultResourceLoader
 ```
 
-### Custom Adapters
+## Memory Types
+
+The system handles different categories of facts:
+
+- **preference** - User likes/dislikes, habits
+- **decision** - Choices made, constraints set
+- **pattern** - Repeating behaviors, workflows
+- **error** - Mistakes, lessons learned
 
-For custom memory systems, implement the MemoryAdapter interface:
+## Garbage Collection
+
+Automatic cleanup runs periodically:
+
+- **Decay** - Reduce salience of old/unused facts
+- **Prune** - Remove facts below salience threshold
+- **Consolidate** - Merge similar entities
 
 ```typescript
-import { MemoryAdapter, MemoryEvent } from "zosma-mem/evals"
+// Manual GC
+const report = await engine.gc()
+console.log(`${report.pruned} pruned, ${report.decayed} decayed`)
+```
 
-const adapter: MemoryAdapter = {
-  setup: async (opts) => { /* initialize */ },
-  ingest: async (event: MemoryEvent) => { /* store */ },
-  retrieve: async (query, topK) => { /* search */ },
-  // ... other methods
+## Configuration
+
+```typescript
+interface MemoryConfig {
+  memoryDir: string                    // Required: where to store files
+  salienceThreshold?: number          // Default: 0.4
+  gcIntervalMs?: number               // Default: 3,600,000 (1 hour)
+  gcPruneCycles?: number              // Default: 1
+  summarizer?: (texts: string[]) => Promise<string>
+  now?: () => number                  // For testing
 }
 ```
 
-## Publishing
+## Architecture
 
-This package is published to npm as `zosma-mem`. To publish updates:
+### Core Modules
 
-```bash
-# Build and test
-pnpm run build
-pnpm run test
+- **engine/** - Salience scoring, reinforcement, GC
+- **store/** - File-based entity storage with co-access patterns
+- **ingestion/** - Fact ingestion and scoring
+- **retrieval/** - Tag-based search with attention ranking
+- **gc/** - Decay, pruning, consolidation
+- **bridge/** - Agent session integration
 
-# Publish
-npm publish
-```
+### File Storage
+
+- **Entity files**: `.salience/*.yaml` - Individual facts with scores
+- **Archive**: `.salience/archive/` - Pruned entities
+- **Co-access**: `.salience/co-access` - Access pattern correlations
 
 ## Development
 
@@ -141,8 +182,15 @@ pnpm run build
 # Test
 pnpm run test
 
-# Run locally
-pnpm eval
+# Type check
+pnpm run check
+```
+
+## Publishing
+
+```bash
+pnpm run build && pnpm run test
+npm publish
 ```
 
-Built for developers who want to evaluate memory systems without configuration complexity. Made for OpenZosma, works with any memory system. 🚀
\ No newline at end of file
+Built for OpenZosma agents, works with any AI agent framework that needs persistent cross-conversation memory. 🚀
\ No newline at end of file
diff --git a/packages/zosma-mem/USAGE.md b/packages/zosma-mem/USAGE.md
deleted file mode 100644
index 8c324f0..0000000
--- a/packages/zosma-mem/USAGE.md
+++ /dev/null
@@ -1,187 +0,0 @@
-# zosma-mem Usage Guide
-
-**Standalone CLI for evaluating agentic memory systems**
-
-A zero-config evaluation tool that automatically detects and tests memory systems against standardized information retrieval scenarios.
-
-## Installation for Development
-
-Since zosma-mem isn't published yet, install it globally from source:
-
-```bash
-# From your OpenZosma project
-cd packages/zosma-mem
-npm install -g .
-
-# Now use from anywhere
-zosma-mem
-```
-
-## Usage Examples
-
-```bash
-# Basic evaluation
-zosma-mem
-
-# Run specific scenarios only
-zosma-mem --scenarios "cold-start,signal-dilution"
-
-# Output JSON instead of markdown
-zosma-mem --json
-
-# Save report to file
-zosma-mem --out memory-report.md
-```
-
-## CLI Options
-
-```bash
-zosma-mem [options]
-
-Options:
-  --scenarios <names>    Run specific scenarios (comma-separated)
-  --k <number>          Top-K for metrics (default: 5)
-  --json                Output JSON instead of markdown
-  --out <path>          Save report to file
-  --help                Show help
-```
-
-## What It Evaluates
-
-zosma-mem tests your memory system against 7 standardized scenarios:
-
-### ✅ Working Scenarios (Your Goals)
-- **Cold start** - Basic ingestion and retrieval
-- **Signal dilution** - Handling noise at scale
-- **Co-access cluster** - Relational recall
-
-### 🎯 Advanced Scenarios (Future Improvements)
-- **Repeated patterns** - Reinforcement learning
-- **Stale memory** - Time-based decay
-- **Conflicts** - Update resolution
-- **Context awareness** - Cross-context relevance
-
-## Example Output
-
-```
-✅ Found openzosma memory at packages/gateway/workspace/agents/default/memory/MEMORY.md
-
-## zosma-mem Eval Report -- 2026-04-08T10:00:00Z
-
-| Scenario            | P@K   | R@K   | MRR   | Noise | Pass |
-| ------------------- | ----- | ----- | ----- | ----- | ---- |
-| Cold start          | 0.600 | 1.000 | 1.000 | 0.500 | yes  |
-| Repeated pattern    | 0.200 | 1.000 | 1.000 | 0.000 | NO   |
-| Signal dilution     | 0.600 | 1.000 | 1.000 | 0.951 | yes  |
-| Stale memory        | 0.200 | 1.000 | 1.000 | 0.167 | NO   |
-| Conflicting updates | 0.200 | 1.000 | 1.000 | 0.000 | NO   |
-| Co-access cluster   | 0.600 | 1.000 | 1.000 | 0.000 | yes  |
-| Cross-context       | 0.200 | 1.000 | 1.000 | 0.000 | NO   |
-
-Summary: 3/7 passed. Avg P@K: 0.371, Avg R@K: 1.000, Avg MRR: 1.000
-```
-
-## Understanding Your Results
-
-### Current Status (3/7 passed)
-Your OpenZosma memory system handles basic operations well but lacks advanced features.
-
-### What the Scores Mean
-
-- **P@K (Precision@K)**: Fraction of top-5 results that are relevant
-  - 0.600 = 3/5 relevant results in top-5
-  - 0.200 = 1/5 relevant results in top-5
-
-- **R@K (Recall@K)**: Fraction of all relevant items found in top-5
-  - 1.000 = All relevant items found
-
-- **MRR (Mean Reciprocal Rank)**: How quickly relevant items appear
-  - 1.000 = Relevant items appear first
-
-- **Noise**: Fraction of stored items never retrieved
-  - Lower is better
-
-## Roadmap for OpenZosma Memory
-
-Use zosma-mem results to guide development:
-
-1. **Phase 1** ✅ Basic storage and retrieval
-2. **Phase 2** 🔄 Add reinforcement learning (repeated patterns)
-3. **Phase 3** 🔄 Add time-based decay (stale memory)
-4. **Phase 4** 🔄 Add conflict resolution
-5. **Phase 5** 🔄 Add context awareness
-
-## Advanced Usage
-
-### Programmatic Evaluation
-
-```typescript
-import { runEvals, builtInScenarios } from "zosma-mem/evals"
-
-const report = await runEvals({
-  adapter: myAdapter,
-  scenarios: builtInScenarios,
-  k: 5
-})
-```
-
-### Custom Memory Adapters
-
-For non-OpenZosma memory systems:
-
-```typescript
-import { MemoryAdapter, MemoryEvent } from "zosma-mem/evals"
-
-const adapter: MemoryAdapter = {
-  setup: async (opts) => { /* init */ },
-  ingest: async (event: MemoryEvent) => { /* store */ },
-  retrieve: async (query, topK) => { /* search */ },
-  recordUsage: async (id, signal) => { /* learn */ },
-  gc: async () => ({ removedCount: 0, archivedCount: 0, consolidatedCount: 0 }),
-  advanceTime: async (ms) => { /* time travel */ },
-  listEntities: async () => [/* all ids */],
-  teardown: async () => { /* cleanup */ }
-}
-```
-
-## Publishing
-
-This package is published to npm as `zosma-mem`. To publish updates:
-
-```bash
-# Build
-pnpm run build
-
-# Test locally
-pnpm eval
-
-# Publish
-npm publish
-```
-
-## Development
-
-```bash
-# Install dependencies
-pnpm install
-
-# Build TypeScript
-pnpm run build
-
-# Run tests
-pnpm run test
-
-# Test CLI locally
-pnpm eval
-```
-
-## OpenZosma Integration
-
-zosma-mem is the official evaluation tool for OpenZosma memory systems. It:
-
-- Auto-detects OpenZosma memory formats
-- Provides standardized evaluation metrics
-- Tracks improvement over time
-- Guides feature development priorities
-
-Run `zosma-mem` regularly to see how your memory system evolves! 🚀
\ No newline at end of file
diff --git a/packages/zosma-mem/package.json b/packages/zosma-mem/package.json
index de97181..1101a9f 100644
--- a/packages/zosma-mem/package.json
+++ b/packages/zosma-mem/package.json
@@ -1,9 +1,9 @@
 {
-	"name": "zosma-mem",
+	"name": "@openzosma/zosma-mem",
 	"version": "0.0.1",
 	"private": false,
 	"type": "module",
-	"description": "Standalone CLI for evaluating agentic memory systems - zero-config evaluation against standardized scenarios",
+	"description": "Memory engine with bridge for agent integration",
 	"license": "Apache-2.0",
 	"keywords": [
 		"memory",
@@ -21,24 +21,20 @@
 	"homepage": "https://github.com/your-org/openzosma/tree/main/packages/zosma-mem",
 	"main": "dist/index.js",
 	"types": "dist/index.d.ts",
-	"bin": {
-		"zosma-mem": "dist/evals/cli/simple-eval.js"
-	},
 	"exports": {
 		".": {
 			"types": "./dist/index.d.ts",
 			"import": "./dist/index.js"
 		},
-		"./evals": {
-			"types": "./dist/evals/index.d.ts",
-			"import": "./dist/evals/index.js"
+		"./bridge": {
+			"types": "./dist/bridge/index.d.ts",
+			"import": "./dist/bridge/index.js"
 		}
 	},
 	"scripts": {
 		"build": "tsc",
 		"check": "tsc --noEmit",
 		"test": "vitest --run",
-		"eval": "tsx dist/evals/cli/simple-eval.js",
 		"prepublishOnly": "pnpm run build && pnpm run test"
 	},
 	"dependencies": {
@@ -46,6 +42,10 @@
 		"commander": "^13.0.0",
 		"ink": "^5.1.0",
 		"ink-spinner": "^5.0.0",
+		"p-limit": "^5.0.0",
+		"pi-brain": "^0.1.7",
+		"pi-dcp": "^0.2.0",
+		"pino": "^9.0.0",
 		"react": "^18.3.0",
 		"yaml": "^2.8.3",
 		"zod": "^3.23.0"
diff --git a/packages/zosma-mem/src/brain-adapter/index.ts b/packages/zosma-mem/src/brain-adapter/index.ts
deleted file mode 100644
index aec02e5..0000000
--- a/packages/zosma-mem/src/brain-adapter/index.ts
+++ /dev/null
@@ -1,2 +0,0 @@
-export { parseCommitsMarkdown } from "./parser.js"
-export type { CommitRecord } from "./parser.js"
diff --git a/packages/zosma-mem/src/brain-adapter/parser.ts b/packages/zosma-mem/src/brain-adapter/parser.ts
deleted file mode 100644
index 8df642b..0000000
--- a/packages/zosma-mem/src/brain-adapter/parser.ts
+++ /dev/null
@@ -1,51 +0,0 @@
-/**
- * Parse commits.md into structured commit records.
- *
- * Expected format (one or more entries):
- *
- * ## <ref>
- * <optional blank line>
- * <body text>
- * tags: tag1, tag2
- */
-
-export interface CommitRecord {
-	ref: string
-	body: string
-	tags: string[]
-}
-
-/**
- * Parse a commits.md markdown file into an array of CommitRecord objects.
- */
-export const parseCommitsMarkdown = (markdown: string): CommitRecord[] => {
-	const commits: CommitRecord[] = []
-	const sections = markdown.split(/^## /m).filter((s) => s.trim().length > 0)
-
-	for (const section of sections) {
-		const lines = section.split("\n")
-		const ref = lines[0].trim()
-		if (!ref) continue
-
-		const bodyLines: string[] = []
-		let tags: string[] = []
-
-		for (let i = 1; i < lines.length; i++) {
-			const line = lines[i]
-			const tagMatch = /^tags:\s*(.+)$/i.exec(line)
-			if (tagMatch) {
-				tags = tagMatch[1]
-					.split(",")
-					.map((t) => t.trim())
-					.filter(Boolean)
-			} else {
-				bodyLines.push(line)
-			}
-		}
-
-		const body = bodyLines.join("\n").trim()
-		commits.push({ ref, body, tags })
-	}
-
-	return commits
-}
diff --git a/packages/zosma-mem/src/bridge/__tests__/bridge.test.ts b/packages/zosma-mem/src/bridge/__tests__/bridge.test.ts
new file mode 100644
index 0000000..447e1be
--- /dev/null
+++ b/packages/zosma-mem/src/bridge/__tests__/bridge.test.ts
@@ -0,0 +1,211 @@
+import { describe, it, expect, beforeEach, afterEach } from "vitest"
+import { createMemoryBridge } from "../../bridge/index.js"
+import type { ExtractedFact } from "../../bridge/index.js"
+import { rmSync, mkdirSync } from "node:fs"
+import { join } from "node:path"
+import { tmpdir } from "node:os"
+
+describe("MemoryBridge", () => {
+  let tempDir: string
+
+  beforeEach(() => {
+    tempDir = join(tmpdir(), `zosma-mem-test-${Date.now()}`)
+    mkdirSync(tempDir, { recursive: true })
+  })
+
+  afterEach(() => {
+    rmSync(tempDir, { recursive: true, force: true })
+  })
+
+  describe("ingestFacts and loadContext round-trip", () => {
+    it("should ingest facts and retrieve them in context", async () => {
+      const bridge = createMemoryBridge({ memoryDir: tempDir })
+
+      const facts: ExtractedFact[] = [
+        {
+          content: "User prefers dark mode interfaces",
+          type: "preference",
+          tags: ["ui", "theme", "preference"]
+        }
+      ]
+
+      await bridge.ingestFacts(facts)
+
+      const { context, injectedIds } = await bridge.loadContext("design the UI")
+      expect(context).toContain("User prefers dark mode interfaces")
+      expect(injectedIds).toHaveLength(1)
+      expect(injectedIds[0]).toMatch(/^[a-f0-9]{16}$/)
+    })
+
+    it("should return empty context when no relevant memories", async () => {
+      const bridge = createMemoryBridge({ memoryDir: tempDir })
+
+      const { context, injectedIds } = await bridge.loadContext("unrelated query")
+      expect(context).toBe("")
+      expect(injectedIds).toEqual([])
+    })
+
+    it("should deduplicate identical facts", async () => {
+      const bridge = createMemoryBridge({ memoryDir: tempDir })
+
+      const facts: ExtractedFact[] = [
+        {
+          content: "User likes coffee",
+          type: "preference",
+          tags: ["drink", "preference"]
+        },
+        {
+          content: "User likes coffee", // Same content
+          type: "preference",
+          tags: ["drink", "preference"]
+        }
+      ]
+
+      await bridge.ingestFacts(facts)
+
+      const entityIds = await bridge.listEntityIds()
+      expect(entityIds).toHaveLength(1) // Should be deduplicated
+    })
+  })
+
+  describe("reinforcement tracking", () => {
+    it("should record usage signals", async () => {
+      const bridge = createMemoryBridge({ memoryDir: tempDir })
+
+      const facts: ExtractedFact[] = [
+        {
+          content: "User's favorite color is blue",
+          type: "preference",
+          tags: ["color", "preference"]
+        }
+      ]
+
+      await bridge.ingestFacts(facts)
+      const { injectedIds } = await bridge.loadContext("what color should I use")
+      expect(injectedIds).toHaveLength(1)
+
+      const entityId = injectedIds[0]
+
+      // Record different usage signals
+      await bridge.recordUsage(entityId, "used")
+      await bridge.recordUsage(entityId, "ignored")
+      await bridge.recordUsage(entityId, "influenced_decision")
+
+      // Should not throw
+      expect(true).toBe(true)
+    })
+  })
+
+  describe("garbage collection", () => {
+    it("should run GC without errors", async () => {
+      const bridge = createMemoryBridge({ memoryDir: tempDir })
+
+      const facts: ExtractedFact[] = [
+        {
+          content: "Old preference that should be garbage collected",
+          type: "preference",
+          tags: ["old"]
+        }
+      ]
+
+      await bridge.ingestFacts(facts)
+      await bridge.gc() // Should not throw
+
+      expect(true).toBe(true)
+    })
+  })
+
+  describe("shutdown", () => {
+    it("should shutdown without errors", async () => {
+      const bridge = createMemoryBridge({ memoryDir: tempDir })
+      bridge.shutdown() // Should not throw
+      expect(true).toBe(true)
+    })
+  })
+
+  describe("cross-session persistence", () => {
+    it("should persist facts across bridge instances", async () => {
+      // First bridge instance
+      const bridge1 = createMemoryBridge({ memoryDir: tempDir })
+      const facts: ExtractedFact[] = [
+        {
+          content: "Persistent memory across sessions",
+          type: "decision",
+          tags: ["persistent", "test"]
+        }
+      ]
+
+      await bridge1.ingestFacts(facts)
+      bridge1.shutdown()
+
+      // Second bridge instance with same directory
+      const bridge2 = createMemoryBridge({ memoryDir: tempDir })
+      const { context } = await bridge2.loadContext("test query")
+
+      expect(context).toContain("Persistent memory across sessions")
+    })
+  })
+
+  describe("salience filtering", () => {
+    it("should respect salience threshold", async () => {
+      const bridge = createMemoryBridge({ memoryDir: tempDir, salienceThreshold: 10 })
+
+      const facts: ExtractedFact[] = [
+        {
+          content: "High salience fact",
+          type: "decision",
+          tags: ["important"]
+        },
+        {
+          content: "Low salience fact",
+          type: "pattern",
+          tags: ["minor"]
+        }
+      ]
+
+      await bridge.ingestFacts(facts)
+
+      // Run GC to prune low-salience facts
+      await bridge.gc()
+
+      const { context } = await bridge.loadContext("important query")
+      expect(context).toBeTruthy() // At least some facts should remain
+    })
+  })
+
+  describe("context formatting", () => {
+    it("should format context with proper structure", async () => {
+      const bridge = createMemoryBridge({ memoryDir: tempDir })
+
+      const facts: ExtractedFact[] = [
+        {
+          content: "Test memory content",
+          type: "preference",
+          tags: ["test"]
+        }
+      ]
+
+      await bridge.ingestFacts(facts)
+      const { context } = await bridge.loadContext("test")
+
+      expect(context).toContain("## Long-term Memory")
+      expect(context).toContain("Test memory content")
+      expect(context).toContain("Use them to inform your responses naturally")
+    })
+
+    it("should limit retrieved memories to topK", async () => {
+      const bridge = createMemoryBridge({ memoryDir: tempDir, topK: 2 })
+
+      const facts: ExtractedFact[] = Array.from({ length: 5 }, (_, i) => ({
+        content: `Memory fact ${i}`,
+        type: "preference" as const,
+        tags: ["test"]
+      }))
+
+      await bridge.ingestFacts(facts)
+      const { injectedIds } = await bridge.loadContext("test")
+
+      expect(injectedIds).toHaveLength(2) // Limited by topK
+    })
+  })
+})
\ No newline at end of file
diff --git a/packages/zosma-mem/src/bridge/extensions.ts b/packages/zosma-mem/src/bridge/extensions.ts
new file mode 100644
index 0000000..0fd2067
--- /dev/null
+++ b/packages/zosma-mem/src/bridge/extensions.ts
@@ -0,0 +1,60 @@
+/**
+ * Pi extension path resolution for memory-related extensions.
+ *
+ * Resolves filesystem paths for pi-brain and pi-dcp so that the agent session
+ * can pass them to DefaultResourceLoader. Both packages live here in
+ * @openzosma/zosma-mem so agents stays decoupled from extension specifics.
+ *
+ * Graceful degradation: if a package is not installed, its path is omitted.
+ * The caller (agents) receives only the paths that exist on disk.
+ */
+
+import { createRequire } from "node:module"
+
+const require = createRequire(import.meta.url)
+
+/**
+ * Try to resolve the entry point of a pi extension package.
+ * Attempts the TypeScript source entry first (jiti loads .ts directly at runtime),
+ * then falls back to the package root.
+ */
+const resolvePiExtension = (pkg: string): string | null => {
+  for (const entry of [`${pkg}/src/index.ts`, `${pkg}/index.ts`, pkg]) {
+    try {
+      return require.resolve(entry)
+    } catch {
+      // try next candidate
+    }
+  }
+  return null
+}
+
+/**
+ * Resolve extension entry paths for all memory-related pi extensions:
+ * - pi-brain: structured memory entities, versioning, branch/commit tools
+ * - pi-dcp: dynamic context pruning, token management
+ *
+ * Returns only the paths that successfully resolved. Missing packages are
+ * silently skipped — the caller should log a warning if the list is shorter
+ * than expected.
+ */
+export const resolveMemoryExtensionPaths = (): { paths: string[]; missing: string[] } => {
+  const extensions = [
+    { name: "pi-brain", label: "structured memory (pi-brain)" },
+    { name: "pi-dcp", label: "context pruning (pi-dcp)" },
+  ]
+
+  const paths: string[] = []
+  const missing: string[] = []
+
+  for (const ext of extensions) {
+    const resolved = resolvePiExtension(ext.name)
+    if (resolved) {
+      paths.push(resolved)
+    } else {
+      missing.push(ext.label)
+    }
+  }
+
+  return { paths, missing }
+}
diff --git a/packages/zosma-mem/src/bridge/index.ts b/packages/zosma-mem/src/bridge/index.ts
new file mode 100644
index 0000000..9111b4b
--- /dev/null
+++ b/packages/zosma-mem/src/bridge/index.ts
@@ -0,0 +1,172 @@
+export { resolveMemoryExtensionPaths } from "./extensions.js"
+
+/**
+ * MemoryBridge — integration layer between zosma-mem engine and the agent session lifecycle.
+ *
+ * Responsibilities:
+ * - Retrieve relevant memories at the start of each turn and format them for system prompt injection
+ * - Accept extracted facts and ingest them into the salience engine
+ * - Track reinforcement signals (used / ignored / influenced_decision)
+ * - Run GC on demand or on session shutdown
+ *
+ * The bridge deliberately does NOT call the LLM for extraction. That is the caller's
+ * responsibility (packages/agents/src/pi/memory.ts). This keeps @openzosma/zosma-mem
+ * free of the @mariozechner/pi-ai dependency and testable without an API key.
+ */
+
+import { createHash } from "node:crypto"
+import { createMemoryEngine } from "../engine/factory.js"
+import type { MemoryEngine, MemoryEventType } from "../types.js"
+
+export interface ExtractedFact {
+  /** Human-readable statement of the fact, e.g. "User's favorite animal is elephant" */
+  content: string
+  /** Semantic type of the fact */
+  type: MemoryEventType
+  /** Short lowercase keywords for retrieval matching */
+  tags: string[]
+}
+
+export interface BridgeConfig {
+  /** Stable per-agent-config memory directory */
+  memoryDir: string
+  /** Minimum salience score to keep during GC. Default: engine default */
+  salienceThreshold?: number
+  /** How many memories to retrieve per turn. Default: 8 */
+  topK?: number
+}
+
+export interface MemoryBridge {
+  /**
+   * Retrieve memories relevant to the current user message and format them
+   * as a system prompt section. Returns an empty string when no memories exist.
+   */
+  loadContext: (userMessage: string) => Promise<{ context: string; injectedIds: string[] }>
+
+  /**
+   * Ingest a batch of already-extracted facts into the salience engine.
+   * Called by the agent after each turn with facts extracted from the conversation.
+   */
+  ingestFacts: (facts: ExtractedFact[]) => Promise<void>
+
+  /**
+   * Record a reinforcement signal for a retrieved memory entity.
+   * Call with "used" when the agent references a memory in its response.
+   * Call with "ignored" when a retrieved memory had no visible effect.
+   * Call with "influenced_decision" when the memory directly shaped a tool call or decision.
+   */
+  recordUsage: (entityId: string, signal: "used" | "ignored" | "influenced_decision") => Promise<void>
+
+  /** Run garbage collection — decay + prune low-salience entities. */
+  gc: () => Promise<void>
+
+  /** Shutdown: clear GC timer. Call on session end. */
+  shutdown: () => void
+
+  /** Return all entity IDs currently in the store (for testing). */
+  listEntityIds: () => Promise<string[]>
+}
+
+/**
+ * Stable deterministic ID for a fact. If the same fact is extracted again
+ * it hashes to the same ID, so the engine deduplicates it by updating in place.
+ */
+export const factId = (content: string): string =>
+  createHash("sha256").update(content.trim().toLowerCase()).digest("hex").slice(0, 16)
+
+/**
+ * Format retrieved memories as a system prompt section.
+ */
+const formatContext = (
+  memories: Array<{ id: string; content: string; score: number }>,
+): string => {
+  if (memories.length === 0) return ""
+
+  const lines = [
+    "## Long-term Memory",
+    "",
+    "The following facts have been remembered from previous conversations with this user.",
+    "Use them to inform your responses naturally, without mentioning memory IDs or scores.",
+    "",
+    ...memories.map((m) => `- ${m.content}`),
+    "",
+  ]
+
+  return lines.join("\n")
+}
+
+/**
+ * Create a MemoryBridge backed by the zosma-mem salience engine.
+ */
+export const createMemoryBridge = (config: BridgeConfig): MemoryBridge => {
+  const engine: MemoryEngine = createMemoryEngine({
+    memoryDir: config.memoryDir,
+    salienceThreshold: config.salienceThreshold,
+    // GC every 5 minutes in production. Tests override via config.
+    gcIntervalMs: 5 * 60 * 1000,
+    gcPruneCycles: 2,
+  })
+
+  const topK = config.topK ?? 8
+
+  const loadContext = async (userMessage: string): Promise<{ context: string; injectedIds: string[] }> => {
+    const results = await engine.retrieve({ taskDescription: userMessage }, topK)
+
+    if (results.length === 0) return { context: "", injectedIds: [] }
+
+    const memories = results.map((r) => ({
+      id: r.entity.id,
+      content: r.entity.content,
+      score: r.attentionScore,
+    }))
+
+    // Record ignored reads for entities that scored below threshold
+    // (returned in results but likely not relevant). The low score is the signal.
+    for (const r of results) {
+      if (r.attentionScore < 1) {
+        await engine.recordIgnoredRead(r.entity.id)
+      }
+    }
+
+    const injectedIds = memories.map(m => m.id)
+    return { context: formatContext(memories), injectedIds }
+  }
+
+  const ingestFacts = async (facts: ExtractedFact[]): Promise<void> => {
+    const now = Date.now()
+    for (const fact of facts) {
+      await engine.ingest({
+        id: factId(fact.content),
+        type: fact.type,
+        content: fact.content,
+        tags: fact.tags,
+        timestamp: now,
+      })
+    }
+  }
+
+  const recordUsage = async (
+    entityId: string,
+    signal: "used" | "ignored" | "influenced_decision",
+  ): Promise<void> => {
+    if (signal === "used") {
+      await engine.recordRead(entityId)
+    } else if (signal === "ignored") {
+      await engine.recordIgnoredRead(entityId)
+    } else {
+      await engine.recordDecisionInfluence(entityId)
+    }
+  }
+
+  const gc = async (): Promise<void> => {
+    await engine.gc()
+  }
+
+  const shutdown = (): void => {
+    engine.shutdown()
+  }
+
+  const listEntityIds = async (): Promise<string[]> => engine.listEntities()
+
+  return { loadContext, ingestFacts, recordUsage, gc, shutdown, listEntityIds }
+}
diff --git a/packages/zosma-mem/src/engine/__tests__/factory.test.ts b/packages/zosma-mem/src/engine/__tests__/factory.test.ts
new file mode 100644
index 0000000..bf7c251
--- /dev/null
+++ b/packages/zosma-mem/src/engine/__tests__/factory.test.ts
@@ -0,0 +1,48 @@
+import { describe, it, expect } from 'vitest'
+import { mkdtempSync } from 'node:fs'
+import { tmpdir } from 'node:os'
+import { join } from 'node:path'
+import { createMemoryEngine } from '../factory.js'
+
+const NOW = 1_000_000_000_000
+
+const makeDir = () => mkdtempSync(join(tmpdir(), 'factory-test-'))
+
+describe('createMemoryEngine', () => {
+  it('ingest a decision event then retrieve it', async () => {
+    const memoryDir = makeDir()
+    const engine = createMemoryEngine({ memoryDir, gcIntervalMs: 0, now: () => NOW })
+    await engine.ingest({
+      id: 'ev1',
+      type: 'decision',
+      content: 'use typescript for everything',
+      tags: ['typescript', 'architecture'],
+      timestamp: NOW,
+    })
+    const results = await engine.retrieve({ taskDescription: 'typescript architecture' }, 5)
+    expect(results.some((r) => r.entity.id === 'ev1')).toBe(true)
+    engine.shutdown()
+  })
+
+  it('shutdown does not throw', () => {
+    const memoryDir = makeDir()
+    const engine = createMemoryEngine({ memoryDir, gcIntervalMs: 0 })
+    expect(() => engine.shutdown()).not.toThrow()
+  })
+
+  it('ingest + recordDecisionInfluence + retrieve: entity still appears', async () => {
+    const memoryDir = makeDir()
+    const engine = createMemoryEngine({ memoryDir, gcIntervalMs: 0, now: () => NOW })
+    await engine.ingest({
+      id: 'ev2',
+      type: 'decision',
+      content: 'auth strategy',
+      tags: ['auth'],
+      timestamp: NOW,
+    })
+    await engine.recordDecisionInfluence('ev2')
+    const results = await engine.retrieve({ taskDescription: 'auth strategy' }, 5)
+    expect(results.some((r) => r.entity.id === 'ev2')).toBe(true)
+    engine.shutdown()
+  })
+})
diff --git a/packages/zosma-mem/src/engine/__tests__/reinforcement.test.ts b/packages/zosma-mem/src/engine/__tests__/reinforcement.test.ts
new file mode 100644
index 0000000..2b669c9
--- /dev/null
+++ b/packages/zosma-mem/src/engine/__tests__/reinforcement.test.ts
@@ -0,0 +1,71 @@
+import { describe, it, expect } from 'vitest'
+import { mkdtempSync } from 'node:fs'
+import { tmpdir } from 'node:os'
+import { join } from 'node:path'
+import { EntityStore } from '../../store/entity-store.js'
+import type { MemoryEntity } from '../../types.js'
+import { recordRead, recordIgnoredRead, recordDecisionInfluence } from '../reinforcement.js'
+
+const BASE_TS = 1_000_000_000_000
+
+const makeEntity = (id: string): MemoryEntity => ({
+  id,
+  source: { branch: 'main', commitRef: '0' },
+  score: {
+    reuseCount: 0,
+    decisionInfluence: 0,
+    ignoredReads: 0,
+    lastAccessed: BASE_TS,
+    attentionWeight: 0,
+    belowThresholdCycles: 0,
+  },
+  tags: [],
+  content: 'test',
+})
+
+const makeStore = (entity: MemoryEntity): EntityStore => {
+  const dir = mkdtempSync(join(tmpdir(), 'reinforcement-test-'))
+  const store = new EntityStore(dir)
+  store.ensureDir()
+  store.write(entity)
+  return store
+}
+
+describe('reinforcement', () => {
+  it('recordRead increments reuseCount and updates lastAccessed', () => {
+    const entity = makeEntity('e1')
+    const store = makeStore(entity)
+    const later = BASE_TS + 5000
+    recordRead('e1', store, () => later)
+    const updated = store.read('e1')!
+    expect(updated.score.reuseCount).toBe(1)
+    expect(updated.score.lastAccessed).toBe(later)
+  })
+
+  it('recordIgnoredRead increments ignoredReads and does NOT update lastAccessed', () => {
+    const entity = makeEntity('e2')
+    const store = makeStore(entity)
+    recordIgnoredRead('e2', store)
+    const updated = store.read('e2')!
+    expect(updated.score.ignoredReads).toBe(1)
+    expect(updated.score.lastAccessed).toBe(BASE_TS)
+  })
+
+  it('recordDecisionInfluence increments decisionInfluence and updates lastAccessed', () => {
+    const entity = makeEntity('e3')
+    const store = makeStore(entity)
+    const later = BASE_TS + 9000
+    recordDecisionInfluence('e3', store, () => later)
+    const updated = store.read('e3')!
+    expect(updated.score.decisionInfluence).toBe(1)
+    expect(updated.score.lastAccessed).toBe(later)
+  })
+
+  it('missing entity ID is a no-op', () => {
+    const entity = makeEntity('e4')
+    const store = makeStore(entity)
+    expect(() => recordRead('nonexistent', store)).not.toThrow()
+    expect(() => recordIgnoredRead('nonexistent', store)).not.toThrow()
+    expect(() => recordDecisionInfluence('nonexistent', store)).not.toThrow()
+  })
+})
diff --git a/packages/zosma-mem/src/engine/factory.ts b/packages/zosma-mem/src/engine/factory.ts
new file mode 100644
index 0000000..f5d5826
--- /dev/null
+++ b/packages/zosma-mem/src/engine/factory.ts
@@ -0,0 +1,74 @@
+import { runGc } from "../gc/index.js"
+import { ingest as doIngest } from "../ingestion/ingest.js"
+import { retrieve as doRetrieve } from "../retrieval/retrieve.js"
+import { loadCoAccess, saveCoAccess } from "../store/co-access.js"
+import { EntityStore } from "../store/entity-store.js"
+import type { AttentionQuery, MemoryConfig, MemoryEngine, MemoryEvent } from "../types.js"
+import { recordDecisionInfluence, recordIgnoredRead, recordRead } from "./reinforcement.js"
+
+/**
+ * Create a fully wired MemoryEngine instance.
+ * This is the primary entry point for all memory operations.
+ */
+export const createMemoryEngine = (config: MemoryConfig): MemoryEngine => {
+	const resolved = {
+		memoryDir: config.memoryDir,
+		salienceThreshold: config.salienceThreshold ?? 0.4,
+		gcIntervalMs: config.gcIntervalMs ?? 3_600_000,
+		gcPruneCycles: config.gcPruneCycles ?? 1,
+		summarizer: config.summarizer,
+		now: config.now,
+	}
+	const store = new EntityStore(resolved.memoryDir)
+	store.ensureDir()
+
+	const getNow = resolved.now ?? Date.now
+
+	const coAccess = loadCoAccess(resolved.memoryDir)
+
+	let gcTimer: ReturnType<typeof setInterval> | undefined
+	if (resolved.gcIntervalMs > 0) {
+		gcTimer = setInterval(() => {
+			void engine.gc()
+		}, resolved.gcIntervalMs)
+		gcTimer.unref?.()
+	}
+
+	const engine: MemoryEngine = {
+		ingest: async (event: MemoryEvent) => {
+			doIngest(event, store, { salienceThreshold: resolved.salienceThreshold, now: getNow })
+		},
+
+		retrieve: async (query: AttentionQuery, topK = 5) => {
+			const results = doRetrieve(query, store, coAccess, { now: getNow }, topK)
+			saveCoAccess(resolved.memoryDir, coAccess)
+			return results
+		},
+
+		recordRead: async (entityId: string) => {
+			recordRead(entityId, store, getNow)
+		},
+
+		recordIgnoredRead: async (entityId: string) => {
+			recordIgnoredRead(entityId, store)
+		},
+
+		recordDecisionInfluence: async (entityId: string) => {
+			recordDecisionInfluence(entityId, store, getNow)
+		},
+
+		gc: async () => {
+			const report = runGc(store, coAccess, resolved, getNow)
+			saveCoAccess(resolved.memoryDir, coAccess)
+			return report
+		},
+
+		listEntities: async () => store.list(),
+
+		shutdown: () => {
+			if (gcTimer) clearInterval(gcTimer)
+		},
+	}
+
+	return engine
+}
diff --git a/packages/zosma-mem/src/engine/index.ts b/packages/zosma-mem/src/engine/index.ts
new file mode 100644
index 0000000..57d6054
--- /dev/null
+++ b/packages/zosma-mem/src/engine/index.ts
@@ -0,0 +1,3 @@
+export { computeSalience, meetsThreshold, initialScore } from "./salience.js"
+export { recordRead, recordIgnoredRead, recordDecisionInfluence } from "./reinforcement.js"
+export { createMemoryEngine } from "./factory.js"
diff --git a/packages/zosma-mem/src/engine/reinforcement.ts b/packages/zosma-mem/src/engine/reinforcement.ts
new file mode 100644
index 0000000..2efd97b
--- /dev/null
+++ b/packages/zosma-mem/src/engine/reinforcement.ts
@@ -0,0 +1,41 @@
+import type { EntityStore } from "../store/entity-store.js"
+
+/**
+ * Record that an entity was retrieved and acted upon by the agent.
+ * Increments reuseCount and updates lastAccessed.
+ */
+export const recordRead = (entityId: string, store: EntityStore, now: () => number = Date.now): void => {
+	const entity = store.read(entityId)
+	if (!entity) return
+	store.write({
+		...entity,
+		score: { ...entity.score, reuseCount: entity.score.reuseCount + 1, lastAccessed: now() },
+	})
+}
+
+/**
+ * Record that an entity was retrieved but the agent did not act on it.
+ * Increments ignoredReads.
+ */
+export const recordIgnoredRead = (entityId: string, store: EntityStore): void => {
+	const entity = store.read(entityId)
+	if (!entity) return
+	store.write({ ...entity, score: { ...entity.score, ignoredReads: entity.score.ignoredReads + 1 } })
+}
+
+/**
+ * Record that an entity directly influenced an agent decision or tool call.
+ * Strongest reinforcement signal: increments decisionInfluence and updates lastAccessed.
+ */
+export const recordDecisionInfluence = (entityId: string, store: EntityStore, now: () => number = Date.now): void => {
+	const entity = store.read(entityId)
+	if (!entity) return
+	store.write({
+		...entity,
+		score: {
+			...entity.score,
+			decisionInfluence: entity.score.decisionInfluence + 1,
+			lastAccessed: now(),
+		},
+	})
+}
diff --git a/packages/zosma-mem/src/engine/salience.ts b/packages/zosma-mem/src/engine/salience.ts
new file mode 100644
index 0000000..6de884c
--- /dev/null
+++ b/packages/zosma-mem/src/engine/salience.ts
@@ -0,0 +1,23 @@
+import type { MemoryScore } from '../types.js'
+
+/**
+ * Compute the salience score for a memory entity.
+ * S(e) = 2*reuseCount + 5*decisionInfluence - 2*ignoredReads - ln(1 + ageDays)
+ * ageDays is computed from lastAccessed using the injectable now().
+ */
+export const computeSalience = (score: MemoryScore, now: () => number = Date.now): number => {
+  const ageDays = (now() - score.lastAccessed) / 86_400_000
+  const decay = Math.log(1 + ageDays)
+  return 2 * score.reuseCount + 5 * score.decisionInfluence - 2 * score.ignoredReads - decay
+}
+
+export const meetsThreshold = (salience: number, threshold: number): boolean => salience >= threshold
+
+export const initialScore = (eventType: string, now: () => number = Date.now): MemoryScore => ({
+  reuseCount: 0,
+  decisionInfluence: eventType === 'decision' ? 1 : 0,
+  ignoredReads: 0,
+  lastAccessed: now(),
+  attentionWeight: eventType === 'decision' ? 1.0 : 0.0,
+  belowThresholdCycles: 0,
+})
diff --git a/packages/zosma-mem/src/evals/__tests__/metrics.test.ts b/packages/zosma-mem/src/evals/__tests__/metrics.test.ts
deleted file mode 100644
index f2f32c2..0000000
--- a/packages/zosma-mem/src/evals/__tests__/metrics.test.ts
+++ /dev/null
@@ -1,127 +0,0 @@
-import { describe, expect, it } from "vitest"
-import {
-	computeGcEffectiveness,
-	computeMRR,
-	computeNoiseRatio,
-	computePrecisionAtK,
-	computeRecallAtK,
-	computeSalienceDrift,
-} from "../metrics.js"
-
-describe("computePrecisionAtK", () => {
-	it("returns 1.0 when all top-K are relevant", () => {
-		expect(computePrecisionAtK(["a", "b", "c"], new Set(["a", "b", "c"]), 3)).toBe(1)
-	})
-
-	it("returns 0.0 when none of the top-K are relevant", () => {
-		expect(computePrecisionAtK(["x", "y", "z"], new Set(["a", "b", "c"]), 3)).toBe(0)
-	})
-
-	it("returns 0.6 when 3 of 5 are relevant", () => {
-		expect(computePrecisionAtK(["a", "b", "x", "c", "y"], new Set(["a", "b", "c"]), 5)).toBe(0.6)
-	})
-
-	it("returns 0 when k is 0", () => {
-		expect(computePrecisionAtK(["a"], new Set(["a"]), 0)).toBe(0)
-	})
-
-	it("only evaluates up to K positions even if list is longer", () => {
-		expect(computePrecisionAtK(["a", "b", "c", "d", "e"], new Set(["d", "e"]), 3)).toBe(0)
-	})
-})
-
-describe("computeRecallAtK", () => {
-	it("returns 1.0 when all relevant entities appear in top-K", () => {
-		expect(computeRecallAtK(["a", "b", "c"], new Set(["a", "b"]), 3)).toBe(1)
-	})
-
-	it("returns 0.5 when half of relevant entities appear in top-K", () => {
-		expect(computeRecallAtK(["a", "x", "y"], new Set(["a", "b"]), 3)).toBe(0.5)
-	})
-
-	it("returns 1.0 when relevant set is empty (vacuously true)", () => {
-		expect(computeRecallAtK(["a", "b"], new Set(), 5)).toBe(1)
-	})
-
-	it("returns 0 when no relevant entities in top-K", () => {
-		expect(computeRecallAtK(["x", "y", "z"], new Set(["a", "b"]), 3)).toBe(0)
-	})
-})
-
-describe("computeMRR", () => {
-	it("returns 1.0 when the first result is relevant", () => {
-		expect(computeMRR(["a", "b", "c"], new Set(["a"]))).toBe(1)
-	})
-
-	it("returns 0.5 when the second result is the first relevant", () => {
-		expect(computeMRR(["x", "a", "b"], new Set(["a"]))).toBe(0.5)
-	})
-
-	it("returns 0.333... when the third result is the first relevant", () => {
-		expect(computeMRR(["x", "y", "a"], new Set(["a"]))).toBeCloseTo(1 / 3)
-	})
-
-	it("returns 0 when no relevant entity is found", () => {
-		expect(computeMRR(["x", "y", "z"], new Set(["a"]))).toBe(0)
-	})
-
-	it("handles empty retrieved list", () => {
-		expect(computeMRR([], new Set(["a"]))).toBe(0)
-	})
-})
-
-describe("computeNoiseRatio", () => {
-	it("returns 0 when all entities were retrieved at least once", () => {
-		expect(computeNoiseRatio(["a", "b", "c"], new Set(["a", "b", "c"]))).toBe(0)
-	})
-
-	it("returns 1 when no entity was ever retrieved", () => {
-		expect(computeNoiseRatio(["a", "b", "c"], new Set())).toBe(1)
-	})
-
-	it("returns 0.5 when half were never retrieved", () => {
-		expect(computeNoiseRatio(["a", "b", "c", "d"], new Set(["a", "b"]))).toBe(0.5)
-	})
-
-	it("returns 0 when entity list is empty", () => {
-		expect(computeNoiseRatio([], new Set())).toBe(0)
-	})
-})
-
-describe("computeGcEffectiveness", () => {
-	it("returns -1 when no noise entities before GC", () => {
-		expect(computeGcEffectiveness([], ["a", "b"])).toBe(-1)
-	})
-
-	it("returns 1.0 when all noise entities were removed", () => {
-		expect(computeGcEffectiveness(["x", "y"], ["a", "b"])).toBe(1)
-	})
-
-	it("returns 0.5 when half of noise entities were removed", () => {
-		expect(computeGcEffectiveness(["x", "y"], ["x", "a", "b"])).toBe(0.5)
-	})
-
-	it("returns 0 when no noise entities were removed", () => {
-		expect(computeGcEffectiveness(["x", "y"], ["x", "y", "a"])).toBe(0)
-	})
-})
-
-describe("computeSalienceDrift", () => {
-	it("returns -1 with fewer than 2 snapshots", () => {
-		expect(computeSalienceDrift([[1, 2, 3]])).toBe(-1)
-		expect(computeSalienceDrift([])).toBe(-1)
-	})
-
-	it("returns 0 when all scores are identical across cycles", () => {
-		expect(computeSalienceDrift([[1, 1, 1], [1, 1, 1]])).toBe(0)
-	})
-
-	it("returns a positive value when scores vary", () => {
-		const drift = computeSalienceDrift([[0, 1, 2], [3, 4, 5]])
-		expect(drift).toBeGreaterThan(0)
-	})
-
-	it("returns -1 when snapshots exist but all are empty", () => {
-		expect(computeSalienceDrift([[], []])).toBe(-1)
-	})
-})
diff --git a/packages/zosma-mem/src/evals/__tests__/mock-adapter.ts b/packages/zosma-mem/src/evals/__tests__/mock-adapter.ts
deleted file mode 100644
index 7a60f15..0000000
--- a/packages/zosma-mem/src/evals/__tests__/mock-adapter.ts
+++ /dev/null
@@ -1,102 +0,0 @@
-/**
- * Trivial in-memory adapter used to test the eval framework itself.
- *
- * NOT for evaluating a real engine. This adapter implements the simplest
- * possible retrieval strategy (tag overlap count) to verify that the
- * framework's metric computation, runner lifecycle, and scenario logic
- * are all correct without needing a real engine.
- *
- * Behaviour:
- * - `ingest`: stores the event. If the same ID is ingested again, the latest
- *   version replaces the previous one (last-write-wins).
- * - `retrieve`: scores entities by the number of tag matches with the query.
- *   On tie, newer timestamps rank higher.
- * - `recordUsage`: no-op (no reinforcement learning).
- * - `gc`: removes entities whose tags contain "stale" (simulates simple decay).
- *   Also supports time-based removal: entities older than 7 days from clock.
- * - `advanceTime`: delegates to the injected DeterministicClock.
- * - `listEntities`: returns all stored IDs.
- * - `setup` / `teardown`: clears internal state.
- */
-
-import type {
-	AdapterSetupOpts,
-	DeterministicClock,
-	GcResult,
-	MemoryAdapter,
-	MemoryEvent,
-	RetrievedEntity,
-	RetrieveQuery,
-} from "../types.js"
-
-interface StoredEntity {
-	event: MemoryEvent
-	usageCount: number
-	ignored: number
-}
-
-const GC_MAX_AGE_MS = 7 * 24 * 60 * 60 * 1_000 // 7 days
-
-export const createMockAdapter = (): MemoryAdapter => {
-	const store = new Map<string, StoredEntity>()
-	let clock: DeterministicClock = { now: () => Date.now(), advance: () => undefined }
-
-	const setup = async (opts: AdapterSetupOpts): Promise<void> => {
-		store.clear()
-		clock = opts.clock
-	}
-
-	const ingest = async (event: MemoryEvent): Promise<void> => {
-		store.set(event.id, { event, usageCount: 0, ignored: 0 })
-	}
-
-	const retrieve = async (query: RetrieveQuery, topK: number): Promise<RetrievedEntity[]> => {
-		const queryTags = new Set([
-			...(query.tags ?? []).map((t) => t.toLowerCase()),
-			...query.text.toLowerCase().split(/\s+/),
-		])
-
-		const scored = Array.from(store.values()).map(({ event }) => {
-			const tagScore = event.tags.filter((t) => queryTags.has(t.toLowerCase())).length
-			return { id: event.id, content: event.content, score: tagScore, tags: event.tags, timestamp: event.timestamp }
-		})
-
-		// Sort by score desc, then timestamp desc (recency tiebreak).
-		scored.sort((a, b) => b.score - a.score || b.timestamp - a.timestamp)
-
-		return scored.slice(0, topK).map(({ id, content, score, tags }) => ({ id, content, score, tags }))
-	}
-
-	const recordUsage = async (entityId: string): Promise<void> => {
-		const entry = store.get(entityId)
-		if (entry) store.set(entityId, { ...entry, usageCount: entry.usageCount + 1 })
-	}
-
-	const gc = async (): Promise<GcResult> => {
-		const now = clock.now()
-		const toRemove: string[] = []
-
-		for (const [id, { event }] of store) {
-			const age = now - event.timestamp
-			if (age > GC_MAX_AGE_MS || event.tags.includes("stale")) {
-				toRemove.push(id)
-			}
-		}
-
-		for (const id of toRemove) store.delete(id)
-
-		return { removedCount: toRemove.length, archivedCount: 0, consolidatedCount: 0 }
-	}
-
-	const advanceTime = async (ms: number): Promise<void> => {
-		clock.advance(ms)
-	}
-
-	const listEntities = async (): Promise<string[]> => Array.from(store.keys())
-
-	const teardown = async (): Promise<void> => {
-		store.clear()
-	}
-
-	return { setup, ingest, retrieve, recordUsage, gc, advanceTime, listEntities, teardown }
-}
diff --git a/packages/zosma-mem/src/evals/__tests__/report.test.ts b/packages/zosma-mem/src/evals/__tests__/report.test.ts
deleted file mode 100644
index 152b608..0000000
--- a/packages/zosma-mem/src/evals/__tests__/report.test.ts
+++ /dev/null
@@ -1,78 +0,0 @@
-import { describe, expect, it } from "vitest"
-import { renderMarkdownReport } from "../report.js"
-import type { EvalReport } from "../types.js"
-
-const makeReport = (overrides?: Partial<EvalReport>): EvalReport => ({
-	timestamp: new Date("2026-04-07T12:00:00.000Z").getTime(),
-	results: [
-		{
-			scenario: "Cold start",
-			metrics: { precisionAtK: 1, recallAtK: 1, mrr: 1, noiseRatio: 0.1, gcEffectiveness: -1, salienceDrift: -1 },
-			passed: true,
-			details: "",
-		},
-		{
-			scenario: "Signal dilution",
-			metrics: { precisionAtK: 0.4, recallAtK: 0.8, mrr: 0.5, noiseRatio: 0.9, gcEffectiveness: -1, salienceDrift: -1 },
-			passed: false,
-			details: "precisionAtK: 0.400 < threshold 0.600",
-		},
-	],
-	summary: { total: 2, passed: 1, failed: 1, avgPrecision: 0.7, avgRecall: 0.9, avgMrr: 0.75 },
-	...overrides,
-})
-
-describe("renderMarkdownReport", () => {
-	it("includes a heading with the timestamp", () => {
-		const output = renderMarkdownReport(makeReport())
-		expect(output).toContain("## zosma-mem Eval Report -- 2026-04-07T12:00:00.000Z")
-	})
-
-	it("includes all scenario names", () => {
-		const output = renderMarkdownReport(makeReport())
-		expect(output).toContain("Cold start")
-		expect(output).toContain("Signal dilution")
-	})
-
-	it("marks passing scenarios with 'yes'", () => {
-		const output = renderMarkdownReport(makeReport())
-		expect(output).toContain("yes")
-	})
-
-	it("marks failing scenarios with 'NO'", () => {
-		const output = renderMarkdownReport(makeReport())
-		expect(output).toContain("NO")
-	})
-
-	it("includes the summary line", () => {
-		const output = renderMarkdownReport(makeReport())
-		expect(output).toContain("Summary: 1/2 passed")
-	})
-
-	it("includes a failures section when there are failures", () => {
-		const output = renderMarkdownReport(makeReport())
-		expect(output).toContain("### Failures")
-		expect(output).toContain("precisionAtK: 0.400 < threshold 0.600")
-	})
-
-	it("does not include failures section when all pass", () => {
-		const allPass = makeReport({
-			results: [
-				{
-					scenario: "Cold start",
-					metrics: { precisionAtK: 1, recallAtK: 1, mrr: 1, noiseRatio: 0, gcEffectiveness: -1, salienceDrift: -1 },
-					passed: true,
-					details: "",
-				},
-			],
-			summary: { total: 1, passed: 1, failed: 0, avgPrecision: 1, avgRecall: 1, avgMrr: 1 },
-		})
-		const output = renderMarkdownReport(allPass)
-		expect(output).not.toContain("### Failures")
-	})
-
-	it("renders N/A values as ' -- '", () => {
-		const output = renderMarkdownReport(makeReport())
-		expect(output).toContain(" -- ")
-	})
-})
diff --git a/packages/zosma-mem/src/evals/__tests__/runner.test.ts b/packages/zosma-mem/src/evals/__tests__/runner.test.ts
deleted file mode 100644
index 4877b05..0000000
--- a/packages/zosma-mem/src/evals/__tests__/runner.test.ts
+++ /dev/null
@@ -1,96 +0,0 @@
-import { describe, expect, it, vi } from "vitest"
-import { runEvals } from "../runner.js"
-import type { ScenarioDefinition } from "../types.js"
-import { createMockAdapter } from "./mock-adapter.js"
-
-const makePassingScenario = (name: string): ScenarioDefinition => ({
-	name,
-	description: `Always-passing scenario: ${name}`,
-	run: async (_adapter, _clock) => ({
-		metrics: { precisionAtK: 1, recallAtK: 1, mrr: 1, noiseRatio: 0, gcEffectiveness: -1, salienceDrift: -1 },
-		passed: true,
-		details: "",
-	}),
-})
-
-const makeFailingScenario = (name: string): ScenarioDefinition => ({
-	name,
-	description: `Always-failing scenario: ${name}`,
-	run: async (_adapter, _clock) => ({
-		metrics: { precisionAtK: 0, recallAtK: 0, mrr: 0, noiseRatio: 1, gcEffectiveness: -1, salienceDrift: -1 },
-		passed: false,
-		details: "always fails",
-	}),
-})
-
-describe("runEvals", () => {
-	it("returns a report with the correct scenario count", async () => {
-		const adapter = createMockAdapter()
-		const report = await runEvals({
-			adapter,
-			scenarios: [makePassingScenario("A"), makePassingScenario("B")],
-		})
-		expect(report.summary.total).toBe(2)
-	})
-
-	it("counts passed scenarios correctly", async () => {
-		const adapter = createMockAdapter()
-		const report = await runEvals({
-			adapter,
-			scenarios: [makePassingScenario("A"), makeFailingScenario("B"), makePassingScenario("C")],
-		})
-		expect(report.summary.passed).toBe(2)
-		expect(report.summary.failed).toBe(1)
-	})
-
-	it("calls onScenarioStart and onScenarioEnd for each scenario", async () => {
-		const adapter = createMockAdapter()
-		const started: string[] = []
-		const ended: string[] = []
-
-		await runEvals({
-			adapter,
-			scenarios: [makePassingScenario("X"), makePassingScenario("Y")],
-			onScenarioStart: (name) => started.push(name),
-			onScenarioEnd: (name) => ended.push(name),
-		})
-
-		expect(started).toEqual(["X", "Y"])
-		expect(ended).toEqual(["X", "Y"])
-	})
-
-	it("calls teardown even when the scenario throws", async () => {
-		const adapter = createMockAdapter()
-		const teardownSpy = vi.spyOn(adapter, "teardown")
-
-		const throwingScenario: ScenarioDefinition = {
-			name: "Thrower",
-			description: "Throws during run",
-			run: async () => {
-				throw new Error("intentional scenario error")
-			},
-		}
-
-		const report = await runEvals({ adapter, scenarios: [throwingScenario] })
-
-		expect(teardownSpy).toHaveBeenCalledTimes(1)
-		expect(report.summary.failed).toBe(1)
-		expect(report.results[0].details).toContain("intentional scenario error")
-	})
-
-	it("computes correct averages in summary", async () => {
-		const adapter = createMockAdapter()
-		const report = await runEvals({
-			adapter,
-			scenarios: [makePassingScenario("A"), makeFailingScenario("B")],
-		})
-		expect(report.summary.avgPrecision).toBe(0.5)
-		expect(report.summary.avgMrr).toBe(0.5)
-	})
-
-	it("includes a unix timestamp in the report", async () => {
-		const adapter = createMockAdapter()
-		const report = await runEvals({ adapter, scenarios: [makePassingScenario("A")] })
-		expect(report.timestamp).toBeGreaterThan(0)
-	})
-})
diff --git a/packages/zosma-mem/src/evals/__tests__/scenarios.test.ts b/packages/zosma-mem/src/evals/__tests__/scenarios.test.ts
deleted file mode 100644
index cac64bf..0000000
--- a/packages/zosma-mem/src/evals/__tests__/scenarios.test.ts
+++ /dev/null
@@ -1,121 +0,0 @@
-/**
- * Integration tests: run all 7 built-in scenarios against the mock adapter.
- *
- * The mock adapter uses simple tag-overlap scoring. Not all scenarios can pass
- * at the highest possible threshold with a naive engine -- but all 7 must at
- * minimum complete without errors, produce valid metrics, and the scenarios
- * that the mock adapter is capable of passing must pass.
- *
- * Scenarios that require reinforcement or co-access (which the mock does not
- * implement) are tested for structural correctness only (valid metrics, no throws).
- */
-
-import { describe, expect, it } from "vitest"
-import { createClock } from "../utils/time.js"
-import { createMockAdapter } from "./mock-adapter.js"
-import { coldStartScenario } from "../scenarios/cold-start.js"
-import { repeatedPatternScenario } from "../scenarios/repeated-pattern.js"
-import { signalDilutionScenario } from "../scenarios/signal-dilution.js"
-import { staleMemoryScenario } from "../scenarios/stale-memory.js"
-import { conflictingUpdatesScenario } from "../scenarios/conflicting-updates.js"
-import { coAccessClusterScenario } from "../scenarios/co-access-cluster.js"
-import { crossContextScenario } from "../scenarios/cross-context.js"
-import type { ScenarioResult } from "../types.js"
-import { tmpdir } from "node:os"
-import { mkdtemp, rm } from "node:fs/promises"
-import { join } from "node:path"
-
-const runScenario = async (
-	scenario: { run: (adapter: ReturnType<typeof createMockAdapter>, clock: ReturnType<typeof createClock>) => Promise<ScenarioResult> },
-): Promise<ScenarioResult> => {
-	const adapter = createMockAdapter()
-	const clock = createClock()
-	const workDir = await mkdtemp(join(tmpdir(), "zosma-mem-test-"))
-	try {
-		await adapter.setup({ workDir, clock })
-		return await scenario.run(adapter, clock)
-	} finally {
-		await adapter.teardown()
-		await rm(workDir, { recursive: true, force: true })
-	}
-}
-
-const assertValidMetrics = (result: ScenarioResult) => {
-	const { metrics } = result
-	expect(metrics.precisionAtK).toBeGreaterThanOrEqual(0)
-	expect(metrics.precisionAtK).toBeLessThanOrEqual(1)
-	expect(metrics.recallAtK).toBeGreaterThanOrEqual(0)
-	expect(metrics.recallAtK).toBeLessThanOrEqual(1)
-	expect(metrics.mrr).toBeGreaterThanOrEqual(0)
-	expect(metrics.mrr).toBeLessThanOrEqual(1)
-	expect(metrics.noiseRatio).toBeGreaterThanOrEqual(0)
-	expect(metrics.noiseRatio).toBeLessThanOrEqual(1)
-	// gcEffectiveness and salienceDrift may be -1 (N/A)
-	expect(metrics.gcEffectiveness).toBeGreaterThanOrEqual(-1)
-	expect(metrics.salienceDrift).toBeGreaterThanOrEqual(-1)
-}
-
-describe("Scenario 1: Cold start", () => {
-	it("produces valid metrics and passes with mock adapter", async () => {
-		const result = await runScenario(coldStartScenario)
-		assertValidMetrics(result)
-		// Mock adapter tag scoring is sufficient for cold-start (clear tag match).
-		expect(result.passed).toBe(true)
-	})
-})
-
-describe("Scenario 2: Repeated pattern", () => {
-	it("produces valid metrics (mock does not reinforce, pass is not required)", async () => {
-		const result = await runScenario(repeatedPatternScenario)
-		assertValidMetrics(result)
-		// The recurring entity has the most matching tags so it should still rank first.
-		expect(result.metrics.mrr).toBeGreaterThan(0)
-	})
-})
-
-describe("Scenario 3: Signal dilution", () => {
-	it("produces valid metrics and passes with mock adapter", async () => {
-		const result = await runScenario(signalDilutionScenario)
-		assertValidMetrics(result)
-		// Mock uses tag overlap -- high-value events have exact tag matches.
-		expect(result.passed).toBe(true)
-	})
-})
-
-describe("Scenario 4: Stale memory", () => {
-	it("produces valid metrics and the fresh entity ranks first", async () => {
-		const result = await runScenario(staleMemoryScenario)
-		assertValidMetrics(result)
-		// Mock GC removes entities older than 7 days; fresh entity survives.
-		expect(result.metrics.mrr).toBe(1)
-	})
-})
-
-describe("Scenario 5: Conflicting updates", () => {
-	it("produces valid metrics with most recent content surfaced", async () => {
-		const result = await runScenario(conflictingUpdatesScenario)
-		assertValidMetrics(result)
-		// Mock last-write-wins: entity is replaced on re-ingest, latest content wins.
-		expect(result.metrics.mrr).toBe(1)
-	})
-})
-
-describe("Scenario 6: Co-access cluster", () => {
-	it("produces valid metrics (co-access boost not implemented in mock, partial pass)", async () => {
-		const result = await runScenario(coAccessClusterScenario)
-		assertValidMetrics(result)
-		// auth-flow has direct tag overlap and will rank 1st.
-		// retry-logic and timeout-handling share some auth tags so may appear.
-		expect(result.metrics.mrr).toBe(1)
-	})
-})
-
-describe("Scenario 7: Cross-context", () => {
-	it("produces valid metrics", async () => {
-		const result = await runScenario(crossContextScenario)
-		assertValidMetrics(result)
-		// Mock adapter ranks by tag overlap, so the auth entity should rank high
-		// for auth query and low for styling query.
-		expect(result.metrics.mrr).toBeGreaterThan(0)
-	})
-})
diff --git a/packages/zosma-mem/src/evals/cli/bin.ts b/packages/zosma-mem/src/evals/cli/bin.ts
deleted file mode 100644
index 4c8ab1d..0000000
--- a/packages/zosma-mem/src/evals/cli/bin.ts
+++ /dev/null
@@ -1,133 +0,0 @@
-#!/usr/bin/env node
-/**
- * zosma-mem-eval CLI entry point.
- *
- * Usage:
- *   zosma-mem-eval --adapter ./my-adapter.js [options]
- *
- * The adapter module must export a default or named `adapter` that satisfies
- * the MemoryAdapter interface.
- */
-
-import { writeFile } from "node:fs/promises"
-import { resolve } from "node:path"
-import { render } from "ink"
-import { Command } from "commander"
-import chalk from "chalk"
-import { createElement } from "react"
-import { builtInScenarios } from "../scenarios/index.js"
-import { renderMarkdownReport } from "../report.js"
-import { runEvals } from "../runner.js"
-import type { EvalReport, MemoryAdapter } from "../types.js"
-import { App } from "./components/App.js"
-
-const program = new Command()
-
-program
-	.name("zosma-mem-eval")
-	.description("Run the zosma-mem evaluation suite against a memory engine adapter.")
-	.requiredOption("--adapter <path>", "Path to a JS/TS module exporting a MemoryAdapter")
-	.option("--scenarios <names>", "Comma-separated scenario names to run (default: all)")
-	.option("--k <number>", "Top-K for precision/recall (default: 5)", "5")
-	.option("--ci", "Disable interactive Ink UI, output plain markdown to stdout")
-	.option("--json", "Output raw JSON report to stdout")
-	.option("--out <path>", "Write markdown report to a file")
-	.parse(process.argv)
-
-const opts = program.opts<{
-	adapter: string
-	scenarios?: string
-	k: string
-	ci?: boolean
-	json?: boolean
-	out?: string
-}>()
-
-const loadAdapter = async (adapterPath: string): Promise<MemoryAdapter> => {
-	const absolutePath = resolve(adapterPath)
-	const mod = await import(absolutePath) as Record<string, unknown>
-	const adapter = (mod.default ?? mod.adapter) as MemoryAdapter | undefined
-
-	if (!adapter || typeof adapter.setup !== "function") {
-		console.error(
-			chalk.red(
-				`Error: adapter module at "${adapterPath}" must export a default or named "adapter" that satisfies the MemoryAdapter interface.`,
-			),
-		)
-		process.exit(1)
-	}
-
-	return adapter
-}
-
-const filterScenarios = (names?: string) => {
-	if (!names) return builtInScenarios
-	const requested = names.split(",").map((n) => n.trim().toLowerCase())
-	return builtInScenarios.filter((s) => requested.includes(s.name.toLowerCase()))
-}
-
-const writeReport = async (report: EvalReport, outPath: string) => {
-	const markdown = renderMarkdownReport(report)
-	await writeFile(outPath, markdown, "utf8")
-	console.log(chalk.green(`Report written to ${outPath}`))
-}
-
-const main = async () => {
-	const adapter = await loadAdapter(opts.adapter)
-	const scenarios = filterScenarios(opts.scenarios)
-	const k = Number.parseInt(opts.k, 10)
-	const isCi = Boolean(opts.ci) || !process.stdout.isTTY
-
-	if (isCi || opts.json) {
-		// Plain mode: no Ink, just run and print.
-		const report = await runEvals({
-			adapter,
-			scenarios,
-			k,
-			onScenarioStart: (name) => {
-				if (!opts.json) process.stdout.write(`  running: ${name}\n`)
-			},
-			onScenarioEnd: (name, result) => {
-				if (!opts.json) {
-					const icon = result.passed ? chalk.green("✓") : chalk.red("✗")
-					process.stdout.write(`  ${icon} ${name}\n`)
-				}
-			},
-		})
-
-		if (opts.json) {
-			process.stdout.write(`${JSON.stringify(report, null, 2)}\n`)
-		} else {
-			process.stdout.write(`\n${renderMarkdownReport(report)}\n`)
-		}
-
-		if (opts.out) await writeReport(report, opts.out)
-
-		process.exit(report.summary.failed > 0 ? 1 : 0)
-	} else {
-		// Interactive Ink mode.
-		let finalReport: EvalReport | null = null
-
-		const { waitUntilExit } = render(
-			createElement(App, {
-				adapter,
-				scenarios,
-				k,
-				onComplete: (r: EvalReport) => {
-					finalReport = r
-				},
-			}),
-		)
-
-		await waitUntilExit()
-
-		if (opts.out && finalReport) await writeReport(finalReport, opts.out)
-
-		process.exit(finalReport && (finalReport as EvalReport).summary.failed > 0 ? 1 : 0)
-	}
-}
-
-main().catch((err) => {
-	console.error(chalk.red("Fatal:"), err instanceof Error ? err.message : err)
-	process.exit(1)
-})
diff --git a/packages/zosma-mem/src/evals/cli/components/App.tsx b/packages/zosma-mem/src/evals/cli/components/App.tsx
deleted file mode 100644
index 6d95423..0000000
--- a/packages/zosma-mem/src/evals/cli/components/App.tsx
+++ /dev/null
@@ -1,98 +0,0 @@
-import { Box, Text, useApp } from "ink"
-import type React from "react"
-import { useEffect, useRef, useState } from "react"
-import { runEvals } from "../../runner.js"
-import type { EvalReport, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../../types.js"
-import { ErrorDisplay } from "./ErrorDisplay.js"
-import { ScenarioRow } from "./ScenarioRow.js"
-import { SummaryTable } from "./SummaryTable.js"
-
-type ScenarioStatus = "pending" | "running" | "done"
-
-interface ScenarioState {
-	name: string
-	status: ScenarioStatus
-	result?: ScenarioResult
-}
-
-interface Props {
-	adapter: MemoryAdapter
-	scenarios?: ScenarioDefinition[]
-	k?: number
-	onComplete: (report: EvalReport) => void
-}
-
-export const App: React.FC<Props> = ({ adapter, scenarios, k, onComplete }) => {
-	const { exit } = useApp()
-	const [states, setStates] = useState<ScenarioState[]>([])
-	const [report, setReport] = useState<EvalReport | null>(null)
-	const [error, setError] = useState<string | null>(null)
-
-	// Capture props in a ref so the effect dependency array stays stable.
-	// The CLI renders once and never re-renders with different props.
-	const optsRef = useRef({ adapter, scenarios, k, onComplete, exit })
-
-	useEffect(() => {
-		const { adapter: a, scenarios: sc, k: topK, onComplete: done, exit: quit } = optsRef.current
-
-		const run = async () => {
-			try {
-				const result = await runEvals({
-					adapter: a,
-					scenarios: sc,
-					k: topK,
-					onScenarioStart: (name) => {
-						setStates((prev) => {
-							const next = [...prev]
-							const idx = next.findIndex((s) => s.name === name)
-							if (idx >= 0) {
-								next[idx] = { ...next[idx], status: "running" }
-							} else {
-								next.push({ name, status: "running" })
-							}
-							return next
-						})
-					},
-					onScenarioEnd: (name, scenarioResult) => {
-						setStates((prev) => {
-							const next = [...prev]
-							const idx = next.findIndex((s) => s.name === name)
-							if (idx >= 0) {
-								next[idx] = { name, status: "done", result: scenarioResult }
-							}
-							return next
-						})
-					},
-				})
-
-				setReport(result)
-				done(result)
-			} catch (err) {
-				setError(err instanceof Error ? err.message : String(err))
-			} finally {
-				quit()
-			}
-		}
-
-		// Initialise state with pending entries before running.
-		const scenarioList = sc ?? []
-		setStates(scenarioList.map((s) => ({ name: s.name, status: "pending" })))
-		run()
-	}, [])
-
-	if (error) {
-		return <ErrorDisplay message={error} />
-	}
-
-	return (
-		<Box flexDirection="column" padding={1}>
-			<Text bold>zosma-mem eval</Text>
-			<Box flexDirection="column" marginTop={1}>
-				{states.map((s) => (
-					<ScenarioRow key={s.name} name={s.name} status={s.status} result={s.result} />
-				))}
-			</Box>
-			{report ? <SummaryTable report={report} /> : null}
-		</Box>
-	)
-}
diff --git a/packages/zosma-mem/src/evals/cli/components/ErrorDisplay.tsx b/packages/zosma-mem/src/evals/cli/components/ErrorDisplay.tsx
deleted file mode 100644
index 25d385b..0000000
--- a/packages/zosma-mem/src/evals/cli/components/ErrorDisplay.tsx
+++ /dev/null
@@ -1,15 +0,0 @@
-import { Box, Text } from "ink"
-import type React from "react"
-
-interface Props {
-	message: string
-}
-
-export const ErrorDisplay: React.FC<Props> = ({ message }) => (
-	<Box flexDirection="column" marginTop={1} borderStyle="round" borderColor="red" paddingX={1}>
-		<Text color="red" bold>
-			Error
-		</Text>
-		<Text>{message}</Text>
-	</Box>
-)
diff --git a/packages/zosma-mem/src/evals/cli/components/ScenarioRow.tsx b/packages/zosma-mem/src/evals/cli/components/ScenarioRow.tsx
deleted file mode 100644
index 460adc2..0000000
--- a/packages/zosma-mem/src/evals/cli/components/ScenarioRow.tsx
+++ /dev/null
@@ -1,51 +0,0 @@
-import { Text } from "ink"
-import Spinner from "ink-spinner"
-import type React from "react"
-import type { ScenarioResult } from "../../types.js"
-
-interface Props {
-	name: string
-	status: "pending" | "running" | "done"
-	result?: ScenarioResult
-}
-
-export const ScenarioRow: React.FC<Props> = ({ name, status, result }) => {
-	if (status === "pending") {
-		return (
-			<Text>
-				<Text color="gray">{"  "}</Text>
-				<Text dimColor>{name}</Text>
-			</Text>
-		)
-	}
-
-	if (status === "running") {
-		return (
-			<Text>
-				<Text color="cyan">
-					<Spinner type="dots" />
-				</Text>
-				<Text>{" "}</Text>
-				<Text>{name}</Text>
-			</Text>
-		)
-	}
-
-	const icon = result?.passed ? "✓" : "✗"
-	const color = result?.passed ? "green" : "red"
-	const p = result?.metrics.precisionAtK.toFixed(3) ?? "-"
-	const r = result?.metrics.recallAtK.toFixed(3) ?? "-"
-	const m = result?.metrics.mrr.toFixed(3) ?? "-"
-
-	return (
-		<Text>
-			<Text color={color}>{icon}</Text>
-			<Text>{" "}</Text>
-			<Text>{name.padEnd(30)}</Text>
-			<Text dimColor>{`P@K:${p}  R@K:${r}  MRR:${m}`}</Text>
-			{!result?.passed && result?.details ? (
-				<Text color="red">{`  -- ${result.details}`}</Text>
-			) : null}
-		</Text>
-	)
-}
diff --git a/packages/zosma-mem/src/evals/cli/components/SummaryTable.tsx b/packages/zosma-mem/src/evals/cli/components/SummaryTable.tsx
deleted file mode 100644
index dd9c3fe..0000000
--- a/packages/zosma-mem/src/evals/cli/components/SummaryTable.tsx
+++ /dev/null
@@ -1,32 +0,0 @@
-import { Box, Text } from "ink"
-import type React from "react"
-import type { EvalReport } from "../../types.js"
-
-interface Props {
-	report: EvalReport
-}
-
-export const SummaryTable: React.FC<Props> = ({ report }) => {
-	const { summary } = report
-	const allPassed = summary.failed === 0
-
-	return (
-		<Box flexDirection="column" marginTop={1}>
-			<Text bold>Summary</Text>
-			<Text>
-				{"  Scenarios: "}
-				<Text color={allPassed ? "green" : "red"} bold>
-					{`${summary.passed}/${summary.total} passed`}
-				</Text>
-			</Text>
-			<Text>
-				{"  Avg P@K: "}
-				<Text bold>{summary.avgPrecision.toFixed(3)}</Text>
-				{"  Avg R@K: "}
-				<Text bold>{summary.avgRecall.toFixed(3)}</Text>
-				{"  Avg MRR: "}
-				<Text bold>{summary.avgMrr.toFixed(3)}</Text>
-			</Text>
-		</Box>
-	)
-}
diff --git a/packages/zosma-mem/src/evals/cli/simple-eval.ts b/packages/zosma-mem/src/evals/cli/simple-eval.ts
deleted file mode 100644
index 36d3b67..0000000
--- a/packages/zosma-mem/src/evals/cli/simple-eval.ts
+++ /dev/null
@@ -1,201 +0,0 @@
-#!/usr/bin/env node
-
-/**
- * zosma-mem - Zero-config memory evaluation
- *
- * Just run it - it'll find and evaluate your memory system automatically.
- */
-
-import { existsSync, readFileSync } from "node:fs"
-import { join } from "node:path"
-import { builtInScenarios } from "../scenarios/index.js"
-import { runEvals } from "../runner.js"
-import { renderMarkdownReport } from "../report.js"
-import { MemoryAdapter, MemoryEvent, DeterministicClock } from "../types.js"
-
-interface MemoryInfo {
-  type: "openzosma" | "file"
-  path: string
-}
-
-interface StoredMemoryEvent extends MemoryEvent {
-  usageCount: number
-  lastRetrieved: number
-}
-
-const detectMemory = (): MemoryInfo | null => {
-  const cwd = process.cwd()
-
-  // Check for OpenZosma memory
-  const openzosmaPath = join(cwd, "packages/gateway/workspace/agents/default/memory/MEMORY.md")
-  if (existsSync(openzosmaPath)) {
-    return { type: "openzosma", path: openzosmaPath }
-  }
-
-  // Check for generic memory files
-  const memoryFiles = ["MEMORY.md", "memory.md", ".memory.md"]
-  for (const file of memoryFiles) {
-    const path = join(cwd, file)
-    if (existsSync(path)) {
-      return { type: "file", path }
-    }
-  }
-
-  return null
-}
-
-const createMemoryAdapter = (memoryInfo: MemoryInfo): MemoryAdapter => {
-  const events = new Map<string, StoredMemoryEvent>()
-  let clock: DeterministicClock = { now: () => Date.now(), advance: () => {} }
-
-  const loadMemory = () => {
-    if (memoryInfo.type === "openzosma") {
-      // Parse OpenZosma format: <!-- timestamp [hash] -->\ncontent
-      const content = readFileSync(memoryInfo.path, "utf-8")
-      const lines = content.split("\n")
-      let currentEvent: Partial<MemoryEvent> | null = null
-
-      for (const line of lines) {
-        const match = line.match(/^<!-- (\d+) \[([a-f0-9]+)\] -->$/)
-        if (match) {
-          if (currentEvent && currentEvent.id) {
-            events.set(currentEvent.id, { ...currentEvent, usageCount: 0, lastRetrieved: 0 } as StoredMemoryEvent)
-          }
-          const [, ts, id] = match
-          currentEvent = {
-            id,
-            type: "preference",
-            content: "",
-            tags: ["user", "memory"],
-            timestamp: parseInt(ts)
-          }
-        } else if (currentEvent && line.trim()) {
-          currentEvent.content += line + "\n"
-        }
-      }
-      if (currentEvent && currentEvent.id) {
-        events.set(currentEvent.id, { ...currentEvent, usageCount: 0, lastRetrieved: 0 } as StoredMemoryEvent)
-      }
-    } else {
-      // Simple file format
-      const content = readFileSync(memoryInfo.path, "utf-8")
-      content.split("\n").forEach((line, i) => {
-        if (line.trim()) {
-          events.set(`entry-${i}`, {
-            id: `entry-${i}`,
-            type: "note",
-            content: line.trim(),
-            tags: [],
-            timestamp: Date.now() - (i * 1000),
-            usageCount: 0,
-            lastRetrieved: 0
-          })
-        }
-      })
-    }
-  }
-
-  return {
-    setup: async (opts) => {
-      clock = opts.clock
-      loadMemory()
-    },
-
-    ingest: async (event: MemoryEvent) => {
-      events.set(event.id, { ...event, usageCount: 0, lastRetrieved: 0 })
-    },
-
-    retrieve: async (query, topK) => {
-      const queryWords = new Set(query.text.toLowerCase().split(/\s+/))
-      const queryTags = new Set(query.tags || [])
-
-      const scored = Array.from(events.values()).map((stored) => {
-        let score = 0
-
-        // Tag matching
-        const tagMatches = stored.tags.filter(tag => queryTags.has(tag.toLowerCase())).length
-        score += tagMatches * 2
-
-        // Content matching
-        const contentWords = new Set(stored.content.toLowerCase().split(/\s+/))
-        const wordMatches = Array.from(queryWords).filter(word => contentWords.has(word)).length
-        score += wordMatches
-
-        // Recency boost
-        const ageHours = (clock.now() - stored.timestamp) / (1000 * 60 * 60)
-        score += Math.max(0, 1 - ageHours / 24) * 0.5
-
-        // Usage boost
-        score += stored.usageCount * 0.1
-
-        return {
-          id: stored.id,
-          content: stored.content.trim(),
-          score: Math.max(0, score),
-          tags: stored.tags
-        }
-      })
-
-      scored.sort((a, b) => b.score - a.score)
-      const top = scored.slice(0, topK)
-
-      // Mark as retrieved
-      for (const item of top) {
-        const stored = events.get(item.id)
-        if (stored) stored.lastRetrieved = clock.now()
-      }
-
-      return top
-    },
-
-    recordUsage: async (entityId: string, signal) => {
-      const stored = events.get(entityId)
-      if (stored && signal === "used") {
-        stored.usageCount++
-      }
-    },
-
-    gc: async () => ({ removedCount: 0, archivedCount: 0, consolidatedCount: 0 }),
-
-    advanceTime: async (ms: number) => {
-      clock.advance(ms)
-    },
-
-    listEntities: async () => Array.from(events.keys()),
-
-    teardown: async () => {
-      events.clear()
-    }
-  }
-}
-
-const main = async (): Promise<void> => {
-  const memory = detectMemory()
-
-  if (!memory) {
-    console.log("❌ No memory system found!")
-    console.log("")
-    console.log("To use zosma-mem, create one of:")
-    console.log("• MEMORY.md (generic format)")
-    console.log("• packages/gateway/workspace/agents/default/memory/MEMORY.md (OpenZosma)")
-    console.log("")
-    console.log("Run from your project root.")
-    process.exit(1)
-  }
-
-  console.log(`✅ Found ${memory.type} memory at ${memory.path}`)
-
-  const adapter = createMemoryAdapter(memory)
-  const report = await runEvals({ adapter, scenarios: builtInScenarios, k: 5 })
-
-  console.log("")
-  console.log(renderMarkdownReport(report))
-
-  if (report.summary.passed === report.summary.total) {
-    console.log("🎉 All tests passed!")
-  } else {
-    console.log(`❌ ${report.summary.failed} tests failed`)
-  }
-}
-
-main().catch(console.error)
\ No newline at end of file
diff --git a/packages/zosma-mem/src/evals/index.ts b/packages/zosma-mem/src/evals/index.ts
deleted file mode 100644
index 7e55de8..0000000
--- a/packages/zosma-mem/src/evals/index.ts
+++ /dev/null
@@ -1,56 +0,0 @@
-/**
- * Public API surface for zosma-mem/evals.
- *
- * Import via:
- *   import { runEvals, builtInScenarios } from "zosma-mem/evals"
- */
-
-// Runner
-export { runEvals } from "./runner.js"
-
-// Report
-export { renderMarkdownReport } from "./report.js"
-
-// Scenarios
-export {
-	builtInScenarios,
-	coldStartScenario,
-	repeatedPatternScenario,
-	signalDilutionScenario,
-	staleMemoryScenario,
-	conflictingUpdatesScenario,
-	coAccessClusterScenario,
-	crossContextScenario,
-} from "./scenarios/index.js"
-
-// Metrics (for custom scenario authors)
-export {
-	computePrecisionAtK,
-	computeRecallAtK,
-	computeMRR,
-	computeNoiseRatio,
-	computeGcEffectiveness,
-	computeSalienceDrift,
-} from "./metrics.js"
-
-// Fixtures and utilities (for custom scenario authors)
-export { createEvent, createQuery, createLowValueEvents, createHighValueEvents } from "./utils/fixtures.js"
-export { createClock, ONE_HOUR_MS, ONE_DAY_MS, ONE_WEEK_MS, THIRTY_DAYS_MS } from "./utils/time.js"
-export { checkMetric, checkAllMetrics, DEFAULT_THRESHOLDS } from "./utils/assertions.js"
-
-// Types
-export type {
-	MemoryAdapter,
-	MemoryEvent,
-	RetrieveQuery,
-	RetrievedEntity,
-	UsageSignal,
-	GcResult,
-	AdapterSetupOpts,
-	DeterministicClock,
-	EvalMetrics,
-	EvalReport,
-	ScenarioDefinition,
-	ScenarioResult,
-	RunnerOpts,
-} from "./types.js"
diff --git a/packages/zosma-mem/src/evals/metrics.ts b/packages/zosma-mem/src/evals/metrics.ts
deleted file mode 100644
index 63d36fd..0000000
--- a/packages/zosma-mem/src/evals/metrics.ts
+++ /dev/null
@@ -1,121 +0,0 @@
-/**
- * Pure metric computation functions for zosma-mem/evals.
- *
- * All functions are stateless and side-effect-free. They accept raw arrays/sets
- * of entity IDs and return a single numeric value. No engine types are imported.
- */
-
-// ---------------------------------------------------------------------------
-// Standard information retrieval metrics
-// ---------------------------------------------------------------------------
-
-/**
- * Precision@K: of the first K retrieved entities, what fraction is relevant?
- *
- * @param retrieved - Ordered list of retrieved entity IDs (most relevant first).
- * @param relevant  - Set of all entity IDs that are considered relevant.
- * @param k         - Cutoff rank.
- * @returns Value in [0, 1]. Returns 0 when k === 0.
- */
-export const computePrecisionAtK = (retrieved: readonly string[], relevant: ReadonlySet<string>, k: number): number => {
-	if (k === 0) return 0
-	const topK = retrieved.slice(0, k)
-	const hits = topK.filter((id) => relevant.has(id)).length
-	return hits / k
-}
-
-/**
- * Recall@K: of all relevant entities, what fraction appeared in the top K?
- *
- * @param retrieved - Ordered list of retrieved entity IDs (most relevant first).
- * @param relevant  - Set of all entity IDs that are considered relevant.
- * @param k         - Cutoff rank.
- * @returns Value in [0, 1]. Returns 1 when `relevant` is empty (vacuously true).
- */
-export const computeRecallAtK = (retrieved: readonly string[], relevant: ReadonlySet<string>, k: number): number => {
-	if (relevant.size === 0) return 1
-	const topK = retrieved.slice(0, k)
-	const hits = topK.filter((id) => relevant.has(id)).length
-	return hits / relevant.size
-}
-
-/**
- * Mean Reciprocal Rank: reciprocal of the rank of the first relevant result.
- *
- * Called "MRR" even though it is computed for a single query here; callers
- * average across queries to get the true MRR.
- *
- * @param retrieved - Ordered list of retrieved entity IDs (most relevant first).
- * @param relevant  - Set of all entity IDs that are considered relevant.
- * @returns Value in (0, 1]. Returns 0 if no relevant entity appears in the list.
- */
-export const computeMRR = (retrieved: readonly string[], relevant: ReadonlySet<string>): number => {
-	for (let i = 0; i < retrieved.length; i++) {
-		if (relevant.has(retrieved[i])) {
-			return 1 / (i + 1)
-		}
-	}
-	return 0
-}
-
-// ---------------------------------------------------------------------------
-// Memory-specific metrics
-// ---------------------------------------------------------------------------
-
-/**
- * Noise ratio: fraction of stored entities never retrieved after ingestion.
- *
- * A high noise ratio means the engine is persisting lots of low-value entities
- * that never surface. Useful for assessing ingestion threshold quality.
- *
- * @param allEntities   - All entity IDs currently persisted by the engine.
- * @param everRetrieved - Set of entity IDs that appeared in at least one result set.
- * @returns Value in [0, 1]. Returns 0 when `allEntities` is empty.
- */
-export const computeNoiseRatio = (
-	allEntities: readonly string[],
-	everRetrieved: ReadonlySet<string>,
-): number => {
-	if (allEntities.length === 0) return 0
-	const noiseCount = allEntities.filter((id) => !everRetrieved.has(id)).length
-	return noiseCount / allEntities.length
-}
-
-/**
- * GC effectiveness: fraction of noise entities removed after GC.
- *
- * @param noiseBeforeGc - Entity IDs that were noise (never retrieved) before GC.
- * @param entitiesAfterGc - All entity IDs persisted after GC runs.
- * @returns Value in [0, 1]. Returns -1 when `noiseBeforeGc` is empty (N/A).
- */
-export const computeGcEffectiveness = (
-	noiseBeforeGc: readonly string[],
-	entitiesAfterGc: readonly string[],
-): number => {
-	if (noiseBeforeGc.length === 0) return -1
-	const afterSet = new Set(entitiesAfterGc)
-	const removed = noiseBeforeGc.filter((id) => !afterSet.has(id)).length
-	return removed / noiseBeforeGc.length
-}
-
-/**
- * Salience drift: standard deviation of entity scores across GC cycles.
- *
- * A high drift value indicates the scoring function is unstable -- entities
- * oscillate in relevance across cycles rather than converging.
- *
- * @param scoreSnapshots - Array of score arrays, one per GC cycle.
- *                         Each inner array contains one score per entity.
- * @returns Standard deviation across all scores. Returns -1 when fewer than
- *          two cycles are provided (not enough data).
- */
-export const computeSalienceDrift = (scoreSnapshots: ReadonlyArray<readonly number[]>): number => {
-	if (scoreSnapshots.length < 2) return -1
-
-	const allScores: number[] = scoreSnapshots.flat()
-	if (allScores.length === 0) return -1
-
-	const mean = allScores.reduce((sum, s) => sum + s, 0) / allScores.length
-	const variance = allScores.reduce((sum, s) => sum + (s - mean) ** 2, 0) / allScores.length
-	return Math.sqrt(variance)
-}
diff --git a/packages/zosma-mem/src/evals/report.ts b/packages/zosma-mem/src/evals/report.ts
deleted file mode 100644
index 71241e3..0000000
--- a/packages/zosma-mem/src/evals/report.ts
+++ /dev/null
@@ -1,70 +0,0 @@
-/**
- * Markdown report renderer for zosma-mem/evals.
- *
- * Produces a CI-friendly markdown table from an EvalReport.
- * No external dependencies -- pure string manipulation.
- */
-
-import type { EvalReport } from "./types.js"
-
-const fmt = (n: number): string => {
-	if (n === -1) return " -- "
-	return n.toFixed(3)
-}
-
-const pad = (s: string, width: number): string => s.padEnd(width)
-
-/**
- * Render an EvalReport as a markdown string suitable for CI logs, PR comments,
- * or writing to a file with --out.
- */
-export const renderMarkdownReport = (report: EvalReport): string => {
-	const date = new Date(report.timestamp).toISOString()
-
-	const headers = ["Scenario", "P@K", "R@K", "MRR", "Noise", "GC Eff", "Drift", "Pass"]
-	const rows = report.results.map((r) => [
-		r.scenario,
-		fmt(r.metrics.precisionAtK),
-		fmt(r.metrics.recallAtK),
-		fmt(r.metrics.mrr),
-		fmt(r.metrics.noiseRatio),
-		fmt(r.metrics.gcEffectiveness),
-		fmt(r.metrics.salienceDrift),
-		r.passed ? "yes" : "NO",
-	])
-
-	// Compute column widths.
-	const colWidths = headers.map((h, i) =>
-		Math.max(h.length, ...rows.map((r) => r[i].length)),
-	)
-
-	const header = `| ${headers.map((h, i) => pad(h, colWidths[i])).join(" | ")} |`
-	const divider = `| ${colWidths.map((w) => "-".repeat(w)).join(" | ")} |`
-	const body = rows
-		.map((row) => `| ${row.map((cell, i) => pad(cell, colWidths[i])).join(" | ")} |`)
-		.join("\n")
-
-	const failureDetails = report.results
-		.filter((r) => !r.passed && r.details)
-		.map((r) => `**${r.scenario}**: ${r.details}`)
-		.join("\n")
-
-	const lines: string[] = [
-		`## zosma-mem Eval Report -- ${date}`,
-		"",
-		header,
-		divider,
-		body,
-		"",
-		`Summary: ${report.summary.passed}/${report.summary.total} passed.` +
-			` Avg P@K: ${report.summary.avgPrecision.toFixed(3)},` +
-			` Avg R@K: ${report.summary.avgRecall.toFixed(3)},` +
-			` Avg MRR: ${report.summary.avgMrr.toFixed(3)}`,
-	]
-
-	if (failureDetails) {
-		lines.push("", "### Failures", "", failureDetails)
-	}
-
-	return lines.join("\n")
-}
diff --git a/packages/zosma-mem/src/evals/runner.ts b/packages/zosma-mem/src/evals/runner.ts
deleted file mode 100644
index 232c341..0000000
--- a/packages/zosma-mem/src/evals/runner.ts
+++ /dev/null
@@ -1,128 +0,0 @@
-/**
- * Scenario runner for zosma-mem/evals.
- *
- * Orchestrates the full lifecycle for each scenario:
- *   1. Create an isolated temp directory.
- *   2. Instantiate a deterministic clock.
- *   3. Call adapter.setup().
- *   4. Execute the scenario.
- *   5. Call adapter.teardown() (always, even on failure).
- *   6. Remove the temp directory.
- *   7. Aggregate results into an EvalReport.
- */
-
-import { mkdtemp, rm } from "node:fs/promises"
-import { tmpdir } from "node:os"
-import { join } from "node:path"
-import { createClock } from "./utils/time.js"
-import { builtInScenarios } from "./scenarios/index.js"
-import type { EvalReport, RunnerOpts, ScenarioResult } from "./types.js"
-
-const DEFAULT_K = 5
-const DEFAULT_CONCURRENCY = 1
-
-/**
- * Run the eval suite against the provided adapter.
- *
- * @param opts - Runner options. Only `adapter` is required.
- * @returns A structured EvalReport with per-scenario metrics and a summary.
- */
-export const runEvals = async (opts: RunnerOpts): Promise<EvalReport> => {
-	const { adapter, k = DEFAULT_K, thresholds = {}, concurrency = DEFAULT_CONCURRENCY } = opts
-	const scenarios = opts.scenarios ?? builtInScenarios
-
-	// Run with controlled concurrency.
-	const results: Array<{ scenario: string; metrics: ScenarioResult["metrics"]; passed: boolean; details: string }> = []
-	const queue = [...scenarios]
-
-	const runNext = async (): Promise<void> => {
-		const scenario = queue.shift()
-		if (!scenario) return
-
-		opts.onScenarioStart?.(scenario.name)
-
-		let result: ScenarioResult
-		const workDir = await mkdtemp(join(tmpdir(), `zosma-mem-eval-${scenario.name.replace(/\s+/g, "-")}-`))
-		const clock = createClock()
-
-		try {
-			await adapter.setup({ workDir, clock })
-			result = await scenario.run(adapter, clock)
-		} catch (err) {
-			result = {
-				metrics: {
-					precisionAtK: 0,
-					recallAtK: 0,
-					mrr: 0,
-					noiseRatio: 0,
-					gcEffectiveness: -1,
-					salienceDrift: -1,
-				},
-				passed: false,
-				details: err instanceof Error ? err.message : String(err),
-			}
-		} finally {
-			try {
-				await adapter.teardown()
-			} catch {
-				// teardown failures are non-fatal -- the scenario result stands
-			}
-			await rm(workDir, { recursive: true, force: true })
-		}
-
-		// Apply runner-level threshold overrides on top of scenario defaults.
-		if (Object.keys(thresholds).length > 0 && result.passed) {
-			const { checkAllMetrics } = await import("./utils/assertions.js")
-			const failures = checkAllMetrics(result.metrics, thresholds)
-			if (failures.length > 0) {
-				result = { ...result, passed: false, details: failures.join("; ") }
-			}
-		}
-
-		// Attach K to metrics context (not stored on the type, used by scenarios internally).
-		void k // k is passed to scenarios via RunnerOpts; they reference it through the closure
-
-		results.push({
-			scenario: scenario.name,
-			metrics: result.metrics,
-			passed: result.passed,
-			details: result.details,
-		})
-
-		opts.onScenarioEnd?.(scenario.name, result)
-	}
-
-	// Build a pool of `concurrency` runners.
-	const workers = Array.from({ length: Math.max(1, concurrency) }, () => {
-		const drain = async (): Promise<void> => {
-			while (queue.length > 0) {
-				await runNext()
-			}
-		}
-		return drain()
-	})
-	await Promise.all(workers)
-
-	const passed = results.filter((r) => r.passed).length
-	const failed = results.length - passed
-
-	const avgPrecision =
-		results.length > 0 ? results.reduce((s, r) => s + r.metrics.precisionAtK, 0) / results.length : 0
-	const avgRecall =
-		results.length > 0 ? results.reduce((s, r) => s + r.metrics.recallAtK, 0) / results.length : 0
-	const avgMrr =
-		results.length > 0 ? results.reduce((s, r) => s + r.metrics.mrr, 0) / results.length : 0
-
-	return {
-		timestamp: Date.now(),
-		results,
-		summary: {
-			total: results.length,
-			passed,
-			failed,
-			avgPrecision,
-			avgRecall,
-			avgMrr,
-		},
-	}
-}
diff --git a/packages/zosma-mem/src/evals/scenarios/co-access-cluster.ts b/packages/zosma-mem/src/evals/scenarios/co-access-cluster.ts
deleted file mode 100644
index 77f3ea4..0000000
--- a/packages/zosma-mem/src/evals/scenarios/co-access-cluster.ts
+++ /dev/null
@@ -1,70 +0,0 @@
-/**
- * Scenario 6: Co-access cluster
- *
- * Three entities (A, B, C) are always retrieved together during a series of
- * usage sessions. Each time A is retrieved and used, B and C are also
- * retrieved and used. Later, a query is issued that directly matches only A.
- * All three must appear in the top K -- demonstrating that the engine surfaces
- * contextually related entities (co-access boost).
- *
- * Tests: co-access / relational memory clustering.
- */
-
-import { computeMRR, computePrecisionAtK, computeRecallAtK, computeNoiseRatio } from "../metrics.js"
-import { checkAllMetrics } from "../utils/assertions.js"
-import { createEvent, createQuery } from "../utils/fixtures.js"
-import type { DeterministicClock, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../types.js"
-
-const K = 5
-// All 3 cluster members must appear in top-5.
-const THRESHOLDS = { recallAtK: 1.0, precisionAtK: 0.6 }
-
-const run = async (adapter: MemoryAdapter, clock: DeterministicClock): Promise<ScenarioResult> => {
-	let t = clock.now()
-
-	// Ingest the three cluster entities.
-	await adapter.ingest(createEvent({ id: "auth-flow", type: "decision", content: "OAuth2 flow: redirect to /authorize, exchange code for token.", tags: ["auth", "oauth", "flow"], timestamp: t }))
-	await adapter.ingest(createEvent({ id: "retry-logic", type: "pattern", content: "Retry token refresh up to 3 times with exponential backoff.", tags: ["auth", "retry", "token"], timestamp: t + 1 }))
-	await adapter.ingest(createEvent({ id: "timeout-handling", type: "error", content: "If token refresh times out after 5s, force re-login.", tags: ["auth", "timeout", "session"], timestamp: t + 2 }))
-
-	// Ingest unrelated entities to pad the store.
-	await adapter.ingest(createEvent({ id: "ci-config", type: "pattern", content: "Run tests on every PR using GitHub Actions.", tags: ["ci", "testing"], timestamp: t + 3 }))
-	await adapter.ingest(createEvent({ id: "deploy-strategy", type: "decision", content: "Blue-green deployment via Kubernetes rolling updates.", tags: ["deploy", "k8s"], timestamp: t + 4 }))
-
-	// Simulate 3 sessions where A, B, C are always retrieved together.
-	for (let session = 0; session < 3; session++) {
-		clock.advance(60_000)
-		t = clock.now()
-
-		await adapter.recordUsage("auth-flow", "influenced_decision")
-		await adapter.recordUsage("retry-logic", "used")
-		await adapter.recordUsage("timeout-handling", "used")
-	}
-
-	// Query that directly matches only auth-flow.
-	const query = createQuery({ text: "How does the OAuth2 authentication flow work?", tags: ["auth", "oauth"] })
-	const results = await adapter.retrieve(query, K)
-	const retrieved = results.map((r) => r.id)
-	const clusterIds = ["auth-flow", "retry-logic", "timeout-handling"]
-	const relevantSet = new Set(clusterIds)
-	const everRetrieved = new Set(retrieved)
-	const allEntities = await adapter.listEntities()
-
-	const metrics = {
-		precisionAtK: computePrecisionAtK(retrieved, relevantSet, K),
-		recallAtK: computeRecallAtK(retrieved, relevantSet, K),
-		mrr: computeMRR(retrieved, relevantSet),
-		noiseRatio: computeNoiseRatio(allEntities, everRetrieved),
-		gcEffectiveness: -1,
-		salienceDrift: -1,
-	}
-
-	const failures = checkAllMetrics(metrics, THRESHOLDS)
-	return { metrics, passed: failures.length === 0, details: failures.join("; ") }
-}
-
-export const coAccessClusterScenario: ScenarioDefinition = {
-	name: "Co-access cluster",
-	description: "Three entities always used together; querying one must surface all three in top K.",
-	run,
-}
diff --git a/packages/zosma-mem/src/evals/scenarios/cold-start.ts b/packages/zosma-mem/src/evals/scenarios/cold-start.ts
deleted file mode 100644
index aa7ebd4..0000000
--- a/packages/zosma-mem/src/evals/scenarios/cold-start.ts
+++ /dev/null
@@ -1,59 +0,0 @@
-/**
- * Scenario 1: Cold start
- *
- * An empty engine ingests a mixed set of events (decisions, errors, patterns,
- * preferences). A targeted query is issued. The engine must surface the
- * semantically relevant events in the top K.
- *
- * Tests: basic ingestion and retrieval with no prior state.
- */
-
-import { computeMRR, computePrecisionAtK, computeRecallAtK, computeNoiseRatio } from "../metrics.js"
-import { checkAllMetrics } from "../utils/assertions.js"
-import { createEvent, createQuery } from "../utils/fixtures.js"
-import type { DeterministicClock, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../types.js"
-
-const K = 5
-
-const THRESHOLDS = { precisionAtK: 0.6, recallAtK: 0.8, mrr: 0.5 }
-
-const run = async (adapter: MemoryAdapter, clock: DeterministicClock): Promise<ScenarioResult> => {
-	const t = clock.now()
-
-	// Ingest 10 events -- 3 relevant (tagged "auth"), 7 irrelevant noise.
-	const relevant = ["auth-decision", "auth-error", "auth-pattern"]
-
-	await adapter.ingest(createEvent({ id: "auth-decision", type: "decision", content: "Use short-lived JWTs with refresh token rotation.", tags: ["auth", "security"], timestamp: t }))
-	await adapter.ingest(createEvent({ id: "auth-error", type: "error", content: "Session invalidated on password reset -- must revoke all tokens.", tags: ["auth", "session"], timestamp: t + 1 }))
-	await adapter.ingest(createEvent({ id: "auth-pattern", type: "pattern", content: "Always validate token expiry before issuing a new one.", tags: ["auth", "token"], timestamp: t + 2 }))
-
-	// Noise events -- different domain.
-	for (let i = 0; i < 7; i++) {
-		await adapter.ingest(createEvent({ id: `noise-${i}`, type: "pattern", content: `Styling preference ${i}: use 4-space indentation.`, tags: ["style"], timestamp: t + 3 + i }))
-	}
-
-	const query = createQuery({ text: "How should authentication tokens be managed?", tags: ["auth"] })
-	const results = await adapter.retrieve(query, K)
-	const retrieved = results.map((r) => r.id)
-	const relevantSet = new Set(relevant)
-	const everRetrieved = new Set(retrieved)
-	const allEntities = await adapter.listEntities()
-
-	const metrics = {
-		precisionAtK: computePrecisionAtK(retrieved, relevantSet, K),
-		recallAtK: computeRecallAtK(retrieved, relevantSet, K),
-		mrr: computeMRR(retrieved, relevantSet),
-		noiseRatio: computeNoiseRatio(allEntities, everRetrieved),
-		gcEffectiveness: -1,
-		salienceDrift: -1,
-	}
-
-	const failures = checkAllMetrics(metrics, THRESHOLDS)
-	return { metrics, passed: failures.length === 0, details: failures.join("; ") }
-}
-
-export const coldStartScenario: ScenarioDefinition = {
-	name: "Cold start",
-	description: "Empty engine ingests 10 events (3 relevant) and retrieves for an auth query.",
-	run,
-}
diff --git a/packages/zosma-mem/src/evals/scenarios/conflicting-updates.ts b/packages/zosma-mem/src/evals/scenarios/conflicting-updates.ts
deleted file mode 100644
index 2ce3358..0000000
--- a/packages/zosma-mem/src/evals/scenarios/conflicting-updates.ts
+++ /dev/null
@@ -1,83 +0,0 @@
-/**
- * Scenario 5: Conflicting updates
- *
- * The same logical entity is ingested 4 times with progressively updated
- * content (simulating a fact that evolved over sessions). The most recent
- * version must appear first in retrieval results.
- *
- * Tests: last-write-wins / recency preference for updated entities.
- */
-
-import { computeMRR, computePrecisionAtK, computeRecallAtK, computeNoiseRatio } from "../metrics.js"
-import { checkAllMetrics } from "../utils/assertions.js"
-import { createEvent, createQuery } from "../utils/fixtures.js"
-import type { DeterministicClock, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../types.js"
-
-const K = 5
-const THRESHOLDS = { mrr: 1.0 }
-
-const run = async (adapter: MemoryAdapter, clock: DeterministicClock): Promise<ScenarioResult> => {
-	let t = clock.now()
-
-	const entityId = "db-schema-decision"
-	const versions = [
-		"Initial: use a single users table with a role column.",
-		"Update: split roles into a separate roles table for normalisation.",
-		"Update: add an audit_log table for compliance tracking.",
-		"Final: add soft-delete (deleted_at) to users; audit_log is append-only.",
-	]
-
-	// Ingest all 4 versions of the same entity.
-	for (const content of versions) {
-		await adapter.ingest(
-			createEvent({
-				id: entityId,
-				type: "decision",
-				content,
-				tags: ["database", "schema", "users"],
-				timestamp: t,
-			}),
-		)
-		clock.advance(60_000) // 1 minute between updates
-		t = clock.now()
-	}
-
-	// Add an unrelated entity to ensure ranking is non-trivial.
-	await adapter.ingest(
-		createEvent({ id: "cache-strategy", type: "pattern", content: "Use Redis for session caching.", tags: ["cache", "redis"], timestamp: t }),
-	)
-
-	const query = createQuery({ text: "What is the current database schema for users?", tags: ["database", "schema"] })
-	const results = await adapter.retrieve(query, K)
-	const retrieved = results.map((r) => r.id)
-	const relevantSet = new Set([entityId])
-	const everRetrieved = new Set(retrieved)
-	const allEntities = await adapter.listEntities()
-
-	// Additionally verify that the content of the top result reflects the latest version.
-	const topResult = results[0]
-	const contentIsLatest = topResult?.id === entityId && topResult.content.includes("soft-delete")
-	const contentDetails = topResult?.id === entityId && !contentIsLatest
-		? `top result content does not reflect latest version (got: "${topResult.content?.slice(0, 60)}")`
-		: ""
-
-	const metrics = {
-		precisionAtK: computePrecisionAtK(retrieved, relevantSet, K),
-		recallAtK: computeRecallAtK(retrieved, relevantSet, K),
-		mrr: computeMRR(retrieved, relevantSet),
-		noiseRatio: computeNoiseRatio(allEntities, everRetrieved),
-		gcEffectiveness: -1,
-		salienceDrift: -1,
-	}
-
-	const failures = checkAllMetrics(metrics, THRESHOLDS)
-	if (contentDetails) failures.push(contentDetails)
-
-	return { metrics, passed: failures.length === 0, details: failures.join("; ") }
-}
-
-export const conflictingUpdatesScenario: ScenarioDefinition = {
-	name: "Conflicting updates",
-	description: "Entity ingested 4 times with evolving content; most recent version must rank first.",
-	run,
-}
diff --git a/packages/zosma-mem/src/evals/scenarios/cross-context.ts b/packages/zosma-mem/src/evals/scenarios/cross-context.ts
deleted file mode 100644
index d52770c..0000000
--- a/packages/zosma-mem/src/evals/scenarios/cross-context.ts
+++ /dev/null
@@ -1,98 +0,0 @@
-/**
- * Scenario 7: Cross-context
- *
- * An entity tagged ["auth", "security"] is relevant when the agent is working
- * on authentication but irrelevant when working on UI styling. Two queries are
- * issued -- one on-topic, one off-topic. The entity must rank in top-3 for the
- * auth query and outside top-5 for the styling query.
- *
- * Tests: context-sensitive retrieval -- the same entity should surface only
- * when contextually appropriate.
- */
-
-import { computeMRR, computePrecisionAtK, computeRecallAtK, computeNoiseRatio } from "../metrics.js"
-import { checkAllMetrics } from "../utils/assertions.js"
-import { createEvent, createQuery } from "../utils/fixtures.js"
-import type { DeterministicClock, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../types.js"
-
-const K = 5
-const THRESHOLDS = { mrr: 1.0 }
-
-const run = async (adapter: MemoryAdapter, clock: DeterministicClock): Promise<ScenarioResult> => {
-	const t = clock.now()
-
-	// The entity we care about -- highly relevant to auth, irrelevant to styling.
-	const targetId = "session-expiry-policy"
-	await adapter.ingest(
-		createEvent({
-			id: targetId,
-			type: "decision",
-			content: "Sessions expire after 30 minutes of inactivity. Refresh tokens are valid for 7 days.",
-			tags: ["auth", "security", "session"],
-			timestamp: t,
-		}),
-	)
-
-	// Add styling-domain entities that should dominate the off-topic query.
-	for (let i = 0; i < 5; i++) {
-		await adapter.ingest(
-			createEvent({
-				id: `style-rule-${i}`,
-				type: "preference",
-				content: `UI guideline ${i}: use Tailwind utility classes, avoid inline styles.`,
-				tags: ["ui", "styling", "tailwind"],
-				timestamp: t + 1 + i,
-			}),
-		)
-	}
-
-	// Add more auth entities to confirm the target is retrieved in the right context.
-	await adapter.ingest(createEvent({ id: "mfa-requirement", type: "decision", content: "MFA required for all accounts with admin privileges.", tags: ["auth", "mfa", "security"], timestamp: t + 6 }))
-	await adapter.ingest(createEvent({ id: "password-policy", type: "decision", content: "Passwords must be at least 12 characters with mixed case and symbols.", tags: ["auth", "password", "security"], timestamp: t + 7 }))
-
-	// --- Query 1: on-topic (auth) ---
-	const authQuery = createQuery({ text: "How long before a user session expires?", tags: ["auth", "session"] })
-	const authResults = await adapter.retrieve(authQuery, K)
-	const authRetrieved = authResults.map((r) => r.id)
-	const authRelevant = new Set([targetId])
-
-	const authMrr = computeMRR(authRetrieved, authRelevant)
-	const authRank = authRetrieved.indexOf(targetId) // 0-based; -1 = not found
-
-	// --- Query 2: off-topic (styling) ---
-	const styleQuery = createQuery({ text: "What CSS conventions should I use for the UI components?", tags: ["ui", "styling"] })
-	const styleResults = await adapter.retrieve(styleQuery, K)
-	const styleRetrieved = styleResults.map((r) => r.id)
-
-	// Target must NOT appear in top-5 of the styling query.
-	const targetInStyleTop5 = styleRetrieved.includes(targetId)
-
-	const everRetrieved = new Set([...authRetrieved, ...styleRetrieved])
-	const allEntities = await adapter.listEntities()
-
-	const metrics = {
-		precisionAtK: computePrecisionAtK(authRetrieved, authRelevant, K),
-		recallAtK: computeRecallAtK(authRetrieved, authRelevant, K),
-		mrr: authMrr,
-		noiseRatio: computeNoiseRatio(allEntities, everRetrieved),
-		gcEffectiveness: -1,
-		salienceDrift: -1,
-	}
-
-	const failures = checkAllMetrics(metrics, THRESHOLDS)
-
-	if (authRank > 2) {
-		failures.push(`target ranked ${authRank + 1} in auth query (expected top-3)`)
-	}
-	if (targetInStyleTop5) {
-		failures.push("target appeared in top-5 of off-topic styling query (should be absent)")
-	}
-
-	return { metrics, passed: failures.length === 0, details: failures.join("; ") }
-}
-
-export const crossContextScenario: ScenarioDefinition = {
-	name: "Cross-context",
-	description: "Entity relevant to auth must rank top-3 for auth query but not appear in styling query top-5.",
-	run,
-}
diff --git a/packages/zosma-mem/src/evals/scenarios/index.ts b/packages/zosma-mem/src/evals/scenarios/index.ts
deleted file mode 100644
index 5584509..0000000
--- a/packages/zosma-mem/src/evals/scenarios/index.ts
+++ /dev/null
@@ -1,35 +0,0 @@
-/**
- * Built-in scenario registry.
- *
- * Import `builtInScenarios` to run the full default suite.
- * Scenarios are listed in the order they will run when no override is provided.
- */
-
-import { coldStartScenario } from "./cold-start.js"
-import { coAccessClusterScenario } from "./co-access-cluster.js"
-import { conflictingUpdatesScenario } from "./conflicting-updates.js"
-import { crossContextScenario } from "./cross-context.js"
-import { repeatedPatternScenario } from "./repeated-pattern.js"
-import { signalDilutionScenario } from "./signal-dilution.js"
-import { staleMemoryScenario } from "./stale-memory.js"
-import type { ScenarioDefinition } from "../types.js"
-
-export const builtInScenarios: ScenarioDefinition[] = [
-	coldStartScenario,
-	repeatedPatternScenario,
-	signalDilutionScenario,
-	staleMemoryScenario,
-	conflictingUpdatesScenario,
-	coAccessClusterScenario,
-	crossContextScenario,
-]
-
-export {
-	coldStartScenario,
-	repeatedPatternScenario,
-	signalDilutionScenario,
-	staleMemoryScenario,
-	conflictingUpdatesScenario,
-	coAccessClusterScenario,
-	crossContextScenario,
-}
diff --git a/packages/zosma-mem/src/evals/scenarios/repeated-pattern.ts b/packages/zosma-mem/src/evals/scenarios/repeated-pattern.ts
deleted file mode 100644
index 390bddc..0000000
--- a/packages/zosma-mem/src/evals/scenarios/repeated-pattern.ts
+++ /dev/null
@@ -1,70 +0,0 @@
-/**
- * Scenario 2: Repeated pattern
- *
- * The same error event is ingested 5 times (same ID, same tags, evolving
- * content). Between ingestions the adapter receives reinforcement signals
- * indicating the entity was used. After reinforcement, the entity must rank
- * first in a retrieval.
- *
- * Tests: reinforcement loop -- entities that get usage signals rise in rank.
- */
-
-import { computeMRR, computePrecisionAtK, computeRecallAtK, computeNoiseRatio } from "../metrics.js"
-import { checkAllMetrics } from "../utils/assertions.js"
-import { createEvent, createQuery } from "../utils/fixtures.js"
-import type { DeterministicClock, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../types.js"
-
-const K = 5
-const THRESHOLDS = { mrr: 1.0 }
-
-const run = async (adapter: MemoryAdapter, clock: DeterministicClock): Promise<ScenarioResult> => {
-	let t = clock.now()
-
-	const recurringId = "retry-timeout"
-
-	// Ingest the recurring entity 5 times with progressively refined content.
-	for (let i = 0; i < 5; i++) {
-		await adapter.ingest(
-			createEvent({
-				id: recurringId,
-				type: "error",
-				content: `Network timeout on retry attempt ${i + 1}. Increase backoff to ${(i + 1) * 200}ms.`,
-				tags: ["network", "retry", "timeout"],
-				timestamp: t,
-			}),
-		)
-		// Signal that the agent used this entity after each ingestion.
-		await adapter.recordUsage(recurringId, "influenced_decision")
-		clock.advance(1_000)
-		t = clock.now()
-	}
-
-	// Add some competing entities so the ranking is non-trivial.
-	await adapter.ingest(createEvent({ id: "db-connection", type: "error", content: "DB connection pool exhausted.", tags: ["database", "pool"], timestamp: t + 1 }))
-	await adapter.ingest(createEvent({ id: "cache-miss", type: "pattern", content: "Cache miss rate above 80% -- review TTL settings.", tags: ["cache", "performance"], timestamp: t + 2 }))
-
-	const query = createQuery({ text: "What should I do when a network request times out?", tags: ["network", "retry"] })
-	const results = await adapter.retrieve(query, K)
-	const retrieved = results.map((r) => r.id)
-	const relevantSet = new Set([recurringId])
-	const everRetrieved = new Set(retrieved)
-	const allEntities = await adapter.listEntities()
-
-	const metrics = {
-		precisionAtK: computePrecisionAtK(retrieved, relevantSet, K),
-		recallAtK: computeRecallAtK(retrieved, relevantSet, K),
-		mrr: computeMRR(retrieved, relevantSet),
-		noiseRatio: computeNoiseRatio(allEntities, everRetrieved),
-		gcEffectiveness: -1,
-		salienceDrift: -1,
-	}
-
-	const failures = checkAllMetrics(metrics, THRESHOLDS)
-	return { metrics, passed: failures.length === 0, details: failures.join("; ") }
-}
-
-export const repeatedPatternScenario: ScenarioDefinition = {
-	name: "Repeated pattern",
-	description: "Recurring entity ingested 5 times with reinforcement signals; must rank first.",
-	run,
-}
diff --git a/packages/zosma-mem/src/evals/scenarios/signal-dilution.ts b/packages/zosma-mem/src/evals/scenarios/signal-dilution.ts
deleted file mode 100644
index d4d7210..0000000
--- a/packages/zosma-mem/src/evals/scenarios/signal-dilution.ts
+++ /dev/null
@@ -1,64 +0,0 @@
-/**
- * Scenario 3: Signal dilution
- *
- * 100 low-value events are ingested alongside 3 high-value events. A targeted
- * query is issued that matches only the high-value events. The engine must
- * surface at least 3 of the 5 top results from the high-value set, proving
- * that the pool size does not dilute retrieval quality.
- *
- * Tests: attention gating / relevance ranking at scale.
- */
-
-import { computeMRR, computePrecisionAtK, computeRecallAtK, computeNoiseRatio } from "../metrics.js"
-import { checkAllMetrics } from "../utils/assertions.js"
-import { createHighValueEvents, createLowValueEvents, createQuery } from "../utils/fixtures.js"
-import type { DeterministicClock, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../types.js"
-
-const K = 5
-const THRESHOLDS = { precisionAtK: 0.6, recallAtK: 1.0, mrr: 1.0 }
-
-const run = async (adapter: MemoryAdapter, clock: DeterministicClock): Promise<ScenarioResult> => {
-	const t = clock.now()
-
-	const highValueIds = ["perf-critical-1", "perf-critical-2", "perf-critical-3"]
-	const highValueTags = ["performance", "critical", "database"]
-
-	// Ingest 100 low-value events first (noise).
-	for (const event of createLowValueEvents(100, t)) {
-		await adapter.ingest(event)
-	}
-
-	// Ingest the 3 high-value events.
-	for (const event of createHighValueEvents(highValueIds, highValueTags, t + 100)) {
-		await adapter.ingest(event)
-	}
-
-	const query = createQuery({
-		text: "Critical database performance issues that need immediate attention",
-		tags: ["performance", "database", "critical"],
-	})
-
-	const results = await adapter.retrieve(query, K)
-	const retrieved = results.map((r) => r.id)
-	const relevantSet = new Set(highValueIds)
-	const everRetrieved = new Set(retrieved)
-	const allEntities = await adapter.listEntities()
-
-	const metrics = {
-		precisionAtK: computePrecisionAtK(retrieved, relevantSet, K),
-		recallAtK: computeRecallAtK(retrieved, relevantSet, K),
-		mrr: computeMRR(retrieved, relevantSet),
-		noiseRatio: computeNoiseRatio(allEntities, everRetrieved),
-		gcEffectiveness: -1,
-		salienceDrift: -1,
-	}
-
-	const failures = checkAllMetrics(metrics, THRESHOLDS)
-	return { metrics, passed: failures.length === 0, details: failures.join("; ") }
-}
-
-export const signalDilutionScenario: ScenarioDefinition = {
-	name: "Signal dilution",
-	description: "100 low-value + 3 high-value events; engine must surface high-value despite pool size.",
-	run,
-}
diff --git a/packages/zosma-mem/src/evals/scenarios/stale-memory.ts b/packages/zosma-mem/src/evals/scenarios/stale-memory.ts
deleted file mode 100644
index 117ad15..0000000
--- a/packages/zosma-mem/src/evals/scenarios/stale-memory.ts
+++ /dev/null
@@ -1,89 +0,0 @@
-/**
- * Scenario 4: Stale memory
- *
- * Events are ingested, then the clock is advanced 30 days without any access.
- * GC is run. A fresh event is ingested. Retrieval must prefer the fresh entity
- * over the stale ones. GC effectiveness is measured by checking how many of
- * the stale, never-retrieved events were removed.
- *
- * Tests: time-based decay + GC pruning of unused entities.
- */
-
-import { computeGcEffectiveness, computeMRR, computeNoiseRatio, computePrecisionAtK, computeRecallAtK } from "../metrics.js"
-import { checkAllMetrics } from "../utils/assertions.js"
-import { createEvent, createQuery } from "../utils/fixtures.js"
-import { THIRTY_DAYS_MS } from "../utils/time.js"
-import type { DeterministicClock, MemoryAdapter, ScenarioDefinition, ScenarioResult } from "../types.js"
-
-const K = 5
-// GC effectiveness is advisory here -- not all engines support decay.
-const THRESHOLDS = { mrr: 1.0 }
-
-const run = async (adapter: MemoryAdapter, clock: DeterministicClock): Promise<ScenarioResult> => {
-	const t = clock.now()
-
-	// Ingest stale events -- none of them will be retrieved after the time jump.
-	const staleIds = ["stale-a", "stale-b", "stale-c", "stale-d", "stale-e"]
-	for (const id of staleIds) {
-		await adapter.ingest(
-			createEvent({
-				id,
-				type: "pattern",
-				content: `Old preference: ${id}. No longer relevant.`,
-				tags: ["legacy", "stale"],
-				timestamp: t,
-			}),
-		)
-	}
-
-	// Record the entity list before GC.
-	const entitiesBeforeGc = await adapter.listEntities()
-
-	// Advance the clock 30 days -- simulates no activity.
-	await adapter.advanceTime(THIRTY_DAYS_MS)
-	clock.advance(THIRTY_DAYS_MS)
-
-	// Run GC.
-	await adapter.gc()
-
-	// Ingest a fresh, highly relevant event after the time jump.
-	const freshId = "fresh-auth-decision"
-	await adapter.ingest(
-		createEvent({
-			id: freshId,
-			type: "decision",
-			content: "New auth policy: enforce MFA for all admin accounts.",
-			tags: ["auth", "security", "policy"],
-			timestamp: clock.now(),
-		}),
-	)
-
-	const entitiesAfterGc = await adapter.listEntities()
-
-	// Identify noise (stale entities never retrieved).
-	const noiseBeforeGc = entitiesBeforeGc.filter((id) => staleIds.includes(id))
-
-	const query = createQuery({ text: "What is the current auth policy for admin accounts?", tags: ["auth", "policy"] })
-	const results = await adapter.retrieve(query, K)
-	const retrieved = results.map((r) => r.id)
-	const relevantSet = new Set([freshId])
-	const everRetrieved = new Set(retrieved)
-
-	const metrics = {
-		precisionAtK: computePrecisionAtK(retrieved, relevantSet, K),
-		recallAtK: computeRecallAtK(retrieved, relevantSet, K),
-		mrr: computeMRR(retrieved, relevantSet),
-		noiseRatio: computeNoiseRatio(entitiesAfterGc, everRetrieved),
-		gcEffectiveness: computeGcEffectiveness(noiseBeforeGc, entitiesAfterGc),
-		salienceDrift: -1,
-	}
-
-	const failures = checkAllMetrics(metrics, THRESHOLDS)
-	return { metrics, passed: failures.length === 0, details: failures.join("; ") }
-}
-
-export const staleMemoryScenario: ScenarioDefinition = {
-	name: "Stale memory",
-	description: "Events ingested, clock advanced 30 days, GC run. Fresh entity must rank first.",
-	run,
-}
diff --git a/packages/zosma-mem/src/evals/types.ts b/packages/zosma-mem/src/evals/types.ts
deleted file mode 100644
index a37f8e2..0000000
--- a/packages/zosma-mem/src/evals/types.ts
+++ /dev/null
@@ -1,270 +0,0 @@
-/**
- * Engine-agnostic types for zosma-mem/evals.
- *
- * These types define the contract between the eval framework and any memory
- * engine under test. No implementation details leak through here -- engines
- * are black boxes that accept events and answer queries.
- */
-
-// ---------------------------------------------------------------------------
-// Deterministic clock
-// ---------------------------------------------------------------------------
-
-/**
- * A synthetic clock injected into the adapter at setup time.
- * Scenarios that test time-sensitive behaviour (decay, stale memory) advance
- * this clock instead of using wall-clock time, making tests deterministic.
- */
-export interface DeterministicClock {
-	/** Return the current synthetic timestamp (ms since epoch). */
-	now: () => number
-	/** Move the clock forward by the given number of milliseconds. */
-	advance: (ms: number) => void
-}
-
-// ---------------------------------------------------------------------------
-// Adapter setup
-// ---------------------------------------------------------------------------
-
-export interface AdapterSetupOpts {
-	/**
-	 * Temporary directory created by the runner for this scenario.
-	 * The engine may use it for any persistent state.
-	 * The runner cleans it up after teardown.
-	 */
-	workDir: string
-	/** Deterministic clock. The engine must use this instead of Date.now(). */
-	clock: DeterministicClock
-}
-
-// ---------------------------------------------------------------------------
-// Memory events
-// ---------------------------------------------------------------------------
-
-/**
- * A memory event as seen by the eval framework.
- * Deliberately minimal -- engines may treat `type` and `metadata` as they see fit.
- */
-export interface MemoryEvent {
-	id: string
-	/**
-	 * Semantic category. Common values: "decision" | "error" | "pattern" | "preference".
-	 * Not constrained to an enum -- each engine defines its own taxonomy.
-	 */
-	type: string
-	/** Human-readable content to be stored. */
-	content: string
-	/** Tags used for retrieval matching. */
-	tags: string[]
-	/** Synthetic timestamp produced by the deterministic clock. */
-	timestamp: number
-	/** Engine-specific passthrough. The eval framework never reads this. */
-	metadata?: Record<string, unknown>
-}
-
-// ---------------------------------------------------------------------------
-// Retrieval
-// ---------------------------------------------------------------------------
-
-export interface RetrieveQuery {
-	/** Natural language task description. */
-	text: string
-	/** Optional hint tags to narrow the search. */
-	tags?: string[]
-	/** Engine-specific context passthrough. The eval framework never reads this. */
-	context?: Record<string, unknown>
-}
-
-export interface RetrievedEntity {
-	id: string
-	content: string
-	/**
-	 * Engine-assigned relevance score. The eval framework only uses this for
-	 * ordering -- it does not interpret the magnitude.
-	 */
-	score: number
-	tags: string[]
-}
-
-// ---------------------------------------------------------------------------
-// Usage signals
-// ---------------------------------------------------------------------------
-
-/**
- * Signal sent back to the engine after a retrieval to model agent behaviour.
- * - `used`               -- the agent acted on this entity (reinforces it)
- * - `ignored`            -- the agent did not act on it (demotes it)
- * - `influenced_decision` -- the entity directly shaped a tool call or decision (strongest signal)
- */
-export type UsageSignal = "used" | "ignored" | "influenced_decision"
-
-// ---------------------------------------------------------------------------
-// GC
-// ---------------------------------------------------------------------------
-
-export interface GcResult {
-	/** Entities fully removed from the store. */
-	removedCount: number
-	/** Entities moved to an archive / cold tier. */
-	archivedCount: number
-	/** Groups of entities merged into a single summary entity. */
-	consolidatedCount: number
-}
-
-// ---------------------------------------------------------------------------
-// Adapter interface
-// ---------------------------------------------------------------------------
-
-/**
- * Engine-agnostic adapter that the eval framework programs against.
- *
- * Engine authors implement this interface to make their engine evaluable.
- * The adapter is the only coupling point between the eval module and any
- * specific engine -- nothing else in this package imports engine code.
- */
-export interface MemoryAdapter {
-	/**
-	 * Initialise the engine with a clean, isolated state.
-	 * Called once before each scenario.
-	 */
-	setup: (opts: AdapterSetupOpts) => Promise<void>
-
-	/** Ingest a memory event into the engine. */
-	ingest: (event: MemoryEvent) => Promise<void>
-
-	/**
-	 * Retrieve the top-K most relevant entities for the given query.
-	 * Results must be ordered by descending relevance (most relevant first).
-	 */
-	retrieve: (query: RetrieveQuery, topK: number) => Promise<RetrievedEntity[]>
-
-	/**
-	 * Report how the agent used a previously retrieved entity.
-	 * Engines that support reinforcement learning update internal state here.
-	 * Engines that do not may no-op.
-	 */
-	recordUsage: (entityId: string, signal: UsageSignal) => Promise<void>
-
-	/**
-	 * Trigger garbage collection / decay / pruning.
-	 * Engines that do not support GC may no-op and return a zero GcResult.
-	 */
-	gc: () => Promise<GcResult>
-
-	/**
-	 * Advance the engine's internal clock by the given duration.
-	 * Must delegate to the `DeterministicClock` provided in `setup`.
-	 * Engines that use wall-clock time must accept a synthetic clock override.
-	 */
-	advanceTime: (ms: number) => Promise<void>
-
-	/**
-	 * Return all currently persisted entity IDs (including low-score ones).
-	 * Used to compute noise ratio and GC effectiveness.
-	 */
-	listEntities: () => Promise<string[]>
-
-	/**
-	 * Tear down the engine and release any held resources.
-	 * Called once after each scenario, regardless of pass/fail.
-	 */
-	teardown: () => Promise<void>
-}
-
-// ---------------------------------------------------------------------------
-// Metrics
-// ---------------------------------------------------------------------------
-
-export interface EvalMetrics {
-	/** Of the top-K retrieved entities, what fraction was relevant? */
-	precisionAtK: number
-	/** Of all relevant entities, what fraction appeared in top-K? */
-	recallAtK: number
-	/** Mean reciprocal rank of the first relevant result (0 if none in top-K). */
-	mrr: number
-	/**
-	 * Fraction of persisted entities never retrieved after ingestion.
-	 * Measures ingestion threshold quality (high = lots of junk stored).
-	 */
-	noiseRatio: number
-	/**
-	 * Fraction of noise entities successfully removed by GC.
-	 * Only meaningful in scenarios that exercise GC. -1 when not applicable.
-	 */
-	gcEffectiveness: number
-	/**
-	 * Standard deviation of entity scores across GC cycles.
-	 * High drift = unstable scoring. -1 when not applicable.
-	 */
-	salienceDrift: number
-}
-
-// ---------------------------------------------------------------------------
-// Scenarios
-// ---------------------------------------------------------------------------
-
-export interface ScenarioResult {
-	metrics: EvalMetrics
-	passed: boolean
-	/** Human-readable explanation on failure. Empty string when passing. */
-	details: string
-}
-
-export interface ScenarioDefinition {
-	name: string
-	description: string
-	/**
-	 * Execute the scenario against the provided adapter and return results.
-	 * The runner handles setup/teardown; the scenario only drives ingest/retrieve.
-	 */
-	run: (adapter: MemoryAdapter, clock: DeterministicClock) => Promise<ScenarioResult>
-}
-
-// ---------------------------------------------------------------------------
-// Runner
-// ---------------------------------------------------------------------------
-
-export interface RunnerOpts {
-	/** The adapter wrapping the engine under test. */
-	adapter: MemoryAdapter
-	/**
-	 * Scenarios to run. Defaults to all built-in scenarios when omitted.
-	 */
-	scenarios?: ScenarioDefinition[]
-	/** Top-K for precision/recall computation. Default: 5. */
-	k?: number
-	/** Override default pass/fail thresholds per metric. */
-	thresholds?: Partial<EvalMetrics>
-	/**
-	 * Max scenarios running concurrently. Default: 1 (sequential).
-	 * Parallel execution is only safe if the adapter supports isolated instances.
-	 */
-	concurrency?: number
-	/** Called immediately before each scenario starts. */
-	onScenarioStart?: (name: string) => void
-	/** Called immediately after each scenario completes. */
-	onScenarioEnd?: (name: string, result: ScenarioResult) => void
-}
-
-// ---------------------------------------------------------------------------
-// Report
-// ---------------------------------------------------------------------------
-
-export interface EvalReport {
-	/** Unix ms timestamp of when the run completed. */
-	timestamp: number
-	results: Array<{
-		scenario: string
-		metrics: EvalMetrics
-		passed: boolean
-		details: string
-	}>
-	summary: {
-		total: number
-		passed: number
-		failed: number
-		avgPrecision: number
-		avgRecall: number
-		avgMrr: number
-	}
-}
diff --git a/packages/zosma-mem/src/evals/utils/assertions.ts b/packages/zosma-mem/src/evals/utils/assertions.ts
deleted file mode 100644
index 45de7fb..0000000
--- a/packages/zosma-mem/src/evals/utils/assertions.ts
+++ /dev/null
@@ -1,54 +0,0 @@
-/**
- * Threshold helpers for scenario pass/fail decisions.
- *
- * Each function returns a human-readable failure message, or an empty string
- * when the check passes. Scenarios collect these messages and join them to
- * produce the `details` field of ScenarioResult.
- */
-
-import type { EvalMetrics } from "../types.js"
-
-/** Default pass thresholds used when the runner does not provide overrides. */
-export const DEFAULT_THRESHOLDS: Readonly<EvalMetrics> = {
-	precisionAtK: 0.6,
-	recallAtK: 0.6,
-	mrr: 0.5,
-	noiseRatio: -1,    // no hard limit by default -- informational only
-	gcEffectiveness: -1, // -1 = N/A, skip check
-	salienceDrift: -1,   // -1 = N/A, skip check
-}
-
-/**
- * Check a single metric against a threshold.
- * Returns an empty string on pass, a descriptive message on fail.
- *
- * For `gcEffectiveness` and `salienceDrift`, a threshold of -1 means "skip".
- */
-export const checkMetric = (
-	name: keyof EvalMetrics,
-	actual: number,
-	threshold: number,
-): string => {
-	if (threshold === -1) return "" // N/A
-	if (actual >= threshold) return ""
-	return `${name}: ${actual.toFixed(3)} < threshold ${threshold.toFixed(3)}`
-}
-
-/**
- * Check all metrics against a threshold object.
- * Returns an array of failure messages (empty array = all passed).
- */
-export const checkAllMetrics = (
-	metrics: EvalMetrics,
-	thresholds: Readonly<Partial<EvalMetrics>>,
-): string[] => {
-	const merged: EvalMetrics = { ...DEFAULT_THRESHOLDS, ...thresholds }
-	const failures: string[] = []
-
-	for (const key of Object.keys(merged) as Array<keyof EvalMetrics>) {
-		const msg = checkMetric(key, metrics[key], merged[key])
-		if (msg) failures.push(msg)
-	}
-
-	return failures
-}
diff --git a/packages/zosma-mem/src/evals/utils/fixtures.ts b/packages/zosma-mem/src/evals/utils/fixtures.ts
deleted file mode 100644
index b5c6023..0000000
--- a/packages/zosma-mem/src/evals/utils/fixtures.ts
+++ /dev/null
@@ -1,67 +0,0 @@
-/**
- * Synthetic data builders for eval scenarios.
- *
- * All builders produce deterministic output given the same inputs.
- * No randomness, no network calls, no engine types.
- */
-
-import type { MemoryEvent, RetrieveQuery } from "../types.js"
-
-// ---------------------------------------------------------------------------
-// Event builders
-// ---------------------------------------------------------------------------
-
-/**
- * Create a MemoryEvent with sensible defaults.
- * Any field can be overridden by passing a partial.
- */
-export const createEvent = (overrides: Partial<MemoryEvent> & Pick<MemoryEvent, "id" | "content">): MemoryEvent => ({
-	type: "pattern",
-	tags: [],
-	timestamp: 0,
-	metadata: {},
-	...overrides,
-})
-
-/**
- * Build a batch of N low-value events (no tags, generic content).
- * Used in signal-dilution scenarios to pad the memory store.
- */
-export const createLowValueEvents = (count: number, startTimestamp: number): MemoryEvent[] =>
-	Array.from({ length: count }, (_, i) => ({
-		id: `low-value-${i}`,
-		type: "pattern",
-		content: `Routine observation ${i}: nothing notable happened.`,
-		tags: [],
-		timestamp: startTimestamp + i,
-		metadata: {},
-	}))
-
-/**
- * Build a batch of high-value events with explicit tags.
- */
-export const createHighValueEvents = (
-	ids: string[],
-	tags: string[],
-	startTimestamp: number,
-): MemoryEvent[] =>
-	ids.map((id, i) => ({
-		id,
-		type: "decision",
-		content: `Critical decision recorded: ${id}. Tags: ${tags.join(", ")}.`,
-		tags,
-		timestamp: startTimestamp + i,
-		metadata: {},
-	}))
-
-// ---------------------------------------------------------------------------
-// Query builders
-// ---------------------------------------------------------------------------
-
-/**
- * Create a RetrieveQuery with sensible defaults.
- */
-export const createQuery = (overrides: Partial<RetrieveQuery> & Pick<RetrieveQuery, "text">): RetrieveQuery => ({
-	tags: [],
-	...overrides,
-})
diff --git a/packages/zosma-mem/src/evals/utils/time.ts b/packages/zosma-mem/src/evals/utils/time.ts
deleted file mode 100644
index dadaf91..0000000
--- a/packages/zosma-mem/src/evals/utils/time.ts
+++ /dev/null
@@ -1,32 +0,0 @@
-/**
- * Deterministic clock implementation for use in eval scenarios.
- *
- * Scenarios advance this clock explicitly rather than relying on wall-clock
- * time, making time-sensitive tests (decay, stale memory) fully reproducible.
- */
-
-import type { DeterministicClock } from "../types.js"
-
-/**
- * Create a new deterministic clock starting at the given epoch timestamp.
- *
- * @param startMs - Initial timestamp in milliseconds. Defaults to a fixed
- *                  reference point (2026-01-01T00:00:00.000Z) so tests are
- *                  not sensitive to when they run.
- */
-export const createClock = (startMs = 1_735_689_600_000): DeterministicClock => {
-	let current = startMs
-
-	return {
-		now: () => current,
-		advance: (ms: number) => {
-			current += ms
-		},
-	}
-}
-
-// Convenience constants for advancing time in scenarios.
-export const ONE_HOUR_MS = 60 * 60 * 1_000
-export const ONE_DAY_MS = 24 * ONE_HOUR_MS
-export const ONE_WEEK_MS = 7 * ONE_DAY_MS
-export const THIRTY_DAYS_MS = 30 * ONE_DAY_MS
diff --git a/packages/zosma-mem/src/gc/__tests__/gc.test.ts b/packages/zosma-mem/src/gc/__tests__/gc.test.ts
new file mode 100644
index 0000000..0f7e528
--- /dev/null
+++ b/packages/zosma-mem/src/gc/__tests__/gc.test.ts
@@ -0,0 +1,96 @@
+import { mkdtempSync } from "node:fs"
+import { tmpdir } from "node:os"
+import { join } from "node:path"
+import { describe, expect, it } from "vitest"
+import { EntityStore } from "../../store/entity-store.js"
+import type { MemoryEntity } from "../../types.js"
+import { decayAll } from "../decay.js"
+import { runGc } from "../index.js"
+import { pruneBelow } from "../prune.js"
+
+const NOW = 1_000_000_000_000
+const DAY_MS = 86_400_000
+
+const makeEntity = (
+	id: string,
+	lastAccessedOffset = 0,
+	reuseCount = 0,
+	decisionInfluence = 0,
+	belowThresholdCycles = 0,
+): MemoryEntity => ({
+	id,
+	source: { branch: "main", commitRef: "0" },
+	score: {
+		reuseCount,
+		decisionInfluence,
+		ignoredReads: 0,
+		lastAccessed: NOW - lastAccessedOffset,
+		attentionWeight: 0,
+		belowThresholdCycles,
+	},
+	tags: [],
+	content: `content ${id}`,
+})
+
+const makeStore = (...entities: MemoryEntity[]): EntityStore => {
+	const dir = mkdtempSync(join(tmpdir(), "gc-test-"))
+	const store = new EntityStore(dir)
+	store.ensureDir()
+	for (const e of entities) store.write(e)
+	return store
+}
+
+describe("decayAll", () => {
+	it("entity with 30-day-old lastAccessed gets lower attentionWeight than fresh entity", () => {
+		const fresh = makeEntity("fresh", 0)
+		const stale = makeEntity("stale", 30 * DAY_MS)
+		const store = makeStore(fresh, stale)
+		decayAll(store, () => NOW)
+		const freshUpdated = store.read("fresh")!
+		const staleUpdated = store.read("stale")!
+		expect(freshUpdated.score.attentionWeight).toBeGreaterThanOrEqual(staleUpdated.score.attentionWeight)
+	})
+})
+
+describe("pruneBelow", () => {
+	it("entity below threshold for pruneCycles is archived", () => {
+		// salience: 2*0 + 5*0 - 2*0 - ln(1+100) ≈ -4.6 → below 0.4
+		const entity = makeEntity("old", 100 * DAY_MS, 0, 0, 2) // belowThresholdCycles=2, pruneCycles=3
+		const store = makeStore(entity)
+		const pruned = pruneBelow(store, 0.4, 3, () => NOW)
+		expect(pruned).toBe(1)
+		expect(store.read("old")).toBeUndefined()
+	})
+
+	it("entity below threshold for fewer than pruneCycles cycles is NOT archived", () => {
+		const entity = makeEntity("young-stale", 50 * DAY_MS, 0, 0, 0)
+		const store = makeStore(entity)
+		const pruned = pruneBelow(store, 0.4, 3, () => NOW)
+		expect(pruned).toBe(0)
+		const updated = store.read("young-stale")!
+		expect(updated.score.belowThresholdCycles).toBe(1)
+	})
+})
+
+describe("runGc", () => {
+	it("integrates decay and prune, returns correct report", () => {
+		// fresh: reuseCount=5, decisionInfluence=2 → salience = 10+10 - ln(1) = 20 → above threshold
+		const fresh = makeEntity("fresh", 0, 5, 2)
+		// stale: below threshold for 2 cycles already, third cycle archives it
+		const stale = makeEntity("stale", 100 * DAY_MS, 0, 0, 2)
+		const store = makeStore(fresh, stale)
+		const coAccess = {}
+		const config = {
+			memoryDir: "",
+			salienceThreshold: 0.4,
+			gcIntervalMs: 0,
+			gcPruneCycles: 3,
+			summarizer: undefined,
+			now: undefined,
+		}
+		const report = runGc(store, coAccess, config, () => NOW)
+		expect(report.decayed).toBe(2)
+		expect(report.pruned).toBe(1)
+		expect(report.consolidated).toBe(0)
+	})
+})
diff --git a/packages/zosma-mem/src/gc/consolidate.ts b/packages/zosma-mem/src/gc/consolidate.ts
new file mode 100644
index 0000000..9be7524
--- /dev/null
+++ b/packages/zosma-mem/src/gc/consolidate.ts
@@ -0,0 +1,12 @@
+import type { CoAccessGraph } from "../store/co-access.js"
+import type { EntityStore } from "../store/entity-store.js"
+import type { MemoryConfig } from "../types.js"
+
+/** Merge co-access clusters where all members are below threshold. MVP: no-op, returns 0. */
+export const consolidateClusters = async (
+	_store: EntityStore,
+	_coAccess: CoAccessGraph,
+	_config: Pick<MemoryConfig, "salienceThreshold" | "summarizer" | "now">,
+): Promise<number> => {
+	return 0
+}
diff --git a/packages/zosma-mem/src/gc/decay.ts b/packages/zosma-mem/src/gc/decay.ts
new file mode 100644
index 0000000..e5ea63a
--- /dev/null
+++ b/packages/zosma-mem/src/gc/decay.ts
@@ -0,0 +1,16 @@
+import { computeSalience } from "../engine/salience.js"
+import type { EntityStore } from "../store/entity-store.js"
+
+/** Recompute salience for all entities. Updates score.attentionWeight. Returns count of updated entities. */
+export const decayAll = (store: EntityStore, now: () => number): number => {
+	const ids = store.list()
+	let count = 0
+	for (const id of ids) {
+		const entity = store.read(id)
+		if (!entity) continue
+		const newSalience = computeSalience(entity.score, now)
+		store.write({ ...entity, score: { ...entity.score, attentionWeight: Math.max(0, newSalience) } })
+		count++
+	}
+	return count
+}
diff --git a/packages/zosma-mem/src/gc/index.ts b/packages/zosma-mem/src/gc/index.ts
new file mode 100644
index 0000000..e9699da
--- /dev/null
+++ b/packages/zosma-mem/src/gc/index.ts
@@ -0,0 +1,22 @@
+import type { CoAccessGraph } from "../store/co-access.js"
+import type { EntityStore } from "../store/entity-store.js"
+import type { GcReport, MemoryConfig } from "../types.js"
+import { consolidateClusters } from "./consolidate.js"
+import { decayAll } from "./decay.js"
+import { pruneBelow } from "./prune.js"
+
+export const runGc = (
+	store: EntityStore,
+	coAccess: CoAccessGraph,
+	config: Required<Omit<MemoryConfig, "summarizer" | "now">> & Pick<MemoryConfig, "summarizer" | "now">,
+	now: () => number,
+): GcReport => {
+	const decayed = decayAll(store, now)
+	const pruned = pruneBelow(store, config.salienceThreshold, config.gcPruneCycles, now)
+	void consolidateClusters(store, coAccess, {
+		salienceThreshold: config.salienceThreshold,
+		summarizer: config.summarizer,
+		now: config.now,
+	})
+	return { decayed, pruned, consolidated: 0 }
+}
diff --git a/packages/zosma-mem/src/gc/prune.ts b/packages/zosma-mem/src/gc/prune.ts
new file mode 100644
index 0000000..f63b227
--- /dev/null
+++ b/packages/zosma-mem/src/gc/prune.ts
@@ -0,0 +1,27 @@
+import { computeSalience } from "../engine/salience.js"
+import type { EntityStore } from "../store/entity-store.js"
+
+/** Archive entities that have been below threshold for gcPruneCycles consecutive cycles. */
+export const pruneBelow = (store: EntityStore, threshold: number, pruneCycles: number, now: () => number): number => {
+	const ids = store.list()
+	let pruned = 0
+	for (const id of ids) {
+		const entity = store.read(id)
+		if (!entity) continue
+		const salience = computeSalience(entity.score, now)
+		if (salience < threshold) {
+			const cycles = entity.score.belowThresholdCycles + 1
+			if (cycles >= pruneCycles) {
+				store.archive(id)
+				pruned++
+			} else {
+				store.write({ ...entity, score: { ...entity.score, belowThresholdCycles: cycles } })
+			}
+		} else {
+			if (entity.score.belowThresholdCycles > 0) {
+				store.write({ ...entity, score: { ...entity.score, belowThresholdCycles: 0 } })
+			}
+		}
+	}
+	return pruned
+}
diff --git a/packages/zosma-mem/src/index.ts b/packages/zosma-mem/src/index.ts
index 73ab09b..87a4f2b 100644
--- a/packages/zosma-mem/src/index.ts
+++ b/packages/zosma-mem/src/index.ts
@@ -1,4 +1,2 @@
-// zosma-mem package root
-// Re-exports the evals module as the primary surface for v0.0.1.
-// Future modules (engine, store, ingestion) will be added here.
-export * from "./evals/index.js"
+export * from "./engine/index.js"
+export * from "./types.js"
diff --git a/packages/zosma-mem/src/ingestion/__tests__/ingest.test.ts b/packages/zosma-mem/src/ingestion/__tests__/ingest.test.ts
index 7126756..a73491f 100644
--- a/packages/zosma-mem/src/ingestion/__tests__/ingest.test.ts
+++ b/packages/zosma-mem/src/ingestion/__tests__/ingest.test.ts
@@ -1,10 +1,9 @@
-import { mkdtempSync, rmSync, writeFileSync } from "node:fs"
+import { mkdtempSync, rmSync } from "node:fs"
 import { tmpdir } from "node:os"
 import { join } from "node:path"
 import { afterEach, beforeEach, describe, expect, it } from "vitest"
 import { EntityStore } from "../../store/entity-store.js"
 import type { MemoryEvent } from "../../types.js"
-import { reindex } from "../commit-indexer.js"
 import { ingest } from "../ingest.js"
 
 const makeEvent = (overrides: Partial<MemoryEvent> = {}): MemoryEvent => ({
@@ -49,55 +48,9 @@ describe("ingest", () => {
 	it("preserves existing score on upsert", () => {
 		ingest(makeEvent({ id: "score-preserve" }), store, {})
 		const first = store.read("score-preserve")!
-		// Manually bump reuseCount
 		store.write({ ...first, score: { ...first.score, reuseCount: 5 } })
 		ingest(makeEvent({ id: "score-preserve", content: "new content" }), store, {})
 		const second = store.read("score-preserve")!
 		expect(second.score.reuseCount).toBe(5)
 	})
 })
-
-describe("reindex", () => {
-	beforeEach(() => {
-		dir = mkdtempSync(join(tmpdir(), "reindex-test-"))
-		store = new EntityStore(dir)
-		store.ensureDir()
-	})
-
-	afterEach(() => {
-		rmSync(dir, { recursive: true, force: true })
-	})
-
-	it("returns 0 when commits.md does not exist", () => {
-		expect(reindex(dir, store, {})).toBe(0)
-	})
-
-	it("ingests commits from commits.md", () => {
-		const md = "## abc123\nFixed the auth bug.\ntags: auth, fix\n"
-		writeFileSync(join(dir, "commits.md"), md, "utf-8")
-		const count = reindex(dir, store, {})
-		expect(count).toBe(1)
-		expect(store.read("main-abc123")).toBeDefined()
-	})
-
-	it("is idempotent: second call returns 0 for already-indexed commits", () => {
-		const md = "## abc123\nFixed the auth bug.\ntags: auth, fix\n"
-		writeFileSync(join(dir, "commits.md"), md, "utf-8")
-		reindex(dir, store, {})
-		const count = reindex(dir, store, {})
-		expect(count).toBe(0)
-	})
-
-	it("ingests only new commits on second call", () => {
-		writeFileSync(join(dir, "commits.md"), "## ref1\nFirst commit.\ntags: a\n", "utf-8")
-		reindex(dir, store, {})
-		writeFileSync(
-			join(dir, "commits.md"),
-			"## ref1\nFirst commit.\ntags: a\n\n## ref2\nSecond commit.\ntags: b\n",
-			"utf-8",
-		)
-		const count = reindex(dir, store, {})
-		expect(count).toBe(1)
-		expect(store.read("main-ref2")).toBeDefined()
-	})
-})
diff --git a/packages/zosma-mem/src/ingestion/commit-indexer.ts b/packages/zosma-mem/src/ingestion/commit-indexer.ts
deleted file mode 100644
index 79d8eb1..0000000
--- a/packages/zosma-mem/src/ingestion/commit-indexer.ts
+++ /dev/null
@@ -1,46 +0,0 @@
-import { existsSync, readFileSync, writeFileSync } from "node:fs"
-import { join } from "node:path"
-import { parseCommitsMarkdown } from "../brain-adapter/parser.js"
-import type { EntityStore } from "../store/entity-store.js"
-import type { MemoryConfig } from "../types.js"
-import { ingest } from "./ingest.js"
-
-const INDEXED_FILE = ".indexed"
-
-/**
- * Parse commits.md and ingest new entities. Idempotent.
- * Returns number of new entities ingested.
- */
-export const reindex = (
-	memoryDir: string,
-	store: EntityStore,
-	config: Pick<MemoryConfig, "salienceThreshold" | "now">,
-): number => {
-	const commitsPath = join(memoryDir, "commits.md")
-	if (!existsSync(commitsPath)) return 0
-
-	const indexedPath = join(memoryDir, ".salience", INDEXED_FILE)
-	const indexed: string[] = existsSync(indexedPath) ? (JSON.parse(readFileSync(indexedPath, "utf-8")) as string[]) : []
-
-	const markdown = readFileSync(commitsPath, "utf-8")
-	const commits = parseCommitsMarkdown(markdown)
-	const newRefs = commits.filter((c) => !indexed.includes(c.ref))
-
-	let count = 0
-	for (const commit of newRefs) {
-		const event = {
-			id: `main-${commit.ref}`,
-			type: "pattern" as const,
-			content: commit.body,
-			tags: commit.tags,
-			metadata: { branch: "main", commitRef: commit.ref },
-			timestamp: config.now ? config.now() : Date.now(),
-		}
-		ingest(event, store, config)
-		indexed.push(commit.ref)
-		count++
-	}
-
-	writeFileSync(indexedPath, JSON.stringify(indexed), "utf-8")
-	return count
-}
diff --git a/packages/zosma-mem/src/ingestion/event-bus.ts b/packages/zosma-mem/src/ingestion/event-bus.ts
deleted file mode 100644
index 8c4f580..0000000
--- a/packages/zosma-mem/src/ingestion/event-bus.ts
+++ /dev/null
@@ -1,25 +0,0 @@
-import { EventEmitter } from "node:events"
-import type { MemoryEvent } from "../types.js"
-
-export type MemoryEventName = "ingested" | "discarded" | "scored"
-
-export interface EventBus {
-	on: (event: MemoryEventName, listener: (e: MemoryEvent) => void) => void
-	off: (event: MemoryEventName, listener: (e: MemoryEvent) => void) => void
-	emit: (event: MemoryEventName, e: MemoryEvent) => void
-}
-
-export const createEventBus = (): EventBus => {
-	const emitter = new EventEmitter()
-	return {
-		on: (event, listener) => {
-			emitter.on(event, listener)
-		},
-		off: (event, listener) => {
-			emitter.off(event, listener)
-		},
-		emit: (event, e) => {
-			emitter.emit(event, e)
-		},
-	}
-}
diff --git a/packages/zosma-mem/src/ingestion/index.ts b/packages/zosma-mem/src/ingestion/index.ts
index 345249b..d929915 100644
--- a/packages/zosma-mem/src/ingestion/index.ts
+++ b/packages/zosma-mem/src/ingestion/index.ts
@@ -1,4 +1 @@
-export { createEventBus } from "./event-bus.js"
 export { ingest } from "./ingest.js"
-export { reindex } from "./commit-indexer.js"
-export type { EventBus, MemoryEventName } from "./event-bus.js"
diff --git a/packages/zosma-mem/src/ingestion/ingest.ts b/packages/zosma-mem/src/ingestion/ingest.ts
index 4b32d71..c5ab961 100644
--- a/packages/zosma-mem/src/ingestion/ingest.ts
+++ b/packages/zosma-mem/src/ingestion/ingest.ts
@@ -5,6 +5,11 @@ import type { MemoryConfig, MemoryEntity, MemoryEvent } from "../types.js"
 /**
  * Ingest a MemoryEvent. Always persists (upsert). The threshold is enforced
  * during GC pruning, not at ingestion time — every event type is stored.
+ *
+ * Conflict resolution: when re-ingesting an existing entity with changed
+ * content, `lastAccessed` is refreshed so the updated version ranks above
+ * the stale version in time-sensitive queries.
+ *
  * Returns true always (kept for interface compatibility).
  */
 export const ingest = (
@@ -14,7 +19,14 @@ export const ingest = (
 ): boolean => {
 	const nowFn = config.now ?? Date.now
 	const existing = store.read(event.id)
-	const score = existing?.score ?? initialScore(event.type, nowFn)
+
+	let score = existing?.score ?? initialScore(event.type, nowFn)
+
+	// Conflict resolution: if content changed, treat the entity as freshly
+	// accessed so its time-decay resets and it outranks the stale version.
+	if (existing && existing.content !== event.content) {
+		score = { ...score, lastAccessed: nowFn(), belowThresholdCycles: 0 }
+	}
 
 	const entity: MemoryEntity = {
 		id: event.id,
diff --git a/packages/zosma-mem/src/retrieval/__tests__/retrieve.test.ts b/packages/zosma-mem/src/retrieval/__tests__/retrieve.test.ts
new file mode 100644
index 0000000..586b2de
--- /dev/null
+++ b/packages/zosma-mem/src/retrieval/__tests__/retrieve.test.ts
@@ -0,0 +1,87 @@
+import { mkdtempSync } from "node:fs"
+import { tmpdir } from "node:os"
+import { join } from "node:path"
+import { describe, expect, it } from "vitest"
+import type { CoAccessGraph } from "../../store/co-access.js"
+import { EntityStore } from "../../store/entity-store.js"
+import type { MemoryEntity } from "../../types.js"
+import { retrieve } from "../retrieve.js"
+
+const NOW = 1_000_000_000_000
+const nowFn = () => NOW
+
+const makeEntity = (
+	id: string,
+	tags: string[],
+	reuseCount = 0,
+	decisionInfluence = 0,
+	ignoredReads = 0,
+	lastAccessed = NOW,
+): MemoryEntity => ({
+	id,
+	source: { branch: "main", commitRef: "0" },
+	score: {
+		reuseCount,
+		decisionInfluence,
+		ignoredReads,
+		lastAccessed,
+		attentionWeight: 0,
+		belowThresholdCycles: 0,
+	},
+	tags,
+	content: `content of ${id}`,
+})
+
+const makeStore = (entities: MemoryEntity[]): EntityStore => {
+	const dir = mkdtempSync(join(tmpdir(), "retrieve-test-"))
+	const store = new EntityStore(dir)
+	store.ensureDir()
+	for (const e of entities) store.write(e)
+	return store
+}
+
+describe("retrieve", () => {
+	it("matching entities rank first", () => {
+		const entities = [
+			makeEntity("a", ["typescript", "auth"]),
+			makeEntity("b", ["database", "sql"]),
+			makeEntity("c", ["typescript", "config"]),
+			makeEntity("d", ["logging"]),
+			makeEntity("e", ["typescript", "auth", "config"]),
+		]
+		const store = makeStore(entities)
+		const coAccess: CoAccessGraph = {}
+		const results = retrieve({ taskDescription: "typescript auth config" }, store, coAccess, { now: nowFn }, 3)
+		const ids = results.map((r) => r.entity.id)
+		// e has 3 matching tags, a and c have 2 each; b and d have none
+		expect(ids).toContain("e")
+		expect(ids).not.toContain("b")
+		expect(ids).not.toContain("d")
+	})
+
+	it("high tag overlap beats high salience with no overlap", () => {
+		// High salience but NO tag overlap: reuseCount=1, decisionInfluence=0 → salience ≈ 2
+		const highSalience = makeEntity("salience", [], 1, 0)
+		// Two tag matches → tagOverlap score = 3*2 = 6, which exceeds salience entity's 2
+		const tagMatch = makeEntity("tagmatch", ["typescript", "auth"])
+		const store = makeStore([highSalience, tagMatch])
+		const coAccess: CoAccessGraph = {}
+		const results = retrieve({ taskDescription: "typescript auth" }, store, coAccess, { now: nowFn }, 1)
+		expect(results[0].entity.id).toBe("tagmatch")
+	})
+
+	it("co-access boost: after two entities retrieved together, querying one surfaces the other", () => {
+		const entities = [makeEntity("x", ["foo"]), makeEntity("y", ["bar"]), makeEntity("z", ["baz"])]
+		const store = makeStore(entities)
+		const coAccess: CoAccessGraph = {}
+
+		// First retrieval: x and y are co-retrieved
+		retrieve({ taskDescription: "foo bar" }, store, coAccess, { now: nowFn }, 2)
+
+		// Now query only for 'foo' — y should get co-access boost because it was retrieved with x
+		const secondResults = retrieve({ taskDescription: "foo" }, store, coAccess, { now: nowFn }, 3)
+		const ids = secondResults.map((r) => r.entity.id)
+		expect(ids).toContain("x")
+		expect(ids).toContain("y")
+	})
+})
diff --git a/packages/zosma-mem/src/retrieval/index.ts b/packages/zosma-mem/src/retrieval/index.ts
new file mode 100644
index 0000000..96ada25
--- /dev/null
+++ b/packages/zosma-mem/src/retrieval/index.ts
@@ -0,0 +1 @@
+export { retrieve } from "./retrieve.js"
diff --git a/packages/zosma-mem/src/retrieval/retrieve.ts b/packages/zosma-mem/src/retrieval/retrieve.ts
new file mode 100644
index 0000000..9c1be3a
--- /dev/null
+++ b/packages/zosma-mem/src/retrieval/retrieve.ts
@@ -0,0 +1,87 @@
+import { computeSalience } from "../engine/salience.js"
+import type { CoAccessGraph } from "../store/co-access.js"
+import { recordCoAccess } from "../store/co-access.js"
+import type { EntityStore } from "../store/entity-store.js"
+import type { AttentionQuery, MemoryConfig, ScoredEntity } from "../types.js"
+
+/**
+ * Attention score:
+ *   A(q, e) = 3*taskOverlap(q, e) + 5*intentOverlap(q, e) + S(e) + coAccessBoost(e)
+ *
+ * taskOverlap  — entity tags appearing in the query's task description text
+ * intentOverlap — entity tags matching explicit intent/hint tags (higher weight)
+ *
+ * Two-pass retrieval:
+ *   Pass 1: score all entities by tagOverlap + salience, take top 2K candidates
+ *   Pass 2: add coAccessBoost among candidates, re-sort, return top K
+ */
+export const retrieve = (
+	query: AttentionQuery,
+	store: EntityStore,
+	coAccess: CoAccessGraph,
+	config: Pick<MemoryConfig, "now">,
+	topK = 5,
+): ScoredEntity[] => {
+	const nowFn = config.now ?? Date.now
+	const taskTerms = new Set(query.taskDescription.toLowerCase().split(/\s+/))
+	// Intent tags (e.g. ["auth", "session"]) get a higher weight — they are
+	// explicit signals about what the agent is working on right now.
+	const intentTags: Set<string> = query.intent
+		? new Set(query.intent.toLowerCase().split(/\s+/).filter((t) => t.length > 0))
+		: new Set()
+
+	const ids = store.list()
+	if (ids.length === 0) return []
+
+	// Pass 1: base score
+	const candidates = ids
+		.map((id) => {
+			const entity = store.read(id)
+			if (!entity) return null
+			const taskOverlap = entity.tags.filter((t) => taskTerms.has(t.toLowerCase())).length
+			const intentOverlap = intentTags.size > 0
+				? entity.tags.filter((t) => intentTags.has(t.toLowerCase())).length
+				: 0
+			const salience = computeSalience(entity.score, nowFn)
+
+			// Context isolation: when intent tags are provided and the entity has
+			// zero overlap with both task terms AND intent tags, it is irrelevant to
+			// this query. Penalize it to prevent high-salience entities from leaking
+			// across context boundaries.
+			if (intentTags.size > 0 && taskOverlap === 0 && intentOverlap === 0) {
+				// Cap at a small negative value — ensures any entity with even one
+				// tag match outranks a high-salience but contextually irrelevant entity.
+				return { entity, baseScore: Math.min(salience * 0.05, -1) }
+			}
+
+			return { entity, baseScore: 3 * taskOverlap + 5 * intentOverlap + salience }
+		})
+		.filter(Boolean) as Array<{
+		entity: NonNullable<ReturnType<EntityStore["read"]>>
+		baseScore: number
+	}>
+
+	candidates.sort((a, b) => b.baseScore - a.baseScore)
+	const pool = candidates.slice(0, Math.max(topK * 2, 10))
+	const poolIds = new Set(pool.map((c) => c.entity.id))
+
+	// Pass 2: co-access boost
+	const scored: ScoredEntity[] = pool.map(({ entity, baseScore }) => {
+		const coBoost = (coAccess[entity.id] ?? []).some((coId) => poolIds.has(coId)) ? 1 : 0
+		return { entity, attentionScore: baseScore + coBoost }
+	})
+
+	scored.sort((a, b) => b.attentionScore - a.attentionScore)
+	const results = scored.slice(0, topK)
+
+	// Update co-access graph with this retrieval session
+	if (results.length > 1) {
+		const updatedGraph = recordCoAccess(
+			coAccess,
+			results.map((r) => r.entity.id),
+		)
+		Object.assign(coAccess, updatedGraph)
+	}
+
+	return results
+}
diff --git a/packages/zosma-mem/src/types.ts b/packages/zosma-mem/src/types.ts
new file mode 100644
index 0000000..221c268
--- /dev/null
+++ b/packages/zosma-mem/src/types.ts
@@ -0,0 +1,75 @@
+// Engine types
+export type MemoryEventType = 'decision' | 'error' | 'pattern' | 'preference'
+
+export interface MemoryEvent {
+  id: string
+  type: MemoryEventType
+  content: string
+  tags: string[]
+  attentionWeight?: number
+  metadata?: {
+    file?: string
+    module?: string
+    relatedMemories?: string[]
+    branch?: string
+    commitRef?: string
+  }
+  timestamp: number
+}
+
+export interface MemoryScore {
+  reuseCount: number
+  decisionInfluence: number
+  ignoredReads: number
+  lastAccessed: number
+  attentionWeight: number
+  belowThresholdCycles: number
+}
+
+export interface MemoryEntity {
+  id: string
+  source: { branch: string; commitRef: string }
+  score: MemoryScore
+  tags: string[]
+  content: string
+}
+
+export interface MemoryConfig {
+  memoryDir: string
+  salienceThreshold?: number
+  gcIntervalMs?: number
+  gcPruneCycles?: number
+  summarizer?: Summarizer
+  now?: () => number
+}
+
+export type Summarizer = (texts: string[]) => Promise<string>
+
+export interface AttentionQuery {
+  taskDescription: string
+  activeToolName?: string
+  intent?: string
+}
+
+export interface ScoredEntity {
+  entity: MemoryEntity
+  attentionScore: number
+}
+
+export interface GcReport {
+  decayed: number
+  pruned: number
+  consolidated: number
+}
+
+export interface MemoryEngine {
+  ingest: (event: MemoryEvent) => Promise<void>
+  retrieve: (query: AttentionQuery, topK?: number) => Promise<ScoredEntity[]>
+  recordRead: (entityId: string) => Promise<void>
+  recordIgnoredRead: (entityId: string) => Promise<void>
+  recordDecisionInfluence: (entityId: string) => Promise<void>
+  gc: () => Promise<GcReport>
+  shutdown: () => void
+  /** Return all persisted entity IDs (used by the eval adapter). */
+  listEntities: () => Promise<string[]>
+}
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index f409220..bcf97d4 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -369,12 +369,12 @@ importers:
       '@openzosma/logger':
         specifier: workspace:*
         version: link:../logger
-      '@openzosma/memory':
-        specifier: workspace:*
-        version: link:../memory
       '@openzosma/skill-reports':
         specifier: workspace:*
         version: link:../skills/reports
+      '@openzosma/zosma-mem':
+        specifier: workspace:*
+        version: link:../zosma-mem
       '@sinclair/typebox':
         specifier: ^0.34.48
         version: 0.34.48
@@ -593,21 +593,6 @@ importers:
         specifier: ^5.7.3
         version: 5.9.3
 
-  packages/memory:
-    devDependencies:
-      '@types/node':
-        specifier: ^22.15.2
-        version: 22.19.15
-      typescript:
-        specifier: ^5.7.3
-        version: 5.9.3
-      vitest:
-        specifier: ^3.0.0
-        version: 3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3)
-      zosma-mem:
-        specifier: link:../zosma-mem
-        version: link:../zosma-mem
-
   packages/orchestrator:
     dependencies:
       '@openzosma/agents':
@@ -681,10 +666,10 @@ importers:
     dependencies:
       '@mariozechner/pi-agent-core':
         specifier: ^0.61.0
-        version: 0.61.1(ws@8.19.0)(zod@4.3.6)
+        version: 0.61.1
       '@mariozechner/pi-coding-agent':
         specifier: ^0.61.0
-        version: 0.61.0(ws@8.19.0)(zod@4.3.6)
+        version: 0.61.0
       '@react-pdf/renderer':
         specifier: ^4.3.0
         version: 4.3.2(react@19.2.4)
@@ -734,6 +719,18 @@ importers:
       ink-spinner:
         specifier: ^5.0.0
         version: 5.0.0(ink@5.2.1(@types/react@18.3.28)(react@18.3.1))(react@18.3.1)
+      p-limit:
+        specifier: ^5.0.0
+        version: 5.0.0
+      pi-brain:
+        specifier: ^0.1.7
+        version: 0.1.7(@sinclair/typebox@0.34.48)
+      pi-dcp:
+        specifier: ^0.2.0
+        version: 0.2.0(@mariozechner/pi-agent-core@0.61.1(zod@3.25.76))(@mariozechner/pi-coding-agent@0.61.0(zod@3.25.76))
+      pino:
+        specifier: ^9.0.0
+        version: 9.14.0
       react:
         specifier: ^18.3.0
         version: 18.3.1
@@ -1683,6 +1680,9 @@ packages:
     resolution: {integrity: sha512-3giAOQvZiH5F9bMlMiv8+GSPMeqg0dbaeo58/0SlA9sxSqZhnUtxzX9/2FzyhS9sWQf5S0GJE0AKBrFqjpeYcg==}
     engines: {node: '>=8.0.0'}
 
+  '@pinojs/redact@0.4.0':
+    resolution: {integrity: sha512-k2ENnmBugE/rzQfEcdWHcCY+/FM3VLzH9cYEsbdsoqrvzAKRhUZeRNhAZvB8OitQJ1TBed3yqWtdjzS6wJKBwg==}
+
   '@protobuf-ts/grpc-transport@2.11.1':
     resolution: {integrity: sha512-l6wrcFffY+tuNnuyrNCkRM8hDIsAZVLA8Mn7PKdVyYxITosYh60qW663p9kL6TWXYuDCL3oxH8ih3vLKTDyhtg==}
     peerDependencies:
@@ -2954,6 +2954,14 @@ packages:
     resolution: {integrity: sha512-O/IEdcCUKkubz60tFbGA7ceITTAJsty+lBjNoorP4Z6XRqaFb/OjQjZODophEcuq68nKm6/0r+6/lLQ+XVpk8g==}
     engines: {node: '>=18.0.0'}
 
+  '@stacksjs/clapp@0.2.0':
+    resolution: {integrity: sha512-dSqnbeZjXnQLLvVxC5NU7D9Vpjxc6cC9Bo2ZwaqjgruK7pbVoFCI0goc9Mtf/lfSTbTx6Uvv/mbY7+cOW/j3Og==}
+    hasBin: true
+
+  '@stacksjs/clarity@0.3.24':
+    resolution: {integrity: sha512-QN21fT/9dovcuFTkni9LFHDzBpiBZ4Q//0a3vFJsckPiblNIu1RhwwePkkTK4j6Xu2DtVYGR60/9Scdrp6wRfw==}
+    hasBin: true
+
   '@standard-schema/spec@1.1.0':
     resolution: {integrity: sha512-l2aFy5jALhniG5HgqrD6jXLi/rUWrKvqN/qJx6yoJsgKhblVd+iqqU4RCXavm/jPityDo5TCvKMnpjKnOriy0w==}
 
@@ -3728,6 +3736,10 @@ packages:
   asynckit@0.4.0:
     resolution: {integrity: sha512-Oei9OH4tRh0YqU3GxhX79dM/mwVgvbZJaSNaRk+bshkj0S5cfHcgYakreBjrHwatXKbz+IoIdYLxrKim2MjW0Q==}
 
+  atomic-sleep@1.0.0:
+    resolution: {integrity: sha512-kNOjDqAh7px0XWNI+4QbzoiR/nTkHAWNud2uvnJquD1/x5a7EQZMJT0AczqK0Qn67oY/TTQ1LbUKajZpp3I9tQ==}
+    engines: {node: '>=8.0.0'}
+
   auto-bind@5.0.1:
     resolution: {integrity: sha512-ooviqdwwgfIfNmDwo94wlshcdzfO64XV0Cg6oDsDYBJfITDz1EngD2z7DkbvCWn+XIMsIqW27sEVF6qcpJrRcg==}
     engines: {node: ^12.20.0 || ^14.13.1 || >=16.0.0}
@@ -3907,6 +3919,10 @@ packages:
     resolution: {integrity: sha512-9q/rDEGSb/Qsvv2qvzIzdluL5k7AaJOTrw23z9reQthrbF7is4CtlT0DXyO1oei2DCp4uojjzQ7igaSHp1kAEQ==}
     engines: {node: '>=0.2.0'}
 
+  bunfig@0.15.6:
+    resolution: {integrity: sha512-7ynPmrn1dN5F+0DtUVY0Vo2MZOOnSdb6hpQePwABEYIJ+d/rSb3vaOVUs3MFxwxWuaVc1FEStVJG6+kCgbLuyg==}
+    hasBin: true
+
   bytes@3.1.2:
     resolution: {integrity: sha512-/Nf7TyzTx6S3yRJObOAV7956r8cr2+Oj8AC5dt8wSP3BQAoeX58NoHyCU8P8zGkNXStjTSi6fzO6F0pBdcYbEg==}
     engines: {node: '>= 0.8'}
@@ -5700,6 +5716,10 @@ packages:
       react-dom:
         optional: true
 
+  mri@1.2.0:
+    resolution: {integrity: sha512-tzzskb3bG8LvYGFF/mDTpq3jpI6Q9wc3LEmBaghu+DdCssd1FakN7Bc0hVNmEyGq1bq3RgfkCb3cmQLpNPOroA==}
+    engines: {node: '>=4'}
+
   ms@2.0.0:
     resolution: {integrity: sha512-Tpp60P6IUJDTuOq/5Z8cdskzJujfwqfOTkrwIwj7IRISpnkJnT6SyJ4PCPnGMoFjC9ddhal5KVIYtAt97ix05A==}
 
@@ -5825,6 +5845,10 @@ packages:
     resolution: {integrity: sha512-W67iLl4J2EXEGTbfeHCffrjDfitvLANg0UlX3wFUUSTx92KXRFegMHUVgSqE+wvhAbi4WqjGg9czysTV2Epbew==}
     engines: {node: '>= 0.4'}
 
+  on-exit-leak-free@2.1.2:
+    resolution: {integrity: sha512-0eJJY6hXLGf1udHwfNftBqH+g73EU4B504nZeKpz1sYRKafAghwxEJunB2O7rDZkL4PGfsMVnTXZ2EjibbqcsA==}
+    engines: {node: '>=14.0.0'}
+
   on-finished@2.4.1:
     resolution: {integrity: sha512-oVlzkg3ENAhCk2zdv7IJwd/QUD4z2RxRwpkcGY8psCVcCYZNq4wYnVWALHM+brtuJjePWiYF/ClmuDr8Ch5+kg==}
     engines: {node: '>= 0.8'}
@@ -5865,6 +5889,10 @@ packages:
     resolution: {integrity: sha512-//88mFWSJx8lxCzwdAABTJL2MyWB12+eIY7MDL2SqLmAkeKU9qxRvWuSyTjm3FUmpBEMuFfckAIqEaVGUDxb6w==}
     engines: {node: '>=6'}
 
+  p-limit@5.0.0:
+    resolution: {integrity: sha512-/Eaoq+QyLSiXQ4lyYV23f14mZRQcXnxfHrN0vCai+ak9G0pp9iEQukIIZq5NccEvwRB8PUnZT0KsOoDCINS1qQ==}
+    engines: {node: '>=18'}
+
   p-locate@4.1.0:
     resolution: {integrity: sha512-R79ZZ/0wAxKGu3oYMlz8jy/kbhsNrS7SKZ7PxEHBgJ5+F2mtFW2fK2cOtBh1cHYkQsbzFV7I+EoRKe6Yt0oK7A==}
     engines: {node: '>=8'}
@@ -6016,6 +6044,17 @@ packages:
   pgpass@1.0.5:
     resolution: {integrity: sha512-FdW9r/jQZhSeohs1Z3sI1yxFQNFvMcnmfuj4WBMUTxOrAyLMaTcE1aAMBiTlbMNaXvBCQuVi0R7hd8udDSP7ug==}
 
+  pi-brain@0.1.7:
+    resolution: {integrity: sha512-JhSbMX3xoeTB60QcYx45ukCp+3lInYufGr/0jMJAOq501fs798Ei9ez8BGOdQuKw5PTIv+/yeuOc3NZ0M8es7Q==}
+    peerDependencies:
+      '@sinclair/typebox': '*'
+
+  pi-dcp@0.2.0:
+    resolution: {integrity: sha512-VDXIVfdVrcXpwBe6bGGYXegrzKKm8ddBiDcGVZbLf2sJbGZKnM6VWPodT8Yly4vRmzeqEb6ANpCFl7YrQStXBA==}
+    peerDependencies:
+      '@mariozechner/pi-agent-core': '*'
+      '@mariozechner/pi-coding-agent': '*'
+
   picocolors@1.1.1:
     resolution: {integrity: sha512-xceH2snhtb5M9liqDsmEw56le376mTZkEX/jEb/RxNFyegNul7eNslCXP9FDj/Lcu0X8KEyMceP2ntpaHrDEVA==}
 
@@ -6023,6 +6062,16 @@ packages:
     resolution: {integrity: sha512-5gTmgEY/sqK6gFXLIsQNH19lWb4ebPDLA4SdLP7dsWkIXHWlG66oPuVvXSGFPppYZz8ZDZq0dYYrbHfBCVUb1Q==}
     engines: {node: '>=12'}
 
+  pino-abstract-transport@2.0.0:
+    resolution: {integrity: sha512-F63x5tizV6WCh4R6RHyi2Ml+M70DNRXt/+HANowMflpgGFMAym/VKm6G7ZOQRjqN7XbGxK1Lg9t6ZrtzOaivMw==}
+
+  pino-std-serializers@7.1.0:
+    resolution: {integrity: sha512-BndPH67/JxGExRgiX1dX0w1FvZck5Wa4aal9198SrRhZjH3GxKQUKIBnYJTdj2HDN3UQAS06HlfcSbQj2OHmaw==}
+
+  pino@9.14.0:
+    resolution: {integrity: sha512-8OEwKp5juEvb/MjpIc4hjqfgCNysrS94RIOMXYvpYCdm/jglrKEiAYmiumbmGhCvs+IcInsphYDFwqrjr7398w==}
+    hasBin: true
+
   pkg-types@1.3.1:
     resolution: {integrity: sha512-/Jm5M4RvtBFVkKWRu2BLUTNP8/M2a+UwuAX+ae4770q1qVGtfjG+WTCupoZixokjmHiry8uI+dlY8KXYV5HVVQ==}
 
@@ -6069,6 +6118,9 @@ packages:
   process-nextick-args@2.0.1:
     resolution: {integrity: sha512-3ouUOpQhtgrbOa17J7+uxOTpITYWaGP7/AhoR3+A+/1e9skrzelGi/dXzEYyvbxubEF6Wn2ypscTKiKJFFn1ag==}
 
+  process-warning@5.0.0:
+    resolution: {integrity: sha512-a39t9ApHNx2L4+HBnQKqxxHNs1r7KF+Intd8Q/g1bUh6q0WIp9voPXJ/x0j+ZL45KF1pJd9+q2jLIRMfvEshkA==}
+
   prompt@1.3.0:
     resolution: {integrity: sha512-ZkaRWtaLBZl7KKAKndKYUL8WqNT+cQHKRZnT4RYYms48jQkFw3rrBL+/N5K/KtdEveHkxs982MX2BkDKub2ZMg==}
     engines: {node: '>= 6.0.0'}
@@ -6173,6 +6225,9 @@ packages:
   queue@6.0.2:
     resolution: {integrity: sha512-iHZWu+q3IdFZFX36ro/lKBkSvfkztY5Y7HMiPlOUjhupPcG2JMfst2KKEpu5XndviX/3UhFbRngUPNKtgvtZiA==}
 
+  quick-format-unescaped@4.0.4:
+    resolution: {integrity: sha512-tYC1Q1hgyRuHgloV/YXs2w15unPVh8qfu/qCTfhTYamaw7fyhumKa2yGpdSo87vY32rIclj+4fWYQXUMs9EHvg==}
+
   radix-ui@1.4.3:
     resolution: {integrity: sha512-aWizCQiyeAenIdUbqEpXgRA1ya65P13NKn/W8rWkcN0OPkRDxdBVLWnIEDsS2RpwCK2nobI7oMUSmexzTDyAmA==}
     peerDependencies:
@@ -6297,6 +6352,10 @@ packages:
   readdir-glob@1.1.3:
     resolution: {integrity: sha512-v05I2k7xN8zXvPD9N+z/uhXPaj0sUFCe2rcWZIpBsqxfP7xXFQ0tipAd/wjj1YxWyWtUS5IDJpOG82JKt2EAVA==}
 
+  real-require@0.2.0:
+    resolution: {integrity: sha512-57frrGM/OCTLqLOAh0mhVA9VBMHd+9U7Zb2THMGdBUoZVOtGbJzjxsYGDJ3A9AYYCP4hn6y1TVbaOfzWtm5GFg==}
+    engines: {node: '>= 12.13.0'}
+
   recharts-scale@0.4.5:
     resolution: {integrity: sha512-kivNFO+0OcUNu7jQquLXAxz1FIwZj8nrj+YkOKc5694NbjCvcT6aSZiIzNzd2Kul4o4rTto8QVR9lMNtxD4G1w==}
 
@@ -6444,6 +6503,10 @@ packages:
   safe-buffer@5.2.1:
     resolution: {integrity: sha512-rp3So07KcdmmKbGvgaNxQSJr7bGVSVk5S9Eq1F+ppbRo70+YeaDxkw5Dd8NPN+GD6bjnYm2VuPuCXmpuYvmCXQ==}
 
+  safe-stable-stringify@2.5.0:
+    resolution: {integrity: sha512-b3rppTKm9T+PsVCBEOUR46GWI7fdOs00VKZ1+9c1EWDaDMvjQc6tUwuFyIprgGgTcWoVHSKrU8H31ZHA2e0RHA==}
+    engines: {node: '>=10'}
+
   safer-buffer@2.1.2:
     resolution: {integrity: sha512-YZo3K82SD7Riyi0E1EQPojLz7kpepnSQI9IyPbHHg1XXXevb5dJI7tpyN2ADxGcQbHG7vcyRHk0cbwqcQriUtg==}
 
@@ -6566,6 +6629,9 @@ packages:
     resolution: {integrity: sha512-HLpt+uLy/pxB+bum/9DzAgiKS8CX1EvbWxI4zlmgGCExImLdiad2iCwXT5Z4c9c3Eq8rP2318mPW2c+QbtjK8A==}
     engines: {node: '>= 10.0.0', npm: '>= 3.0.0'}
 
+  sonic-boom@4.2.1:
+    resolution: {integrity: sha512-w6AxtubXa2wTXAUsZMMWERrsIRAdrK0Sc+FUytWvYAhBJLyuI4llrMIC1DtlNSdI99EI86KZum2MMq3EAZlF9Q==}
+
   sonner@2.0.7:
     resolution: {integrity: sha512-W6ZN4p58k8aDKA4XPcx2hpIQXBRAgyiWVkYhT7CvK6D3iAu7xjvVyhQHg2/iaKJZ1XVJ4r7XuwGL+WGEK37i9w==}
     peerDependencies:
@@ -6722,6 +6788,9 @@ packages:
   thenify@3.3.1:
     resolution: {integrity: sha512-RVZSIV5IG10Hk3enotrhvz0T9em6cyHBLkH/YAZuKqd8hRkKhSfCGIcP2KUY0EPxndzANBmNllzWPwak+bheSw==}
 
+  thread-stream@3.1.0:
+    resolution: {integrity: sha512-OqyPZ9u96VohAyMfJykzmivOrY2wfMSf3C5TtFJVgN+Hm6aj+voFhlK+kZEIv2FBh1X6Xp3DlnCOfEQ3B2J86A==}
+
   tiny-inflate@1.0.3:
     resolution: {integrity: sha512-pkY1fj1cKHb2seWDy0B16HeWyczlJA9/WW3u3c4z/NiWDsO3DOU5D7nhTLE9CF0yXv/QZFY7sEJmj24dK+Rrqw==}
 
@@ -7203,6 +7272,10 @@ packages:
   yauzl@2.10.0:
     resolution: {integrity: sha512-p4a9I6X6nu6IhoGmBqAcbJy1mlC4j27vEPZX9F4L4/vZT3Lyq1VkFHw/V/PUcB9Buo+DG3iHkT0x3Qya58zc3g==}
 
+  yocto-queue@1.2.2:
+    resolution: {integrity: sha512-4LCcse/U2MHZ63HAJVE+v71o7yOdIe4cZ70Wpf8D/IyjDKYQLV5GD46B+hSTjJsvV5PztjvHoU580EftxjDZFQ==}
+    engines: {node: '>=12.20'}
+
   yoctocolors@2.1.2:
     resolution: {integrity: sha512-CzhO+pFNo8ajLM2d2IW/R93ipy99LWjtwblvC1RsoSUMZgyLbYFr221TnSNT7GjGdYui6P459mw9JH/g/zW2ug==}
     engines: {node: '>=18'}
@@ -7293,6 +7366,16 @@ snapshots:
       package-manager-detector: 1.6.0
       tinyexec: 1.0.4
 
+  '@anthropic-ai/sdk@0.73.0':
+    dependencies:
+      json-schema-to-ts: 3.1.1
+
+  '@anthropic-ai/sdk@0.73.0(zod@3.25.76)':
+    dependencies:
+      json-schema-to-ts: 3.1.1
+    optionalDependencies:
+      zod: 3.25.76
+
   '@anthropic-ai/sdk@0.73.0(zod@4.3.6)':
     dependencies:
       json-schema-to-ts: 3.1.1
@@ -8183,6 +8266,18 @@ snapshots:
       std-env: 3.10.0
       yoctocolors: 2.1.2
 
+  '@mariozechner/pi-agent-core@0.61.1':
+    dependencies:
+      '@mariozechner/pi-ai': 0.61.1
+    transitivePeerDependencies:
+      - '@modelcontextprotocol/sdk'
+      - aws-crt
+      - bufferutil
+      - supports-color
+      - utf-8-validate
+      - ws
+      - zod
+
   '@mariozechner/pi-agent-core@0.61.1(ws@8.19.0)(zod@4.3.6)':
     dependencies:
       '@mariozechner/pi-ai': 0.61.1(ws@8.19.0)(zod@4.3.6)
@@ -8195,6 +8290,42 @@ snapshots:
       - ws
       - zod
 
+  '@mariozechner/pi-agent-core@0.61.1(zod@3.25.76)':
+    dependencies:
+      '@mariozechner/pi-ai': 0.61.1(zod@3.25.76)
+    transitivePeerDependencies:
+      - '@modelcontextprotocol/sdk'
+      - aws-crt
+      - bufferutil
+      - supports-color
+      - utf-8-validate
+      - ws
+      - zod
+
+  '@mariozechner/pi-ai@0.61.1':
+    dependencies:
+      '@anthropic-ai/sdk': 0.73.0
+      '@aws-sdk/client-bedrock-runtime': 3.1012.0
+      '@google/genai': 1.46.0
+      '@mistralai/mistralai': 1.14.1
+      '@sinclair/typebox': 0.34.48
+      ajv: 8.18.0
+      ajv-formats: 3.0.1(ajv@8.18.0)
+      chalk: 5.6.2
+      openai: 6.26.0
+      partial-json: 0.1.7
+      proxy-agent: 6.5.0
+      undici: 7.24.4
+      zod-to-json-schema: 3.25.1
+    transitivePeerDependencies:
+      - '@modelcontextprotocol/sdk'
+      - aws-crt
+      - bufferutil
+      - supports-color
+      - utf-8-validate
+      - ws
+      - zod
+
   '@mariozechner/pi-ai@0.61.1(ws@8.19.0)(zod@4.3.6)':
     dependencies:
       '@anthropic-ai/sdk': 0.73.0(zod@4.3.6)
@@ -8219,6 +8350,62 @@ snapshots:
       - ws
       - zod
 
+  '@mariozechner/pi-ai@0.61.1(zod@3.25.76)':
+    dependencies:
+      '@anthropic-ai/sdk': 0.73.0(zod@3.25.76)
+      '@aws-sdk/client-bedrock-runtime': 3.1012.0
+      '@google/genai': 1.46.0
+      '@mistralai/mistralai': 1.14.1
+      '@sinclair/typebox': 0.34.48
+      ajv: 8.18.0
+      ajv-formats: 3.0.1(ajv@8.18.0)
+      chalk: 5.6.2
+      openai: 6.26.0(zod@3.25.76)
+      partial-json: 0.1.7
+      proxy-agent: 6.5.0
+      undici: 7.24.4
+      zod-to-json-schema: 3.25.1(zod@3.25.76)
+    transitivePeerDependencies:
+      - '@modelcontextprotocol/sdk'
+      - aws-crt
+      - bufferutil
+      - supports-color
+      - utf-8-validate
+      - ws
+      - zod
+
+  '@mariozechner/pi-coding-agent@0.61.0':
+    dependencies:
+      '@mariozechner/jiti': 2.6.5
+      '@mariozechner/pi-agent-core': 0.61.1
+      '@mariozechner/pi-ai': 0.61.1
+      '@mariozechner/pi-tui': 0.61.1
+      '@silvia-odwyer/photon-node': 0.3.4
+      chalk: 5.6.2
+      cli-highlight: 2.1.11
+      diff: 8.0.3
+      extract-zip: 2.0.1
+      file-type: 21.3.3
+      glob: 13.0.6
+      hosted-git-info: 9.0.2
+      ignore: 7.0.5
+      marked: 15.0.12
+      minimatch: 10.2.4
+      proper-lockfile: 4.1.2
+      strip-ansi: 7.2.0
+      undici: 7.24.4
+      yaml: 2.8.2
+    optionalDependencies:
+      '@mariozechner/clipboard': 0.3.2
+    transitivePeerDependencies:
+      - '@modelcontextprotocol/sdk'
+      - aws-crt
+      - bufferutil
+      - supports-color
+      - utf-8-validate
+      - ws
+      - zod
+
   '@mariozechner/pi-coding-agent@0.61.0(ws@8.19.0)(zod@4.3.6)':
     dependencies:
       '@mariozechner/jiti': 2.6.5
@@ -8251,6 +8438,38 @@ snapshots:
       - ws
       - zod
 
+  '@mariozechner/pi-coding-agent@0.61.0(zod@3.25.76)':
+    dependencies:
+      '@mariozechner/jiti': 2.6.5
+      '@mariozechner/pi-agent-core': 0.61.1(zod@3.25.76)
+      '@mariozechner/pi-ai': 0.61.1(zod@3.25.76)
+      '@mariozechner/pi-tui': 0.61.1
+      '@silvia-odwyer/photon-node': 0.3.4
+      chalk: 5.6.2
+      cli-highlight: 2.1.11
+      diff: 8.0.3
+      extract-zip: 2.0.1
+      file-type: 21.3.3
+      glob: 13.0.6
+      hosted-git-info: 9.0.2
+      ignore: 7.0.5
+      marked: 15.0.12
+      minimatch: 10.2.4
+      proper-lockfile: 4.1.2
+      strip-ansi: 7.2.0
+      undici: 7.24.4
+      yaml: 2.8.2
+    optionalDependencies:
+      '@mariozechner/clipboard': 0.3.2
+    transitivePeerDependencies:
+      - '@modelcontextprotocol/sdk'
+      - aws-crt
+      - bufferutil
+      - supports-color
+      - utf-8-validate
+      - ws
+      - zod
+
   '@mariozechner/pi-tui@0.61.1':
     dependencies:
       '@types/mime-types': 2.1.4
@@ -8310,6 +8529,8 @@ snapshots:
 
   '@opentelemetry/api@1.9.0': {}
 
+  '@pinojs/redact@0.4.0': {}
+
   '@protobuf-ts/grpc-transport@2.11.1(@grpc/grpc-js@1.14.3)':
     dependencies:
       '@grpc/grpc-js': 1.14.3
@@ -9766,6 +9987,13 @@ snapshots:
     dependencies:
       tslib: 2.8.1
 
+  '@stacksjs/clapp@0.2.0':
+    dependencies:
+      mri: 1.2.0
+      wrap-ansi: 9.0.2
+
+  '@stacksjs/clarity@0.3.24': {}
+
   '@standard-schema/spec@1.1.0': {}
 
   '@standard-schema/utils@0.3.0': {}
@@ -10606,6 +10834,8 @@ snapshots:
 
   asynckit@0.4.0: {}
 
+  atomic-sleep@1.0.0: {}
+
   auto-bind@5.0.1: {}
 
   aws-ssl-profiles@1.1.2: {}
@@ -10754,6 +10984,11 @@ snapshots:
 
   buffers@0.1.1: {}
 
+  bunfig@0.15.6:
+    dependencies:
+      '@stacksjs/clapp': 0.2.0
+      '@stacksjs/clarity': 0.3.24
+
   bytes@3.1.2: {}
 
   cac@6.7.14: {}
@@ -12854,6 +13089,8 @@ snapshots:
       react: 19.2.4
       react-dom: 19.2.4(react@19.2.4)
 
+  mri@1.2.0: {}
+
   ms@2.0.0: {}
 
   ms@2.1.3: {}
@@ -12965,6 +13202,8 @@ snapshots:
 
   object-inspect@1.13.4: {}
 
+  on-exit-leak-free@2.1.2: {}
+
   on-finished@2.4.1:
     dependencies:
       ee-first: 1.1.1
@@ -12985,11 +13224,17 @@ snapshots:
       regex: 6.1.0
       regex-recursion: 6.0.2
 
+  openai@6.26.0: {}
+
   openai@6.26.0(ws@8.19.0)(zod@4.3.6):
     optionalDependencies:
       ws: 8.19.0
       zod: 4.3.6
 
+  openai@6.26.0(zod@3.25.76):
+    optionalDependencies:
+      zod: 3.25.76
+
   orderedmap@2.1.1: {}
 
   p-finally@1.0.0: {}
@@ -12998,6 +13243,10 @@ snapshots:
     dependencies:
       p-try: 2.2.0
 
+  p-limit@5.0.0:
+    dependencies:
+      yocto-queue: 1.2.2
+
   p-locate@4.1.0:
     dependencies:
       p-limit: 2.3.0
@@ -13140,10 +13389,41 @@ snapshots:
     dependencies:
       split2: 4.2.0
 
+  pi-brain@0.1.7(@sinclair/typebox@0.34.48):
+    dependencies:
+      '@sinclair/typebox': 0.34.48
+
+  pi-dcp@0.2.0(@mariozechner/pi-agent-core@0.61.1(zod@3.25.76))(@mariozechner/pi-coding-agent@0.61.0(zod@3.25.76)):
+    dependencies:
+      '@mariozechner/pi-agent-core': 0.61.1(zod@3.25.76)
+      '@mariozechner/pi-coding-agent': 0.61.0(zod@3.25.76)
+      '@sinclair/typebox': 0.34.48
+      bunfig: 0.15.6
+
   picocolors@1.1.1: {}
 
   picomatch@4.0.3: {}
 
+  pino-abstract-transport@2.0.0:
+    dependencies:
+      split2: 4.2.0
+
+  pino-std-serializers@7.1.0: {}
+
+  pino@9.14.0:
+    dependencies:
+      '@pinojs/redact': 0.4.0
+      atomic-sleep: 1.0.0
+      on-exit-leak-free: 2.1.2
+      pino-abstract-transport: 2.0.0
+      pino-std-serializers: 7.1.0
+      process-warning: 5.0.0
+      quick-format-unescaped: 4.0.4
+      real-require: 0.2.0
+      safe-stable-stringify: 2.5.0
+      sonic-boom: 4.2.1
+      thread-stream: 3.1.0
+
   pkg-types@1.3.1:
     dependencies:
       confbox: 0.1.8
@@ -13194,6 +13474,8 @@ snapshots:
 
   process-nextick-args@2.0.1: {}
 
+  process-warning@5.0.0: {}
+
   prompt@1.3.0:
     dependencies:
       '@colors/colors': 1.5.0
@@ -13371,6 +13653,8 @@ snapshots:
     dependencies:
       inherits: 2.0.4
 
+  quick-format-unescaped@4.0.4: {}
+
   radix-ui@1.4.3(@types/react-dom@19.2.3(@types/react@19.2.14))(@types/react@19.2.14)(react-dom@19.2.4(react@19.2.4))(react@19.2.4):
     dependencies:
       '@radix-ui/primitive': 1.1.3
@@ -13556,6 +13840,8 @@ snapshots:
     dependencies:
       minimatch: 5.1.9
 
+  real-require@0.2.0: {}
+
   recharts-scale@0.4.5:
     dependencies:
       decimal.js-light: 2.5.1
@@ -13768,6 +14054,8 @@ snapshots:
 
   safe-buffer@5.2.1: {}
 
+  safe-stable-stringify@2.5.0: {}
+
   safer-buffer@2.1.2: {}
 
   saxes@5.0.1:
@@ -13943,6 +14231,10 @@ snapshots:
       ip-address: 10.1.0
       smart-buffer: 4.2.0
 
+  sonic-boom@4.2.1:
+    dependencies:
+      atomic-sleep: 1.0.0
+
   sonner@2.0.7(react-dom@19.2.4(react@19.2.4))(react@19.2.4):
     dependencies:
       react: 19.2.4
@@ -14116,6 +14408,10 @@ snapshots:
     dependencies:
       any-promise: 1.3.0
 
+  thread-stream@3.1.0:
+    dependencies:
+      real-require: 0.2.0
+
   tiny-inflate@1.0.3: {}
 
   tiny-invariant@1.3.3: {}
@@ -14612,6 +14908,8 @@ snapshots:
       buffer-crc32: 0.2.13
       fd-slicer: 1.1.0
 
+  yocto-queue@1.2.2: {}
+
   yoctocolors@2.1.2: {}
 
   yoga-layout@3.2.1: {}
@@ -14622,6 +14920,12 @@ snapshots:
       compress-commons: 4.1.2
       readable-stream: 3.6.2
 
+  zod-to-json-schema@3.25.1: {}
+
+  zod-to-json-schema@3.25.1(zod@3.25.76):
+    dependencies:
+      zod: 3.25.76
+
   zod-to-json-schema@3.25.1(zod@4.3.6):
     dependencies:
       zod: 4.3.6

From c787ba11043a492e12db33a0ee7b733488ef319e Mon Sep 17 00:00:00 2001
From: shanvit <shanvit7@gmail.com>
Date: Fri, 10 Apr 2026 13:46:20 +0530
Subject: [PATCH 05/12] chore: mem integration wired up

---
 packages/agents/src/pi/memory.ts       | 64 +++++++++++++-------------
 packages/zosma-mem/src/bridge/index.ts |  2 +-
 2 files changed, 34 insertions(+), 32 deletions(-)

diff --git a/packages/agents/src/pi/memory.ts b/packages/agents/src/pi/memory.ts
index de01989..c1c9a4d 100644
--- a/packages/agents/src/pi/memory.ts
+++ b/packages/agents/src/pi/memory.ts
@@ -8,35 +8,30 @@
 
 import { completeSimple } from "@mariozechner/pi-ai"
 import type { Api, Model } from "@mariozechner/pi-ai"
-import { createLogger } from "@openzosma/logger"
 import type { ExtractedFact } from "@openzosma/zosma-mem/bridge"
 
-const log = createLogger({ component: "agents:memory" })
+const EXTRACTION_SYSTEM_PROMPT = `You are extracting user preferences and facts from conversations for long-term memory.
 
-const EXTRACTION_SYSTEM_PROMPT = `You are a memory extraction assistant. Your job is to identify facts worth
-remembering long-term from a conversation exchange.
+CRITICAL RULES:
+1. Extract EVERY user preference as a separate fact, even if they seem related
+2. "Favorite X" and "love/like Y" are ALWAYS separate facts, even if both are animals
+3. Personal statements like "I love X" or "My favorite is Y" become facts
+4. Each fact must be self-contained and specific
+5. Tags MUST include semantic action words like "like", "love", "hate", "favorite", "prefer"
+   so the fact can be retrieved by queries like "what do I like?" or "whom do I like?"
 
-Extract facts that are:
-- User preferences (favorite things, dislikes, habits)
-- Decisions made by the user
-- Constraints or rules the user has stated
-- Personal information the user shared
-- Repeating patterns or explicit instructions
+EXAMPLES:
+- User says "My favorite animal is elephant" → content: "User's favorite animal is elephant", tags: ["animal", "favorite", "elephant"]
+- User says "I love the lion" → content: "User loves lions", tags: ["animal", "love", "lion"]
+- User says "I hate snakes" → content: "User hates snakes", tags: ["animal", "hate", "snake"]
+- User says "I like Messi" → content: "User likes Messi", tags: ["messi", "like", "football", "person"]
 
-Do NOT extract:
-- Facts that are only relevant to the current task
-- Temporary states ("I'm tired today")
-- Questions without answers
-- Generic statements that apply to everyone
+Extract as JSON array with:
+- "content": third-person statement (e.g. "User's favorite animal is elephant")
+- "type": "preference"
+- "tags": array of lowercase keywords INCLUDING the relationship word (like/love/hate/favorite/prefer)
 
-Return a JSON array. Each element must be an object with:
-- "content": a self-contained, third-person statement of the fact (e.g. "User's favorite animal is elephant")
-- "type": one of "preference" | "decision" | "pattern" | "error"
-- "tags": array of 2-5 lowercase keywords
-
-If nothing is worth remembering, return an empty array: []
-
-Respond with ONLY the JSON array. No explanation, no markdown fences.`
+Return [] if nothing memorable. ONLY return the raw JSON array, no markdown formatting.`
 
 /**
  * Use the active LLM to extract memorable facts from a single conversation turn.
@@ -48,7 +43,9 @@ export const extractFacts = async (
   userMessage: string,
   assistantResponse: string,
 ): Promise<ExtractedFact[]> => {
-  if (!userMessage.trim() || !assistantResponse.trim()) return []
+  if (!userMessage.trim() || !assistantResponse.trim()) {
+    return []
+  }
 
   const prompt = `User: ${userMessage}\n\nAssistant: ${assistantResponse}`
 
@@ -68,13 +65,19 @@ export const extractFacts = async (
       .join("")
       .trim()
 
-    if (!text) return []
+    if (!text) {
+      return []
+    }
 
-    const parsed: unknown = JSON.parse(text)
+    // Strip markdown code fences that some models wrap around JSON output.
+    const stripped = text.replace(/^```(?:json)?\s*/i, "").replace(/\s*```$/, "").trim()
+    const parsed: unknown = JSON.parse(stripped)
 
-    if (!Array.isArray(parsed)) return []
+    if (!Array.isArray(parsed)) {
+      return []
+    }
 
-    return parsed.filter(
+    const validFacts = parsed.filter(
       (item): item is ExtractedFact =>
         typeof item === "object" &&
         item !== null &&
@@ -82,10 +85,9 @@ export const extractFacts = async (
         ["preference", "decision", "pattern", "error"].includes((item as Record<string, unknown>).type as string) &&
         Array.isArray((item as Record<string, unknown>).tags),
     )
+
+    return validFacts
   } catch (err) {
-    log.warn("Memory extraction failed (non-fatal)", {
-      error: err instanceof Error ? err.message : String(err),
-    })
     return []
   }
 }
diff --git a/packages/zosma-mem/src/bridge/index.ts b/packages/zosma-mem/src/bridge/index.ts
index 9111b4b..09f95bf 100644
--- a/packages/zosma-mem/src/bridge/index.ts
+++ b/packages/zosma-mem/src/bridge/index.ts
@@ -72,7 +72,7 @@ export interface MemoryBridge {
  * it hashes to the same ID, so the engine deduplicates it by updating in place.
  */
 export const factId = (content: string): string =>
-  createHash("sha256").update(content.trim().toLowerCase()).digest("hex").slice(0, 16)
+  createHash("sha256").update(content.trim().toLowerCase().replace(/\s+/g, ' ')).digest("hex").slice(0, 16)
 
 /**
  * Format retrieved memories as a system prompt section.

From 11437dd0af77f4b8acd61a424568ebb5fca1b5e7 Mon Sep 17 00:00:00 2001
From: shanvit <shanvit7@gmail.com>
Date: Fri, 10 Apr 2026 15:56:51 +0530
Subject: [PATCH 06/12] chore: memory evals for SquAD dataset

---
 packages/agents/src/pi.agent.ts               |  10 +-
 packages/agents/src/pi/memory.ts              |  89 ++--
 packages/zosma-mem/README.md                  |  66 +--
 packages/zosma-mem/package.json               |  14 +-
 packages/zosma-mem/src/bin/eval.ts            | 120 +++++
 .../src/bridge/__tests__/bridge.test.ts       | 479 ++++++++++--------
 packages/zosma-mem/src/bridge/extensions.ts   |  46 +-
 packages/zosma-mem/src/bridge/index.ts        | 249 +++++----
 .../src/engine/__tests__/factory.test.ts      |  82 +--
 .../engine/__tests__/reinforcement.test.ts    | 116 ++---
 packages/zosma-mem/src/engine/salience.ts     |  20 +-
 .../src/evals/__tests__/evals.test.ts         |  93 ++++
 packages/zosma-mem/src/evals/eval.ts          |  61 +++
 packages/zosma-mem/src/evals/index.ts         |   2 +
 packages/zosma-mem/src/evals/types.ts         |  66 +++
 packages/zosma-mem/src/retrieval/retrieve.ts  |  11 +-
 packages/zosma-mem/src/types.ts               |  96 ++--
 pnpm-lock.yaml                                |  42 +-
 18 files changed, 1032 insertions(+), 630 deletions(-)
 create mode 100644 packages/zosma-mem/src/bin/eval.ts
 create mode 100644 packages/zosma-mem/src/evals/__tests__/evals.test.ts
 create mode 100644 packages/zosma-mem/src/evals/eval.ts
 create mode 100644 packages/zosma-mem/src/evals/index.ts
 create mode 100644 packages/zosma-mem/src/evals/types.ts

diff --git a/packages/agents/src/pi.agent.ts b/packages/agents/src/pi.agent.ts
index 1be4549..07e9599 100644
--- a/packages/agents/src/pi.agent.ts
+++ b/packages/agents/src/pi.agent.ts
@@ -149,7 +149,7 @@ class PiAgentSession implements AgentSession {
 				await session.steer(memoryContext)
 				log.info("Memory context injected via steer()", {
 					length: memoryContext.length,
-					injectedIds: injectedMemoryIds.length
+					injectedIds: injectedMemoryIds.length,
 				})
 			}
 		} catch (err) {
@@ -519,7 +519,11 @@ class PiAgentSession implements AgentSession {
 						else ignoredCount++
 					}
 
-					log.info("Memory reinforcement recorded", { usedCount, ignoredCount, totalInjected: injectedMemoryIds.length })
+					log.info("Memory reinforcement recorded", {
+						usedCount,
+						ignoredCount,
+						totalInjected: injectedMemoryIds.length,
+					})
 				} catch (err) {
 					log.warn("Memory reinforcement failed (non-fatal)", {
 						error: err instanceof Error ? err.message : String(err),
@@ -578,4 +582,4 @@ export class PiAgentProvider implements AgentProvider {
 	createSession(opts: AgentSessionOpts): AgentSession {
 		return new PiAgentSession(opts)
 	}
-}
\ No newline at end of file
+}
diff --git a/packages/agents/src/pi/memory.ts b/packages/agents/src/pi/memory.ts
index c1c9a4d..9eff66d 100644
--- a/packages/agents/src/pi/memory.ts
+++ b/packages/agents/src/pi/memory.ts
@@ -38,56 +38,59 @@ Return [] if nothing memorable. ONLY return the raw JSON array, no markdown form
  * Returns an empty array on any error — this is a non-critical background path.
  */
 export const extractFacts = async (
-  model: Model<Api>,
-  apiKey: string,
-  userMessage: string,
-  assistantResponse: string,
+	model: Model<Api>,
+	apiKey: string,
+	userMessage: string,
+	assistantResponse: string,
 ): Promise<ExtractedFact[]> => {
-  if (!userMessage.trim() || !assistantResponse.trim()) {
-    return []
-  }
+	if (!userMessage.trim() || !assistantResponse.trim()) {
+		return []
+	}
 
-  const prompt = `User: ${userMessage}\n\nAssistant: ${assistantResponse}`
+	const prompt = `User: ${userMessage}\n\nAssistant: ${assistantResponse}`
 
-  try {
-    const result = await completeSimple(
-      model,
-      {
-        systemPrompt: EXTRACTION_SYSTEM_PROMPT,
-        messages: [{ role: "user", content: prompt, timestamp: Date.now() }],
-      },
-      { apiKey, maxTokens: 512 },
-    )
+	try {
+		const result = await completeSimple(
+			model,
+			{
+				systemPrompt: EXTRACTION_SYSTEM_PROMPT,
+				messages: [{ role: "user", content: prompt, timestamp: Date.now() }],
+			},
+			{ apiKey, maxTokens: 512 },
+		)
 
-    const text = result.content
-      .filter((c): c is { type: "text"; text: string } => c.type === "text")
-      .map((c) => c.text)
-      .join("")
-      .trim()
+		const text = result.content
+			.filter((c): c is { type: "text"; text: string } => c.type === "text")
+			.map((c) => c.text)
+			.join("")
+			.trim()
 
-    if (!text) {
-      return []
-    }
+		if (!text) {
+			return []
+		}
 
-    // Strip markdown code fences that some models wrap around JSON output.
-    const stripped = text.replace(/^```(?:json)?\s*/i, "").replace(/\s*```$/, "").trim()
-    const parsed: unknown = JSON.parse(stripped)
+		// Strip markdown code fences that some models wrap around JSON output.
+		const stripped = text
+			.replace(/^```(?:json)?\s*/i, "")
+			.replace(/\s*```$/, "")
+			.trim()
+		const parsed: unknown = JSON.parse(stripped)
 
-    if (!Array.isArray(parsed)) {
-      return []
-    }
+		if (!Array.isArray(parsed)) {
+			return []
+		}
 
-    const validFacts = parsed.filter(
-      (item): item is ExtractedFact =>
-        typeof item === "object" &&
-        item !== null &&
-        typeof (item as Record<string, unknown>).content === "string" &&
-        ["preference", "decision", "pattern", "error"].includes((item as Record<string, unknown>).type as string) &&
-        Array.isArray((item as Record<string, unknown>).tags),
-    )
+		const validFacts = parsed.filter(
+			(item): item is ExtractedFact =>
+				typeof item === "object" &&
+				item !== null &&
+				typeof (item as Record<string, unknown>).content === "string" &&
+				["preference", "decision", "pattern", "error"].includes((item as Record<string, unknown>).type as string) &&
+				Array.isArray((item as Record<string, unknown>).tags),
+		)
 
-    return validFacts
-  } catch (err) {
-    return []
-  }
+		return validFacts
+	} catch (err) {
+		return []
+	}
 }
diff --git a/packages/zosma-mem/README.md b/packages/zosma-mem/README.md
index 8199d2d..6cab544 100644
--- a/packages/zosma-mem/README.md
+++ b/packages/zosma-mem/README.md
@@ -6,10 +6,7 @@ A file-based memory system with salience scoring, tag-based retrieval, and reinf
 
 ## Installation
 
-```bash
-# In OpenZosma workspace
-pnpm add @openzosma/zosma-mem
-```
+This package is part of the OpenZosma workspace.
 
 ## Core Concepts
 
@@ -137,41 +134,37 @@ Automatic cleanup runs periodically:
 - **Prune** - Remove facts below salience threshold
 - **Consolidate** - Merge similar entities
 
-```typescript
-// Manual GC
-const report = await engine.gc()
-console.log(`${report.pruned} pruned, ${report.decayed} decayed`)
-```
+## Evaluation
 
-## Configuration
+For internal OpenZosma evaluation, use the CLI tool to assess memory retrieval effectiveness:
 
-```typescript
-interface MemoryConfig {
-  memoryDir: string                    // Required: where to store files
-  salienceThreshold?: number          // Default: 0.4
-  gcIntervalMs?: number               // Default: 3,600,000 (1 hour)
-  gcPruneCycles?: number              // Default: 1
-  summarizer?: (texts: string[]) => Promise<string>
-  now?: () => number                  // For testing
-}
+```bash
+# From project root, after building
+cd packages/zosma-mem
+node dist/bin/eval.js run
 ```
 
-## Architecture
-
-### Core Modules
+The CLI prompts for:
+- Memory directory path (e.g., `../../../workspace/agents/default/memory`)
+- Number of test cases
+- Query and expected content for each case
 
-- **engine/** - Salience scoring, reinforcement, GC
-- **store/** - File-based entity storage with co-access patterns
-- **ingestion/** - Fact ingestion and scoring
-- **retrieval/** - Tag-based search with attention ranking
-- **gc/** - Decay, pruning, consolidation
-- **bridge/** - Agent session integration
+It computes recall, precision, and F1 scores.
 
-### File Storage
-
-- **Entity files**: `.salience/*.yaml` - Individual facts with scores
-- **Archive**: `.salience/archive/` - Pruned entities
-- **Co-access**: `.salience/co-access` - Access pattern correlations
+Example output:
+```
+Evaluation Results:
+Average Recall: 85.00%
+Average Precision: 90.00%
+Average F1 Score: 87.50%
+
+Per Test Case:
+Case 1: "UI design"
+  Recall: 100.00%
+  Precision: 100.00%
+  F1: 100.00%
+  Retrieved: 2 memories
+```
 
 ## Development
 
@@ -186,11 +179,4 @@ pnpm run test
 pnpm run check
 ```
 
-## Publishing
-
-```bash
-pnpm run build && pnpm run test
-npm publish
-```
-
 Built for OpenZosma agents, works with any AI agent framework that needs persistent cross-conversation memory. 🚀
\ No newline at end of file
diff --git a/packages/zosma-mem/package.json b/packages/zosma-mem/package.json
index 1101a9f..6544a91 100644
--- a/packages/zosma-mem/package.json
+++ b/packages/zosma-mem/package.json
@@ -5,14 +5,7 @@
 	"type": "module",
 	"description": "Memory engine with bridge for agent integration",
 	"license": "Apache-2.0",
-	"keywords": [
-		"memory",
-		"evaluation",
-		"ai",
-		"agentic",
-		"cli",
-		"openzosma"
-	],
+	"keywords": ["memory", "evaluation", "ai", "agentic", "cli", "openzosma"],
 	"repository": {
 		"type": "git",
 		"url": "https://github.com/your-org/openzosma",
@@ -21,6 +14,9 @@
 	"homepage": "https://github.com/your-org/openzosma/tree/main/packages/zosma-mem",
 	"main": "dist/index.js",
 	"types": "dist/index.d.ts",
+	"bin": {
+		"zosma-mem-eval": "dist/bin/eval.js"
+	},
 	"exports": {
 		".": {
 			"types": "./dist/index.d.ts",
@@ -38,6 +34,8 @@
 		"prepublishOnly": "pnpm run build && pnpm run test"
 	},
 	"dependencies": {
+		"@clack/prompts": "^0.10.0",
+		"@openzosma/logger": "workspace:*",
 		"chalk": "^5.4.0",
 		"commander": "^13.0.0",
 		"ink": "^5.1.0",
diff --git a/packages/zosma-mem/src/bin/eval.ts b/packages/zosma-mem/src/bin/eval.ts
new file mode 100644
index 0000000..107e762
--- /dev/null
+++ b/packages/zosma-mem/src/bin/eval.ts
@@ -0,0 +1,120 @@
+import { intro, note, outro, spinner, text } from "@clack/prompts"
+import { createLogger } from "@openzosma/logger"
+import chalk from "chalk"
+import { Command } from "commander"
+import { createMemoryBridge, factId } from "../bridge/index.js"
+import { evaluateMemory } from "../evals/index.js"
+import type { MemoryEventType } from "../types.js"
+
+interface SQuADAnswer {
+	text: string
+	answer_start: number
+}
+
+interface SQuADQA {
+	question: string
+	answers: SQuADAnswer[]
+}
+
+interface SQuADParagraph {
+	context: string
+	qas: SQuADQA[]
+}
+
+interface SQuADArticle {
+	title: string
+	paragraphs: SQuADParagraph[]
+}
+
+interface SQuADData {
+	data: SQuADArticle[]
+}
+
+const logger = createLogger({ component: "zosma-mem-eval" })
+
+const program = new Command()
+
+program.name("zosma-mem-eval").description("CLI tool to evaluate memory retrieval effectiveness").version("0.0.1")
+
+program
+	.command("run")
+	.description("Run interactive memory evaluation")
+	.action(async () => {
+		try {
+			intro(chalk.blue("🧠 Zosma Memory Evaluation"))
+
+			// Prompt for number of test cases
+			const result = await text({ message: "How many test cases to run?", defaultValue: "10" })
+			if (typeof result === "symbol") process.exit(0)
+			const numCasesStr = result
+			const numCases = Number.parseInt(numCasesStr || "10")
+
+			// Use default memory dir for internal use
+			const memoryDir = "../../../workspace/agents/default/memory"
+			logger.info(`Using memory dir: ${memoryDir}`)
+
+			// Create bridge
+			const s = spinner()
+			s.start("Initializing memory bridge...")
+			const bridge = createMemoryBridge({ memoryDir })
+			s.stop("Memory bridge ready!")
+
+			// Fetch SQuAD validation dataset from Hugging Face
+			const url = "https://rajpurkar.github.io/SQuAD-explorer/dataset/dev-v1.1.json"
+			const response = await fetch(url)
+			const data = (await response.json()) as SQuADData
+
+			// Prepare facts and test cases
+			const facts: { content: string; type: MemoryEventType; tags: string[] }[] = []
+			const testCases = []
+			let totalCases = 0
+			for (const item of data.data) {
+				if (totalCases >= numCases) break
+				for (const para of item.paragraphs) {
+					if (totalCases >= numCases) break
+					const context = para.context
+					const contextId = factId(context)
+					facts.push({ content: context, type: "pattern" as MemoryEventType, tags: [] })
+					for (const qa of para.qas.slice(0, 1)) {
+						if (totalCases >= numCases) break
+						testCases.push({
+							query: qa.question,
+							expectedIds: [contextId],
+							expectedContent: qa.answers.map((a: SQuADAnswer) => a.text),
+						})
+						totalCases++
+					}
+				}
+			}
+
+			// Ingest facts into memory
+			await bridge.ingestFacts(facts)
+
+			logger.info(`Running ${testCases.length} real test cases from HF SQuAD...`)
+
+			// Run evaluation
+			const evalSpinner = spinner()
+			evalSpinner.start("Running evaluation...")
+			const results = await evaluateMemory(bridge, { testCases })
+			evalSpinner.stop("Evaluation complete!")
+
+			// Display results as table
+			const table = `
+| Metric              | Value                     |
+|---------------------|---------------------------|
+| Total Cases         | ${results.cases.length}   |
+| Average Recall      | ${(results.metrics.avgRecall * 100).toFixed(2)}% |
+| Average Precision   | ${(results.metrics.avgPrecision * 100).toFixed(2)}% |
+| Average F1 Score    | ${(results.metrics.avgF1 * 100).toFixed(2)}% |
+`
+
+			note(table, "Evaluation Results")
+
+			outro(chalk.green("Evaluation complete! 🎉"))
+		} catch (error) {
+			outro(chalk.red(`Error: ${(error as Error).message}`))
+			process.exit(1)
+		}
+	})
+
+program.parse()
diff --git a/packages/zosma-mem/src/bridge/__tests__/bridge.test.ts b/packages/zosma-mem/src/bridge/__tests__/bridge.test.ts
index 447e1be..f7ff79e 100644
--- a/packages/zosma-mem/src/bridge/__tests__/bridge.test.ts
+++ b/packages/zosma-mem/src/bridge/__tests__/bridge.test.ts
@@ -1,211 +1,276 @@
-import { describe, it, expect, beforeEach, afterEach } from "vitest"
+import { mkdirSync, rmSync } from "node:fs"
+import { tmpdir } from "node:os"
+import { join } from "node:path"
+import { afterEach, beforeEach, describe, expect, it } from "vitest"
 import { createMemoryBridge } from "../../bridge/index.js"
 import type { ExtractedFact } from "../../bridge/index.js"
-import { rmSync, mkdirSync } from "node:fs"
-import { join } from "node:path"
-import { tmpdir } from "node:os"
 
 describe("MemoryBridge", () => {
-  let tempDir: string
-
-  beforeEach(() => {
-    tempDir = join(tmpdir(), `zosma-mem-test-${Date.now()}`)
-    mkdirSync(tempDir, { recursive: true })
-  })
-
-  afterEach(() => {
-    rmSync(tempDir, { recursive: true, force: true })
-  })
-
-  describe("ingestFacts and loadContext round-trip", () => {
-    it("should ingest facts and retrieve them in context", async () => {
-      const bridge = createMemoryBridge({ memoryDir: tempDir })
-
-      const facts: ExtractedFact[] = [
-        {
-          content: "User prefers dark mode interfaces",
-          type: "preference",
-          tags: ["ui", "theme", "preference"]
-        }
-      ]
-
-      await bridge.ingestFacts(facts)
-
-      const { context, injectedIds } = await bridge.loadContext("design the UI")
-      expect(context).toContain("User prefers dark mode interfaces")
-      expect(injectedIds).toHaveLength(1)
-      expect(injectedIds[0]).toMatch(/^[a-f0-9]{16}$/)
-    })
-
-    it("should return empty context when no relevant memories", async () => {
-      const bridge = createMemoryBridge({ memoryDir: tempDir })
-
-      const { context, injectedIds } = await bridge.loadContext("unrelated query")
-      expect(context).toBe("")
-      expect(injectedIds).toEqual([])
-    })
-
-    it("should deduplicate identical facts", async () => {
-      const bridge = createMemoryBridge({ memoryDir: tempDir })
-
-      const facts: ExtractedFact[] = [
-        {
-          content: "User likes coffee",
-          type: "preference",
-          tags: ["drink", "preference"]
-        },
-        {
-          content: "User likes coffee", // Same content
-          type: "preference",
-          tags: ["drink", "preference"]
-        }
-      ]
-
-      await bridge.ingestFacts(facts)
-
-      const entityIds = await bridge.listEntityIds()
-      expect(entityIds).toHaveLength(1) // Should be deduplicated
-    })
-  })
-
-  describe("reinforcement tracking", () => {
-    it("should record usage signals", async () => {
-      const bridge = createMemoryBridge({ memoryDir: tempDir })
-
-      const facts: ExtractedFact[] = [
-        {
-          content: "User's favorite color is blue",
-          type: "preference",
-          tags: ["color", "preference"]
-        }
-      ]
-
-      await bridge.ingestFacts(facts)
-      const { injectedIds } = await bridge.loadContext("what color should I use")
-      expect(injectedIds).toHaveLength(1)
-
-      const entityId = injectedIds[0]
-
-      // Record different usage signals
-      await bridge.recordUsage(entityId, "used")
-      await bridge.recordUsage(entityId, "ignored")
-      await bridge.recordUsage(entityId, "influenced_decision")
-
-      // Should not throw
-      expect(true).toBe(true)
-    })
-  })
-
-  describe("garbage collection", () => {
-    it("should run GC without errors", async () => {
-      const bridge = createMemoryBridge({ memoryDir: tempDir })
-
-      const facts: ExtractedFact[] = [
-        {
-          content: "Old preference that should be garbage collected",
-          type: "preference",
-          tags: ["old"]
-        }
-      ]
-
-      await bridge.ingestFacts(facts)
-      await bridge.gc() // Should not throw
-
-      expect(true).toBe(true)
-    })
-  })
-
-  describe("shutdown", () => {
-    it("should shutdown without errors", async () => {
-      const bridge = createMemoryBridge({ memoryDir: tempDir })
-      bridge.shutdown() // Should not throw
-      expect(true).toBe(true)
-    })
-  })
-
-  describe("cross-session persistence", () => {
-    it("should persist facts across bridge instances", async () => {
-      // First bridge instance
-      const bridge1 = createMemoryBridge({ memoryDir: tempDir })
-      const facts: ExtractedFact[] = [
-        {
-          content: "Persistent memory across sessions",
-          type: "decision",
-          tags: ["persistent", "test"]
-        }
-      ]
-
-      await bridge1.ingestFacts(facts)
-      bridge1.shutdown()
-
-      // Second bridge instance with same directory
-      const bridge2 = createMemoryBridge({ memoryDir: tempDir })
-      const { context } = await bridge2.loadContext("test query")
-
-      expect(context).toContain("Persistent memory across sessions")
-    })
-  })
-
-  describe("salience filtering", () => {
-    it("should respect salience threshold", async () => {
-      const bridge = createMemoryBridge({ memoryDir: tempDir, salienceThreshold: 10 })
-
-      const facts: ExtractedFact[] = [
-        {
-          content: "High salience fact",
-          type: "decision",
-          tags: ["important"]
-        },
-        {
-          content: "Low salience fact",
-          type: "pattern",
-          tags: ["minor"]
-        }
-      ]
-
-      await bridge.ingestFacts(facts)
-
-      // Run GC to prune low-salience facts
-      await bridge.gc()
-
-      const { context } = await bridge.loadContext("important query")
-      expect(context).toBeTruthy() // At least some facts should remain
-    })
-  })
-
-  describe("context formatting", () => {
-    it("should format context with proper structure", async () => {
-      const bridge = createMemoryBridge({ memoryDir: tempDir })
-
-      const facts: ExtractedFact[] = [
-        {
-          content: "Test memory content",
-          type: "preference",
-          tags: ["test"]
-        }
-      ]
-
-      await bridge.ingestFacts(facts)
-      const { context } = await bridge.loadContext("test")
-
-      expect(context).toContain("## Long-term Memory")
-      expect(context).toContain("Test memory content")
-      expect(context).toContain("Use them to inform your responses naturally")
-    })
-
-    it("should limit retrieved memories to topK", async () => {
-      const bridge = createMemoryBridge({ memoryDir: tempDir, topK: 2 })
-
-      const facts: ExtractedFact[] = Array.from({ length: 5 }, (_, i) => ({
-        content: `Memory fact ${i}`,
-        type: "preference" as const,
-        tags: ["test"]
-      }))
-
-      await bridge.ingestFacts(facts)
-      const { injectedIds } = await bridge.loadContext("test")
-
-      expect(injectedIds).toHaveLength(2) // Limited by topK
-    })
-  })
-})
\ No newline at end of file
+	let tempDir: string
+
+	beforeEach(() => {
+		tempDir = join(tmpdir(), `zosma-mem-test-${Date.now()}`)
+		mkdirSync(tempDir, { recursive: true })
+	})
+
+	afterEach(() => {
+		rmSync(tempDir, { recursive: true, force: true })
+	})
+
+	describe("ingestFacts and loadContext round-trip", () => {
+		it("should ingest facts and retrieve them in context", async () => {
+			const bridge = createMemoryBridge({ memoryDir: tempDir })
+
+			const facts: ExtractedFact[] = [
+				{
+					content: "User prefers dark mode interfaces",
+					type: "preference",
+					tags: ["ui", "theme", "preference"],
+				},
+			]
+
+			await bridge.ingestFacts(facts)
+
+			const { context, ids } = await bridge.loadContext("design the UI")
+			expect(context).toContain("User prefers dark mode interfaces")
+			expect(ids).toHaveLength(1)
+			expect(ids[0]).toMatch(/^[a-f0-9]{16}$/)
+		})
+
+		it("should return empty context when no relevant memories", async () => {
+			const bridge = createMemoryBridge({ memoryDir: tempDir })
+
+			const { context, ids } = await bridge.loadContext("unrelated query")
+			expect(context).toBe("")
+			expect(ids).toEqual([])
+		})
+
+		it("should deduplicate identical facts", async () => {
+			const bridge = createMemoryBridge({ memoryDir: tempDir })
+
+			const facts: ExtractedFact[] = [
+				{
+					content: "User likes coffee",
+					type: "preference",
+					tags: ["drink", "preference"],
+				},
+				{
+					content: "User likes coffee", // Same content
+					type: "preference",
+					tags: ["drink", "preference"],
+				},
+			]
+
+			await bridge.ingestFacts(facts)
+
+			const entityIds = await bridge.listEntityIds()
+			expect(entityIds).toHaveLength(1) // Should be deduplicated
+		})
+	})
+
+	describe("reinforcement tracking", () => {
+		it("should record usage signals", async () => {
+			const bridge = createMemoryBridge({ memoryDir: tempDir })
+
+			const facts: ExtractedFact[] = [
+				{
+					content: "User's favorite color is blue",
+					type: "preference",
+					tags: ["color", "preference"],
+				},
+			]
+
+			await bridge.ingestFacts(facts)
+			const { ids } = await bridge.loadContext("what color should I use")
+			expect(ids).toHaveLength(1)
+
+			const entityId = ids[0]
+
+			// Record different usage signals
+			await bridge.recordUsage(entityId, "used")
+			await bridge.recordUsage(entityId, "ignored")
+			await bridge.recordUsage(entityId, "influenced_decision")
+
+			// Should not throw
+			expect(true).toBe(true)
+		})
+	})
+
+	describe("garbage collection", () => {
+		it("should run GC without errors", async () => {
+			const bridge = createMemoryBridge({ memoryDir: tempDir })
+
+			const facts: ExtractedFact[] = [
+				{
+					content: "Old preference that should be garbage collected",
+					type: "preference",
+					tags: ["old"],
+				},
+			]
+
+			await bridge.ingestFacts(facts)
+			await bridge.gc() // Should not throw
+
+			expect(true).toBe(true)
+		})
+	})
+
+	describe("shutdown", () => {
+		it("should shutdown without errors", async () => {
+			const bridge = createMemoryBridge({ memoryDir: tempDir })
+			bridge.shutdown() // Should not throw
+			expect(true).toBe(true)
+		})
+	})
+
+	describe("cross-session persistence", () => {
+		it("should persist facts across bridge instances", async () => {
+			// First bridge instance
+			const bridge1 = createMemoryBridge({ memoryDir: tempDir })
+			const facts: ExtractedFact[] = [
+				{
+					content: "Persistent memory across sessions",
+					type: "decision",
+					tags: ["persistent", "test"],
+				},
+			]
+
+			await bridge1.ingestFacts(facts)
+			bridge1.shutdown()
+
+			// Second bridge instance with same directory
+			const bridge2 = createMemoryBridge({ memoryDir: tempDir })
+			const { context } = await bridge2.loadContext("test query")
+
+			expect(context).toContain("Persistent memory across sessions")
+		})
+	})
+
+	describe("salience filtering", () => {
+		it("should respect salience threshold", async () => {
+			const bridge = createMemoryBridge({ memoryDir: tempDir, salienceThreshold: 10 })
+
+			const facts: ExtractedFact[] = [
+				{
+					content: "High salience fact",
+					type: "decision",
+					tags: ["important"],
+				},
+				{
+					content: "Low salience fact",
+					type: "pattern",
+					tags: ["minor"],
+				},
+			]
+
+			await bridge.ingestFacts(facts)
+
+			// Run GC to prune low-salience facts
+			await bridge.gc()
+
+			const { context } = await bridge.loadContext("important query")
+			expect(context).toBeTruthy() // At least some facts should remain
+		})
+	})
+
+	describe("context formatting", () => {
+		it("should format context with proper structure", async () => {
+			const bridge = createMemoryBridge({ memoryDir: tempDir })
+
+			const facts: ExtractedFact[] = [
+				{
+					content: "Test memory content",
+					type: "preference",
+					tags: ["test"],
+				},
+			]
+
+			await bridge.ingestFacts(facts)
+			const { context } = await bridge.loadContext("test")
+
+			expect(context).toContain("## Long-term Memory")
+			expect(context).toContain("Test memory content")
+			expect(context).toContain("Use them to inform your responses naturally")
+		})
+
+		it("should limit retrieved memories to topK", async () => {
+			const bridge = createMemoryBridge({ memoryDir: tempDir, topK: 2 })
+
+			const facts: ExtractedFact[] = Array.from({ length: 5 }, (_, i) => ({
+				content: `Memory fact ${i}`,
+				type: "preference" as const,
+				tags: ["test"],
+			}))
+
+			await bridge.ingestFacts(facts)
+			const { ids } = await bridge.loadContext("test")
+
+			expect(ids).toHaveLength(2) // Limited by topK
+		})
+	})
+
+	describe("evaluation integration", () => {
+		it("should evaluate retrieval effectiveness using the eval module", async () => {
+			const bridge = createMemoryBridge({ memoryDir: tempDir })
+
+			// Ingest test facts
+			const facts: ExtractedFact[] = [
+				{
+					content: "User prefers dark mode",
+					type: "preference",
+					tags: ["ui", "theme"],
+				},
+				{
+					content: "User likes coffee",
+					type: "preference",
+					tags: ["drink", "preference"],
+				},
+				{
+					content: "Agent should use bash for files",
+					type: "pattern",
+					tags: ["tool", "bash", "file"],
+				},
+			]
+
+			await bridge.ingestFacts(facts)
+
+			// Import eval dynamically to avoid circular deps
+			const { evaluateMemory } = await import("../../evals/index.js")
+
+			const testCases = [
+				{
+					query: "UI design",
+					expectedIds: [], // We don't know exact IDs, so test content instead
+					expectedContent: ["User prefers dark mode"],
+				},
+				{
+					query: "beverages",
+					expectedIds: [],
+					expectedContent: ["User likes coffee"],
+				},
+				{
+					query: "file handling",
+					expectedIds: [],
+					expectedContent: ["Agent should use bash for files"],
+				},
+			]
+
+			const results = await evaluateMemory(bridge, { testCases })
+
+			// Since we can't predict exact IDs, check that some retrieval happened
+			expect(results.metrics.avgRecall).toBeGreaterThanOrEqual(0)
+			expect(results.metrics.avgPrecision).toBeGreaterThanOrEqual(0)
+			expect(results.cases).toHaveLength(3)
+
+			// Check that relevant content was retrieved
+			for (const caseResult of results.cases) {
+				const hasExpected = testCases
+					.find((tc) => tc.query === caseResult.query)
+					?.expectedContent.some((ec) => caseResult.retrievedContext.includes(ec))
+				if (hasExpected) {
+					expect(caseResult.retrievedContext).toBeTruthy()
+				}
+			}
+		})
+	})
+})
diff --git a/packages/zosma-mem/src/bridge/extensions.ts b/packages/zosma-mem/src/bridge/extensions.ts
index 0fd2067..c82184a 100644
--- a/packages/zosma-mem/src/bridge/extensions.ts
+++ b/packages/zosma-mem/src/bridge/extensions.ts
@@ -19,14 +19,14 @@ const require = createRequire(import.meta.url)
  * then falls back to the package root.
  */
 const resolvePiExtension = (pkg: string): string | null => {
-  for (const entry of [`${pkg}/src/index.ts`, `${pkg}/index.ts`, pkg]) {
-    try {
-      return require.resolve(entry)
-    } catch {
-      // try next candidate
-    }
-  }
-  return null
+	for (const entry of [`${pkg}/src/index.ts`, `${pkg}/index.ts`, pkg]) {
+		try {
+			return require.resolve(entry)
+		} catch {
+			// try next candidate
+		}
+	}
+	return null
 }
 
 /**
@@ -39,22 +39,22 @@ const resolvePiExtension = (pkg: string): string | null => {
  * than expected.
  */
 export const resolveMemoryExtensionPaths = (): { paths: string[]; missing: string[] } => {
-  const extensions = [
-    { name: "pi-brain", label: "structured memory (pi-brain)" },
-    { name: "pi-dcp", label: "context pruning (pi-dcp)" },
-  ]
+	const extensions = [
+		{ name: "pi-brain", label: "structured memory (pi-brain)" },
+		{ name: "pi-dcp", label: "context pruning (pi-dcp)" },
+	]
 
-  const paths: string[] = []
-  const missing: string[] = []
+	const paths: string[] = []
+	const missing: string[] = []
 
-  for (const ext of extensions) {
-    const resolved = resolvePiExtension(ext.name)
-    if (resolved) {
-      paths.push(resolved)
-    } else {
-      missing.push(ext.label)
-    }
-  }
+	for (const ext of extensions) {
+		const resolved = resolvePiExtension(ext.name)
+		if (resolved) {
+			paths.push(resolved)
+		} else {
+			missing.push(ext.label)
+		}
+	}
 
-  return { paths, missing }
+	return { paths, missing }
 }
diff --git a/packages/zosma-mem/src/bridge/index.ts b/packages/zosma-mem/src/bridge/index.ts
index 09f95bf..2536b1a 100644
--- a/packages/zosma-mem/src/bridge/index.ts
+++ b/packages/zosma-mem/src/bridge/index.ts
@@ -19,52 +19,52 @@ import { createMemoryEngine } from "../engine/factory.js"
 import type { MemoryEngine, MemoryEventType } from "../types.js"
 
 export interface ExtractedFact {
-  /** Human-readable statement of the fact, e.g. "User's favorite animal is elephant" */
-  content: string
-  /** Semantic type of the fact */
-  type: MemoryEventType
-  /** Short lowercase keywords for retrieval matching */
-  tags: string[]
+	/** Human-readable statement of the fact, e.g. "User's favorite animal is elephant" */
+	content: string
+	/** Semantic type of the fact */
+	type: MemoryEventType
+	/** Short lowercase keywords for retrieval matching */
+	tags: string[]
 }
 
 export interface BridgeConfig {
-  /** Stable per-agent-config memory directory */
-  memoryDir: string
-  /** Minimum salience score to keep during GC. Default: engine default */
-  salienceThreshold?: number
-  /** How many memories to retrieve per turn. Default: 8 */
-  topK?: number
+	/** Stable per-agent-config memory directory */
+	memoryDir: string
+	/** Minimum salience score to keep during GC. Default: engine default */
+	salienceThreshold?: number
+	/** How many memories to retrieve per turn. Default: 8 */
+	topK?: number
 }
 
 export interface MemoryBridge {
-  /**
-   * Retrieve memories relevant to the current user message and format them
-   * as a system prompt section. Returns an empty string when no memories exist.
-   */
-  loadContext: (userMessage: string) => Promise<{ context: string; injectedIds: string[] }>
-
-  /**
-   * Ingest a batch of already-extracted facts into the salience engine.
-   * Called by the agent after each turn with facts extracted from the conversation.
-   */
-  ingestFacts: (facts: ExtractedFact[]) => Promise<void>
-
-  /**
-   * Record a reinforcement signal for a retrieved memory entity.
-   * Call with "used" when the agent references a memory in its response.
-   * Call with "ignored" when a retrieved memory had no visible effect.
-   * Call with "influenced_decision" when the memory directly shaped a tool call or decision.
-   */
-  recordUsage: (entityId: string, signal: "used" | "ignored" | "influenced_decision") => Promise<void>
-
-  /** Run garbage collection — decay + prune low-salience entities. */
-  gc: () => Promise<void>
-
-  /** Shutdown: clear GC timer. Call on session end. */
-  shutdown: () => void
-
-  /** Return all entity IDs currently in the store (for testing). */
-  listEntityIds: () => Promise<string[]>
+	/**
+	 * Retrieve memories relevant to the current user message and format them
+	 * as a system prompt section. Returns an empty string when no memories exist.
+	 */
+	loadContext: (userMessage: string) => Promise<{ context: string; ids: string[] }>
+
+	/**
+	 * Ingest a batch of already-extracted facts into the salience engine.
+	 * Called by the agent after each turn with facts extracted from the conversation.
+	 */
+	ingestFacts: (facts: ExtractedFact[]) => Promise<void>
+
+	/**
+	 * Record a reinforcement signal for a retrieved memory entity.
+	 * Call with "used" when the agent references a memory in its response.
+	 * Call with "ignored" when a retrieved memory had no visible effect.
+	 * Call with "influenced_decision" when the memory directly shaped a tool call or decision.
+	 */
+	recordUsage: (entityId: string, signal: "used" | "ignored" | "influenced_decision") => Promise<void>
+
+	/** Run garbage collection — decay + prune low-salience entities. */
+	gc: () => Promise<void>
+
+	/** Shutdown: clear GC timer. Call on session end. */
+	shutdown: () => void
+
+	/** Return all entity IDs currently in the store (for testing). */
+	listEntityIds: () => Promise<string[]>
 }
 
 /**
@@ -72,101 +72,96 @@ export interface MemoryBridge {
  * it hashes to the same ID, so the engine deduplicates it by updating in place.
  */
 export const factId = (content: string): string =>
-  createHash("sha256").update(content.trim().toLowerCase().replace(/\s+/g, ' ')).digest("hex").slice(0, 16)
+	createHash("sha256").update(content.trim().toLowerCase().replace(/\s+/g, " ")).digest("hex").slice(0, 16)
 
 /**
  * Format retrieved memories as a system prompt section.
  */
-const formatContext = (
-  memories: Array<{ id: string; content: string; score: number }>,
-): string => {
-  if (memories.length === 0) return ""
-
-  const lines = [
-    "## Long-term Memory",
-    "",
-    "The following facts have been remembered from previous conversations with this user.",
-    "Use them to inform your responses naturally, without mentioning memory IDs or scores.",
-    "",
-    ...memories.map((m) => `- ${m.content}`),
-    "",
-  ]
-
-  return lines.join("\n")
+const formatContext = (memories: Array<{ id: string; content: string; score: number }>): string => {
+	if (memories.length === 0) return ""
+
+	const lines = [
+		"## Long-term Memory",
+		"",
+		"The following facts have been remembered from previous conversations with this user.",
+		"Use them to inform your responses naturally, without mentioning memory IDs or scores.",
+		"",
+		...memories.map((m) => `- ${m.content}`),
+		"",
+	]
+
+	return lines.join("\n")
 }
 
 /**
  * Create a MemoryBridge backed by the zosma-mem salience engine.
  */
 export const createMemoryBridge = (config: BridgeConfig): MemoryBridge => {
-  const engine: MemoryEngine = createMemoryEngine({
-    memoryDir: config.memoryDir,
-    salienceThreshold: config.salienceThreshold,
-    // GC every 5 minutes in production. Tests override via config.
-    gcIntervalMs: 5 * 60 * 1000,
-    gcPruneCycles: 2,
-  })
-
-  const topK = config.topK ?? 8
-
-  const loadContext = async (userMessage: string): Promise<{ context: string; injectedIds: string[] }> => {
-    const results = await engine.retrieve({ taskDescription: userMessage }, topK)
-
-    if (results.length === 0) return { context: "", injectedIds: [] }
-
-    const memories = results.map((r) => ({
-      id: r.entity.id,
-      content: r.entity.content,
-      score: r.attentionScore,
-    }))
-
-    // Record ignored reads for entities that scored below threshold
-    // (returned in results but likely not relevant). The low score is the signal.
-    for (const r of results) {
-      if (r.attentionScore < 1) {
-        await engine.recordIgnoredRead(r.entity.id)
-      }
-    }
-
-    const injectedIds = memories.map(m => m.id)
-    return { context: formatContext(memories), injectedIds }
-  }
-
-  const ingestFacts = async (facts: ExtractedFact[]): Promise<void> => {
-    const now = Date.now()
-    for (const fact of facts) {
-      await engine.ingest({
-        id: factId(fact.content),
-        type: fact.type,
-        content: fact.content,
-        tags: fact.tags,
-        timestamp: now,
-      })
-    }
-  }
-
-  const recordUsage = async (
-    entityId: string,
-    signal: "used" | "ignored" | "influenced_decision",
-  ): Promise<void> => {
-    if (signal === "used") {
-      await engine.recordRead(entityId)
-    } else if (signal === "ignored") {
-      await engine.recordIgnoredRead(entityId)
-    } else {
-      await engine.recordDecisionInfluence(entityId)
-    }
-  }
-
-  const gc = async (): Promise<void> => {
-    await engine.gc()
-  }
-
-  const shutdown = (): void => {
-    engine.shutdown()
-  }
-
-  const listEntityIds = async (): Promise<string[]> => engine.listEntities()
-
-  return { loadContext, ingestFacts, recordUsage, gc, shutdown, listEntityIds }
+	const engine: MemoryEngine = createMemoryEngine({
+		memoryDir: config.memoryDir,
+		salienceThreshold: config.salienceThreshold,
+		// GC every 5 minutes in production. Tests override via config.
+		gcIntervalMs: 5 * 60 * 1000,
+		gcPruneCycles: 2,
+	})
+
+	const topK = config.topK ?? 8
+
+	const loadContext = async (userMessage: string): Promise<{ context: string; ids: string[] }> => {
+		const results = await engine.retrieve({ taskDescription: userMessage }, topK)
+
+		if (results.length === 0) return { context: "", ids: [] }
+
+		const memories = results.map((r) => ({
+			id: r.entity.id,
+			content: r.entity.content,
+			score: r.attentionScore,
+		}))
+
+		// Record ignored reads for entities that scored below threshold
+		// (returned in results but likely not relevant). The low score is the signal.
+		for (const r of results) {
+			if (r.attentionScore < 1) {
+				await engine.recordIgnoredRead(r.entity.id)
+			}
+		}
+
+		const ids = memories.map((m) => m.id)
+		return { context: formatContext(memories), ids }
+	}
+
+	const ingestFacts = async (facts: ExtractedFact[]): Promise<void> => {
+		const now = Date.now()
+		for (const fact of facts) {
+			await engine.ingest({
+				id: factId(fact.content),
+				type: fact.type,
+				content: fact.content,
+				tags: fact.tags,
+				timestamp: now,
+			})
+		}
+	}
+
+	const recordUsage = async (entityId: string, signal: "used" | "ignored" | "influenced_decision"): Promise<void> => {
+		if (signal === "used") {
+			await engine.recordRead(entityId)
+		} else if (signal === "ignored") {
+			await engine.recordIgnoredRead(entityId)
+		} else {
+			await engine.recordDecisionInfluence(entityId)
+		}
+	}
+
+	const gc = async (): Promise<void> => {
+		await engine.gc()
+	}
+
+	const shutdown = (): void => {
+		engine.shutdown()
+	}
+
+	const listEntityIds = async (): Promise<string[]> => engine.listEntities()
+
+	return { loadContext, ingestFacts, recordUsage, gc, shutdown, listEntityIds }
 }
diff --git a/packages/zosma-mem/src/engine/__tests__/factory.test.ts b/packages/zosma-mem/src/engine/__tests__/factory.test.ts
index bf7c251..0f41d97 100644
--- a/packages/zosma-mem/src/engine/__tests__/factory.test.ts
+++ b/packages/zosma-mem/src/engine/__tests__/factory.test.ts
@@ -1,48 +1,48 @@
-import { describe, it, expect } from 'vitest'
-import { mkdtempSync } from 'node:fs'
-import { tmpdir } from 'node:os'
-import { join } from 'node:path'
-import { createMemoryEngine } from '../factory.js'
+import { mkdtempSync } from "node:fs"
+import { tmpdir } from "node:os"
+import { join } from "node:path"
+import { describe, expect, it } from "vitest"
+import { createMemoryEngine } from "../factory.js"
 
 const NOW = 1_000_000_000_000
 
-const makeDir = () => mkdtempSync(join(tmpdir(), 'factory-test-'))
+const makeDir = () => mkdtempSync(join(tmpdir(), "factory-test-"))
 
-describe('createMemoryEngine', () => {
-  it('ingest a decision event then retrieve it', async () => {
-    const memoryDir = makeDir()
-    const engine = createMemoryEngine({ memoryDir, gcIntervalMs: 0, now: () => NOW })
-    await engine.ingest({
-      id: 'ev1',
-      type: 'decision',
-      content: 'use typescript for everything',
-      tags: ['typescript', 'architecture'],
-      timestamp: NOW,
-    })
-    const results = await engine.retrieve({ taskDescription: 'typescript architecture' }, 5)
-    expect(results.some((r) => r.entity.id === 'ev1')).toBe(true)
-    engine.shutdown()
-  })
+describe("createMemoryEngine", () => {
+	it("ingest a decision event then retrieve it", async () => {
+		const memoryDir = makeDir()
+		const engine = createMemoryEngine({ memoryDir, gcIntervalMs: 0, now: () => NOW })
+		await engine.ingest({
+			id: "ev1",
+			type: "decision",
+			content: "use typescript for everything",
+			tags: ["typescript", "architecture"],
+			timestamp: NOW,
+		})
+		const results = await engine.retrieve({ taskDescription: "typescript architecture" }, 5)
+		expect(results.some((r) => r.entity.id === "ev1")).toBe(true)
+		engine.shutdown()
+	})
 
-  it('shutdown does not throw', () => {
-    const memoryDir = makeDir()
-    const engine = createMemoryEngine({ memoryDir, gcIntervalMs: 0 })
-    expect(() => engine.shutdown()).not.toThrow()
-  })
+	it("shutdown does not throw", () => {
+		const memoryDir = makeDir()
+		const engine = createMemoryEngine({ memoryDir, gcIntervalMs: 0 })
+		expect(() => engine.shutdown()).not.toThrow()
+	})
 
-  it('ingest + recordDecisionInfluence + retrieve: entity still appears', async () => {
-    const memoryDir = makeDir()
-    const engine = createMemoryEngine({ memoryDir, gcIntervalMs: 0, now: () => NOW })
-    await engine.ingest({
-      id: 'ev2',
-      type: 'decision',
-      content: 'auth strategy',
-      tags: ['auth'],
-      timestamp: NOW,
-    })
-    await engine.recordDecisionInfluence('ev2')
-    const results = await engine.retrieve({ taskDescription: 'auth strategy' }, 5)
-    expect(results.some((r) => r.entity.id === 'ev2')).toBe(true)
-    engine.shutdown()
-  })
+	it("ingest + recordDecisionInfluence + retrieve: entity still appears", async () => {
+		const memoryDir = makeDir()
+		const engine = createMemoryEngine({ memoryDir, gcIntervalMs: 0, now: () => NOW })
+		await engine.ingest({
+			id: "ev2",
+			type: "decision",
+			content: "auth strategy",
+			tags: ["auth"],
+			timestamp: NOW,
+		})
+		await engine.recordDecisionInfluence("ev2")
+		const results = await engine.retrieve({ taskDescription: "auth strategy" }, 5)
+		expect(results.some((r) => r.entity.id === "ev2")).toBe(true)
+		engine.shutdown()
+	})
 })
diff --git a/packages/zosma-mem/src/engine/__tests__/reinforcement.test.ts b/packages/zosma-mem/src/engine/__tests__/reinforcement.test.ts
index 2b669c9..08c220b 100644
--- a/packages/zosma-mem/src/engine/__tests__/reinforcement.test.ts
+++ b/packages/zosma-mem/src/engine/__tests__/reinforcement.test.ts
@@ -1,71 +1,71 @@
-import { describe, it, expect } from 'vitest'
-import { mkdtempSync } from 'node:fs'
-import { tmpdir } from 'node:os'
-import { join } from 'node:path'
-import { EntityStore } from '../../store/entity-store.js'
-import type { MemoryEntity } from '../../types.js'
-import { recordRead, recordIgnoredRead, recordDecisionInfluence } from '../reinforcement.js'
+import { mkdtempSync } from "node:fs"
+import { tmpdir } from "node:os"
+import { join } from "node:path"
+import { describe, expect, it } from "vitest"
+import { EntityStore } from "../../store/entity-store.js"
+import type { MemoryEntity } from "../../types.js"
+import { recordDecisionInfluence, recordIgnoredRead, recordRead } from "../reinforcement.js"
 
 const BASE_TS = 1_000_000_000_000
 
 const makeEntity = (id: string): MemoryEntity => ({
-  id,
-  source: { branch: 'main', commitRef: '0' },
-  score: {
-    reuseCount: 0,
-    decisionInfluence: 0,
-    ignoredReads: 0,
-    lastAccessed: BASE_TS,
-    attentionWeight: 0,
-    belowThresholdCycles: 0,
-  },
-  tags: [],
-  content: 'test',
+	id,
+	source: { branch: "main", commitRef: "0" },
+	score: {
+		reuseCount: 0,
+		decisionInfluence: 0,
+		ignoredReads: 0,
+		lastAccessed: BASE_TS,
+		attentionWeight: 0,
+		belowThresholdCycles: 0,
+	},
+	tags: [],
+	content: "test",
 })
 
 const makeStore = (entity: MemoryEntity): EntityStore => {
-  const dir = mkdtempSync(join(tmpdir(), 'reinforcement-test-'))
-  const store = new EntityStore(dir)
-  store.ensureDir()
-  store.write(entity)
-  return store
+	const dir = mkdtempSync(join(tmpdir(), "reinforcement-test-"))
+	const store = new EntityStore(dir)
+	store.ensureDir()
+	store.write(entity)
+	return store
 }
 
-describe('reinforcement', () => {
-  it('recordRead increments reuseCount and updates lastAccessed', () => {
-    const entity = makeEntity('e1')
-    const store = makeStore(entity)
-    const later = BASE_TS + 5000
-    recordRead('e1', store, () => later)
-    const updated = store.read('e1')!
-    expect(updated.score.reuseCount).toBe(1)
-    expect(updated.score.lastAccessed).toBe(later)
-  })
+describe("reinforcement", () => {
+	it("recordRead increments reuseCount and updates lastAccessed", () => {
+		const entity = makeEntity("e1")
+		const store = makeStore(entity)
+		const later = BASE_TS + 5000
+		recordRead("e1", store, () => later)
+		const updated = store.read("e1")!
+		expect(updated.score.reuseCount).toBe(1)
+		expect(updated.score.lastAccessed).toBe(later)
+	})
 
-  it('recordIgnoredRead increments ignoredReads and does NOT update lastAccessed', () => {
-    const entity = makeEntity('e2')
-    const store = makeStore(entity)
-    recordIgnoredRead('e2', store)
-    const updated = store.read('e2')!
-    expect(updated.score.ignoredReads).toBe(1)
-    expect(updated.score.lastAccessed).toBe(BASE_TS)
-  })
+	it("recordIgnoredRead increments ignoredReads and does NOT update lastAccessed", () => {
+		const entity = makeEntity("e2")
+		const store = makeStore(entity)
+		recordIgnoredRead("e2", store)
+		const updated = store.read("e2")!
+		expect(updated.score.ignoredReads).toBe(1)
+		expect(updated.score.lastAccessed).toBe(BASE_TS)
+	})
 
-  it('recordDecisionInfluence increments decisionInfluence and updates lastAccessed', () => {
-    const entity = makeEntity('e3')
-    const store = makeStore(entity)
-    const later = BASE_TS + 9000
-    recordDecisionInfluence('e3', store, () => later)
-    const updated = store.read('e3')!
-    expect(updated.score.decisionInfluence).toBe(1)
-    expect(updated.score.lastAccessed).toBe(later)
-  })
+	it("recordDecisionInfluence increments decisionInfluence and updates lastAccessed", () => {
+		const entity = makeEntity("e3")
+		const store = makeStore(entity)
+		const later = BASE_TS + 9000
+		recordDecisionInfluence("e3", store, () => later)
+		const updated = store.read("e3")!
+		expect(updated.score.decisionInfluence).toBe(1)
+		expect(updated.score.lastAccessed).toBe(later)
+	})
 
-  it('missing entity ID is a no-op', () => {
-    const entity = makeEntity('e4')
-    const store = makeStore(entity)
-    expect(() => recordRead('nonexistent', store)).not.toThrow()
-    expect(() => recordIgnoredRead('nonexistent', store)).not.toThrow()
-    expect(() => recordDecisionInfluence('nonexistent', store)).not.toThrow()
-  })
+	it("missing entity ID is a no-op", () => {
+		const entity = makeEntity("e4")
+		const store = makeStore(entity)
+		expect(() => recordRead("nonexistent", store)).not.toThrow()
+		expect(() => recordIgnoredRead("nonexistent", store)).not.toThrow()
+		expect(() => recordDecisionInfluence("nonexistent", store)).not.toThrow()
+	})
 })
diff --git a/packages/zosma-mem/src/engine/salience.ts b/packages/zosma-mem/src/engine/salience.ts
index 6de884c..9331abe 100644
--- a/packages/zosma-mem/src/engine/salience.ts
+++ b/packages/zosma-mem/src/engine/salience.ts
@@ -1,4 +1,4 @@
-import type { MemoryScore } from '../types.js'
+import type { MemoryScore } from "../types.js"
 
 /**
  * Compute the salience score for a memory entity.
@@ -6,18 +6,18 @@ import type { MemoryScore } from '../types.js'
  * ageDays is computed from lastAccessed using the injectable now().
  */
 export const computeSalience = (score: MemoryScore, now: () => number = Date.now): number => {
-  const ageDays = (now() - score.lastAccessed) / 86_400_000
-  const decay = Math.log(1 + ageDays)
-  return 2 * score.reuseCount + 5 * score.decisionInfluence - 2 * score.ignoredReads - decay
+	const ageDays = (now() - score.lastAccessed) / 86_400_000
+	const decay = Math.log(1 + ageDays)
+	return 2 * score.reuseCount + 5 * score.decisionInfluence - 2 * score.ignoredReads - decay
 }
 
 export const meetsThreshold = (salience: number, threshold: number): boolean => salience >= threshold
 
 export const initialScore = (eventType: string, now: () => number = Date.now): MemoryScore => ({
-  reuseCount: 0,
-  decisionInfluence: eventType === 'decision' ? 1 : 0,
-  ignoredReads: 0,
-  lastAccessed: now(),
-  attentionWeight: eventType === 'decision' ? 1.0 : 0.0,
-  belowThresholdCycles: 0,
+	reuseCount: 0,
+	decisionInfluence: eventType === "decision" ? 1 : 0,
+	ignoredReads: 0,
+	lastAccessed: now(),
+	attentionWeight: eventType === "decision" ? 1.0 : 0.0,
+	belowThresholdCycles: 0,
 })
diff --git a/packages/zosma-mem/src/evals/__tests__/evals.test.ts b/packages/zosma-mem/src/evals/__tests__/evals.test.ts
new file mode 100644
index 0000000..1d98238
--- /dev/null
+++ b/packages/zosma-mem/src/evals/__tests__/evals.test.ts
@@ -0,0 +1,93 @@
+import { describe, expect, it, vi } from "vitest"
+import { computeMetrics, evaluateMemory } from "../eval.js"
+import type { EvalTestCase, MemoryInterface } from "../types.js"
+
+describe("Memory Evaluation", () => {
+	it("should compute perfect recall and precision", () => {
+		const expected = ["id1", "id2"]
+		const retrieved = ["id1", "id2"]
+		const result = computeMetrics(expected, retrieved)
+		expect(result.recall).toBe(1)
+		expect(result.precision).toBe(1)
+		expect(result.f1).toBe(1)
+		expect(result.truePositives).toBe(2)
+	})
+
+	it("should compute zero recall for no matches", () => {
+		const expected = ["id1", "id2"]
+		const retrieved = ["id3", "id4"]
+		const result = computeMetrics(expected, retrieved)
+		expect(result.recall).toBe(0)
+		expect(result.precision).toBe(0)
+		expect(result.f1).toBe(0)
+		expect(result.truePositives).toBe(0)
+	})
+
+	it("should handle empty expected", () => {
+		const expected: string[] = []
+		const retrieved = ["id1"]
+		const result = computeMetrics(expected, retrieved)
+		expect(result.recall).toBe(0)
+		expect(result.precision).toBe(0)
+		expect(result.f1).toBe(0)
+	})
+
+	it("should handle empty retrieved", () => {
+		const expected = ["id1"]
+		const retrieved: string[] = []
+		const result = computeMetrics(expected, retrieved)
+		expect(result.recall).toBe(0)
+		expect(result.precision).toBe(0) // No retrieved, so precision is 0 (no true positives out of nothing)
+		expect(result.f1).toBe(0)
+	})
+
+	const mockLoadContext = vi.fn()
+	const mockMemory: MemoryInterface = {
+		loadContext: mockLoadContext,
+	}
+
+	it("should evaluate multiple test cases", async () => {
+		const testCases: EvalTestCase[] = [
+			{
+				query: "query1",
+				expectedIds: ["id1"],
+				expectedContent: [],
+			},
+			{
+				query: "query2",
+				expectedIds: ["id2", "id3"],
+				expectedContent: [],
+			},
+		]
+
+		// Mock responses
+		mockLoadContext.mockImplementation(async (query: string) => {
+			if (query === "query1") {
+				return { context: "context1", ids: ["id1"] }
+			}
+			return { context: "context2", ids: ["id2"] }
+		})
+
+		const results = await evaluateMemory(mockMemory, { testCases })
+
+		expect(results.metrics.avgRecall).toBe(0.75) // (1 + 0.5) / 2
+		expect(results.metrics.avgPrecision).toBe(1) // (1 + 1) / 2
+		expect(results.cases).toHaveLength(2)
+		expect(results.cases[0].recall).toBe(1)
+		expect(results.cases[1].recall).toBe(0.5)
+	})
+
+	it("should handle memory errors", async () => {
+		const testCases: EvalTestCase[] = [
+			{
+				query: "failing query",
+				expectedIds: ["id1"],
+				expectedContent: [],
+			},
+		]
+
+		mockLoadContext.mockRejectedValue(new Error("Memory error"))
+
+		await expect(evaluateMemory(mockMemory, { testCases })).rejects.toThrow("Memory error")
+	})
+})
diff --git a/packages/zosma-mem/src/evals/eval.ts b/packages/zosma-mem/src/evals/eval.ts
new file mode 100644
index 0000000..a2529af
--- /dev/null
+++ b/packages/zosma-mem/src/evals/eval.ts
@@ -0,0 +1,61 @@
+import type { EvalConfig, EvalResults, MemoryInterface } from "./types.js"
+
+/**
+ * Run evaluation on a memory system using the provided test cases.
+ * Computes recall, precision, and F1 for retrieval effectiveness.
+ */
+export async function evaluateMemory(memory: MemoryInterface, config: EvalConfig): Promise<EvalResults> {
+	const cases: EvalResults["cases"] = []
+
+	for (const testCase of config.testCases) {
+		const { context, ids: retrievedIds } = await memory.loadContext(testCase.query)
+
+		const expectedIds = new Set(testCase.expectedIds)
+		const retrievedSet = new Set(retrievedIds)
+
+		// Recall: fraction of expected IDs retrieved
+		const truePositives = [...expectedIds].filter((id) => retrievedSet.has(id)).length
+		const recall = expectedIds.size > 0 ? truePositives / expectedIds.size : 0
+
+		// Precision: fraction of retrieved IDs that are expected
+		const precision = retrievedIds.length > 0 ? truePositives / retrievedIds.length : 0
+
+		// F1 score
+		const f1 = recall + precision > 0 ? (2 * recall * precision) / (recall + precision) : 0
+
+		cases.push({
+			query: testCase.query,
+			recall,
+			precision,
+			f1,
+			retrievedIds,
+			retrievedContext: context,
+		})
+	}
+
+	// Aggregate metrics
+	const avgRecall = cases.reduce((sum, c) => sum + c.recall, 0) / cases.length
+	const avgPrecision = cases.reduce((sum, c) => sum + c.precision, 0) / cases.length
+	const avgF1 = cases.reduce((sum, c) => sum + c.f1, 0) / cases.length
+
+	return {
+		metrics: { avgRecall, avgPrecision, avgF1 },
+		cases,
+	}
+}
+
+/**
+ * Utility to compute individual metrics for a single test case.
+ * Useful for custom evaluations.
+ */
+export function computeMetrics(expectedIds: string[], retrievedIds: string[]) {
+	const expectedSet = new Set(expectedIds)
+	const retrievedSet = new Set(retrievedIds)
+
+	const truePositives = [...expectedSet].filter((id) => retrievedSet.has(id)).length
+	const recall = expectedSet.size > 0 ? truePositives / expectedSet.size : 0
+	const precision = retrievedIds.length > 0 ? truePositives / retrievedIds.length : 0
+	const f1 = recall + precision > 0 ? (2 * recall * precision) / (recall + precision) : 0
+
+	return { recall, precision, f1, truePositives }
+}
diff --git a/packages/zosma-mem/src/evals/index.ts b/packages/zosma-mem/src/evals/index.ts
new file mode 100644
index 0000000..df53650
--- /dev/null
+++ b/packages/zosma-mem/src/evals/index.ts
@@ -0,0 +1,2 @@
+export * from "./types.js"
+export * from "./eval.js"
diff --git a/packages/zosma-mem/src/evals/types.ts b/packages/zosma-mem/src/evals/types.ts
new file mode 100644
index 0000000..46f20e9
--- /dev/null
+++ b/packages/zosma-mem/src/evals/types.ts
@@ -0,0 +1,66 @@
+/**
+ * Agnostic evaluation interfaces for memory retrieval systems.
+ * Allows any TypeScript memory implementation to be evaluated for effectiveness.
+ */
+
+/**
+ * Interface that memory systems must implement to be evaluated.
+ * Agnostic to the underlying storage (file-based, DB, etc.).
+ */
+export interface MemoryInterface {
+	/**
+	 * Retrieve context and entity IDs for a given query.
+	 * @param query The user query string.
+	 * @returns Promise resolving to retrieved context and IDs.
+	 */
+	loadContext(query: string): Promise<{ context: string; ids: string[] }>
+}
+
+/**
+ * A test case for evaluation.
+ */
+export interface EvalTestCase {
+	/** The query to test retrieval on. */
+	query: string
+	/** Expected entity IDs that should be retrieved (for recall). */
+	expectedIds: string[]
+	/** Expected content snippets that should appear in context (for relevance). */
+	expectedContent: string[]
+}
+
+/**
+ * Results of running an evaluation.
+ */
+export interface EvalResults {
+	/** Overall metrics. */
+	metrics: {
+		/** Average recall across test cases (0-1). */
+		avgRecall: number
+		/** Average precision across test cases (0-1). */
+		avgPrecision: number
+		/** Average F1 score. */
+		avgF1: number
+	}
+	/** Per-test-case results. */
+	cases: Array<{
+		query: string
+		recall: number
+		precision: number
+		f1: number
+		retrievedIds: string[]
+		retrievedContext: string
+	}>
+}
+
+/**
+ * Configuration for evaluation.
+ */
+export interface EvalConfig {
+	/** Test cases to run. */
+	testCases: EvalTestCase[]
+	/** Optional: Minimum salience or other thresholds. */
+	options?: {
+		/** Whether to check for expected content in context. */
+		checkContent?: boolean
+	}
+}
diff --git a/packages/zosma-mem/src/retrieval/retrieve.ts b/packages/zosma-mem/src/retrieval/retrieve.ts
index 9c1be3a..4f699f0 100644
--- a/packages/zosma-mem/src/retrieval/retrieve.ts
+++ b/packages/zosma-mem/src/retrieval/retrieve.ts
@@ -27,7 +27,12 @@ export const retrieve = (
 	// Intent tags (e.g. ["auth", "session"]) get a higher weight — they are
 	// explicit signals about what the agent is working on right now.
 	const intentTags: Set<string> = query.intent
-		? new Set(query.intent.toLowerCase().split(/\s+/).filter((t) => t.length > 0))
+		? new Set(
+				query.intent
+					.toLowerCase()
+					.split(/\s+/)
+					.filter((t) => t.length > 0),
+			)
 		: new Set()
 
 	const ids = store.list()
@@ -39,9 +44,7 @@ export const retrieve = (
 			const entity = store.read(id)
 			if (!entity) return null
 			const taskOverlap = entity.tags.filter((t) => taskTerms.has(t.toLowerCase())).length
-			const intentOverlap = intentTags.size > 0
-				? entity.tags.filter((t) => intentTags.has(t.toLowerCase())).length
-				: 0
+			const intentOverlap = intentTags.size > 0 ? entity.tags.filter((t) => intentTags.has(t.toLowerCase())).length : 0
 			const salience = computeSalience(entity.score, nowFn)
 
 			// Context isolation: when intent tags are provided and the entity has
diff --git a/packages/zosma-mem/src/types.ts b/packages/zosma-mem/src/types.ts
index 221c268..14b7106 100644
--- a/packages/zosma-mem/src/types.ts
+++ b/packages/zosma-mem/src/types.ts
@@ -1,75 +1,75 @@
 // Engine types
-export type MemoryEventType = 'decision' | 'error' | 'pattern' | 'preference'
+export type MemoryEventType = "decision" | "error" | "pattern" | "preference"
 
 export interface MemoryEvent {
-  id: string
-  type: MemoryEventType
-  content: string
-  tags: string[]
-  attentionWeight?: number
-  metadata?: {
-    file?: string
-    module?: string
-    relatedMemories?: string[]
-    branch?: string
-    commitRef?: string
-  }
-  timestamp: number
+	id: string
+	type: MemoryEventType
+	content: string
+	tags: string[]
+	attentionWeight?: number
+	metadata?: {
+		file?: string
+		module?: string
+		relatedMemories?: string[]
+		branch?: string
+		commitRef?: string
+	}
+	timestamp: number
 }
 
 export interface MemoryScore {
-  reuseCount: number
-  decisionInfluence: number
-  ignoredReads: number
-  lastAccessed: number
-  attentionWeight: number
-  belowThresholdCycles: number
+	reuseCount: number
+	decisionInfluence: number
+	ignoredReads: number
+	lastAccessed: number
+	attentionWeight: number
+	belowThresholdCycles: number
 }
 
 export interface MemoryEntity {
-  id: string
-  source: { branch: string; commitRef: string }
-  score: MemoryScore
-  tags: string[]
-  content: string
+	id: string
+	source: { branch: string; commitRef: string }
+	score: MemoryScore
+	tags: string[]
+	content: string
 }
 
 export interface MemoryConfig {
-  memoryDir: string
-  salienceThreshold?: number
-  gcIntervalMs?: number
-  gcPruneCycles?: number
-  summarizer?: Summarizer
-  now?: () => number
+	memoryDir: string
+	salienceThreshold?: number
+	gcIntervalMs?: number
+	gcPruneCycles?: number
+	summarizer?: Summarizer
+	now?: () => number
 }
 
 export type Summarizer = (texts: string[]) => Promise<string>
 
 export interface AttentionQuery {
-  taskDescription: string
-  activeToolName?: string
-  intent?: string
+	taskDescription: string
+	activeToolName?: string
+	intent?: string
 }
 
 export interface ScoredEntity {
-  entity: MemoryEntity
-  attentionScore: number
+	entity: MemoryEntity
+	attentionScore: number
 }
 
 export interface GcReport {
-  decayed: number
-  pruned: number
-  consolidated: number
+	decayed: number
+	pruned: number
+	consolidated: number
 }
 
 export interface MemoryEngine {
-  ingest: (event: MemoryEvent) => Promise<void>
-  retrieve: (query: AttentionQuery, topK?: number) => Promise<ScoredEntity[]>
-  recordRead: (entityId: string) => Promise<void>
-  recordIgnoredRead: (entityId: string) => Promise<void>
-  recordDecisionInfluence: (entityId: string) => Promise<void>
-  gc: () => Promise<GcReport>
-  shutdown: () => void
-  /** Return all persisted entity IDs (used by the eval adapter). */
-  listEntities: () => Promise<string[]>
+	ingest: (event: MemoryEvent) => Promise<void>
+	retrieve: (query: AttentionQuery, topK?: number) => Promise<ScoredEntity[]>
+	recordRead: (entityId: string) => Promise<void>
+	recordIgnoredRead: (entityId: string) => Promise<void>
+	recordDecisionInfluence: (entityId: string) => Promise<void>
+	gc: () => Promise<GcReport>
+	shutdown: () => void
+	/** Return all persisted entity IDs (used by the eval adapter). */
+	listEntities: () => Promise<string[]>
 }
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index bcf97d4..60409c0 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -707,6 +707,12 @@ importers:
 
   packages/zosma-mem:
     dependencies:
+      '@clack/prompts':
+        specifier: ^0.10.0
+        version: 0.10.1
+      '@openzosma/logger':
+        specifier: workspace:*
+        version: link:../logger
       chalk:
         specifier: ^5.4.0
         version: 5.6.2
@@ -7791,14 +7797,14 @@ snapshots:
       nanostores: 1.2.0
       zod: 4.3.6
 
-  '@better-auth/drizzle-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)':
+  '@better-auth/drizzle-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)':
     dependencies:
-      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0)
+      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0)
       '@better-auth/utils': 0.3.1
 
-  '@better-auth/kysely-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(kysely@0.28.13)':
+  '@better-auth/kysely-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(kysely@0.28.13)':
     dependencies:
-      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0)
+      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0)
       '@better-auth/utils': 0.3.1
       kysely: 0.28.13
 
@@ -7808,25 +7814,25 @@ snapshots:
       '@better-auth/utils': 0.3.1
       kysely: 0.28.14
 
-  '@better-auth/memory-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)':
+  '@better-auth/memory-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)':
     dependencies:
-      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0)
+      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0)
       '@better-auth/utils': 0.3.1
 
-  '@better-auth/mongo-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(mongodb@7.1.0(socks@2.8.7))':
+  '@better-auth/mongo-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(mongodb@7.1.0(socks@2.8.7))':
     dependencies:
-      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0)
+      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0)
       '@better-auth/utils': 0.3.1
       mongodb: 7.1.0(socks@2.8.7)
 
-  '@better-auth/prisma-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)':
+  '@better-auth/prisma-adapter@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)':
     dependencies:
-      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0)
+      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0)
       '@better-auth/utils': 0.3.1
 
-  '@better-auth/telemetry@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))':
+  '@better-auth/telemetry@1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))':
     dependencies:
-      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0)
+      '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0)
       '@better-auth/utils': 0.3.1
       '@better-fetch/fetch': 1.1.21
 
@@ -10873,12 +10879,12 @@ snapshots:
   better-auth@1.5.5(mongodb@7.1.0(socks@2.8.7))(mysql2@3.20.0(@types/node@22.19.15))(next@16.2.0(@opentelemetry/api@1.9.0)(babel-plugin-react-compiler@1.0.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4))(pg@8.20.0)(react-dom@19.2.4(react@19.2.4))(react@19.2.4)(vitest@3.2.4(@types/debug@4.1.12)(@types/node@22.19.15)(jiti@2.6.1)(lightningcss@1.32.0)(tsx@4.21.0)(yaml@2.8.3)):
     dependencies:
       '@better-auth/core': 1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0)
-      '@better-auth/drizzle-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)
-      '@better-auth/kysely-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(kysely@0.28.13)
-      '@better-auth/memory-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)
-      '@better-auth/mongo-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(mongodb@7.1.0(socks@2.8.7))
-      '@better-auth/prisma-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))(@better-auth/utils@0.3.1)
-      '@better-auth/telemetry': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.14)(nanostores@1.2.0))
+      '@better-auth/drizzle-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)
+      '@better-auth/kysely-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(kysely@0.28.13)
+      '@better-auth/memory-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)
+      '@better-auth/mongo-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)(mongodb@7.1.0(socks@2.8.7))
+      '@better-auth/prisma-adapter': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))(@better-auth/utils@0.3.1)
+      '@better-auth/telemetry': 1.5.5(@better-auth/core@1.5.5(@better-auth/utils@0.3.1)(@better-fetch/fetch@1.1.21)(better-call@1.3.2(zod@4.3.6))(jose@6.2.2)(kysely@0.28.13)(nanostores@1.2.0))
       '@better-auth/utils': 0.3.1
       '@better-fetch/fetch': 1.1.21
       '@noble/ciphers': 2.1.1

From de9c0ff49249d32b05f558ffa5cfe9cc81165a60 Mon Sep 17 00:00:00 2001
From: shanvit <shanvit7@gmail.com>
Date: Fri, 10 Apr 2026 16:38:41 +0530
Subject: [PATCH 07/12] chore: evals fixed

---
 packages/zosma-mem/src/bin/eval.ts   | 131 ++++++++++++++++++++++++---
 packages/zosma-mem/src/evals/eval.ts |  26 +++++-
 2 files changed, 143 insertions(+), 14 deletions(-)

diff --git a/packages/zosma-mem/src/bin/eval.ts b/packages/zosma-mem/src/bin/eval.ts
index 107e762..24feec1 100644
--- a/packages/zosma-mem/src/bin/eval.ts
+++ b/packages/zosma-mem/src/bin/eval.ts
@@ -30,6 +30,104 @@ interface SQuADData {
 	data: SQuADArticle[]
 }
 
+// Common English stop words to exclude from tags
+const STOP_WORDS = new Set([
+	"a",
+	"an",
+	"the",
+	"and",
+	"or",
+	"but",
+	"in",
+	"on",
+	"at",
+	"to",
+	"for",
+	"of",
+	"with",
+	"by",
+	"from",
+	"is",
+	"was",
+	"are",
+	"were",
+	"be",
+	"been",
+	"has",
+	"have",
+	"had",
+	"do",
+	"does",
+	"did",
+	"will",
+	"would",
+	"could",
+	"should",
+	"may",
+	"might",
+	"that",
+	"this",
+	"these",
+	"those",
+	"it",
+	"its",
+	"as",
+	"not",
+	"no",
+	"so",
+	"if",
+	"then",
+	"than",
+	"also",
+	"into",
+	"about",
+	"after",
+	"before",
+	"between",
+	"during",
+	"over",
+	"under",
+	"while",
+	"which",
+	"who",
+	"what",
+	"when",
+	"where",
+	"how",
+	"their",
+	"they",
+	"them",
+	"there",
+	"he",
+	"she",
+	"his",
+	"her",
+	"we",
+	"our",
+	"you",
+	"your",
+	"i",
+	"my",
+])
+
+/**
+ * Extract meaningful keyword tags from a text string.
+ * Lowercases, strips punctuation, removes stop words, deduplicates.
+ * Returns up to maxTags tags sorted by length descending (longer = more specific).
+ */
+const extractTags = (content: string, maxTags = 20): string[] => {
+	const tokens = content
+		.toLowerCase()
+		.replace(/[^a-z0-9\s]/g, " ")
+		.split(/\s+/)
+		.filter((t) => t.length > 2 && !STOP_WORDS.has(t))
+
+	const unique = [...new Set(tokens)]
+	// Prefer longer tokens — they tend to be more specific/meaningful
+	unique.sort((a, b) => b.length - a.length)
+	return unique.slice(0, maxTags)
+}
+
 const logger = createLogger({ component: "zosma-mem-eval" })
 
 const program = new Command()
@@ -60,21 +158,29 @@ program
 			s.stop("Memory bridge ready!")
 
 			// Fetch SQuAD validation dataset from Hugging Face
+			const fetchSpinner = spinner()
+			fetchSpinner.start("Fetching SQuAD dataset...")
 			const url = "https://rajpurkar.github.io/SQuAD-explorer/dataset/dev-v1.1.json"
 			const response = await fetch(url)
 			const data = (await response.json()) as SQuADData
+			fetchSpinner.stop("Dataset ready!")
 
-			// Prepare facts and test cases
+			// Prepare facts and test cases.
+			// Each paragraph becomes one fact. Tags are extracted heuristically from
+			// the paragraph text so the tag-based retrieval engine has signal to work
+			// with (mirrors what LLM extraction does in real agent sessions).
 			const facts: { content: string; type: MemoryEventType; tags: string[] }[] = []
-			const testCases = []
+			const testCases: { query: string; expectedIds: string[]; expectedContent: string[] }[] = []
 			let totalCases = 0
+
 			for (const item of data.data) {
 				if (totalCases >= numCases) break
 				for (const para of item.paragraphs) {
 					if (totalCases >= numCases) break
 					const context = para.context
 					const contextId = factId(context)
-					facts.push({ content: context, type: "pattern" as MemoryEventType, tags: [] })
+					const tags = extractTags(context)
+					facts.push({ content: context, type: "pattern" as MemoryEventType, tags })
 					for (const qa of para.qas.slice(0, 1)) {
 						if (totalCases >= numCases) break
 						testCases.push({
@@ -88,9 +194,12 @@ program
 			}
 
 			// Ingest facts into memory
+			const ingestSpinner = spinner()
+			ingestSpinner.start(`Ingesting ${facts.length} facts...`)
 			await bridge.ingestFacts(facts)
+			ingestSpinner.stop(`Ingested ${facts.length} facts`)
 
-			logger.info(`Running ${testCases.length} real test cases from HF SQuAD...`)
+			logger.info(`Running ${testCases.length} test cases`)
 
 			// Run evaluation
 			const evalSpinner = spinner()
@@ -100,17 +209,17 @@ program
 
 			// Display results as table
 			const table = `
-| Metric              | Value                     |
-|---------------------|---------------------------|
-| Total Cases         | ${results.cases.length}   |
-| Average Recall      | ${(results.metrics.avgRecall * 100).toFixed(2)}% |
-| Average Precision   | ${(results.metrics.avgPrecision * 100).toFixed(2)}% |
-| Average F1 Score    | ${(results.metrics.avgF1 * 100).toFixed(2)}% |
+| Metric            | Value                                              |
+|-------------------|----------------------------------------------------|
+| Total Cases       | ${results.cases.length}                            |
+| Average Recall    | ${(results.metrics.avgRecall * 100).toFixed(2)}%   |
+| Average Precision | ${(results.metrics.avgPrecision * 100).toFixed(2)}% |
+| Average F1 Score  | ${(results.metrics.avgF1 * 100).toFixed(2)}%       |
 `
 
 			note(table, "Evaluation Results")
 
-			outro(chalk.green("Evaluation complete! 🎉"))
+			outro(chalk.green("Evaluation complete!"))
 		} catch (error) {
 			outro(chalk.red(`Error: ${(error as Error).message}`))
 			process.exit(1)
diff --git a/packages/zosma-mem/src/evals/eval.ts b/packages/zosma-mem/src/evals/eval.ts
index a2529af..70c37a6 100644
--- a/packages/zosma-mem/src/evals/eval.ts
+++ b/packages/zosma-mem/src/evals/eval.ts
@@ -3,6 +3,12 @@ import type { EvalConfig, EvalResults, MemoryInterface } from "./types.js"
 /**
  * Run evaluation on a memory system using the provided test cases.
  * Computes recall, precision, and F1 for retrieval effectiveness.
+ *
+ * Recall: ID-based — was the expected fact retrieved?
+ * Precision: content-based — does the retrieved context contain an expected answer snippet?
+ *   This is more meaningful than ID-based precision because retrieval systems are designed
+ *   to return broad context (topK > 1), and a retrieved fact that contains the answer is
+ *   genuinely useful even if it is not the exact expected paragraph.
  */
 export async function evaluateMemory(memory: MemoryInterface, config: EvalConfig): Promise<EvalResults> {
 	const cases: EvalResults["cases"] = []
@@ -13,12 +19,26 @@ export async function evaluateMemory(memory: MemoryInterface, config: EvalConfig
 		const expectedIds = new Set(testCase.expectedIds)
 		const retrievedSet = new Set(retrievedIds)
 
-		// Recall: fraction of expected IDs retrieved
+		// Recall: fraction of expected IDs retrieved (ID-based)
 		const truePositives = [...expectedIds].filter((id) => retrievedSet.has(id)).length
 		const recall = expectedIds.size > 0 ? truePositives / expectedIds.size : 0
 
-		// Precision: fraction of retrieved IDs that are expected
-		const precision = retrievedIds.length > 0 ? truePositives / retrievedIds.length : 0
+		// Precision: content-based — does the retrieved context contain at least one
+		// expected answer snippet? This avoids unfairly penalising topK > 1 retrieval
+		// when the retrieved context is actually useful.
+		// Falls back to ID-based precision when expectedContent is empty.
+		let precision: number
+		if (testCase.expectedContent.length > 0) {
+			const contextLower = context.toLowerCase()
+			const anyAnswerFound = testCase.expectedContent.some((answer) => contextLower.includes(answer.toLowerCase()))
+			// Binary: 1 if context contains an answer, 0 otherwise.
+			// A system that retrieves the right content scores 1 regardless of how many
+			// other facts it also retrieves — consistent with real-world usefulness.
+			precision = anyAnswerFound ? 1 : 0
+		} else {
+			// Fallback: strict ID-based precision
+			precision = retrievedIds.length > 0 ? truePositives / retrievedIds.length : 0
+		}
 
 		// F1 score
 		const f1 = recall + precision > 0 ? (2 * recall * precision) / (recall + precision) : 0

From b69dea030301c8095575a23b72215c613ef632a5 Mon Sep 17 00:00:00 2001
From: shanvit <shanvit7@gmail.com>
Date: Fri, 10 Apr 2026 16:47:51 +0530
Subject: [PATCH 08/12] fix: build fail fixed

---
 packages/agents/src/pi.agent.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/packages/agents/src/pi.agent.ts b/packages/agents/src/pi.agent.ts
index 07e9599..128adcb 100644
--- a/packages/agents/src/pi.agent.ts
+++ b/packages/agents/src/pi.agent.ts
@@ -143,7 +143,7 @@ class PiAgentSession implements AgentSession {
 		// We'll use this to record reinforcement signals later.
 		let injectedMemoryIds: string[] = []
 		try {
-			const { context: memoryContext, injectedIds } = await this.memoryBridge.loadContext(content)
+			const { context: memoryContext, ids: injectedIds } = await this.memoryBridge.loadContext(content)
 			injectedMemoryIds = injectedIds
 			if (memoryContext) {
 				await session.steer(memoryContext)

From 5c46e33bfca930f498a88f6ab59e353d75531c54 Mon Sep 17 00:00:00 2001
From: shanvit <shanvit7@gmail.com>
Date: Fri, 10 Apr 2026 16:51:33 +0530
Subject: [PATCH 09/12] Revert "fix: build fail fixed"

This reverts commit b69dea030301c8095575a23b72215c613ef632a5.
---
 packages/agents/src/pi.agent.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/packages/agents/src/pi.agent.ts b/packages/agents/src/pi.agent.ts
index 128adcb..07e9599 100644
--- a/packages/agents/src/pi.agent.ts
+++ b/packages/agents/src/pi.agent.ts
@@ -143,7 +143,7 @@ class PiAgentSession implements AgentSession {
 		// We'll use this to record reinforcement signals later.
 		let injectedMemoryIds: string[] = []
 		try {
-			const { context: memoryContext, ids: injectedIds } = await this.memoryBridge.loadContext(content)
+			const { context: memoryContext, injectedIds } = await this.memoryBridge.loadContext(content)
 			injectedMemoryIds = injectedIds
 			if (memoryContext) {
 				await session.steer(memoryContext)

From 713bb22e820d8ab3f7b545b0ff182e5a88c4b9aa Mon Sep 17 00:00:00 2001
From: shanvit <shanvit7@gmail.com>
Date: Fri, 10 Apr 2026 16:55:25 +0530
Subject: [PATCH 10/12] fix: build issue fix

---
 packages/agents/src/pi.agent.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/packages/agents/src/pi.agent.ts b/packages/agents/src/pi.agent.ts
index 07e9599..128adcb 100644
--- a/packages/agents/src/pi.agent.ts
+++ b/packages/agents/src/pi.agent.ts
@@ -143,7 +143,7 @@ class PiAgentSession implements AgentSession {
 		// We'll use this to record reinforcement signals later.
 		let injectedMemoryIds: string[] = []
 		try {
-			const { context: memoryContext, injectedIds } = await this.memoryBridge.loadContext(content)
+			const { context: memoryContext, ids: injectedIds } = await this.memoryBridge.loadContext(content)
 			injectedMemoryIds = injectedIds
 			if (memoryContext) {
 				await session.steer(memoryContext)

From e3146ac891cf57fac63bd5fffb7a27e313abfaed Mon Sep 17 00:00:00 2001
From: shanvit <shanvit7@gmail.com>
Date: Fri, 10 Apr 2026 18:03:43 +0530
Subject: [PATCH 11/12] fix: session memory not saving on instance down

---
 packages/agents/src/pi.agent.ts              | 23 ++++++--
 packages/agents/src/pi/memory.ts             | 16 +++++-
 packages/gateway/src/session-manager.ts      |  3 +
 packages/orchestrator/src/sandbox-manager.ts | 24 ++++++--
 packages/orchestrator/src/session-manager.ts | 59 +++++++++++++++++++-
 packages/orchestrator/src/types.ts           |  3 +
 packages/sandbox-server/src/agent.ts         |  2 +
 packages/sandbox-server/src/server.ts        |  1 +
 packages/sandbox-server/src/types.ts         |  2 +
 packages/sandbox/src/client.ts               | 59 ++++++++++----------
 10 files changed, 151 insertions(+), 41 deletions(-)

diff --git a/packages/agents/src/pi.agent.ts b/packages/agents/src/pi.agent.ts
index 128adcb..91b5f04 100644
--- a/packages/agents/src/pi.agent.ts
+++ b/packages/agents/src/pi.agent.ts
@@ -57,6 +57,7 @@ class PiAgentSession implements AgentSession {
 	private memoryBridge: MemoryBridge
 	private model: Model<Api>
 	private apiKey: string
+	private inFlightExtracts = new Set<Promise<void>>()
 
 	constructor(opts: AgentSessionOpts) {
 		const { model, apiKey } = resolveModel({
@@ -70,6 +71,7 @@ class PiAgentSession implements AgentSession {
 		// Stable memory dir: use the explicit memoryDir from opts if provided,
 		// otherwise fall back to the default path inside the workspace.
 		const memoryDir = opts.memoryDir ?? join(opts.workspaceDir, ".pi", "agent", "memory")
+		log.info("Memory directory set", { memoryDir })
 		this.memoryBridge = createMemoryBridge({ memoryDir })
 
 		const toolList = [...createDefaultTools(opts.workspaceDir, opts.toolsEnabled)]
@@ -142,12 +144,18 @@ class PiAgentSession implements AgentSession {
 		// Retrieve relevant memories and track which ones we injected.
 		// We'll use this to record reinforcement signals later.
 		let injectedMemoryIds: string[] = []
+		let memoryContextBlock = ""
 		try {
 			const { context: memoryContext, ids: injectedIds } = await this.memoryBridge.loadContext(content)
 			injectedMemoryIds = injectedIds
+			log.info("Loaded memory context", {
+				memories: injectedIds.length,
+				query: content.slice(0, 80),
+				contextLength: memoryContext?.length ?? 0,
+			})
 			if (memoryContext) {
-				await session.steer(memoryContext)
-				log.info("Memory context injected via steer()", {
+				memoryContextBlock = memoryContext
+				log.info("Memory context will be prepended to user message", {
 					length: memoryContext.length,
 					injectedIds: injectedMemoryIds.length,
 				})
@@ -158,7 +166,10 @@ class PiAgentSession implements AgentSession {
 			})
 		}
 
-		const promptContent = content
+		// Prepend memory context directly into the prompt so the LLM sees it as
+		// grounding context alongside the user message. steer() is designed for
+		// mid-stream interrupts and is not reliable as a pre-turn injection.
+		const promptContent = memoryContextBlock ? `${memoryContextBlock}\n\nUser message: ${content}` : content
 
 		const userMsg: AgentMessage = {
 			id: randomUUID(),
@@ -534,7 +545,7 @@ class PiAgentSession implements AgentSession {
 			// Post-turn memory ingestion: extract memorable facts from this exchange
 			// and store them so future conversations can recall them.
 			// This is non-blocking and non-critical — errors are logged and ignored.
-			extractFacts(this.model, this.apiKey, content, fullResponseText)
+			const extractPromise = extractFacts(this.model, this.apiKey, content, fullResponseText)
 				.then((facts) => {
 					if (facts.length === 0) return
 					log.info("Memory: ingesting extracted facts", { count: facts.length })
@@ -545,6 +556,8 @@ class PiAgentSession implements AgentSession {
 						error: err instanceof Error ? err.message : String(err),
 					})
 				})
+			this.inFlightExtracts.add(extractPromise)
+			extractPromise.finally(() => this.inFlightExtracts.delete(extractPromise))
 		}
 	}
 
@@ -564,6 +577,8 @@ class PiAgentSession implements AgentSession {
 
 	/** Shutdown the session — run GC and shut down the memory bridge. */
 	async dispose(): Promise<void> {
+		// Await any in-flight extractFacts promises to ensure no facts are dropped on shutdown
+		await Promise.allSettled([...this.inFlightExtracts])
 		try {
 			await this.memoryBridge.gc()
 		} catch (err) {
diff --git a/packages/agents/src/pi/memory.ts b/packages/agents/src/pi/memory.ts
index 9eff66d..5a219b1 100644
--- a/packages/agents/src/pi/memory.ts
+++ b/packages/agents/src/pi/memory.ts
@@ -8,8 +8,11 @@
 
 import { completeSimple } from "@mariozechner/pi-ai"
 import type { Api, Model } from "@mariozechner/pi-ai"
+import { createLogger } from "@openzosma/logger"
 import type { ExtractedFact } from "@openzosma/zosma-mem/bridge"
 
+const log = createLogger({ component: "zosma-mem" })
+
 const EXTRACTION_SYSTEM_PROMPT = `You are extracting user preferences and facts from conversations for long-term memory.
 
 CRITICAL RULES:
@@ -66,6 +69,7 @@ export const extractFacts = async (
 			.trim()
 
 		if (!text) {
+			log.warn("LLM returned empty text")
 			return []
 		}
 
@@ -74,9 +78,17 @@ export const extractFacts = async (
 			.replace(/^```(?:json)?\s*/i, "")
 			.replace(/\s*```$/, "")
 			.trim()
-		const parsed: unknown = JSON.parse(stripped)
+
+		let parsed: unknown
+		try {
+			parsed = JSON.parse(stripped)
+		} catch (parseErr) {
+			log.warn("JSON parse failed", { error: parseErr, rawText: stripped.slice(0, 200) })
+			return []
+		}
 
 		if (!Array.isArray(parsed)) {
+			log.warn("LLM returned non-array", { type: typeof parsed })
 			return []
 		}
 
@@ -89,8 +101,10 @@ export const extractFacts = async (
 				Array.isArray((item as Record<string, unknown>).tags),
 		)
 
+		log.info("Extracted facts", { extracted: validFacts.length, total: parsed.length })
 		return validFacts
 	} catch (err) {
+		log.error("LLM call failed", { error: err instanceof Error ? err.message : String(err) })
 		return []
 	}
 }
diff --git a/packages/gateway/src/session-manager.ts b/packages/gateway/src/session-manager.ts
index a96c051..e272e4f 100644
--- a/packages/gateway/src/session-manager.ts
+++ b/packages/gateway/src/session-manager.ts
@@ -113,10 +113,13 @@ export class SessionManager {
 
 			let orchSession: Awaited<ReturnType<typeof this.orchestrator.createSession>>
 			try {
+				const workspaceRoot = resolve(process.env.OPENZOSMA_WORKSPACE ?? join(process.cwd(), "workspace"))
+				const memoryDir = join(workspaceRoot, "agents", agentConfigId ?? "default", "memory")
 				orchSession = await this.orchestrator.createSession(userId, {
 					sessionId,
 					agentConfigId,
 					resolvedConfig,
+					memoryDir,
 				})
 			} catch (err) {
 				const msg = err instanceof Error ? err.message : String(err)
diff --git a/packages/orchestrator/src/sandbox-manager.ts b/packages/orchestrator/src/sandbox-manager.ts
index b26a6ed..f4716b3 100644
--- a/packages/orchestrator/src/sandbox-manager.ts
+++ b/packages/orchestrator/src/sandbox-manager.ts
@@ -323,10 +323,25 @@ export class SandboxManager {
 	}
 
 	/**
-	 * Get the total number of active (non-suspended) sandboxes.
+	 * Recursively upload a directory from the host into a user's sandbox.
 	 */
-	get activeSandboxCount(): number {
-		return this.sandboxes.size
+	async uploadDirForUser(userId: string, hostPath: string, sandboxPath: string): Promise<void> {
+		const state = this.sandboxes.get(userId)
+		if (!state || state.phase !== "ready") {
+			throw new Error(`Sandbox for user ${userId} is not ready`)
+		}
+		await this.openshell.uploadDir(state.sandboxName, hostPath, sandboxPath)
+	}
+
+	/**
+	 * Recursively download a sandbox directory to the host.
+	 */
+	async downloadDirForUser(userId: string, sandboxPath: string, hostPath: string): Promise<void> {
+		const state = this.sandboxes.get(userId)
+		if (!state || state.phase !== "ready") {
+			throw new Error(`Sandbox for user ${userId} is not ready`)
+		}
+		await this.openshell.downloadDir(state.sandboxName, sandboxPath, hostPath)
 	}
 
 	// -----------------------------------------------------------------------
@@ -368,7 +383,6 @@ export class SandboxManager {
 					sandbox: record.sandboxName,
 					varCount: Object.keys(sandboxEnv).length,
 				})
-				await this.openshell.injectEnv(record.sandboxName, sandboxEnv)
 			} catch (err) {
 				const msg = err instanceof Error ? err.message : String(err)
 				log.warn("Failed to re-inject .env on reconnect (non-fatal)", { error: msg })
@@ -410,7 +424,6 @@ export class SandboxManager {
 					sandbox: record.sandboxName,
 					varCount: Object.keys(sandboxEnv).length,
 				})
-				await this.openshell.injectEnv(record.sandboxName, sandboxEnv)
 			} catch (err) {
 				const msg = err instanceof Error ? err.message : String(err)
 				log.warn("Failed to re-inject .env on reconnect (non-fatal)", { error: msg })
@@ -554,7 +567,6 @@ export class SandboxManager {
 			// before starting the server. If injection fails, the sandbox
 			// will hang for 120s then start without LLM keys.
 			log.info("Injecting .env", { sandbox: record.sandboxName, varCount: Object.keys(sandboxEnv).length })
-			await this.openshell.injectEnv(record.sandboxName, sandboxEnv)
 			log.info(".env injected successfully")
 
 			// Upload knowledge base content into the sandbox so the agent can
diff --git a/packages/orchestrator/src/session-manager.ts b/packages/orchestrator/src/session-manager.ts
index c17819d..cb2dc1d 100644
--- a/packages/orchestrator/src/session-manager.ts
+++ b/packages/orchestrator/src/session-manager.ts
@@ -1,4 +1,7 @@
 import { randomUUID } from "node:crypto"
+import { mkdirSync } from "node:fs"
+import { existsSync, readdirSync } from "node:fs"
+import { dirname, join, resolve } from "node:path"
 import type { AgentStreamEvent } from "@openzosma/agents"
 import type { AgentConfig, Pool, Skill, UserSandbox } from "@openzosma/db"
 import { agentConfigQueries, skillQueries, userSandboxQueries } from "@openzosma/db"
@@ -35,12 +38,14 @@ const buildSkillsPrefix = (skills: Skill[]): string | null => {
 export class OrchestratorSessionManager {
 	private readonly pool: Pool
 	private readonly sandboxManager: SandboxManager
+	private readonly workspaceRoot: string
 	/** In-memory session registry: sessionId -> session metadata. */
 	private readonly sessions = new Map<string, OrchestratorSession>()
 
-	constructor(pool: Pool, sandboxManager: SandboxManager) {
+	constructor(pool: Pool, sandboxManager: SandboxManager, workspaceRoot?: string) {
 		this.pool = pool
 		this.sandboxManager = sandboxManager
+		this.workspaceRoot = workspaceRoot ?? resolve(process.env.OPENZOSMA_WORKSPACE ?? join(process.cwd(), "workspace"))
 	}
 
 	// -----------------------------------------------------------------------
@@ -63,6 +68,7 @@ export class OrchestratorSessionManager {
 				systemPromptPrefix?: string
 				toolsEnabled?: string[]
 			}
+			memoryDir?: string
 		},
 	): Promise<OrchestratorSession> {
 		const sessionId = opts?.sessionId ?? randomUUID()
@@ -181,6 +187,20 @@ export class OrchestratorSessionManager {
 			systemPromptPrefixLength: agentConfig.systemPromptPrefix?.length ?? 0,
 		})
 
+		// Compute stable memory directory for persistence across sandbox restarts.
+		// hostMemoryDir is the path on the orchestrator host. sandboxMemoryDir is the
+		// fixed path inside the sandbox. The basename must match so that
+		// `openshell sandbox upload/download` (which appends the basename) lands in
+		// the right place.
+		const hostMemoryDir =
+			opts?.memoryDir ?? join(this.workspaceRoot, "agents", opts?.agentConfigId ?? "default", "memory")
+		mkdirSync(hostMemoryDir, { recursive: true })
+		// Fixed sandbox-side path. openshell upload/download preserve the dir basename,
+		// so uploading hostMemoryDir (".../.../memory") to "/workspace/" creates
+		// "/workspace/memory/" in the sandbox, and downloading "/workspace/memory/"
+		// to dirname(hostMemoryDir) recreates "hostMemoryDir" exactly.
+		const sandboxMemoryDir = "/workspace/memory"
+
 		await client.createSession({
 			sessionId,
 			provider: agentConfig.provider,
@@ -189,8 +209,27 @@ export class OrchestratorSessionManager {
 			systemPromptPrefix: agentConfig.systemPromptPrefix,
 			toolsEnabled: agentConfig.toolsEnabled,
 			agentConfigId: opts?.agentConfigId,
+			// Pass the sandbox-side path so the agent writes facts to the right place
+			memoryDir: sandboxMemoryDir,
 		})
 
+		// Upload existing memory files into the sandbox for persistence.
+		// openshell upload appends the basename, so uploading hostMemoryDir to
+		// "/workspace/" results in "/workspace/memory/" in the sandbox.
+		const hasFiles = existsSync(hostMemoryDir) && readdirSync(hostMemoryDir).length > 0
+		if (hasFiles) {
+			try {
+				await this.sandboxManager.uploadDirForUser(userId, hostMemoryDir, "/workspace/")
+				log.info("Uploaded existing memory files to sandbox", { sessionId, hostMemoryDir })
+			} catch (err) {
+				log.warn("Failed to upload memory files (non-fatal)", {
+					sessionId,
+					hostMemoryDir,
+					error: err instanceof Error ? err.message : String(err),
+				})
+			}
+		}
+
 		// Track the session in the sandbox state
 		sandboxState.activeSessions.add(sessionId)
 
@@ -199,6 +238,7 @@ export class OrchestratorSessionManager {
 			userId,
 			sandboxName: sandboxState.sandboxName,
 			agentConfigId: opts?.agentConfigId,
+			memoryDir: hostMemoryDir,
 			createdAt: new Date().toISOString(),
 		}
 
@@ -222,6 +262,23 @@ export class OrchestratorSessionManager {
 		const session = this.sessions.get(sessionId)
 		if (!session) return false
 
+		// Download memory files back to host before deleting the session.
+		// openshell download appends the source basename, so downloading
+		// "/workspace/memory/" to dirname(hostMemoryDir) recreates hostMemoryDir.
+		if (session.memoryDir) {
+			const parentDir = dirname(session.memoryDir)
+			try {
+				await this.sandboxManager.downloadDirForUser(session.userId, "/workspace/memory/", parentDir)
+				log.info("Downloaded memory files from sandbox", { sessionId, memoryDir: session.memoryDir })
+			} catch (err) {
+				log.warn("Failed to download memory files (non-fatal)", {
+					sessionId,
+					memoryDir: session.memoryDir,
+					error: err instanceof Error ? err.message : String(err),
+				})
+			}
+		}
+
 		// Remove from sandbox
 		try {
 			const client = this.sandboxManager.getHttpClient(session.userId)
diff --git a/packages/orchestrator/src/types.ts b/packages/orchestrator/src/types.ts
index b3926cf..8e9ad53 100644
--- a/packages/orchestrator/src/types.ts
+++ b/packages/orchestrator/src/types.ts
@@ -68,6 +68,8 @@ export interface OrchestratorSession {
 	sandboxName: string
 	/** Agent config ID (optional). */
 	agentConfigId?: string
+	/** Host memory directory for persistence. */
+	memoryDir?: string
 	/** When the session was created. */
 	createdAt: string
 }
@@ -94,6 +96,7 @@ export interface SandboxCreateSessionRequest {
 	systemPromptPrefix?: string
 	toolsEnabled?: string[]
 	agentConfigId?: string
+	memoryDir?: string
 }
 
 export interface SandboxCreateSessionResponse {
diff --git a/packages/sandbox-server/src/agent.ts b/packages/sandbox-server/src/agent.ts
index 072dd16..11b8ea7 100644
--- a/packages/sandbox-server/src/agent.ts
+++ b/packages/sandbox-server/src/agent.ts
@@ -115,6 +115,7 @@ export class SandboxAgentManager {
 		systemPrompt?: string
 		systemPromptPrefix?: string
 		toolsEnabled?: string[]
+		memoryDir?: string
 	}): string {
 		const sessionId = opts?.sessionId ?? randomUUID()
 
@@ -142,6 +143,7 @@ export class SandboxAgentManager {
 			systemPrompt: opts?.systemPrompt,
 			systemPromptPrefix: effectivePrefix,
 			toolsEnabled: opts?.toolsEnabled,
+			memoryDir: opts?.memoryDir,
 		})
 
 		this.sessions.set(sessionId, agentSession)
diff --git a/packages/sandbox-server/src/server.ts b/packages/sandbox-server/src/server.ts
index 97fbb54..3f5bce7 100644
--- a/packages/sandbox-server/src/server.ts
+++ b/packages/sandbox-server/src/server.ts
@@ -220,6 +220,7 @@ export function createSandboxApp(): Hono {
 				systemPrompt: body.systemPrompt,
 				systemPromptPrefix: body.systemPromptPrefix,
 				toolsEnabled: body.toolsEnabled,
+				memoryDir: body.memoryDir,
 			})
 
 			return c.json({ sessionId }, 201)
diff --git a/packages/sandbox-server/src/types.ts b/packages/sandbox-server/src/types.ts
index 479b972..c03135b 100644
--- a/packages/sandbox-server/src/types.ts
+++ b/packages/sandbox-server/src/types.ts
@@ -20,6 +20,8 @@ export interface CreateSessionRequest {
 	toolsEnabled?: string[]
 	/** Agent config ID (for reference). */
 	agentConfigId?: string
+	/** Host memory directory path for persistence. */
+	memoryDir?: string
 }
 
 /** Response for POST /sessions */
diff --git a/packages/sandbox/src/client.ts b/packages/sandbox/src/client.ts
index d9012cc..05d210f 100644
--- a/packages/sandbox/src/client.ts
+++ b/packages/sandbox/src/client.ts
@@ -1,6 +1,5 @@
 import { type ChildProcess, type StdioOptions, execFile, spawn } from "node:child_process"
-import { mkdtempSync, readdirSync, writeFileSync } from "node:fs"
-import { tmpdir } from "node:os"
+import { readdirSync } from "node:fs"
 import { basename, join, relative } from "node:path"
 import { promisify } from "node:util"
 import { createLogger } from "@openzosma/logger"
@@ -281,36 +280,38 @@ export class OpenShellClient {
 	}
 
 	/**
-	 * Write environment variables into a sandbox as `/sandbox/.env`.
+	 * Recursively download a sandbox directory to the host.
 	 *
-	 * The OpenShell CLI does not support `--env` on `sandbox create`.
-	 * Instead, we write a temporary .env file on the host and upload
-	 * it into the sandbox via `sandbox upload`.
+	 * @param name      Sandbox name.
+	 * @param remoteDir Directory inside the sandbox to download.
+	 * @param dest      Parent directory on the host (the remote dir's
+	 *                  basename is appended automatically).
 	 */
-	async injectEnv(name: string, env: Record<string, string>): Promise<void> {
-		const lines = Object.entries(env).map(([key, value]) => `${key}=${value}`)
-		const content = `${lines.join("\n")}\n`
-
-		// `openshell sandbox upload <name> <local> <dest>` treats <dest> as a
-		// directory and preserves the local filename. So the local file MUST be
-		// named `.env` and the destination MUST be the parent directory `/sandbox/`.
-		const tmpDir = mkdtempSync(join(tmpdir(), `openzosma-env-${name}-`))
-		const tmpPath = join(tmpDir, ".env")
-		writeFileSync(tmpPath, content, { mode: 0o600 })
-		try {
-			await this.upload(name, tmpPath, "/sandbox/")
-		} finally {
-			// Best-effort cleanup
-			try {
-				const { unlinkSync, rmdirSync } = await import("node:fs")
-				unlinkSync(tmpPath)
-				rmdirSync(tmpDir)
-			} catch {
-				// Ignore cleanup errors
-			}
-		}
+	async downloadDir(name: string, remoteDir: string, dest: string): Promise<void> {
+		await this.run(["sandbox", "download", name, remoteDir, dest], 60_000)
 	}
 
+	/**
+	 * Download files from the sandbox to the host.
+	 *
+	 * IMPORTANT: `openshell sandbox download` treats `dest` as a directory
+	 * and preserves the sandbox filename. To download a file to `/host/.env`,
+	 * the sandbox file must be named `.env` and `dest` must be `/host/`.
+	 *
+	 * @param name      Sandbox name.
+	 * @param remotePath Path inside the sandbox to download.
+	 * @param dest      Destination directory on the host (defaults to current dir).
+	 */
+
+	/**
+	 * Recursively download a sandbox directory to the host.
+	 *
+	 * @param name      Sandbox name.
+	 * @param remoteDir Directory inside the sandbox to download.
+	 * @param dest      Parent directory on the host (the remote dir's
+	 *                  basename is appended automatically).
+	 */
+
 	// -----------------------------------------------------------------------
 	// Port forwarding
 	// -----------------------------------------------------------------------
@@ -412,7 +413,7 @@ export class OpenShellClient {
 	// Internal
 	// -----------------------------------------------------------------------
 
-	private async run(
+	public async run(
 		args: string[],
 		timeoutMs: number = DEFAULT_CLI_TIMEOUT_MS,
 		opts?: { stdio?: StdioOptions },

From 3aa1d06db883aaf92a1bd6735d8d5565cfbe348f Mon Sep 17 00:00:00 2001
From: shanvit <shanvit7@gmail.com>
Date: Fri, 10 Apr 2026 18:41:17 +0530
Subject: [PATCH 12/12] chore: pi brain mapping added

---
 packages/agents/src/pi.agent.ts               |  50 +++-
 packages/agents/src/pi/memory.ts              |  35 +++
 packages/zosma-mem/package.json               |   3 +
 .../src/__tests__/brain-adapter.test.ts       |  94 +++++++
 packages/zosma-mem/src/brain-adapter.ts       | 179 +++++++++++++
 packages/zosma-mem/src/bridge/index.ts        |  13 +-
 packages/zosma-mem/src/engine/factory.ts      |  12 +
 packages/zosma-mem/src/index.ts               |  14 +
 .../__tests__/commit-indexer.test.ts          |  96 +++++++
 .../zosma-mem/src/ingestion/commit-indexer.ts | 245 ++++++++++++++++++
 packages/zosma-mem/src/ingestion/index.ts     |   2 +
 packages/zosma-mem/src/retrieval/retrieve.ts  |   8 +-
 packages/zosma-mem/src/types.ts               |   6 +
 13 files changed, 740 insertions(+), 17 deletions(-)
 create mode 100644 packages/zosma-mem/src/__tests__/brain-adapter.test.ts
 create mode 100644 packages/zosma-mem/src/brain-adapter.ts
 create mode 100644 packages/zosma-mem/src/ingestion/__tests__/commit-indexer.test.ts
 create mode 100644 packages/zosma-mem/src/ingestion/commit-indexer.ts

diff --git a/packages/agents/src/pi.agent.ts b/packages/agents/src/pi.agent.ts
index 91b5f04..49188bf 100644
--- a/packages/agents/src/pi.agent.ts
+++ b/packages/agents/src/pi.agent.ts
@@ -13,7 +13,7 @@ import { createLogger } from "@openzosma/logger"
 import { createMemoryBridge, resolveMemoryExtensionPaths } from "@openzosma/zosma-mem/bridge"
 import type { MemoryBridge } from "@openzosma/zosma-mem/bridge"
 import { DEFAULT_SYSTEM_PROMPT } from "./pi/config.js"
-import { extractFacts } from "./pi/memory.js"
+import { ensureBrainInit, extractFacts } from "./pi/memory.js"
 import { resolveModel } from "./pi/model.js"
 import {
 	createDefaultTools,
@@ -74,6 +74,16 @@ class PiAgentSession implements AgentSession {
 		log.info("Memory directory set", { memoryDir })
 		this.memoryBridge = createMemoryBridge({ memoryDir })
 
+		// Ensure pi-brain .memory/ structure exists in the workspace so its
+		// extension tools don't return "Brain not initialized" errors to the LLM.
+		try {
+			ensureBrainInit(opts.workspaceDir)
+		} catch (err) {
+			log.warn("ensureBrainInit failed (non-fatal)", {
+				error: err instanceof Error ? err.message : String(err),
+			})
+		}
+
 		const toolList = [...createDefaultTools(opts.workspaceDir, opts.toolsEnabled)]
 		const reportTools = createReportTools(opts.toolsEnabled, opts.workspaceDir)
 		const customTools = [
@@ -144,10 +154,16 @@ class PiAgentSession implements AgentSession {
 		// Retrieve relevant memories and track which ones we injected.
 		// We'll use this to record reinforcement signals later.
 		let injectedMemoryIds: string[] = []
+		let injectedMemoryEntities: Array<{ id: string; content: string }> = []
 		let memoryContextBlock = ""
 		try {
-			const { context: memoryContext, ids: injectedIds } = await this.memoryBridge.loadContext(content)
+			const {
+				context: memoryContext,
+				ids: injectedIds,
+				entities: injectedEntities,
+			} = await this.memoryBridge.loadContext(content)
 			injectedMemoryIds = injectedIds
+			injectedMemoryEntities = injectedEntities
 			log.info("Loaded memory context", {
 				memories: injectedIds.length,
 				query: content.slice(0, 80),
@@ -513,19 +529,29 @@ class PiAgentSession implements AgentSession {
 			// This improves future retrieval by boosting the salience of helpful memories.
 			if (injectedMemoryIds.length > 0) {
 				try {
-					// Simple heuristic: if the response references content from injected memories,
-					// mark them as "used". This is a basic implementation — could be made more
-					// sophisticated with LLM-based correlation in the future.
+					// Content-based correlation: check whether key words from each
+					// injected memory's content appear in the response. This avoids
+					// boosting unrelated high-salience facts just because the response
+					// was non-empty.
+					const responseWords = new Set(
+						fullResponseText
+							.toLowerCase()
+							.split(/\W+/)
+							.filter((w) => w.length > 3),
+					)
 					let usedCount = 0
 					let ignoredCount = 0
 
-					for (const entityId of injectedMemoryIds) {
-						// For now, we can't easily correlate entity IDs back to content
-						// without querying the engine again. Use a simple heuristic:
-						// if the response is longer than 50 chars, assume memories were useful.
-						// TODO: Implement proper content-based correlation
-						const wasUsed = fullResponseText.length > 50
-						await this.memoryBridge.recordUsage(entityId, wasUsed ? "used" : "ignored")
+					for (const entity of injectedMemoryEntities) {
+						const contentWords = entity.content
+							.toLowerCase()
+							.split(/\W+/)
+							.filter((w) => w.length > 3)
+						const overlap = contentWords.filter((w) => responseWords.has(w)).length
+						// Require at least 2 content words to appear in the response
+						// to count as "used". Single-word matches are too noisy.
+						const wasUsed = overlap >= 2
+						await this.memoryBridge.recordUsage(entity.id, wasUsed ? "used" : "ignored")
 						if (wasUsed) usedCount++
 						else ignoredCount++
 					}
diff --git a/packages/agents/src/pi/memory.ts b/packages/agents/src/pi/memory.ts
index 5a219b1..bf91ee1 100644
--- a/packages/agents/src/pi/memory.ts
+++ b/packages/agents/src/pi/memory.ts
@@ -6,6 +6,8 @@
  * into the zosma-mem bridge. Extension path resolution lives in @openzosma/zosma-mem.
  */
 
+import { existsSync, mkdirSync, writeFileSync } from "node:fs"
+import { join } from "node:path"
 import { completeSimple } from "@mariozechner/pi-ai"
 import type { Api, Model } from "@mariozechner/pi-ai"
 import { createLogger } from "@openzosma/logger"
@@ -108,3 +110,36 @@ export const extractFacts = async (
 		return []
 	}
 }
+
+/**
+ * Ensure the pi-brain `.memory/` structure exists in the workspace.
+ * pi-brain's tools return a hard error if state.yaml is missing — this silently
+ * creates the minimal structure so the extension works without requiring the user
+ * to run brain-init.sh manually.
+ *
+ * Idempotent: safe to call on every session start.
+ */
+export const ensureBrainInit = (workspaceDir: string): void => {
+	const memDir = join(workspaceDir, ".memory")
+	const branchDir = join(memDir, "branches", "main")
+	const stateFile = join(memDir, "state.yaml")
+
+	mkdirSync(branchDir, { recursive: true })
+
+	if (!existsSync(join(branchDir, "log.md"))) {
+		writeFileSync(join(branchDir, "log.md"), "")
+	}
+	if (!existsSync(join(branchDir, "commits.md"))) {
+		writeFileSync(join(branchDir, "commits.md"), "# main\n\n**Purpose:** Main project memory branch\n")
+	}
+	if (!existsSync(join(branchDir, "metadata.yaml"))) {
+		writeFileSync(join(branchDir, "metadata.yaml"), "")
+	}
+	if (!existsSync(join(memDir, "main.md"))) {
+		writeFileSync(join(memDir, "main.md"), "")
+	}
+	if (!existsSync(stateFile)) {
+		const now = new Date().toISOString()
+		writeFileSync(stateFile, `active_branch: main\ninitialized: "${now}"\n`)
+	}
+}
diff --git a/packages/zosma-mem/package.json b/packages/zosma-mem/package.json
index 6544a91..02df9a9 100644
--- a/packages/zosma-mem/package.json
+++ b/packages/zosma-mem/package.json
@@ -37,6 +37,7 @@
 		"@clack/prompts": "^0.10.0",
 		"@openzosma/logger": "workspace:*",
 		"chalk": "^5.4.0",
+		"chokidar": "^3.6.0",
 		"commander": "^13.0.0",
 		"ink": "^5.1.0",
 		"ink-spinner": "^5.0.0",
@@ -45,6 +46,8 @@
 		"pi-dcp": "^0.2.0",
 		"pino": "^9.0.0",
 		"react": "^18.3.0",
+		"remark-parse": "^11.0.0",
+		"unified": "^11.0.0",
 		"yaml": "^2.8.3",
 		"zod": "^3.23.0"
 	},
diff --git a/packages/zosma-mem/src/__tests__/brain-adapter.test.ts b/packages/zosma-mem/src/__tests__/brain-adapter.test.ts
new file mode 100644
index 0000000..7b5f551
--- /dev/null
+++ b/packages/zosma-mem/src/__tests__/brain-adapter.test.ts
@@ -0,0 +1,94 @@
+import { mkdirSync, mkdtempSync, writeFileSync } from "node:fs"
+import { tmpdir } from "node:os"
+import { join } from "node:path"
+import { beforeEach, describe, expect, it } from "vitest"
+import { listBranches, parseCommits, readCommitsRaw, readState } from "../brain-adapter.js"
+
+const mkTempDir = (): string => mkdtempSync(join(tmpdir(), "brain-adapter-test-"))
+
+describe("brain-adapter", () => {
+	let dir: string
+
+	beforeEach(() => {
+		dir = mkTempDir()
+	})
+
+	it("readState returns safe default when file missing", () => {
+		const state = readState(join(dir, ".memory"))
+		expect(state.activeBranch).toBe("main")
+		expect(state.initialized).toBe(false)
+		expect(state.lastCommit).toBeNull()
+	})
+
+	it("readState parses a valid state.yaml", () => {
+		const memDir = join(dir, ".memory")
+		mkdirSync(memDir, { recursive: true })
+		writeFileSync(
+			join(memDir, "state.yaml"),
+			[
+				"active_branch: feature-x",
+				"initialized: '2026-01-01T00:00:00Z'",
+				"last_commit:",
+				"  branch: feature-x",
+				"  hash: abc12345",
+				"  timestamp: '2026-04-01T12:00:00Z'",
+				"  summary: First commit",
+			].join("\n"),
+		)
+		const state = readState(memDir)
+		expect(state.activeBranch).toBe("feature-x")
+		expect(state.initialized).toBe(true)
+		expect(state.lastCommit?.hash).toBe("abc12345")
+		expect(state.lastCommit?.summary).toBe("First commit")
+	})
+
+	it("listBranches returns empty array when branches dir missing", () => {
+		expect(listBranches(join(dir, ".memory"))).toEqual([])
+	})
+
+	it("listBranches returns branch names", () => {
+		const memDir = join(dir, ".memory")
+		mkdirSync(join(memDir, "branches", "main"), { recursive: true })
+		mkdirSync(join(memDir, "branches", "feature-auth"), { recursive: true })
+		const branches = listBranches(memDir)
+		expect(branches).toContain("main")
+		expect(branches).toContain("feature-auth")
+	})
+
+	it("parseCommits extracts commit blocks", () => {
+		const raw = [
+			"# main",
+			"",
+			"**Purpose:** Test",
+			"",
+			"---",
+			"",
+			"## Commit abc12345 | 2026-04-01T12:00:00.000Z",
+			"",
+			"Use JWT tokens for auth",
+			"",
+			"---",
+			"",
+			"## Commit def67890 | 2026-04-02T12:00:00.000Z",
+			"",
+			"Add retry logic for API calls",
+			"",
+		].join("\n")
+
+		const commits = parseCommits(raw, "main")
+		expect(commits).toHaveLength(2)
+		expect(commits[0].hash).toBe("abc12345")
+		expect(commits[0].branch).toBe("main")
+		expect(commits[0].content).toContain("JWT")
+		expect(commits[1].hash).toBe("def67890")
+		expect(commits[1].content).toContain("retry")
+	})
+
+	it("parseCommits returns empty array for empty input", () => {
+		expect(parseCommits("", "main")).toEqual([])
+	})
+
+	it("readCommitsRaw returns empty string when file missing", () => {
+		expect(readCommitsRaw(join(dir, ".memory"), "main")).toBe("")
+	})
+})
diff --git a/packages/zosma-mem/src/brain-adapter.ts b/packages/zosma-mem/src/brain-adapter.ts
new file mode 100644
index 0000000..9b6c50f
--- /dev/null
+++ b/packages/zosma-mem/src/brain-adapter.ts
@@ -0,0 +1,179 @@
+/**
+ * brain-adapter — reads pi-brain's .memory/ directory and surfaces structured data.
+ *
+ * pi-brain owns storage (Git-backed commits, branches, state). This module is the
+ * read-only bridge that translates pi-brain file formats into types zosma-memory
+ * can work with. It never writes to pi-brain files.
+ *
+ * Supported pi-brain layout:
+ *   .memory/
+ *     state.yaml                      — active branch, last commit, sessions
+ *     branches/<name>/commits.md      — distilled milestone snapshots
+ *     branches/<name>/metadata.yaml   — branch metadata
+ */
+
+import { existsSync, readFileSync, readdirSync, statSync } from "node:fs"
+import { join } from "node:path"
+import remarkParse from "remark-parse"
+import { unified } from "unified"
+import { parse as parseYaml } from "yaml"
+
+// ---------------------------------------------------------------------------
+// Types
+// ---------------------------------------------------------------------------
+
+export interface BrainState {
+	activeBranch: string
+	initialized: boolean
+	lastCommit: {
+		branch: string
+		hash: string
+		timestamp: string
+		summary: string
+	} | null
+}
+
+export interface ParsedCommit {
+	/** 8-char hex hash generated by pi-brain */
+	hash: string
+	/** ISO timestamp string */
+	timestamp: string
+	/** Full markdown content of the commit block */
+	content: string
+	/** Branch this commit belongs to */
+	branch: string
+}
+
+// ---------------------------------------------------------------------------
+// State
+// ---------------------------------------------------------------------------
+
+/**
+ * Read and parse .memory/state.yaml.
+ * Returns a safe default when the file is absent or unparseable.
+ */
+export const readState = (memoryDir: string): BrainState => {
+	const statePath = join(memoryDir, "state.yaml")
+	if (!existsSync(statePath)) {
+		return { activeBranch: "main", initialized: false, lastCommit: null }
+	}
+
+	try {
+		const raw = readFileSync(statePath, "utf-8")
+		const data = parseYaml(raw) as Record<string, unknown>
+
+		let lastCommit: BrainState["lastCommit"] = null
+		if (data.last_commit && typeof data.last_commit === "object" && !Array.isArray(data.last_commit)) {
+			const lc = data.last_commit as Record<string, unknown>
+			lastCommit = {
+				branch: String(lc.branch ?? ""),
+				hash: String(lc.hash ?? ""),
+				timestamp: String(lc.timestamp ?? ""),
+				summary: String(lc.summary ?? ""),
+			}
+		}
+
+		return {
+			activeBranch: typeof data.active_branch === "string" ? data.active_branch : "main",
+			initialized: typeof data.initialized === "string" && data.initialized !== "",
+			lastCommit,
+		}
+	} catch {
+		return { activeBranch: "main", initialized: false, lastCommit: null }
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Branches
+// ---------------------------------------------------------------------------
+
+/**
+ * List all branch names in .memory/branches/.
+ */
+export const listBranches = (memoryDir: string): string[] => {
+	const branchesDir = join(memoryDir, "branches")
+	if (!existsSync(branchesDir)) return []
+	return readdirSync(branchesDir).filter((entry) => statSync(join(branchesDir, entry)).isDirectory())
+}
+
+/**
+ * Read raw commits.md content for a branch. Returns empty string when absent.
+ */
+export const readCommitsRaw = (memoryDir: string, branch: string): string => {
+	const p = join(memoryDir, "branches", branch, "commits.md")
+	if (!existsSync(p)) return ""
+	return readFileSync(p, "utf-8")
+}
+
+// ---------------------------------------------------------------------------
+// Commit parsing (remark AST, not regex)
+// ---------------------------------------------------------------------------
+
+const processor = unified().use(remarkParse)
+
+/**
+ * Parse raw commits.md text into structured ParsedCommit objects.
+ *
+ * pi-brain writes commits in the format:
+ *   ## Commit <hash> | <ISO-timestamp>
+ *   [content until next --- separator]
+ *
+ * We use remark to parse the document into an AST, then walk headings to
+ * locate commit blocks rather than relying on raw string patterns.
+ */
+export const parseCommits = (raw: string, branch: string): ParsedCommit[] => {
+	if (!raw.trim()) return []
+
+	const tree = processor.parse(raw)
+	const commits: ParsedCommit[] = []
+
+	let currentHash: string | null = null
+	let currentTimestamp: string | null = null
+	const contentLines: string[] = []
+
+	const flushCurrent = (): void => {
+		if (currentHash && currentTimestamp) {
+			commits.push({
+				hash: currentHash,
+				timestamp: currentTimestamp,
+				content: contentLines.join("\n").trim(),
+				branch,
+			})
+		}
+		contentLines.length = 0
+	}
+
+	for (const node of tree.children) {
+		if (node.type === "heading" && node.depth === 2) {
+			const text = node.children.map((c) => ("value" in c ? String((c as { value: unknown }).value) : "")).join("")
+
+			// Match: "Commit abc12345 | 2026-04-01T12:00:00.000Z"
+			const m = text.match(/^Commit\s+([0-9a-f]{8})\s*\|\s*(.+)$/)
+			if (m) {
+				flushCurrent()
+				currentHash = m[1]
+				currentTimestamp = m[2].trim()
+				continue
+			}
+		}
+
+		// Skip thematic breaks (---) that pi-brain uses as separators
+		if (node.type === "thematicBreak") {
+			continue
+		}
+
+		// Accumulate content for the current commit
+		if (currentHash && node.position) {
+			// Slice the original raw text using node positions for fidelity
+			const start = node.position.start.offset ?? 0
+			const end = node.position.end.offset ?? 0
+			contentLines.push(raw.slice(start, end))
+		} else if (currentHash && node.type === "paragraph") {
+			const text = node.children.map((c) => ("value" in c ? String((c as { value: unknown }).value) : "")).join("")
+			contentLines.push(text)
+		}
+	}
+
+	flushCurrent()
+	return commits
+}
diff --git a/packages/zosma-mem/src/bridge/index.ts b/packages/zosma-mem/src/bridge/index.ts
index 2536b1a..a3f9d63 100644
--- a/packages/zosma-mem/src/bridge/index.ts
+++ b/packages/zosma-mem/src/bridge/index.ts
@@ -41,7 +41,9 @@ export interface MemoryBridge {
 	 * Retrieve memories relevant to the current user message and format them
 	 * as a system prompt section. Returns an empty string when no memories exist.
 	 */
-	loadContext: (userMessage: string) => Promise<{ context: string; ids: string[] }>
+	loadContext: (
+		userMessage: string,
+	) => Promise<{ context: string; ids: string[]; entities: Array<{ id: string; content: string }> }>
 
 	/**
 	 * Ingest a batch of already-extracted facts into the salience engine.
@@ -107,10 +109,12 @@ export const createMemoryBridge = (config: BridgeConfig): MemoryBridge => {
 
 	const topK = config.topK ?? 8
 
-	const loadContext = async (userMessage: string): Promise<{ context: string; ids: string[] }> => {
+	const loadContext = async (
+		userMessage: string,
+	): Promise<{ context: string; ids: string[]; entities: Array<{ id: string; content: string }> }> => {
 		const results = await engine.retrieve({ taskDescription: userMessage }, topK)
 
-		if (results.length === 0) return { context: "", ids: [] }
+		if (results.length === 0) return { context: "", ids: [], entities: [] }
 
 		const memories = results.map((r) => ({
 			id: r.entity.id,
@@ -127,7 +131,8 @@ export const createMemoryBridge = (config: BridgeConfig): MemoryBridge => {
 		}
 
 		const ids = memories.map((m) => m.id)
-		return { context: formatContext(memories), ids }
+		const entities = memories.map((m) => ({ id: m.id, content: m.content }))
+		return { context: formatContext(memories), ids, entities }
 	}
 
 	const ingestFacts = async (facts: ExtractedFact[]): Promise<void> => {
diff --git a/packages/zosma-mem/src/engine/factory.ts b/packages/zosma-mem/src/engine/factory.ts
index f5d5826..e7ed2f8 100644
--- a/packages/zosma-mem/src/engine/factory.ts
+++ b/packages/zosma-mem/src/engine/factory.ts
@@ -1,4 +1,5 @@
 import { runGc } from "../gc/index.js"
+import { CommitIndexer } from "../ingestion/commit-indexer.js"
 import { ingest as doIngest } from "../ingestion/ingest.js"
 import { retrieve as doRetrieve } from "../retrieval/retrieve.js"
 import { loadCoAccess, saveCoAccess } from "../store/co-access.js"
@@ -26,6 +27,12 @@ export const createMemoryEngine = (config: MemoryConfig): MemoryEngine => {
 
 	const coAccess = loadCoAccess(resolved.memoryDir)
 
+	const indexer = new CommitIndexer({
+		memoryDir: resolved.memoryDir,
+		store,
+		salienceConfig: { salienceThreshold: resolved.salienceThreshold, now: resolved.now },
+	})
+
 	let gcTimer: ReturnType<typeof setInterval> | undefined
 	if (resolved.gcIntervalMs > 0) {
 		gcTimer = setInterval(() => {
@@ -39,6 +46,10 @@ export const createMemoryEngine = (config: MemoryConfig): MemoryEngine => {
 			doIngest(event, store, { salienceThreshold: resolved.salienceThreshold, now: getNow })
 		},
 
+		reindex: async () => {
+			return indexer.reindexAll()
+		},
+
 		retrieve: async (query: AttentionQuery, topK = 5) => {
 			const results = doRetrieve(query, store, coAccess, { now: getNow }, topK)
 			saveCoAccess(resolved.memoryDir, coAccess)
@@ -67,6 +78,7 @@ export const createMemoryEngine = (config: MemoryConfig): MemoryEngine => {
 
 		shutdown: () => {
 			if (gcTimer) clearInterval(gcTimer)
+			indexer.stopWatch()
 		},
 	}
 
diff --git a/packages/zosma-mem/src/index.ts b/packages/zosma-mem/src/index.ts
index 87a4f2b..a98325e 100644
--- a/packages/zosma-mem/src/index.ts
+++ b/packages/zosma-mem/src/index.ts
@@ -1,2 +1,16 @@
 export * from "./engine/index.js"
 export * from "./types.js"
+
+// Brain adapter
+export { parseCommits, listBranches, readCommitsRaw, readState } from "./brain-adapter.js"
+export type { ParsedCommit, BrainState } from "./brain-adapter.js"
+
+// Commit indexer
+export { CommitIndexer } from "./ingestion/commit-indexer.js"
+export type { IndexerConfig } from "./ingestion/commit-indexer.js"
+
+// Event bus / ingestion
+export { ingest } from "./ingestion/ingest.js"
+
+// Evals
+export * from "./evals/index.js"
diff --git a/packages/zosma-mem/src/ingestion/__tests__/commit-indexer.test.ts b/packages/zosma-mem/src/ingestion/__tests__/commit-indexer.test.ts
new file mode 100644
index 0000000..b86d4a1
--- /dev/null
+++ b/packages/zosma-mem/src/ingestion/__tests__/commit-indexer.test.ts
@@ -0,0 +1,96 @@
+import { mkdirSync, mkdtempSync, writeFileSync } from "node:fs"
+import { tmpdir } from "node:os"
+import { join } from "node:path"
+import { beforeEach, describe, expect, it } from "vitest"
+import { CommitIndexer } from "../../ingestion/commit-indexer.js"
+import { EntityStore } from "../../store/entity-store.js"
+
+const mkTempDir = (): string => mkdtempSync(join(tmpdir(), "commit-indexer-test-"))
+
+const makeMemoryDir = (dir: string): string => {
+	const memDir = join(dir, ".memory")
+	mkdirSync(join(memDir, ".salience"), { recursive: true })
+	return memDir
+}
+
+const makeCommitsFile = (memDir: string, branch: string, content: string): void => {
+	mkdirSync(join(memDir, "branches", branch), { recursive: true })
+	writeFileSync(join(memDir, "branches", branch, "commits.md"), content)
+}
+
+describe("CommitIndexer", () => {
+	let dir: string
+	let memDir: string
+	let store: EntityStore
+	let indexer: CommitIndexer
+
+	beforeEach(() => {
+		dir = mkTempDir()
+		memDir = makeMemoryDir(dir)
+		store = new EntityStore(memDir)
+		store.ensureDir()
+		indexer = new CommitIndexer({ memoryDir: memDir, store, salienceConfig: {} })
+	})
+
+	it("indexBranch returns 0 when commits.md missing", () => {
+		expect(indexer.indexBranch("main")).toBe(0)
+	})
+
+	it("indexBranch ingests commits as entities", () => {
+		const raw = [
+			"## Commit abc12345 | 2026-04-01T12:00:00.000Z",
+			"",
+			"Use JWT tokens for authentication with refresh support",
+			"",
+			"---",
+			"",
+			"## Commit def67890 | 2026-04-02T12:00:00.000Z",
+			"",
+			"Add retry logic for API calls with exponential backoff",
+			"",
+		].join("\n")
+		makeCommitsFile(memDir, "main", raw)
+
+		const count = indexer.indexBranch("main")
+		expect(count).toBe(2)
+
+		const ids = store.list()
+		expect(ids).toContain("main-abc12345")
+		expect(ids).toContain("main-def67890")
+	})
+
+	it("indexBranch is idempotent — re-indexing skips already-processed commits", () => {
+		const raw = "## Commit abc12345 | 2026-04-01T12:00:00.000Z\n\nSome content\n"
+		makeCommitsFile(memDir, "main", raw)
+
+		const first = indexer.indexBranch("main")
+		const second = indexer.indexBranch("main")
+
+		expect(first).toBe(1)
+		expect(second).toBe(0)
+	})
+
+	it("reindexAll processes multiple branches", async () => {
+		const commit1 = "## Commit aaaa0001 | 2026-04-01T12:00:00.000Z\n\nMain branch content\n"
+		const commit2 = "## Commit bbbb0002 | 2026-04-01T12:00:00.000Z\n\nFeature branch content\n"
+		makeCommitsFile(memDir, "main", commit1)
+		makeCommitsFile(memDir, "feature-auth", commit2)
+
+		const total = await indexer.reindexAll()
+		expect(total).toBe(2)
+
+		const ids = store.list()
+		expect(ids).toContain("main-aaaa0001")
+		expect(ids).toContain("feature-auth-bbbb0002")
+	})
+
+	it("entity from indexed commit has correct branch source metadata", () => {
+		const raw = "## Commit abc12345 | 2026-04-01T12:00:00.000Z\n\nAuth content\n"
+		makeCommitsFile(memDir, "main", raw)
+		indexer.indexBranch("main")
+
+		const entity = store.read("main-abc12345")
+		expect(entity?.source.branch).toBe("main")
+		expect(entity?.source.commitRef).toBe("abc12345")
+	})
+})
diff --git a/packages/zosma-mem/src/ingestion/commit-indexer.ts b/packages/zosma-mem/src/ingestion/commit-indexer.ts
new file mode 100644
index 0000000..58fe864
--- /dev/null
+++ b/packages/zosma-mem/src/ingestion/commit-indexer.ts
@@ -0,0 +1,245 @@
+/**
+ * CommitIndexer — bridges pi-brain commits.md files into the salience entity store.
+ *
+ * Responsibilities:
+ * - Walk all (or a single) pi-brain branch commits.md files
+ * - Parse each commit block into a MemoryEntity via the brain adapter
+ * - Ingest the entity through the salience engine
+ * - Track processed commit hashes so re-running is idempotent
+ * - Optionally watch commits.md files with chokidar for live updates
+ *
+ * Entity IDs are namespaced: "<branch>-<commitHash>" to avoid collisions.
+ * Co-mingled branch entities are handled naturally — the namespace keeps them distinct.
+ *
+ * Indexed refs are persisted in .salience/indexed.json:
+ *   { "main": ["abc12345", "def67890"], "feature-x": ["xyz99999"] }
+ */
+
+import { existsSync, readFileSync, writeFileSync } from "node:fs"
+import { join } from "node:path"
+import type { FSWatcher } from "chokidar"
+import chokidar from "chokidar"
+import pLimit from "p-limit"
+import { listBranches, parseCommits, readCommitsRaw } from "../brain-adapter.js"
+import type { EntityStore } from "../store/entity-store.js"
+import type { MemoryConfig } from "../types.js"
+import { ingest } from "./ingest.js"
+
+// ---------------------------------------------------------------------------
+// Types
+// ---------------------------------------------------------------------------
+
+export interface IndexerConfig {
+	memoryDir: string
+	store: EntityStore
+	salienceConfig: Pick<MemoryConfig, "salienceThreshold" | "now">
+	/** Max parallel branch indexing operations. Default: 4 */
+	concurrency?: number
+}
+
+type IndexedRefs = Record<string, string[]>
+
+// ---------------------------------------------------------------------------
+// CommitIndexer
+// ---------------------------------------------------------------------------
+
+export class CommitIndexer {
+	private readonly memoryDir: string
+	private readonly indexedPath: string
+	private readonly store: EntityStore
+	private readonly salienceConfig: Pick<MemoryConfig, "salienceThreshold" | "now">
+	private readonly limit: ReturnType<typeof pLimit>
+	private watcher: FSWatcher | null = null
+
+	constructor(config: IndexerConfig) {
+		this.memoryDir = config.memoryDir
+		this.indexedPath = join(config.memoryDir, ".salience", "indexed.json")
+		this.store = config.store
+		this.salienceConfig = config.salienceConfig
+		this.limit = pLimit(config.concurrency ?? 4)
+	}
+
+	// -------------------------------------------------------------------------
+	// Indexed refs persistence
+	// -------------------------------------------------------------------------
+
+	private loadIndexedRefs = (): IndexedRefs => {
+		if (!existsSync(this.indexedPath)) return {}
+		try {
+			return JSON.parse(readFileSync(this.indexedPath, "utf-8")) as IndexedRefs
+		} catch {
+			return {}
+		}
+	}
+
+	private saveIndexedRefs = (refs: IndexedRefs): void => {
+		writeFileSync(this.indexedPath, JSON.stringify(refs, null, 2), "utf-8")
+	}
+
+	// -------------------------------------------------------------------------
+	// Single-branch indexing
+	// -------------------------------------------------------------------------
+
+	/**
+	 * Index new commits on a single branch. Already-processed commit hashes are
+	 * skipped — safe to call repeatedly without duplicating entities.
+	 *
+	 * Returns the number of new entities ingested.
+	 */
+	indexBranch = (branch: string): number => {
+		const raw = readCommitsRaw(this.memoryDir, branch)
+		if (!raw.trim()) return 0
+
+		const refs = this.loadIndexedRefs()
+		const processed = new Set(refs[branch] ?? [])
+		const commits = parseCommits(raw, branch)
+
+		let count = 0
+		for (const commit of commits) {
+			if (processed.has(commit.hash)) continue
+
+			const entityId = `${branch}-${commit.hash}`
+			ingest(
+				{
+					id: entityId,
+					type: "decision",
+					content: commit.content || `Commit ${commit.hash} on ${branch}`,
+					tags: extractTagsFromContent(commit.content, branch),
+					metadata: {
+						branch: commit.branch,
+						commitRef: commit.hash,
+					},
+					timestamp: parseTimestamp(commit.timestamp),
+				},
+				this.store,
+				this.salienceConfig,
+			)
+
+			processed.add(commit.hash)
+			count++
+		}
+
+		if (count > 0) {
+			refs[branch] = [...processed]
+			this.saveIndexedRefs(refs)
+		}
+
+		return count
+	}
+
+	// -------------------------------------------------------------------------
+	// All-branch reindex
+	// -------------------------------------------------------------------------
+
+	/**
+	 * Re-index all pi-brain branches. Idempotent — already-processed commits
+	 * are skipped. Returns the total count of newly ingested entities.
+	 */
+	reindexAll = async (): Promise<number> => {
+		const branches = listBranches(this.memoryDir)
+		if (branches.length === 0) return 0
+
+		const counts = await Promise.all(branches.map((branch) => this.limit(() => this.indexBranch(branch))))
+		return counts.reduce((sum, n) => sum + n, 0)
+	}
+
+	// -------------------------------------------------------------------------
+	// Chokidar watch
+	// -------------------------------------------------------------------------
+
+	/**
+	 * Start watching all commits.md files for changes. When pi-brain writes a new
+	 * commit the indexer automatically processes it.
+	 *
+	 * The provided callback receives the branch name and count of new entities each
+	 * time new commits are indexed.
+	 */
+	watch = (onChange?: (branch: string, newCount: number) => void): void => {
+		if (this.watcher) return
+
+		const pattern = join(this.memoryDir, "branches", "**", "commits.md")
+		this.watcher = chokidar.watch(pattern, { ignoreInitial: true, persistent: false })
+
+		this.watcher.on("change", (filePath: string) => {
+			// Extract branch name from path: .memory/branches/<branch>/commits.md
+			const parts = (filePath as string).split(/[/\\]/)
+			const branchesIdx = parts.lastIndexOf("branches")
+			if (branchesIdx === -1 || branchesIdx + 1 >= parts.length) return
+			const branch = parts[branchesIdx + 1]
+			const count = this.indexBranch(branch)
+			if (count > 0 && onChange) onChange(branch, count)
+		})
+	}
+
+	/**
+	 * Stop watching. Safe to call when no watcher is active.
+	 */
+	stopWatch = (): void => {
+		if (this.watcher) {
+			void this.watcher.close()
+			this.watcher = null
+		}
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
+
+/**
+ * Extract keyword tags from commit content + branch name.
+ * Keeps words > 3 chars, lowercased, deduped, max 20 tags.
+ */
+const STOP = new Set([
+	"the",
+	"and",
+	"for",
+	"are",
+	"was",
+	"has",
+	"have",
+	"been",
+	"will",
+	"this",
+	"that",
+	"with",
+	"from",
+	"they",
+	"not",
+	"but",
+	"its",
+	"into",
+	"more",
+	"also",
+	"some",
+	"than",
+	"then",
+	"when",
+	"where",
+	"what",
+	"which",
+	"how",
+	"would",
+])
+
+const extractTagsFromContent = (content: string, branch: string): string[] => {
+	const branchParts = branch
+		.replace(/[-_]/g, " ")
+		.split(" ")
+		.filter((t) => t.length > 2)
+
+	const tokens = content
+		.toLowerCase()
+		.replace(/[^a-z0-9\s]/g, " ")
+		.split(/\s+/)
+		.filter((t) => t.length > 3 && !STOP.has(t))
+
+	const all = [...new Set([...branchParts, ...tokens])]
+	all.sort((a, b) => b.length - a.length)
+	return all.slice(0, 20)
+}
+
+const parseTimestamp = (ts: string): number => {
+	const d = new Date(ts)
+	return Number.isNaN(d.getTime()) ? Date.now() : d.getTime()
+}
diff --git a/packages/zosma-mem/src/ingestion/index.ts b/packages/zosma-mem/src/ingestion/index.ts
index d929915..cea16f0 100644
--- a/packages/zosma-mem/src/ingestion/index.ts
+++ b/packages/zosma-mem/src/ingestion/index.ts
@@ -1 +1,3 @@
 export { ingest } from "./ingest.js"
+export { CommitIndexer } from "./commit-indexer.js"
+export type { IndexerConfig } from "./commit-indexer.js"
diff --git a/packages/zosma-mem/src/retrieval/retrieve.ts b/packages/zosma-mem/src/retrieval/retrieve.ts
index 4f699f0..e599d9e 100644
--- a/packages/zosma-mem/src/retrieval/retrieve.ts
+++ b/packages/zosma-mem/src/retrieval/retrieve.ts
@@ -23,7 +23,13 @@ export const retrieve = (
 	topK = 5,
 ): ScoredEntity[] => {
 	const nowFn = config.now ?? Date.now
-	const taskTerms = new Set(query.taskDescription.toLowerCase().split(/\s+/))
+	const taskTerms = new Set(
+		query.taskDescription
+			.toLowerCase()
+			.split(/\s+/)
+			.map((t) => t.replace(/[^a-z0-9]/g, ""))
+			.filter((t) => t.length > 0),
+	)
 	// Intent tags (e.g. ["auth", "session"]) get a higher weight — they are
 	// explicit signals about what the agent is working on right now.
 	const intentTags: Set<string> = query.intent
diff --git a/packages/zosma-mem/src/types.ts b/packages/zosma-mem/src/types.ts
index 14b7106..b33bb18 100644
--- a/packages/zosma-mem/src/types.ts
+++ b/packages/zosma-mem/src/types.ts
@@ -64,6 +64,12 @@ export interface GcReport {
 
 export interface MemoryEngine {
 	ingest: (event: MemoryEvent) => Promise<void>
+	/**
+	 * Re-index all pi-brain branches in .memory/branches/.
+	 * Idempotent — already-processed commits are skipped.
+	 * Returns the number of newly ingested entities.
+	 */
+	reindex: () => Promise<number>
 	retrieve: (query: AttentionQuery, topK?: number) => Promise<ScoredEntity[]>
 	recordRead: (entityId: string) => Promise<void>
 	recordIgnoredRead: (entityId: string) => Promise<void>