stackmemoryai
diff --git a/‎README.md‎
Lines changed: 33 additions & 0 deletions b/‎README.md‎
Lines changed: 33 additions & 0 deletions
diff --git a/‎docs/SETUP.md‎
Lines changed: 41 additions & 0 deletions b/‎docs/SETUP.md‎
Lines changed: 41 additions & 0 deletions
diff --git a/‎docs/mcp.md‎
Lines changed: 168 additions & 0 deletions b/‎docs/mcp.md‎
Lines changed: 168 additions & 0 deletions
diff --git a/‎package.json‎
Lines changed: 3 additions & 1 deletion b/‎package.json‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎scripts/demos/ralph-integration-demo.ts‎
Lines changed: 14 additions & 13 deletions b/‎scripts/demos/ralph-integration-demo.ts‎
Lines changed: 14 additions & 13 deletions
@@ -97,6 +97,38 @@ Frames can span:
 
 Runs as an MCP server. Editors (e.g., Claude Code) call StackMemory on each interaction to fetch a compiled context bundle; editors don’t store memory themselves.
 
+### MCP Quick Usage
+
+Use these JSON snippets with Claude Code’s MCP “tools/call”. Responses are returned as a single text item containing JSON.
+
+- Plan only (no code):
+  ```json
+  {"method":"tools/call","params":{"name":"plan_only","arguments":{"task":"Refactor config loader","plannerModel":"claude-3-5-sonnet-latest"}}}
+  ```
+
+- Approval‑gated plan (phase 1):
+  ```json
+  {"method":"tools/call","params":{"name":"plan_gate","arguments":{"task":"Refactor config loader","compact":true}}}
+  ```
+
+- Approve + execute (phase 2):
+  ```json
+  {"method":"tools/call","params":{"name":"approve_plan","arguments":{"approvalId":"<copy from plan_gate>","implementer":"codex","execute":true,"recordFrame":true,"compact":true}}}
+  ```
+
+- Manage approvals:
+  ```json
+  {"method":"tools/call","params":{"name":"pending_list","arguments":{}}}
+  {"method":"tools/call","params":{"name":"pending_show","arguments":{"approvalId":"<id>","compact":true}}}
+  {"method":"tools/call","params":{"name":"pending_clear","arguments":{"approvalId":"<id>"}}}
+  ```
+
+Env defaults (optional):
+- `STACKMEMORY_MM_PLANNER_MODEL` (e.g., `claude-3-5-sonnet-latest` or `claude-3-opus-latest`)
+- `STACKMEMORY_MM_REVIEWER_MODEL` (defaults to planner if unset)
+- `STACKMEMORY_MM_IMPLEMENTER` (`codex` or `claude`)
+- `STACKMEMORY_MM_MAX_ITERS` (e.g., `2`)
+
 ---
 
 ## Quick Start
@@ -386,5 +418,6 @@ See https://github.com/stackmemoryai/stackmemory/blob/main/docs/roadmap.md for o
 - [Product Requirements](./PRD.md) - Detailed product specifications
 - [Technical Architecture](./TECHNICAL_ARCHITECTURE.md) - System design and database schemas
 - [Beads Integration](./BEADS_INTEGRATION.md) - Git-native memory patterns from Beads ecosystem
+ - [MCP: plan_and_code](https://github.com/stackmemoryai/stackmemory/blob/main/docs/mcp.md) - Trigger planning + coding via MCP with JSON results
 
 ---
@@ -62,6 +62,47 @@ stackmemory init --chromadb
 | `linear_update_task` | Update Linear issue                        |
 | `linear_get_tasks`   | Get tasks from Linear                      |
 
+### Quick: plan_and_code (planning + coding)
+
+- Trigger a full plan → implement → critique loop and get a single JSON result.
+- Tool: `plan_and_code`
+- Args:
+  - `task`: short description
+  - `implementer`: `codex` (default) or `claude`
+  - `maxIters`: retries (default 2)
+  - `execute`: true to actually call the implementer (otherwise dry‑run)
+  - `record`: write plan/critique to simple context
+  - `recordFrame`: write a real frame + anchors
+- Env defaults: `STACKMEMORY_MM_PLANNER_MODEL`, `STACKMEMORY_MM_REVIEWER_MODEL`, `STACKMEMORY_MM_IMPLEMENTER`, `STACKMEMORY_MM_MAX_ITERS`
+
+Example request (tools/call):
+
+```json
+{
+  "method": "tools/call",
+  "params": {
+    "name": "plan_and_code",
+    "arguments": {
+      "task": "Refactor config loader into provider pattern",
+      "implementer": "codex",
+      "maxIters": 2,
+      "execute": true,
+      "recordFrame": true
+    }
+  }
+}
+```
+
+CLI equivalents for quick checks:
+
+```bash
+# Quiet JSON (UI-friendly)
+stackmemory mm-spike --task "Refactor config loader" --json
+
+# Execute implementer and record as frame
+stackmemory skills spike --task "Refactor" --execute --max-iters 3 --json --record-frame
+```
+
 ## Open-Source Local Mode
 
 ### Step 1: Clone & Build
 
@@ -0,0 +1,168 @@
+# MCP: plan_and_code Tool
+
+The `plan_and_code` MCP tool lets Claude Code trigger StackMemory’s multi‑agent flow silently and receive a single JSON result. It plans with Claude, implements with Codex or Claude, and critiques the result — with optional retry loops and context recording.
+
+## What it does
+- Planner (Claude): generates a concise plan with acceptance criteria and risks.
+- Implementer (Codex/Claude): applies a focused change per step.
+- Critic (Claude): returns `{ approved, issues[], suggestions[] }` to gate retries.
+- Returns a single JSON payload: `{ plan, implementation, critique, iterations[] }`.
+
+## Tool definition
+- name: `plan_and_code`
+- arguments:
+  - `task` (string, required): short task description
+  - `implementer` ("codex" | "claude", default: `codex`)
+  - `maxIters` (number, default: `2`): retry loop iterations
+  - `execute` (boolean, default: `false`): if `false`, implementer is dry‑run
+  - `record` (boolean, default: `false`): write plan/critique as simple context rows
+  - `recordFrame` (boolean, default: `false`): write a real frame + anchors
+
+## Environment defaults
+If not specified in arguments, the MCP handler reads these env vars:
+- `STACKMEMORY_MM_PLANNER_MODEL` (e.g., `claude-3-5-sonnet-latest`)
+- `STACKMEMORY_MM_REVIEWER_MODEL` (defaults to planner model if unset)
+- `STACKMEMORY_MM_IMPLEMENTER` (`codex` or `claude`)
+- `STACKMEMORY_MM_MAX_ITERS` (e.g., `3`)
+
+## Example (MCP request)
+```json
+{
+  "method": "tools/call",
+  "params": {
+    "name": "plan_and_code",
+    "arguments": {
+      "task": "Refactor config loader into provider pattern",
+      "implementer": "codex",
+      "maxIters": 2,
+      "execute": true,
+      "recordFrame": true
+    }
+  }
+}
+```
+
+Response content is a single `text` item containing a JSON string:
+```json
+{
+  "ok": true,
+  "result": {
+    "plan": { "summary": "...", "steps": [ ... ], "risks": [ ... ] },
+    "implementation": { "success": true, "summary": "...", "commands": [ ... ] },
+    "critique": { "approved": true, "issues": [], "suggestions": [] },
+    "iterations": [
+      { "command": "...", "ok": true, "outputPreview": "...", "critique": { ... } }
+    ]
+  }
+}
+```
+
+## Recording behavior
+- `record: true` writes two entries into `.stackmemory/context.db` (simple `contexts` table):
+  - `Plan: <summary>` (importance 0.8)
+  - `Critique: approved|needs_changes` (importance 0.6)
+- `recordFrame: true` writes a real frame + anchors using the FrameManager:
+  - Frame: `Plan & Code: <task>`
+  - Anchors: `DECISION` (plan summary), `FACT` (commands), `RISK` (first few issues), `TODO` (first few suggestions)
+  - Closes the frame with `{ approved: true|false }`
+- Both modes are best‑effort. If the DB isn’t ready, handler returns JSON without failing.
+
+## Notes
+- Implementer `codex` calls `codex-sm` (must be on PATH). Use `--execute` in CLI, or `execute: true` in MCP, to actually run it; otherwise it’s a dry‑run.
+- Audit files are saved to `.stackmemory/mm-spike/spike-<timestamp>.json` to support review/debugging.
+- You can compare models:
+  - Planner/critic: override with `STACKMEMORY_MM_PLANNER_MODEL` / `STACKMEMORY_MM_REVIEWER_MODEL`.
+  - Implementer: set to `claude` to A/B against Codex, or keep `codex` (default).
+
+## CLI equivalents (for quick checks)
+- Quiet JSON output:
+  - `stackmemory mm-spike --task "Refactor config loader" --json`
+  - `stackmemory skills spike --task "Refactor config loader" --json`
+- Execute implementer and record as frame:
+  - `stackmemory skills spike --task "Refactor" --execute --max-iters 3 --json --record-frame`
+
+---
+
+## Approval‑Gated Flow (plan_gate → approve_plan)
+
+Use this two‑phase flow when you want the plan reviewed before any code runs.
+
+### Phase 1: plan_gate
+
+Request (tools/call):
+
+```json
+{
+  "method": "tools/call",
+  "params": {
+    "name": "plan_gate",
+    "arguments": {
+      "task": "Refactor config loader into provider pattern",
+      "plannerModel": "claude-3-5-sonnet-latest"
+    }
+  }
+}
+```
+
+Response (content[0].text is a JSON string):
+
+```json
+{
+  "ok": true,
+  "approvalId": "appr_1738612345678_ab12cd",
+  "plan": { "summary": "...", "steps": [ ... ], "risks": [ ... ] }
+}
+```
+
+Render `plan` for review; store `approvalId` for Phase 2.
+
+### Phase 2: approve_plan
+
+Request (tools/call):
+
+```json
+{
+  "method": "tools/call",
+  "params": {
+    "name": "approve_plan",
+    "arguments": {
+      "approvalId": "appr_1738612345678_ab12cd",
+      "implementer": "codex",
+      "maxIters": 2,
+      "execute": true,
+      "recordFrame": true
+    }
+  }
+}
+```
+
+Response (content[0].text is a JSON string):
+
+```json
+{
+  "ok": true,
+  "approvalId": "appr_1738612345678_ab12cd",
+  "result": {
+    "plan": { ... },
+    "implementation": { "success": true, "commands": [ ... ] },
+    "critique": { "approved": true, "issues": [], "suggestions": [] },
+    "iterations": [ { "command": "...", "ok": true, "critique": { ... } } ]
+  }
+}
+```
+
+Notes:
+- `recordFrame: true` creates a real StackMemory frame + anchors (plan summary, commands, issues, suggestions).
+- `execute: true` actually invokes the implementer; otherwise it’s a dry‑run.
+- Approval IDs are persisted to `.stackmemory/mm-spike/pending.json` so editor restarts don’t lose pending approvals.
+
+### Optional helper tools
+- `plan_only`: Returns a plan JSON without running code.
+- `call_claude`: Calls Claude directly (prompt/model/system).
+- `call_codex`: Calls Codex via `codex-sm` (prompt/args/execute).
+- `pending_list`: Lists pending approval-gated plans with `approvalId`, `task`, and `createdAt`. Supports optional filters:
+  - `{ taskContains: "refactor", sort: "desc", limit: 10 }`
+  - `{ olderThanMs: 3600000 }` (older than 1 hour)
+  - `{ newerThanMs: 600000 }` (newer than 10 minutes)
+- `pending_clear`: Clears pending approvals. Args: `{ approvalId }`, or `{ all: true }`, or `{ olderThanMs: <ms> }`.
+- `pending_show`: Returns a stored pending plan by `{ approvalId }`.
@@ -87,7 +87,9 @@
     "sync:start": "node scripts/background-sync-manager.js",
     "sync:setup": "./scripts/setup-background-sync.sh",
     "prepare": "echo 'Prepare step completed'",
-    "verify:dist": "node scripts/verify-dist.cjs"
+    "verify:dist": "node scripts/verify-dist.cjs",
+    "rebuild:native": "npm rebuild better-sqlite3 || true",
+    "deps:reset": "rm -rf node_modules package-lock.json && npm ci"
   },
   "dependencies": {
     "@anthropic-ai/sdk": "^0.71.2",
 
@@ -5,7 +5,6 @@
  */
 
 import { RalphStackMemoryBridge } from './bridge/ralph-stackmemory-bridge.js';
-import { logger } from '../../core/monitoring/logger.js';
 import { RalphStackMemoryConfig } from './types.js';
 
 class RalphIntegrationDemo {
@@ -60,9 +59,12 @@ class RalphIntegrationDemo {
       await this.demonstrateMetrics();
 
       console.log('\n✅ Demo completed successfully!\n');
-    } catch (error: any) {
-      console.error('\n❌ Demo failed:', error.message);
-      throw error;
+    } catch (err: unknown) {
+      console.error(
+        '\n❌ Demo failed:',
+        err instanceof Error ? err.message : err
+      );
+      throw err;
     } finally {
       await this.cleanup();
     }
@@ -158,9 +160,6 @@ class RalphIntegrationDemo {
     console.log('\n🚑 Phase 3: Crash Recovery');
     console.log('===========================');
 
-    // Simulate getting session ID
-    const sessionId = 'demo-session-123';
-
     try {
       console.log('🔄 Simulating session rehydration...');
 
@@ -177,8 +176,10 @@ class RalphIntegrationDemo {
       console.log('  - State reconciled: 0.3s');
       console.log('  - Memory usage: 45MB');
       console.log('  - Cache hit rate: 78%');
-    } catch (error: any) {
-      console.log(`⚠️  Recovery simulation: ${error.message}`);
+    } catch (err: unknown) {
+      console.log(
+        `⚠️  Recovery simulation: ${err instanceof Error ? err.message : err}`
+      );
     }
   }
 
@@ -227,10 +228,10 @@ async function main() {
 
   try {
     await demo.run();
-  } catch (error: any) {
-    console.error('Demo failed:', error.message);
-    if (process.env.DEBUG) {
-      console.error(error.stack);
+  } catch (err: unknown) {
+    console.error('Demo failed:', err instanceof Error ? err.message : err);
+    if (process.env.DEBUG && err instanceof Error) {
+      console.error(err.stack);
     }
     process.exit(1);
   }