stackmemoryai · jonathanpeterwu · Jun 9, 2026 · May 5, 2026 · May 8, 2026 · May 9, 2026
diff --git a/.claude/skills/instrument-agent b/.claude/skills/instrument-agent
@@ -0,0 +1 @@
+../../.agents/skills/instrument-agent
diff --git a/.claude/skills/setup-agent-replay b/.claude/skills/setup-agent-replay
@@ -0,0 +1 @@
+../../.agents/skills/setup-agent-replay
diff --git a/.codex/config.toml b/.codex/config.toml
@@ -0,0 +1,3 @@
+[mcp_servers.raindrop]
+command = "/Users/jwu/.raindrop/bin/raindrop"
+args = [ "workshop", "mcp" ]
diff --git a/.cursor/mcp.json b/.cursor/mcp.json
@@ -0,0 +1,11 @@
+{
+  "mcpServers": {
+    "raindrop": {
+      "command": "/Users/jwu/.raindrop/bin/raindrop",
+      "args": [
+        "workshop",
+        "mcp"
+      ]
+    }
+  }
+}
diff --git a/.mcp.json b/.mcp.json
@@ -0,0 +1,11 @@
+{
+  "mcpServers": {
+    "raindrop": {
+      "command": "/Users/jwu/.raindrop/bin/raindrop",
+      "args": [
+        "workshop",
+        "mcp"
+      ]
+    }
+  }
+}
diff --git a/CLAUDE.md b/CLAUDE.md
@@ -1,38 +1,27 @@
-# StackMemory - Project Configuration
+You are a senior Node.js/Express engineer working on this codebase. Write working code over explanations. Run commands before asserting state — never assume branch, file, or test status without verification.
+
+# croissant.ai — Agent Guide
+
+Tool-agnostic reference for AI coding agents working in this repository.
+
+## Stack
+
+Node.js / Express / PostgreSQL / Redis
+Railway deployment | Stripe / Salesforce / QuickBooks integrations
 
 ## Project Structure
 
 ```
 src/
-  cli/             # CLI commands and entry point
-  core/            # Core business logic
-    config/        # Config types and manager
-    context/       # Frame management, enrichment, rehydration
-    database/      # SQLite adapter, migrations, query cache
-    digest/        # Digest generation (hybrid, chronological)
-    errors/        # Error types and recovery
-    merge/         # Stack merge and conflict resolution
-    models/        # Model routing, complexity scoring
-    monitoring/    # Logging, metrics, session monitor
-    performance/   # Caching, profiling, benchmarks
-    query/         # Query parsing and routing
-    retrieval/     # Context retrieval, LLM provider
-    session/       # Handoff, session management
-    skills/        # Skill storage and types
-    storage/       # Tiered storage, remote sync
-    trace/         # Debug tracing, trace detection
-  integrations/    # External integrations
-    claude-code/   # Agent bridge, post-task hooks
-    linear/        # Linear sync, webhooks, OAuth
-    mcp/           # MCP server, 56 tool handlers
-    ralph/         # Multi-agent swarm orchestration
-  daemon/          # Unified daemon, session daemon
-  features/        # Analytics, browser, sweep, TUI
-  hooks/           # Claude Code hook handlers
-  skills/          # Built-in skill implementations
-  utils/           # Shared utilities
-scripts/           # Build and utility scripts
-docs/              # Documentation
+  api/          # Route handlers
+  core/         # monitoring-service, cache-service, queue-service, master-agent, api-validation
+  features/     # Feature modules
+  shared/       # Shared utilities
+  integrations/ # Third-party connectors
+docs/           # Documentation
+scripts/        # Automation scripts
+docker/         # Container configs
+prompts/        # Externalized LLM prompt templates
 ```
 
 ## Key Files
@@ -69,81 +58,64 @@ Full documentation (docs/):
 ## Commands
 
 ```bash
-npm run build          # Compile TypeScript (esbuild)
-npm run lint           # ESLint check
-npm run lint:fix       # Auto-fix lint issues
-npm run lint:fast      # Fast lint via oxlint
-npm run typecheck      # tsc --noEmit (8GB heap, avoids OOM)
-npm test               # Run Vitest (watch)
-npm run test:run       # Run tests once
-npm run linear:sync    # Sync with Linear
-
-# StackMemory CLI
-stackmemory capture    # Save session state for handoff
-stackmemory restore    # Restore from captured state
-stackmemory snapshot save  # Post-run context snapshot (alias: snap)
-stackmemory snapshot list  # List recent snapshots
-stackmemory preflight      # File overlap check for parallel tasks (alias: pf)
-stackmemory conductor start    # Autonomous Linear→worktree→agent orchestrator
-stackmemory conductor learn    # Analyze agent outcomes (success rate, failure phases, error patterns)
-stackmemory conductor learn --evolve  # Auto-mutate prompt template from failure data (GEPA)
-stackmemory conductor status   # Live agent status dashboard
-
-# GEPA Optimizer (scripts/gepa/optimize.js)
-node scripts/gepa/optimize.js run [gens] [--auto-apply]  # Full optimization loop
-node scripts/gepa/optimize.js score [--auto-apply]        # Score variants, select best
-node scripts/gepa/optimize.js run --target skill:start     # Optimize specific target
-node scripts/gepa/optimize.js mutate --auto-phase          # Auto-detect worst phase
-# Flags: --auto-apply (deploy winner), --no-cache (fresh eval), --target <name>, --phase <name>
-stackmemory conductor monitor  # Real-time TUI with phase tracking
-stackmemory conductor finalize # Clean up dead/stale agents
-stackmemory conductor traces <issue-id>  # View conversation traces for an agent run
-stackmemory conductor replay <session-id> # Replay full agent conversation from traces
-stackmemory conductor trace-stats         # Aggregate trace statistics
-stackmemory loop "<cmd>" --until "<pattern>"  # Poll until condition met (alias: watch)
+npm run dev       # Start dev server
+npm run test      # Run test suites (3 parallel Jest workers, maxWorkers=4)
+npm run lint      # Lint check
+npm run migrate   # Run DB migrations
+docker-compose up -d   # Start local DBs
 ```
 
-## Working Directory
+## Git Conventions
+
+- Branch prefixes: `feature/`, `fix/`, `chore/`
+- Commit format: `type(scope): message`
+- Do NOT add `Co-Authored-By` lines to commits
+- Pre-commit hook runs: `npm run lint` + `npm run test` + E2E browser screenshots
+
+## Testing Rules
 
-- PRIMARY: /Users/jwu/Dev/stackmemory
-- ALLOWED: All subdirectories
-- TEMP: /tmp for temporary operations
+- **Framework**: Jest + SWC
+- **DB mocking**: Use dependency injection (DI), not global mocks
+- **Supertest**: Pass `app` (NOT `server`) to supertest
+- **Global jest**: src/ tests use global `jest` — do NOT import from `@jest/globals` (causes redeclaration errors)
+- **Mock reset**: `jest.clearAllMocks()` resets `mockReturnValue` — always re-set mocks in `beforeEach`
+- **Test runner**: `npm test` is long-running; run in a background process or sub-agent, not inline
 
-## Validation
+## ESLint Rules
 
-Verify each step after code changes — pre-commit hooks catch 80% of CI failures locally:
-1. `npm run lint` - fix any errors AND warnings
-2. `npm run test:run` - verify no regressions
-3. `npm run build` - ensure compilation
-4. Run code to verify it works
+- Use `catch {}` not `catch (_err) {}` — underscore prefix not in the allowed pattern
+- CJS format for JS files in `src/`
 
-Test coverage:
-- New features require tests in `src/**/__tests__/`
-- Maintain or improve coverage (no untested code paths)
-- Critical paths: context management, handoff, Linear sync
+## Key Patterns
 
-Testing rules:
-- Run `npm run test:run` via subagent or background task — never inline (blocks context)
-- ESLint: use `catch {}` not `catch (_err) {}` (lint rule)
-- `vi.clearAllMocks()` resets `mockReturnValue` — re-set mocks in `beforeEach`
-- Pre-commit hook runs: lint + parallel vitest + build — fix issues before commit, never skip
+- Provenance tracking: every data point includes source, timestamp, lineage
+- Multi-tenant container isolation
+- DI route factories for testability
+- Error handling: return undefined over throwing; log and continue over crashing
+- Add `.js` extension to relative ESM imports
 
-## Git Rules
+## Task Steering
 
-The pre-commit hook enforces lint + test + build. Fix the underlying issue rather than bypassing it.
+**`master-tasks.md`** is the single source of truth for what to build. Agents must:
 
-- Do not use `--no-verify` on git push or commit — fix the hook failure instead
-- Fix lint/test errors before pushing
-- If pre-push hooks fail, fix the underlying issue
-- Run `npm run lint && npm run test:run` before pushing
-- Commit message format: `type(scope): message`
-- Branch naming: `feature/STA-XXX-description` | `fix/STA-XXX-description` | `chore/description`
+1. Read `master-tasks.md` before starting work (especially via `/next`)
+2. Pick the highest-priority (`P0` > `P1` > `P2`) non-blocked `todo` task
+3. Prefer tasks with `owner=@agent` over `owner=@me` (unless user overrides)
+4. Update task status to `active` when starting, `done` when complete
+5. Add branch/PR info to the table row
+6. Never create tasks in Linear or GitHub unless `sync` column says so
 
-## Task Management
+## StackMemory Context Rule
 
-- Use TodoWrite for 3+ steps or multiple requests
-- Keep one task in_progress at a time
-- Update task status immediately on completion
+- When an agent fetches conversation context for active work, it must pass the exact current assignment or question as `task_query`.
+- Prefer the MCP shape:
+  - `org_id`
+  - `conversation_id`
+  - `worker_mode: true`
+  - `task_query`
+  - `recover_on_low_signal: true`
+- Do not fetch raw `get_conversation` context for worker execution unless full transcript behavior is explicitly required.
+- The current assignment is persisted under `.stackmemory/worker-context/current-assignment.json` so wrappers and hooks can auto-fill or enforce `task_query`.
 
 ## Security
 

diff --git a/docs/plans/webhook-retry-exponential-backoff.md b/docs/plans/webhook-retry-exponential-backoff.md
@@ -0,0 +1,94 @@
+# Plan: Webhook Retry with Exponential Backoff
+
+## Summary
+
+Add persistent retry with exponential backoff to webhook event processing. Replace the in-memory `eventQueue` in `webhook-server.ts` with a SQLite-backed delivery queue that tracks attempts, applies exponential backoff with jitter, and respects circuit breaker state.
+
+## Existing Infrastructure to Leverage
+
+- **`src/core/errors/recovery.ts`**: `retry()`, `calculateBackoff()`, `CircuitBreaker` — all production-ready
+- **`src/integrations/linear/webhook-server.ts`**: Current in-memory queue (`eventQueue[]`, `processQueue()`)
+- **`src/core/database/sqlite-adapter.ts`**: SQLite persistence layer
+- **Error codes**: `LINEAR_WEBHOOK_FAILED`, `LINEAR_API_ERROR` already exist
+
+## Files to Change
+
+| File | Action | Purpose |
+|---|---|---|
+| `src/integrations/linear/webhook-retry.ts` | CREATE | Delivery queue + retry worker |
+| `src/integrations/linear/webhook-server.ts` | MODIFY | Replace in-memory queue with persistent queue |
+| `src/integrations/linear/__tests__/webhook-retry.test.ts` | CREATE | Tests for retry logic |
+
+## Data Model
+
+New table: `webhook_deliveries` (added inline in webhook-retry.ts, not in global migrations — this is integration-scoped)
+
+```sql
+CREATE TABLE IF NOT EXISTS webhook_deliveries (
+  id TEXT PRIMARY KEY,
+  event_type TEXT NOT NULL,
+  payload TEXT NOT NULL,
+  status TEXT NOT NULL DEFAULT 'pending',  -- pending | processing | completed | failed | dead
+  attempts INTEGER NOT NULL DEFAULT 0,
+  max_attempts INTEGER NOT NULL DEFAULT 5,
+  next_retry_at INTEGER,                   -- unix ms
+  last_error TEXT,
+  created_at INTEGER NOT NULL,
+  updated_at INTEGER NOT NULL
+);
+CREATE INDEX IF NOT EXISTS idx_webhook_deliveries_status_retry
+  ON webhook_deliveries(status, next_retry_at);
+```
+
+## Implementation Steps
+
+### Step 1: Create `webhook-retry.ts`
+
+- `WebhookDeliveryQueue` class
+  - `constructor(dbPath: string, options?: RetryConfig)` — opens/creates SQLite DB, ensures table
+  - `enqueue(eventType: string, payload: object): string` — inserts delivery, returns ID
+  - `processNext(): Promise<boolean>` — picks oldest `pending` or retriable `failed` delivery where `next_retry_at <= now`, marks `processing`, calls handler, updates status
+  - `startWorker(intervalMs?: number): void` — setInterval loop calling `processNext()`
+  - `stopWorker(): void` — clearInterval
+  - `getStats(): { pending, processing, completed, failed, dead }` — counts by status
+- Uses `calculateBackoff()` from `recovery.ts` for next_retry_at computation
+- Marks delivery `dead` after max_attempts exceeded
+- Config: `{ maxAttempts: 5, initialDelay: 1000, maxDelay: 300_000, backoffFactor: 2 }`
+
+### Step 2: Modify `webhook-server.ts`
+
+- Replace `eventQueue: LinearWebhookPayload[]` with `WebhookDeliveryQueue` instance
+- In webhook endpoint handler: call `queue.enqueue()` instead of `eventQueue.push()`
+- Start worker in `start()`, stop in `stop()`
+- Remove `processQueue()` method and `isProcessing` flag
+
+### Step 3: Write tests
+
+- Unit tests for `WebhookDeliveryQueue`:
+  - enqueue creates a delivery record
+  - processNext picks the oldest pending delivery
+  - failed delivery gets exponential backoff schedule
+  - delivery marked dead after max_attempts
+  - concurrent processNext doesn't double-process (status = processing guard)
+  - getStats returns correct counts
+
+## Acceptance Criteria
+
+- [x] Failed webhook events are retried up to 5 times with exponential backoff
+- [x] Backoff schedule: 1s, 2s, 4s, 8s, 16s (capped at 300s)
+- [x] Delivery state persisted in SQLite — survives process restart
+- [x] Dead deliveries (exceeded max attempts) are logged but not retried
+- [x] Existing webhook signature verification unchanged
+- [x] Tests pass with 80%+ coverage on new code
+
+## Risks
+
+- **LOW**: SQLite write contention if webhook volume is high — mitigated by WAL mode (already used)
+- **LOW**: Worker interval drift — acceptable for webhook retry cadence (not real-time)
+
+## Non-Goals
+
+- Redis/BullMQ queue (overkill for single-process webhook handler)
+- Webhook delivery UI/dashboard
+- Dead letter queue notification
+- Outbound webhook sending (this is for processing *received* webhooks)