Compare commits

...

24 Commits

Author SHA1 Message Date
6fde7002aa docs: boocode-lift-analysis, openspec change docs, codesight cache, deps
- Add boocode-lift-analysis.md: comprehensive 30-repo lift matrix across 25 domains
- Add openspec/ change docs: domain2-code-intelligence, domain3-multi-agent, impeccable-wave, streaming-codeblocks
- Update .gitignore: .impeccable/, .omo/, bun.lock, DESIGN.md, PRODUCT.md
- Update dependencies in package.json + pnpm-lock.yaml
- Update .codesight/ analysis cache
2026-06-08 03:49:26 +00:00
50de80ee75 feat(web): workspace components — ComparePane, Memory page, McpDialog, error boundaries, message-parts
- Add ComparePane.tsx: side-by-side AI response comparison
- Add Memory.tsx: memory management page with CRUD UI
- Add McpPermissionDialog.tsx: MCP tool permission approval dialog
- Add McpResponseDisplay.tsx: MCP response visualization
- Add MessageBoundary.tsx + MessageListErrorBoundary.tsx: error resilience
- Add EmptyState.tsx: contextual empty state component
- Add KeyboardShortcutsDialog.tsx: keyboard shortcut reference
- Add message-parts/: ActionRow, CompactCard, MistakeRecoverySentinel, ReasoningBlock, SendToTerminalMenu, StatsLine, SummaryCard
- Add useDraftPersistence.ts: draft message persistence hook
- Add useTerminals.ts: terminal session management hook
- Add keyboard-shortcuts.ts + tool-utils.ts: shared utilities
- Extend components: ChatInput, MessageBubble, MessageList, Workspace, panes
- Extend hooks: useTerminalSocket, useSessionStream test suite
- Update pages: Home, Project — workspace layout and session flow
2026-06-08 03:49:22 +00:00
51733c1338 feat(contracts): ws-frames and message-metadata extensions
- Extend WsFrameSchema: new frame types for memory, state-graph events
- Extend MessageMetadata: AgentSessionConfig, ErrorReason variants
2026-06-08 03:49:06 +00:00
fa07b01567 feat(booterm): PTY session metadata, terminal registry, WS attach enhancements
- Add PTY session metadata tracking (title, description, parent agent)
- Extend terminal registry: structured session metadata
- Extend WS attach: session-aware WebSocket lifecycle
- Extend routes: terminals and sessions with metadata
2026-06-08 03:49:02 +00:00
e2d6a6b6cd feat(coder): flow-runner decisions, conductor types, collision detection tests
- Add flow-runner-decisions.ts: decision-aware step execution
- Extend flow-runner.ts: dynamic step decisions
- Extend conductor types: additional flow state types
- Add collision-detector.test.ts: edit collision unit tests
- Add conflict-index.test.ts: conflict resolution index tests
2026-06-08 03:48:58 +00:00
381b97f78a feat(server): inference state-graph + supervisor, memory tools, MCP client, schema, routes
- Add state-graph.ts: typed state machine for inference lifecycle
- Add supervisor.ts: agent supervisor pattern for multi-agent coordination
- Add export-formatter.ts: structured export formatting
- Add manage_memory.ts: memory CRUD tool for agent persistence
- Add get_wiki_article.ts: codecontext wiki article retrieval
- Extend memory/index.ts: 3-tier memory (context/daily/core)
- Extend MCP client: mcp-config.ts env-var substitution
- Update schema.sql: agent_sessions, tasks, pending_changes extensions
- Update API types: MessageMetadata, ErrorReason, AgentSessionConfig
- Update routes: chats, messages, sessions — column renames and agent_session_id
- Update inference: error handler, payload builder, stream phase, turn orchestrator
2026-06-08 03:48:47 +00:00
9e2b0a7dc0 docs: guidance audit — refusals up front, version anchors, failure modes, resolution order, drift guards
Apply 7 proposed edits from guidance improver audit:
- CLAUDE.md: refusal rails up front, version anchor, resolution order
- BOOCHAT.md: resolution order section
- BOOCODER.md: tool reliability callouts
- data/AGENTS.md: tool list drift guard, failure modes preamble
2026-06-08 03:20:33 +00:00
51f2f4284f docs: changelog + roadmap for v2.8.19-v2.8.20 2026-06-08 03:14:46 +00:00
45a1140fd3 feat: phase 3-5 — workflow engine, background subagents, multi-modal, cache shape, inline diff
Phase 3: Dynamic Workflow Engine
- VM sandbox (node:vm) with agent/parallel/pipeline API, Claude Code compatible
- Workflow file discovery (.boocode/workflows/*.js + ~/.boocode/workflows/*.js)
- Workflow manager with session/chat creation and inference dispatch
- Built-in catalog: deep-research, review-code, find-issues
- Resumability cache: SHA-256 hash of agent spec, in-memory Map

Phase 4: Background Subagents
- background-task.ts service: spawn/poll/cancel lifecycle
- spawn_subagent, subagent_status, subagent_result tools in ALL_TOOLS

Phase 5: Multi-modal + Cache Shape
- Multi-modal stub with type defs and hook point in payload.ts
- CacheShapeBadge component in trace viewer (colored bar + %)
2026-06-08 03:11:39 +00:00
74da084521 feat(conductor): Wave 2 — parallel batch execution + SWITCH branching step
- Parallel batch execution: batch field on Step, batchConfig on Flow,
  batch-aware readySteps with maxConcurrent gating, getReadyInBatch helper
- SWITCH branching step: new 'switch' StepKind with cases/programmed conditions,
  resolveSwitch() pure function, switch-excluded steps tracked in
  SchedulerState, non-selected branches excluded from execution
2026-06-08 03:00:06 +00:00
c860b6c4b7 feat: Wave 1 complete — state machine, Paseo hub, collision detection, PTY search
- Task state machine: TIMED_OUT state, retriable steps, timeout detection
- Paseo hub: paseo-client.ts (HTTP+CLI), PaseoBackend (AgentBackend), 14 tests
- Collision detection: collision-detector.ts, conflict-index.ts, ws-frames type
- PTY search: ring buffer, search route, capture-pane fallback
2026-06-08 02:45:17 +00:00
c4ee377dbc feat(conductor): task state machine — TIMED_OUT state and retriable steps
- Add 'timed_out' to flow_runs/flow_steps CHECK constraints
- Add retry_count and max_retries columns to flow_steps
- Add timeout detection in advanceInner loop (configurable FLOW_STEP_TIMEOUT_MS)
- Add retriable logic: re-dispatch on timeout if maxRetries > 0 and retryCount < maxRetries
- Add isRetriable() + shouldRetry() pure decision functions
- Add timed_out handling to reconcileResumeStep and reconcileRun
- Add 'timed_out' to ws-frames enum, publishStep status type
2026-06-08 02:43:45 +00:00
f2401352a8 chore: update pnpm-lock.yaml for @ai-sdk/deepseek 2026-06-08 02:28:32 +00:00
abe9c5a3a8 feat: Paseo-like orchestrator Phase 1-2 — trace system, session persistence, timeline, run_command, auto-fix loop
Phase 1: Trace System + Observability
- tool_traces DB table + insert/update service
- tool_trace_start/tool_trace_finish WS frames (contracts + FE types)
- Instrumented tool-phase.ts with timing around every tool call
- GET /api/chats/:id/traces paginated endpoint
- Trace viewer frontend (collapsible panel with timing bars + token breakdown)

Phase 2: Session Persistence + Resume
- agent_snapshots table (UPSERT per chat, persisted on turn boundaries)
- save/load/delete service functions
- Agent snapshot sent on WS reconnect
- Session timeline view (vertical timeline with scroll-to + restore)

Tooling:
- run_command tool (execFile, 30s timeout, 32KB cap, path-guarded)
- Auto-fix loop: after write tools, runs pnpm build, injects errors into next turn
2026-06-08 02:26:47 +00:00
7cb692d8be feat: Phase 4 teardown — remove Go codecontext sidecar from deployment
- Remove codecontext service block from docker-compose.yml
- Remove CODECONTEXT_URL env var
- Delete codecontext/Dockerfile
- Update callCodecontext() to try boocontext MCP first with HTTP fallback
- Graceful degradation: if boocontext MCP unavailable, tools still work via HTTP
2026-06-08 02:16:02 +00:00
917a229363 feat: Domain 2 Phase 3-4 — wiki article tool, DCP compress toggle, Go sidecar deprecation
Phase 3: get_wiki_article tool wraps codesight_get_wiki_article MCP
(cached, persistent codebase wiki). DCP compress toggle on
get_codebase_overview (compress=true for large projects >50 files).

Phase 4: Deprecation markers on Go codecontext sidecar. Warning log
in callCodecontext(), deprecation comments in factory.ts and
docker-compose.yml. Sidecar remains functional — removal deferred.
2026-06-08 01:35:40 +00:00
39be5ce413 fix: move cache_tokens/reasoning_tokens ALTER TABLE before view creation 2026-06-08 01:32:25 +00:00
378e29308e fix: add cache_tokens/reasoning_tokens to Message constructors in useSessionStream 2026-06-08 01:27:31 +00:00
8f6a814ab0 fix: add cache_tokens/reasoning_tokens to web WsFrame union 2026-06-08 01:26:01 +00:00
3c019a2281 changelog: v2.8.18-deepseek-whale-lift 2026-06-08 01:24:59 +00:00
203cfd2fa8 feat: DeepSeek API integration + Whale lift (hooks, tool repair, MCP permissions, token tracking)
DeepSeek API:
- @ai-sdk/deepseek provider replaces openai-compatible for deepseek-* models
- Token tracking: cache_hit/reasoning tokens flow API → DB → WS frames → UI
- thinking effort levels (off/low/medium/high/xhigh/max) via AGENTS.md frontmatter
- V4 models: deepseek-v4-flash, deepseek-v4-pro
- Wired for both chat and coder panes

Whale lifts:
- Tool input repair (schema-based type coercion, markdown link unwrapping)
- Hooks system (6 lifecycle events, shell exec, JSON stdin/stdout contract)
- Per-MCP-server permissions (allow/ask/deny)
- token tracking UI (cache N, think N in message stats line)

Infra:
- New DB columns: messages.cache_tokens, messages.reasoning_tokens
- New WS frame fields: cache_tokens, reasoning_tokens on message_complete
- coder provider snapshot merges DeepSeek models alongside llama-swap
2026-06-08 01:24:23 +00:00
c11e26090f feat(coder): boulder state — cross-session plan persistence + auto-resumption
New plans table (id, project_id, title, description, status, flow_run_id,
progress_pct, items_total, items_completed, metadata, timestamps) with
CHECK constraints and indexes.

Plan store (plan-store.ts): createPlan, getPlan, listPlans, listActivePlans,
updatePlan, updatePlanFromRun, findPlanWithRunningRun, planStatusFromRun.

Flow-runner integration: onRunTerminal callback fires on every terminal
transition (complete/fail/cancel) and updates linked plans automatically.

5 API endpoints: GET /api/plans, GET /api/plans/active, GET /api/plans/:id,
POST /api/plans, PATCH /api/plans/:id.

484 tests pass, build clean.
2026-06-08 01:11:07 +00:00
e0feb53437 feat: omo-paseo-bridge — auto-register OMO subagents as Paseo agents
Bridge script that calls paseo import <session-id> --provider opencode
--label omo=true on task() child sessions. Supports import, archive,
ls commands with --dry-run verification. Skill at .opencode/skills/
is gitignored (user-level) — copy from scripts/ on setup.
2026-06-08 01:11:00 +00:00
3c5b2c2bcf feat(server): Domain 2 Phase 1 — boocontext MCP client + 4 new code intelligence tools
Shared boocontext MCP client (boocontext_client.ts) wrapping the existing
mcp-client.ts callTool() infrastructure with 32KB truncation and error
handling. Used by get_code_health.

4 new first-class agent tools backed by the boocontext MCP server:
- get_code_health — A-F grades per file across 7 dimensions, project health
  summary, refactoring candidates (wraps boocontext_health)
- get_code_impact — merged symbol trace + blast radius in one call (wraps
  boocontext_impact, replaces two-step get_symbol_info+get_blast_radius)
- get_type_info — TypeScript type recovery via type-inject MCP (wraps
  boocontext_types, returns signatures, interfaces, generics, JSDoc)
- get_code_map — DCP-compressed context map with compress toggle (wraps
  boocontext_map, 10x token reduction vs full scan)

All 4 registered in ALL_TOOLS as read-only tools.
2026-06-08 00:45:46 +00:00
190 changed files with 18917 additions and 721 deletions

View File

@@ -3,9 +3,9 @@
> **Stack:** fastify, go-net-http | none | react | typescript
> **Microservices:** @boocode/contracts, @boocode/ion, @boocode/booterm, @boocode/coder, @boocode/server, @boocode/web, codecontext, @boocode/conductor
> 131 routes (9 inferred) + 9 ws | 18 models | 69 components | 247 lib files | 39 env vars | 16 middleware
> 147 routes (9 inferred) + 9 ws | 23 models | 92 components | 296 lib files | 43 env vars | 17 middleware
> **Token savings:** this file is ~0 tokens. Without it, AI exploration would cost ~0 tokens. **Saves ~0 tokens per conversation.**
> **Last scanned:** 2026-06-07 21:09 — re-run after significant changes
> **Last scanned:** 2026-06-08 03:49 — re-run after significant changes
---
@@ -14,6 +14,7 @@
## CRUD Resources
- **`/api/battles`** GET | POST | GET/:id → Battle
- **`/api/plans`** GET | POST | GET/:id | PATCH/:id → Plan
- **`/api/runs`** GET | POST | GET/:id → Run
- **`/api/tasks`** GET | POST | GET/:id → Task
- **`/api/chats/:id/messages`** GET | POST | GET/:id | DELETE/:id → Message
@@ -25,11 +26,16 @@
### fastify
- `GET` `/api/term/health` params()
- `GET` `/api/term/sessions/:sid/panes/:pid/search` params(sid, pid) [auth]
- `GET` `/api/term/sessions` params() [auth]
- `POST` `/api/term/sessions/:sid/panes/:pid/start` params(sid, pid) [auth]
- `POST` `/api/term/sessions/:sid/panes/:pid/kill` params(sid, pid) [auth]
- `GET` `/ws/term/sessions/:sid/panes/:pid` params(sid, pid) [auth]
- `GET` `/api/health` params() [auth, db, queue, ai]
- `GET` `/api/sessions/:sessionId/agent-sessions` params(sessionId) [auth, db]
- `GET` `/api/analytics/summary` params() [auth, db]
- `GET` `/api/analytics/sessions` params() [auth, db]
- `GET` `/api/analytics/token-breakdown` params() [auth, db]
- `POST` `/api/battles/generate-prompt` params() [auth, db]
- `POST` `/api/battles/:id/stop` params(id) [auth, db]
- `GET` `/api/battles/:id/analysis` params(id) [auth, db]
@@ -53,6 +59,7 @@
- `POST` `/api/pending/:id/apply` params(id) [auth, db, queue]
- `POST` `/api/pending/:id/reject` params(id) [auth, db, queue]
- `POST` `/api/pending/:id/rewind` params(id) [auth, db, queue]
- `GET` `/api/plans/active` params() [db]
- `GET` `/api/providers/snapshot` params() [db, cache]
- `GET` `/api/providers/config` params() [db, cache]
- `PATCH` `/api/providers/config` params() [db, cache]
@@ -70,19 +77,22 @@
- `GET` `/api/ws/sessions/:sessionId` params(sessionId) [auth, db]
- `GET` `/api/ws/user` params() [auth, db]
- `GET` `/api/projects/:id/agents` params(id) [db, cache]
- `GET` `/api/analytics/context` params() [auth, db]
- `POST` `/api/chats/:id/messages/:msg_id/artifacts/download` params(id, msg_id) [auth, db]
- `GET` `/api/chats/:id/messages/:msg_id/html_artifact` params(id, msg_id) [auth, db]
- `GET` `/api/projects/:project_id/artifacts/:filename` params(project_id, filename) [auth, db]
- `GET` `/api/sessions/:id/chats` params(id) [auth, db]
- `POST` `/api/sessions/:id/chats` params(id) [auth, db]
- `PATCH` `/api/chats/:id` params(id) [auth, db]
- `POST` `/api/sessions/:id/chats/archive-all` params(id) [auth, db]
- `GET` `/api/sessions/:id/chats/open-count` params(id) [auth, db]
- `POST` `/api/chats/:id/archive` params(id) [auth, db]
- `POST` `/api/chats/:id/unarchive` params(id) [auth, db]
- `DELETE` `/api/chats/:id` params(id) [auth, db]
- `POST` `/api/chats/:id/fork` params(id) [auth, db]
- `POST` `/api/chats/:id/discard_stale` params(id) [auth, db]
- `GET` `/api/sessions/:id/chats` params(id) [auth, db, queue]
- `POST` `/api/sessions/:id/chats` params(id) [auth, db, queue]
- `PATCH` `/api/chats/:id` params(id) [auth, db, queue]
- `POST` `/api/sessions/:id/chats/archive-all` params(id) [auth, db, queue]
- `GET` `/api/sessions/:id/chats/open-count` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/archive` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/unarchive` params(id) [auth, db, queue]
- `DELETE` `/api/chats/:id` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/fork` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/discard_stale` params(id) [auth, db, queue]
- `GET` `/api/chats/:id/export` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/compare` params(id) [auth, db, queue]
- `GET` `/api/coder/ws/sessions/:sessionId` params(sessionId) [auth]
- `ALL` `/api/coder/*` params() [auth]
- `GET` `/api/settings/inference` params() [cache]
@@ -94,7 +104,9 @@
- `POST` `/api/chats/:id/continue` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/force_send` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/grant_read_access` params(id) [auth, db, queue]
- `GET` `/api/models` params()
- `POST` `/api/chats/:id/mcp-approve` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/messages/:message_id/feedback` params(id, message_id) [auth, db, queue]
- `GET` `/api/models` params() [auth]
- `POST` `/api/projects/create` params() [auth, db]
- `POST` `/api/projects/:id/archive` params(id) [auth, db]
- `POST` `/api/projects/:id/unarchive` params(id) [auth, db]
@@ -122,6 +134,7 @@
- `GET` `/api/skills` params() [auth, db, queue]
- `POST` `/api/chats/:id/skill_invoke` params(id) [auth, db, queue]
- `GET` `/api/tools/cost_stats` params() [auth, db]
- `GET` `/api/chats/:id/traces` params(id) [db]
- `GET` `/api/ws/sessions/:id` params(id) [auth, db]
### go-net-http
@@ -273,6 +286,25 @@
- model: text (required)
- verdict: text
### flow_step_events
- id: uuid (pk)
- run_id: uuid (required, fk)
- step_id: varchar (required, fk)
- event: varchar (required)
- payload: jsonb
### plans
- id: uuid (pk)
- project_id: uuid (required, fk)
- title: text (required)
- description: text
- status: text (required)
- flow_run_id: uuid (fk)
- progress_pct: integer (required)
- items_total: integer (required)
- items_completed: integer (required)
- metadata: jsonb
### projects
- id: uuid (pk)
- name: text (required)
@@ -294,6 +326,8 @@
- content: text (required)
- status: text (required)
- last_seq: integer (required)
- cache_tokens: integer
- reasoning_tokens: integer
### message_parts
- id: uuid (pk)
@@ -311,6 +345,45 @@
- name: text
- status: text (required)
### tool_traces
- id: uuid (pk)
- session_id: uuid (required, fk)
- chat_id: uuid (required, fk)
- message_id: uuid (fk)
- turn_number: integer (required)
- tool_name: text (required)
- tool_input: jsonb (required)
- tool_output: text
- started_at: timestamp(tz) (required)
- finished_at: timestamp(tz)
- latency_ms: integer
- tokens_used: integer
- cache_tokens: integer
- reasoning_tokens: integer
- error: text
- outcome: text
### tool_trace_states
- id: uuid (pk)
- session_id: uuid (required, fk)
- chat_id: uuid (required, fk)
- message_id: uuid (fk)
- turn_number: integer (required)
- tool_name: text (required)
- tool_input: jsonb (required)
- started_at: timestamp(tz) (required)
### agent_snapshots
- id: uuid (pk)
- session_id: uuid (required, fk)
- chat_id: uuid (required, fk)
- model: text (required)
- agent: text
- mode: text
- turn_number: integer (required)
- messages: jsonb (required)
- tool_states: jsonb (required)
---
# Components
@@ -325,23 +398,34 @@
- **AttachmentChip** — props: attachment, onRemove, onPreview — `apps/web/src/components/AttachmentChip.tsx`
- **AttachmentPreviewModal** — props: attachment, onClose — `apps/web/src/components/AttachmentPreviewModal.tsx`
- **BottomSheet** — props: open, onClose, title — `apps/web/src/components/BottomSheet.tsx`
- **CacheShapeBadge** — props: cacheTokens, totalTokens — `apps/web/src/components/CacheShapeBadge.tsx`
- **CapHitSentinel** — props: message, capHitPosition, isLatest — `apps/web/src/components/CapHitSentinel.tsx`
- **ChatInput** — props: disabled, projectId, agentId, onAgentChange, sessionId, webSearchEnabled, onSend, onForceSend, generating, onStop — `apps/web/src/components/ChatInput.tsx`
- **ChatTabBar** — props: pane, tabs, tabNumbers, onSwitchTab, onRemoveTab, onCloseOthers, onCloseToRight, onCloseAll, onNewTab, onSplitPane — `apps/web/src/components/ChatTabBar.tsx`
- **ChatThroughput** — props: chatId, className — `apps/web/src/components/ChatThroughput.tsx`
- **CodeBlock** — props: code, lang — `apps/web/src/components/CodeBlock.tsx`
- **ComparePane** — props: models, responses, onClose — `apps/web/src/components/ComparePane.tsx`
- **ContextMeter** — props: messages, modelContextLimit, sessionCostUsd — `apps/web/src/components/ContextMeter.tsx`
- **CreateProjectModal** — props: open, onOpenChange — `apps/web/src/components/CreateProjectModal.tsx`
- **DiffSnippet** — props: diff — `apps/web/src/components/DiffSnippet.tsx`
- **DiffSplitView** — props: file, wrapLines — `apps/web/src/components/DiffSplitView.tsx`
- **DoomLoopSentinel** — props: message — `apps/web/src/components/DoomLoopSentinel.tsx`
- **DropOverlay** — props: visible — `apps/web/src/components/DropOverlay.tsx`
- **EmptyState** — props: icon, title, description, action, className — `apps/web/src/components/EmptyState.tsx`
- **FileMentionPopover** — props: query, files, anchorRect, onSelect, onClose — `apps/web/src/components/FileMentionPopover.tsx`
- **FileViewerOverlay** — props: path, content, lang, onClose — `apps/web/src/components/FileViewerOverlay.tsx`
- **FlowLauncherDialog** — `apps/web/src/components/FlowLauncherDialog.tsx`
- **GitDiffView** — props: result, loading, error, mode, onSelectMode, onRefresh, mutating, mutateError, onStage, onUnstage — `apps/web/src/components/GitDiffView.tsx`
- **HtmlArtifactPane** — props: chatId, state, onClose — `apps/web/src/components/HtmlArtifactPane.tsx`
- **InferenceSettings** — `apps/web/src/components/InferenceSettings.tsx`
- **InlineReviewEditor** — props: initialBody, onSave, onCancel — `apps/web/src/components/InlineReviewEditor.tsx`
- **InlineReviewGutterCell** — props: lineNumber, type, hasComments, canComment, onClick — `apps/web/src/components/InlineReviewGutterCell.tsx`
- **InlineReviewThread** — props: comments, onEditComment, onDeleteComment — `apps/web/src/components/InlineReviewThread.tsx`
- **KeyboardShortcutsDialog** — props: open, onOpenChange — `apps/web/src/components/KeyboardShortcutsDialog.tsx`
- **MarkdownArtifactPane** — props: chatId, state, onClose — `apps/web/src/components/MarkdownArtifactPane.tsx`
- **MarkdownRenderer** — props: content — `apps/web/src/components/MarkdownRenderer.tsx`
- **McpPermissionDialog** — props: toolCallId, toolName, toolArgs, chatId, open, onClose — `apps/web/src/components/McpPermissionDialog.tsx`
- **McpResponseDisplay** — props: toolCall, toolResult — `apps/web/src/components/McpResponseDisplay.tsx`
- **MessageBubble** — props: message, sessionChats, capHitInfo, actions, hideActions, hasCheckpoint, restoreDisabled — `apps/web/src/components/MessageBubble.tsx`
- **MessageList** — props: messages, sessionChats — `apps/web/src/components/MessageList.tsx`
- **MobileTabSwitcher** — props: panes, activePaneIdx, chats, onSwitchPane, onRemovePane, onRenameChat — `apps/web/src/components/MobileTabSwitcher.tsx`
@@ -353,12 +437,14 @@
- **RequestReadAccessCard** — props: toolCall, toolResult, chatId — `apps/web/src/components/RequestReadAccessCard.tsx`
- **RightRail** — props: projectId, sessionId — `apps/web/src/components/RightRail.tsx`
- **SessionLandingPage** — props: projectId, sessionId, agentId, onAgentChange, onSend, onSkillInvoke, createChat, chats, onOpenChat, onUnarchiveChat — `apps/web/src/components/SessionLandingPage.tsx`
- **SessionTimeline** — props: messages, onClose, onScrollToMessage — `apps/web/src/components/SessionTimeline.tsx`
- **SlashCommandPicker** — props: query, items, groups, inputRef, onSelect, onClose, emptyLabel — `apps/web/src/components/SlashCommandPicker.tsx`
- **StaleStreamBanner** — props: onRetry, onDiscard — `apps/web/src/components/StaleStreamBanner.tsx`
- **StatusDot** — props: chatId, className — `apps/web/src/components/StatusDot.tsx`
- **ThemePicker** — `apps/web/src/components/ThemePicker.tsx`
- **ToolCallGroup** — props: runs — `apps/web/src/components/ToolCallGroup.tsx`
- **ToolCallLine** — props: run, insideGroup — `apps/web/src/components/ToolCallLine.tsx`
- **ToolCallLine** — props: run, insideGroup, chatId`apps/web/src/components/ToolCallLine.tsx`
- **TraceViewer** — props: chatId — `apps/web/src/components/TraceViewer.tsx`
- **Workspace** — props: sessionId, projectId, agentId, onAgentChange, panesHook, chatsHook, session, project, onAddPane — `apps/web/src/components/Workspace.tsx`
- **AddProviderModal** — props: open, onOpenChange, onAdded — `apps/web/src/components/coder/AddProviderModal.tsx`
- **ProvidersSettings** — `apps/web/src/components/coder/ProvidersSettings.tsx`
@@ -367,21 +453,31 @@
- **ThemeFx** — `apps/web/src/components/fx/ThemeFx.tsx`
- **ClaudeIcon** — props: size, className — `apps/web/src/components/icons/ProviderIcons.tsx`
- **OpenCodeIcon** — props: size, className — `apps/web/src/components/icons/ProviderIcons.tsx`
- **ActionRow** — props: message, actions, hiddenSet, hasCheckpoint, restoreDisabled — `apps/web/src/components/message-parts/ActionRow.tsx`
- **CompactCard** — props: message, sessionChats — `apps/web/src/components/message-parts/CompactCard.tsx`
- **MistakeRecoverySentinel** — props: message — `apps/web/src/components/message-parts/MistakeRecoverySentinel.tsx`
- **ReasoningBlock** — props: text, streaming — `apps/web/src/components/message-parts/ReasoningBlock.tsx`
- **SendToTerminalMenu** — `apps/web/src/components/message-parts/SendToTerminalMenu.tsx`
- **StatsLine** — props: message — `apps/web/src/components/message-parts/StatsLine.tsx`
- **SummaryCard** — props: message — `apps/web/src/components/message-parts/SummaryCard.tsx`
- **ArenaPane** — props: state, onClose — `apps/web/src/components/panes/ArenaPane.tsx`
- **ChatPane** — props: sessionId, chatId, projectId, agentId, onAgentChange, sessionChats, webSearchEnabled — `apps/web/src/components/panes/ChatPane.tsx`
- **CoderMessageList** — props: messages, chatId, footer, actions, checkpointMessageIds, restoreDisabled — `apps/web/src/components/panes/CoderMessageList.tsx`
- **CoderPane** — props: sessionId, paneId, chatId, chatPending, projectPath, onConnectedChange, onAgentLabelChange — `apps/web/src/components/panes/CoderPane.tsx`
- **OrchestratorPane** — props: state, onClose — `apps/web/src/components/panes/OrchestratorPane.tsx`
- **SettingsPane** — props: session, project, maximized, onToggleMaximize, onClose, isMobile — `apps/web/src/components/panes/SettingsPane.tsx`
- **TerminalPane** — props: sessionId, paneId, label, active — `apps/web/src/components/panes/TerminalPane.tsx`
- **TerminalPane** — props: sessionId, paneId, label, description, parentAgent, active — `apps/web/src/components/panes/TerminalPane.tsx`
- **FloatingMenu** — props: x, y, hasSelection, chatInputs, onCopy, onPaste, onSelectAll, onSearch, onSendToChat, onDismiss — `apps/web/src/components/panes/terminal/FloatingMenu.tsx`
- **SearchBar** — props: searchRef, theme, onClose — `apps/web/src/components/panes/terminal/SearchBar.tsx`
- **TerminalHotkeyBar** — props: ctrlArmed, onSendBytes, onArmCtrl, onFit — `apps/web/src/components/panes/terminal/TerminalHotkeyBar.tsx`
- **RightRailDrawerProvider** — `apps/web/src/hooks/useRightRailDrawer.tsx`
- **SidebarDrawerProvider** — `apps/web/src/hooks/useSidebarDrawer.tsx`
- **PATH_REGEX** — `apps/web/src/lib/linkify-paths.tsx`
- **Analytics** — `apps/web/src/pages/Analytics.tsx`
- **Home** — `apps/web/src/pages/Home.tsx`
- **Memory** — `apps/web/src/pages/Memory.tsx`
- **Project** — `apps/web/src/pages/Project.tsx`
- **Results** — `apps/web/src/pages/Results.tsx`
- **Session** — `apps/web/src/pages/Session.tsx`
- **Settings** — `apps/web/src/pages/Settings.tsx`
@@ -403,8 +499,17 @@
- function ensureSession: (tmuxConfPath, sessionName, projectRoot, log, cols?, rows?) => Promise<void>
- function killSession: (tmuxConfPath, sessionName) => Promise<boolean>
- function capturePane: (tmuxConfPath, sessionName, lines) => Promise<string>
- _...1 more_
- `apps/booterm/src/pty/pty.ts` — function attachPty: (opts) => IPty
- `apps/booterm/src/ws/attach.ts` — function registerWsAttachRoute: (app, tmuxConfPath) => void
- `apps/booterm/src/pty/registry.ts`
- function register: (sessionId, paneId, projectPath, title?, opts?) => void
- function unregister: (paneId) => void
- function touchActivity: (paneId) => void
- function list: () => SessionMeta[]
- function get: (paneId) => SessionMeta | undefined
- function setPendingMetadata: (paneId, meta) => void
- _...8 more_
- `apps/booterm/src/ws/attach.ts` — function registerWsAttachRoute: (app, tmuxConfPath, idleTimeoutSeconds?, absoluteTimeoutSeconds?) => void
- `apps/coder/src/conductor/contracts.ts`
- function produceContract: (contracts) => string
- function reviewContract: (contracts) => string
@@ -491,7 +596,7 @@
- function classifyLane: (battleType, _identity, model, localModels) => ContestantLane
- function nextLocalContestant: (contestants) => string | null
- function isBattleComplete: (contestants) => boolean
- function computeBenchmark: (startedAt, endedAt, costTokens, lane) => Benchmark
- function computeBenchmark: (startedAt, endedAt, costTokens, lane, tokenBreakdown) => Benchmark
- function sanitizeSlug: (s) => string
- function buildBattleSlug: (battleId, battleType, createdAt) => string
- _...7 more_
@@ -555,6 +660,7 @@
- function stepEndedToUsage: (props) => StepUsage
- interface StepEndedProps
- interface StepUsage
- `apps/coder/src/services/backends/paseo.ts` — class PaseoBackend, interface PaseoBackendDeps
- `apps/coder/src/services/backends/pushable-iterable.ts` — function createPushable: () => Pushable<T>, interface Pushable
- `apps/coder/src/services/backends/turn-guard.ts`
- function armAbortGuard: (g) => void
@@ -563,6 +669,30 @@
- interface AbortTerminalGuard
- `apps/coder/src/services/backends/warm-acp-routing.ts` — function shouldUseWarmBackend: (task) => boolean, function isTurnOkForStopReason: (stopReason) => boolean
- `apps/coder/src/services/backends/warm-acp.ts` — class WarmAcpBackend, interface WarmAcpBackendDeps
- `apps/coder/src/services/behavioral/generation.ts`
- function createExecutionPlan: (observational, actionable, previouslyApplied, disambiguationGroups, lowCriticality) => BatchExecutionPlan[]
- function getRetryTemperatures: (baseTemp, maxAttempts) => number[]
- class SchematicGenerator
- class DefaultSchematicGenerator
- interface ObservationalOutput
- interface ActionableOutput
- _...7 more_
- `apps/coder/src/services/behavioral/matching.ts`
- function matchWithRetry: (fn) => void
- function executeBatchesParallel: (batches, _generationInfo) => Promise<GuidelineMatchingResult>
- function createScoredMatch: (guidelineId, score, rationale) => ScoredMatch
- class GuidelineMatchingBatchError
- class ObservationalGuidelineMatchingBatch
- class ActionableGuidelineMatchingBatch
- _...25 more_
- `apps/coder/src/services/behavioral/resolver.ts`
- class RelationalResolver
- interface RelationshipEntity
- interface Relationship
- interface RelationshipStore
- interface ResolvedEntity
- interface Resolution
- _...8 more_
- `apps/coder/src/services/cancel-registry.ts` — function createCancelRegistry: () => CancelRegistry, interface CancelRegistry
- `apps/coder/src/services/checkpoints.ts`
- function buildShadowCommitCommand: (worktreePath, id) => string
@@ -573,7 +703,15 @@
- interface RestoreCheckpointResult
- _...1 more_
- `apps/coder/src/services/claude-command-discovery.ts` — function discoverClaudeCommands: () => AgentCommand[]
- `apps/coder/src/services/collision-detector.ts`
- function findConflicts: (changedFiles, worktreeId, /** Approximate line range for the proposed changes, keyed by file path */
changedRanges, {...}, conflictIndex) => ConflictVerdict[]
- interface ConflictVerdict
- interface ConflictEntry
- type ConflictSeverity
- type ConflictIndexData
- `apps/coder/src/services/command-availability.ts` — function isCommandAvailable: (binary) => Promise<boolean>
- `apps/coder/src/services/conflict-index.ts` — class ConflictIndex, const conflictIndex
- `apps/coder/src/services/correction-service.ts`
- function recordCorrection: (originalClaim, correction, principleExtracted, persistedTo, basePath?) => Promise<UserCorrectionRecord>
- function scanForCorrections: (auditPath) => Promise<UserCorrectionRecord[]>
@@ -603,10 +741,11 @@
- function partitionReady: (ready, ctx) => void
- function isRunComplete: (flow, state) => boolean
- function isStuck: (flow, state) => boolean
- function reconcileResumeStep: (status, taskId, taskState) => ResumeAction
- _...5 more_
- function buildBatchState: (flow, inFlight) => Map<string,
- _...12 more_
- `apps/coder/src/services/flow-runner.ts`
- function createFlowRunner: (deps) => FlowRunner
- function resolveVariables: (prompt, results, string>) => string
- interface LaunchOpts
- interface FlowRunner
- `apps/coder/src/services/frame-emitter.ts`
@@ -626,6 +765,19 @@
- function deleteGuideline: (id, basePath?) => Promise<boolean>
- function findGuideline: (content, basePath?) => Promise<Guideline | null>
- _...14 more_
- `apps/coder/src/services/hashline/hash-computation.ts`
- function computeLineHash: (lineNumber, content) => string
- function computeLegacyLineHash: (lineNumber, content) => string
- function formatHashLine: (lineNumber, content) => string
- function formatHashLines: (content) => string
- `apps/coder/src/services/hashline/validation.ts`
- function normalizeLineRef: (ref) => string
- function parseLineRef: (ref) => LineRef
- function validateLineRef: (lines, ref) => void
- function validateLineRefs: (lines, refs) => void
- class HashlineMismatchError
- interface LineRef
- `apps/coder/src/services/hashline/xxhash32.ts` — function hashXxh32: (input, seed) => number
- `apps/coder/src/services/host-exec.ts` — function hostExec: (command, opts?) => Promise<HostExecResult>, interface HostExecResult
- `apps/coder/src/services/lsp/client.ts` — class LspClient
- `apps/coder/src/services/lsp/config.ts` — function getServerConfig: (filePath) => LspServerConfig | null, interface LspServerConfig
@@ -637,6 +789,44 @@
- function findReferences: (client, filePath, content, line, character) => Promise<Location[]>
- `apps/coder/src/services/lsp/server-manager.ts` — class LspServerManager, const lspManager
- `apps/coder/src/services/mcp-server.ts` — function startMcpServer: (sql) => Promise<void>
- `apps/coder/src/services/model-resolution/connected-providers-cache.ts`
- function readConnectedProvidersCache: () => string[] | null
- function findProviderModelMetadata: (_providerID, _modelID) => ModelMetadata | undefined
- function readProviderModelsCache: () => ProviderModelsCache | null
- interface ProviderModelsCache
- interface ConnectedProvidersAdapter
- const connectedProvidersAdapter: ConnectedProvidersAdapter
- `apps/coder/src/services/model-resolution/fallback-chain-from-models.ts`
- function parseFallbackModelEntry: (model, contextProviderID, defaultProviderID) => FallbackEntry | undefined
- function parseFallbackModelObjectEntry: (obj, contextProviderID, defaultProviderID) => FallbackEntry | undefined
- function findMostSpecificFallbackEntry: (providerID, modelID, chain) => FallbackEntry | undefined
- function buildFallbackChainFromModels: (fallbackModels) => void
- `apps/coder/src/services/model-resolution/model-availability.ts` — function fuzzyMatchModel: (target, available, providers?) => string | null, function isModelAvailable: (targetModel, availableModels) => boolean
- `apps/coder/src/services/model-resolution/model-error-classifier.ts`
- function isRetryableModelError: (error) => boolean
- function shouldRetryError: (error) => boolean
- function getNextFallback: (fallbackChain, attemptCount) => FallbackEntry | undefined
- function hasMoreFallbacks: (fallbackChain, attemptCount) => boolean
- function selectFallbackProvider: (providers, preferredProviderID?) => string
- function selectFallbackProviderWithCache: (providers, providerCache, preferredProviderID?) => string
- _...1 more_
- `apps/coder/src/services/model-resolution/model-normalization.ts` — function normalizeModel: (model?) => string | undefined, function normalizeModelID: (modelID) => string
- `apps/coder/src/services/model-resolution/model-resolution-pipeline.ts`
- function _setModelResolutionLogImplementationForTesting: (logImplementation) => void
- function resolveModelPipeline: (request, providerCache) => void
- type ModelResolutionRequest
- type ModelResolutionProvenance
- type ModelResolutionResult
- type ModelResolutionDeps
- `apps/coder/src/services/model-resolution/model-resolver.ts`
- function resolveModel: (input) => string | undefined
- function resolveModelWithFallback: (input, connectedProvidersAdapter) => ModelResolutionResult | undefined
- function normalizeFallbackModels: (models) => void
- function flattenToFallbackModelStrings: (models) => void
- type ModelResolutionInput
- type ModelSource
- _...2 more_
- `apps/coder/src/services/model-resolution/provider-model-id-transform.ts` — function transformModelForProvider: (provider, model) => string, function transformModelForProviderDisplay: (provider, model) => string
- `apps/coder/src/services/net/port-utils.ts`
- function reclaimPort: (port) => void
- function waitForPortRelease: (port, timeoutMs) => Promise<boolean>
@@ -646,6 +836,13 @@
- function createOrphanWorktreeReaper: (deps) => void
- interface OrphanWorktreeReaperDeps
- interface OrphanReaperResult
- `apps/coder/src/services/paseo-client.ts`
- class PaseoClientError
- class PaseoClient
- interface PaseoAgentListItem
- interface PaseoAgentDetail
- interface PaseoSendResult
- interface PaseoClientConfig
- `apps/coder/src/services/pending_changes.ts`
- function planEdit: (content, oldStr, newStr) => EditPlan
- function queueEdit: (sql, sessionId, taskId, filePath, oldString, newString, projectRoot, // v2.6 Phase 1-UX) => void
@@ -662,6 +859,14 @@
- function waitForElicitationResponse: (taskId, sessionId, provider, modeId, params, timeoutMs) => Promise<CreateElicitationResponse>
- function cancelPendingPermission: (taskId) => void
- _...3 more_
- `apps/coder/src/services/plan-store.ts`
- function createPlan: (sql, opts) => Promise<Plan>
- function getPlan: (sql, planId) => Promise<Plan | null>
- function listPlans: (sql, projectId) => Promise<Plan[]>
- function listActivePlans: (sql, projectId) => Promise<Plan[]>
- function updatePlan: (sql, planId, opts) => Promise<Plan | null>
- function updatePlanFromRun: (sql, runId, runStatus) => Promise<boolean>
- _...5 more_
- `apps/coder/src/services/provider-commands.ts`
- function getManifestCommands: (provider) => AgentCommand[]
- function mergeCommands: (...lists) => AgentCommand[]
@@ -684,13 +889,13 @@
- interface ProviderManifestEntry
- const PROVIDER_MANIFEST: Record<string, ProviderManifestEntry>
- `apps/coder/src/services/provider-snapshot.ts`
- function fetchDeepSeekModels: (config) => Promise<ProviderModel[]>
- function fetchLlamaSwapModels: (config) => Promise<ProviderModel[]>
- function prefixLlamaSwapModels: (models) => ProviderModel[]
- function mergeModels: (...lists) => ProviderModel[]
- function getProviderSnapshot: (sql, config, cwd?, force) => Promise<ProviderSnapshotEntry[]>
- function clearProviderSnapshotCache: () => void
- function peekSnapshotEntry: (name, cwd?) => ProviderSnapshotEntry | undefined
- _...1 more_
- _...2 more_
- `apps/coder/src/services/pty-dispatch.ts`
- function dispatchViaPty: (opts) => Promise<DispatchResult>
- interface DispatchResult
@@ -800,6 +1005,17 @@
- function readSession: (sessionId, projectRoot?) => SessionJson | null
- _...9 more_
- `apps/server/src/services/auto_name.ts` — function maybeAutoNameChat: (ctx, chatId, sessionId) => Promise<void>
- `apps/server/src/services/background-task.ts`
- function setBackgroundInferenceEnqueuer: (enqueue, chatId, assistantMessageId, user) => void
- function spawnBackgroundTask: (sql, log, projectId, input, model, agent?, label?) => Promise<BackgroundTask>
- function getBackgroundTaskStatus: (sql, taskId) => Promise<BackgroundTask | null>
- function getBackgroundTaskResult: (sql, taskId, chatId) => Promise<
- function cancelBackgroundTask: (sql, taskId) => Promise<boolean>
- interface BackgroundTask
- `apps/server/src/services/boocontext_client.ts`
- function callBoocontext: (req, log?, msg) => void
- interface BoocontextRequest
- interface BoocontextResponse
- `apps/server/src/services/broker.ts`
- function createBroker: (log?) => Broker
- interface Broker
@@ -818,6 +1034,7 @@
- function select: (messages, contextLimit, tailTurns) => SelectResult
- function deriveFilesRead: (head) => string[]
- _...8 more_
- `apps/server/src/services/export-formatter.ts` — function formatJson: (chat, messages, model) => string, function formatMarkdown: (chat, messages, model) => string
- `apps/server/src/services/file_index.ts` — function getProjectFiles: (projectId, projectRoot) => Promise<string[]>
- `apps/server/src/services/file_ops.ts`
- function listDir: (projectRoot, relPath, opts?) => Promise<ListDirResult>
@@ -842,7 +1059,20 @@
- interface GiteaConfig
- interface GiteaRepo
- `apps/server/src/services/grant_resolver.ts` — function resolveGrantRoot: (sql, requestedPath, projectRoot, whitelistRoot) => Promise<GrantResolution>, type GrantResolution
- `apps/server/src/services/hooks.ts`
- function loadHooksConfig: (path) => HooksConfig
- function reloadHooksConfig: () => HooksConfig
- function createHookRunner: () => HookRunner
- interface HookConfig
- interface HooksConfig
- interface PreToolUsePayload
- _...10 more_
- `apps/server/src/services/inference/budget.ts` — function resolveToolBudget: (agent) => number
- `apps/server/src/services/inference/compute-diff.ts`
- function computeDiff: (oldStr, newStr, filePath) => string
- function isWriteTool: (name) => boolean
- function diffFromToolArgs: (name, args, unknown>, filePath?) => string
- const WRITE_TOOL_NAMES
- `apps/server/src/services/inference/content-flusher.ts` — function createContentFlusher: (sql, messageId, getContent) => void, interface ContentFlusher
- `apps/server/src/services/inference/dcp/messages.ts`
- function toDcpMessages: (parts) => DcpMessage[]
@@ -882,6 +1112,10 @@
- type FailureKind
- const MISTAKE_THRESHOLD
- _...1 more_
- `apps/server/src/services/inference/multi-modal.ts`
- function hasImageAttachments: (_message) => boolean
- function imageAttachmentsToParts: (attachments) => Array<
- interface ImageAttachment
- `apps/server/src/services/inference/parts.ts`
- function insertParts: (sql, parts) => Promise<void>
- function partsFromAssistantMessage: (args) => void
@@ -894,10 +1128,13 @@
- function maybeFlagForCompaction: (ctx, chatId, updated) => Promise<void>
- interface OpenAiMessage
- `apps/server/src/services/inference/provider.ts`
- function resolveRoute: (agent, config?) => RoutingInfo
- function isDeepSeekModel: (modelId) => boolean
- function resolveRoute: (agent, config?, modelId?) => RoutingInfo
- function upstreamModel: (config, modelId, agent?) => LanguageModel
- function resolveModelEndpoint: (config, modelId) => void
- function resetDeepSeekProvider: () => void
- interface RoutingInfo
- type InferenceRoute
- _...1 more_
- `apps/server/src/services/inference/prune.ts`
- function selectPruneTargets: (partsNewestFirst, tailStartCreatedAt) => void
- function prune: (args) => Promise<PruneResult>
@@ -918,6 +1155,12 @@
- function isAnySentinel: (m) => boolean
- const DOOM_LOOP_THRESHOLD
- _...1 more_
- `apps/server/src/services/inference/state-graph.ts`
- function createDefaultGraph: () => GraphNode[]
- function runGraph: (ctx, args, extra) => Promise<GraphResult>
- interface GraphState
- interface GraphResult
- type GraphNodeType
- `apps/server/src/services/inference/step-decision.ts`
- function decideStep: (input) => PreStepDecision
- function decidePostToolAction: (action, mistakeTracker) => PostToolDecision
@@ -934,12 +1177,14 @@
- `apps/server/src/services/inference/stream-phase.ts` — function executeStreamPhase: (ctx, args, session, messages, state, agent, // v1.11.8, web_search and web_fetch are stripped from the
// tool list sent to the LLM, so the model can't even attempt them.
webToolsEnabled) => Promise<StreamResult>
- `apps/server/src/services/inference/supervisor.ts` — function resolveSupervisorTurn: (latestUserMessage, agents, fallbackModel?) => Promise<SupervisorRoute | null>, interface SupervisorRoute
- `apps/server/src/services/inference/tool-call-parser.ts`
- function stripToolMarkup: (text, opts?) => string
- function extractToolCallBlocks: (buffer, log?) => ToolCallExtraction
- interface ParsedCall
- interface ToolCallExtraction
- `apps/server/src/services/inference/tool-phase.ts` — function executeToolPhase: (ctx, args, result, startedAt, session, projectRoot, agent?) => Promise<ToolPhaseResult>, interface ToolPhaseResult
- `apps/server/src/services/inference/tool-input-repair.ts` — function repairToolInput: (schema, unknown> | undefined, args, unknown>) => void, interface ToolInputRepair
- `apps/server/src/services/inference/tool-phase.ts` — function executeToolPhase: (ctx, args, result, startedAt, session, projectRoot, agent?, turnNumber?) => Promise<ToolPhaseResult>, interface ToolPhaseResult
- `apps/server/src/services/inference/tool-shim.ts`
- function extractToolCalls: (text) => ParsedToolCall[]
- function hasToolCallMarkup: (text) => boolean
@@ -955,20 +1200,26 @@
- `apps/server/src/services/inference/turn.ts`
- function runAssistantTurn: (ctx, args) => Promise<void>
- function runInference: (ctx, sessionId, chatId, assistantMessageId, signal?) => Promise<void>
- function runInferenceWithModel: (ctx, sessionId, chatId, assistantMessageId, modelOverride, compareGroupId, signal?) => Promise<void>
- function createInferenceRunner: (ctx, 'publishUser'>, publishUserFn, frame) => void
- `apps/server/src/services/mcp-client.ts`
- function initialize: (entries, logger) => Promise<void>
- function callTool: (prefixedName, args, unknown>) => Promise<unknown>
- function getServerPermission: (prefixedToolName) => McpPermission
- function setServerPermission: (serverName, permission) => void
- function getServerName: (prefixedToolName) => string | null
- function getTools: () => ToolDef<Record<string, unknown>>[]
- function getMcpServers: () => Array<
- function shutdown: () => Promise<void>
- function wrapMcpTool: (serverName, mcpTool) => ToolDef<Record<string, unknown>>
- _...2 more_
- _...6 more_
- `apps/server/src/services/mcp-config.ts`
- function substituteEnvVars: (value, log, unsetVars?) => unknown
- function loadMcpConfig: (configPath, log) => McpServerEntry[]
- interface McpServerEntry
- type McpServerConfig
- `apps/server/src/services/memory/bm25.ts` — class Bm25Ranker
- `apps/server/src/services/memory/embeddings.ts`
- function isEmbeddingAvailable: () => boolean
- function initEmbeddings: (modelPath?) => Promise<boolean>
- function embed: (texts) => Promise<number[][] | null>
- `apps/server/src/services/memory/entries.ts` — function parseMemoryEntries: (fileName, markdown) => MemoryEntry[], interface MemoryEntry
- `apps/server/src/services/memory/paths.ts`
- function getMemoryRoot: (projectRoot) => string
@@ -976,7 +1227,10 @@
- function ensureMemoryScaffold: (root) => Promise<void>
- type MemoryTopic
- `apps/server/src/services/memory/prompt.ts` — function formatMemoryBlock: (entries) => string
- `apps/server/src/services/memory/recall.ts` — function rankByRelevance: (query, entries) => MemoryEntry[], function loadMemoryForSession: (projectRoot, _sessionId?, query?) => Promise<string[]>
- `apps/server/src/services/memory/recall.ts`
- function rankByRelevance: (query, entries) => MemoryEntry[]
- function rankByHybrid: (query, entries) => Promise<MemoryEntry[]>
- function loadMemoryForSession: (projectRoot, _sessionId?, query?) => Promise<string[]>
- `apps/server/src/services/memory/scan.ts`
- function scanMemoryScopes: (scope) => Promise<MemoryEntry[]>
- function scanProjectMemory: (projectRoot) => Promise<MemoryEntry[]>
@@ -1007,6 +1261,11 @@
- function filterSecretEntries: (entries, pathOf) => void
- class SecretBlockedError
- const DEFAULT_SECURITY_IGNORE_FILETYPES: ReadonlyArray<string>
- `apps/server/src/services/session-snapshots.ts`
- function saveAgentSnapshot: (sql, chatId, data) => Promise<void>
- function loadAgentSnapshot: (sql, chatId) => Promise<AgentSnapshot | null>
- function deleteAgentSnapshot: (sql, chatId) => Promise<void>
- interface AgentSnapshot
- `apps/server/src/services/skill-invoke.ts`
- function runSkillInvokeTransaction: (sql, args) => Promise<
- function buildSkillInvokeSyntheticFrames: (chatId, result, toolCall, skillBody) => SkillInvokeSessionFrame[]
@@ -1037,8 +1296,53 @@
- _...2 more_
- `apps/server/src/services/task-model.ts` — function taskModelCompletion: (opts) => Promise<string>
- `apps/server/src/services/task-search-rewrite.ts` — function rewriteSearchQuery: (userMessage) => Promise<string>
- `apps/server/src/services/tool-traces.ts`
- function insertToolTrace: (sql, insert) => Promise<ToolTrace>
- function updateToolTrace: (sql, id, updates) => Promise<ToolTrace | null>
- interface ToolTrace
- interface ToolTraceInsert
- interface ToolTraceUpdate
- `apps/server/src/services/tools/background-subagent-tools.ts`
- function executeSpawnSubagent: (input, sql, sessionId) => Promise<Record<string, unknown>>
- function executeSubagentStatus: (input, sql) => Promise<Record<string, unknown>>
- function executeSubagentResult: (input, sql) => Promise<Record<string, unknown>>
- type SpawnSubagentInputT
- type SubagentStatusInputT
- type SubagentResultInputT
- _...6 more_
- `apps/server/src/services/tools/codecontext/factory.ts` — function makeCodecontextTool: (opts, unknown>;
mapArgs) => void
- `apps/server/src/services/tools/codecontext/get_code_health.ts`
- function executeGetCodeHealth: (input, projectPath) => Promise<string>
- type GetCodeHealthInputT
- const GetCodeHealthInput
- const getCodeHealth: ToolDef<GetCodeHealthInputT>
- `apps/server/src/services/tools/codecontext/get_code_impact.ts`
- function executeGetCodeImpact: (input, projectPath) => Promise<CodecontextResponse>
- type GetCodeImpactInputT
- const GetCodeImpactInput
- const getCodeImpact: ToolDef<GetCodeImpactInputT>
- `apps/server/src/services/tools/codecontext/get_code_map.ts`
- function executeGetCodeMap: (input, projectRoot) => Promise<CodeMapResponse>
- interface CodeMapResponse
- type GetCodeMapInputT
- const GetCodeMapInput
- const getCodeMap: ToolDef<GetCodeMapInputT>
- `apps/server/src/services/tools/codecontext/get_type_info.ts`
- function executeGetTypeInfo: (input, _projectPath?) => Promise<CodecontextResponse>
- type GetTypeInfoInputT
- const GetTypeInfoInput
- const getTypeInfo: ToolDef<GetTypeInfoInputT>
- `apps/server/src/services/tools/codecontext/get_wiki_article.ts`
- function executeGetWikiArticle: (input, projectPath) => Promise<string>
- type GetWikiArticleInputT
- const GetWikiArticleInput
- const getWikiArticle: ToolDef<GetWikiArticleInputT>
- `apps/server/src/services/tools/execute-command.ts`
- function executeRunCommand: (input, projectRoot) => Promise<RunCommandOutput>
- type RunCommandInputT
- type RunCommandOutput
- const runCommand: ToolDef<RunCommandInputT>
- `apps/server/src/services/tools/registry.ts` — function appendMcpTools: (mcpTools) => void, function toolJsonSchemas: () => ToolJsonSchema[]
- `apps/server/src/services/tools/tiers.ts`
- function resolveToolTier: (tier) => readonly string[]
@@ -1064,6 +1368,39 @@
- interface WebSearchOutput
- type WebSearchInputT
- const webSearch: ToolDef<WebSearchInputT>
- `apps/server/src/services/workflow/catalog.ts`
- function fingerprintAgentTask: (prompt, spec, unknown>, args) => string
- function getBuiltinWorkflows: () => BuiltinWorkflow[]
- function getBuiltinWorkflow: (name) => BuiltinWorkflow | undefined
- function mergeBuiltinWorkflows: (fileWorkflows) => Array<
- interface BuiltinWorkflow
- const meta
- `apps/server/src/services/workflow/discovery.ts`
- function isBuiltinWorkflow: (meta) => boolean
- function discoverWorkflows: (projectRoot) => WorkflowMeta[]
- function findWorkflow: (name, projectRoot) => WorkflowMeta | undefined
- function isValidWorkflowPath: (filePath) => boolean
- interface WorkflowMeta
- `apps/server/src/services/workflow/manager.ts`
- class WorkflowManager
- interface WorkflowMetaInfo
- type WorkflowEventHandler
- `apps/server/src/services/workflow/resumability.ts`
- function cacheKey: (spec, args) => string
- function getCachedResult: (key) => CachedResult | null
- function setCachedResult: (key, result) => void
- function invalidateRun: (runKey) => void
- function clearCache: () => void
- function cacheSize: () => number
- _...1 more_
- `apps/server/src/services/workflow/sandbox.ts`
- function transformEsmToCjs: (code) => string
- function name: (...) => void
- function isEsmSyntax: (code) => boolean
- function buildSandbox: (context) => Record<string, unknown>
- function loadWorkflowScript: (sourceFile, context) => (...args: unknown[]) => Promise<unknown>
- function loadWorkflowScriptFromCode: (code, context, filename?) => (...args: unknown[]) => Promise<unknown>
- _...3 more_
- `apps/server/src/utils/string-utils.ts` — function stripQuotes: (s) => string
- `apps/web/src/api/client.ts`
- class ApiError
@@ -1084,7 +1421,7 @@
- interface TerminalSelectionActions
- interface TerminalSelection
- `apps/web/src/hooks/terminal/useTerminalSocket.ts`
- function useTerminalSocket: ({...}, sessionId, paneId, fit, getSize, setSize, }) => TerminalSocket
- function useTerminalSocket: ({...}, sessionId, paneId, description, parentAgent, fit, getSize, setSize, }) => TerminalSocket
- interface TerminalSocket
- type ConnState
- `apps/web/src/hooks/useActivePane.ts`
@@ -1108,7 +1445,8 @@
- interface ThroughputSample
- `apps/web/src/hooks/useCoderUserEvents.ts` — function useCoderUserEvents: () => void
- `apps/web/src/hooks/useDiffPreferences.ts` — function useDiffPreferences: () => void, interface DiffPreferences
- `apps/web/src/hooks/useGitDiff.ts` — function useGitDiff: (projectId) => void
- `apps/web/src/hooks/useDraftPersistence.ts` — function useDraftPersistence: (chatId) => DraftPersistenceResult, interface DraftPersistenceResult
- `apps/web/src/hooks/useGitDiff.ts` — function useGitDiff: (projectId, hideWhitespace) => void
- `apps/web/src/hooks/useLongPress.ts` — function useLongPress: (callback) => void
- `apps/web/src/hooks/useProjectGit.ts` — function useProjectGit: (projectId) => GitMeta | null
- `apps/web/src/hooks/useProviderSnapshot.ts` — function refreshProviderSnapshot: (cwd?) => Promise<ProviderSnapshotEntry[]>, function useProviderSnapshot: (cwd?) => ProviderSnapshotEntry[] | null
@@ -1121,6 +1459,7 @@
- `apps/web/src/hooks/useSessions.ts` — function useSessions: (projectId) => void
- `apps/web/src/hooks/useSidebar.ts` — function useSidebar: () => void
- `apps/web/src/hooks/useSkills.ts` — function useSkills: () => void
- `apps/web/src/hooks/useTerminals.ts` — function useTerminals: () => TerminalRegistration[]
- `apps/web/src/hooks/useUserEvents.ts` — function useUserEvents: () => void
- `apps/web/src/hooks/useViewport.ts` — function useViewport: () => ViewportSnapshot, interface ViewportSnapshot
- `apps/web/src/hooks/useWorkspacePanes.ts`
@@ -1183,7 +1522,16 @@
- interface ThemeMeta
- type ThemeId
- _...5 more_
- `apps/web/src/lib/tool-utils.ts`
- function isMcpTool: (name) => boolean
- function extractServerName: (name) => string | null
- function extractToolName: (name) => string | null
- const BUILT_IN_TOOLS
- `apps/web/src/lib/utils.ts` — function cn: (...inputs) => void
- `apps/web/src/stores/useDiffCommentStore.ts`
- function useDiffComments: (sessionId, mode) => void
- interface DiffComment
- interface DiffCommentTarget
- `apps/web/src/utils/diff-layout.ts`
- function parseDiff: (diffBody) => ParsedDiffFile[]
- function buildSplitRows: (file) => SplitRow[]
@@ -1344,8 +1692,11 @@
- `CONTAINER_GUIDANCE_FILE` **required** — apps/server/src/services/__tests__/system-prompt.test.ts
- `CONTEXT7_API_KEY` (has default) — .env
- `DATABASE_URL` (has default) — .env.example
- `DEEPSEEK_API_KEY` (has default) — .env
- `DEEPSEEK_BASE_URL` (has default) — .env
- `DEFAULT_MODEL` (has default) — .env.example
- `DEV_REMOTE_USER` **required** — apps/web/vite.config.ts
- `EMBEDDING_MODEL_PATH` **required** — apps/server/src/services/memory/embeddings.ts
- `GITEA_BASE_URL` (has default) — .env
- `GITEA_SSH_HOST` (has default) — .env
- `GITEA_TOKEN` (has default) — .env
@@ -1353,6 +1704,7 @@
- `LLAMA_SWAP_URL` (has default) — .env.example
- `MCP_TEST_MISSING` **required** — apps/server/src/services/__tests__/mcp-config.test.ts
- `MCP_TEST_SECRET` **required** — apps/server/src/services/__tests__/mcp-config.test.ts
- `MEMORY_SEARCH` **required** — apps/server/src/services/memory/recall.ts
- `NODE_ENV` (has default) — .env.example
- `PORT` (has default) — .env.example
- `POSTGRES_PASSWORD` (has default) — .env.example
@@ -1368,6 +1720,10 @@
- `apps/web/vite.config.ts`
- `docker-compose.yml`
## Key Dependencies
- better-sqlite3: ^11.10.0
---
# Middleware
@@ -1379,6 +1735,7 @@
- turn-guard — `apps/coder/src/services/backends/turn-guard.ts`
- get_middleware — `apps/server/src/services/tools/codecontext/get_middleware.ts`
- authoring — `conductor/src/flows/authoring.ts`
- spec — `openspec/changes/add-behavioral-engine/specs/audit-middleware/spec.md`
## custom
- write_guard.test — `apps/coder/src/services/__tests__/write_guard.test.ts`
@@ -1400,39 +1757,39 @@
## Most Imported Files (change these carefully)
- `apps/coder/src/db.ts` — imported by **40** files
- `apps/server/src/types/api.ts` — imported by **28** files
- `apps/server/src/db.ts` — imported by **25** files
- `apps/coder/src/db.ts` — imported by **44** files
- `apps/server/src/types/api.ts` — imported by **34** files
- `apps/server/src/db.ts` — imported by **32** files
- `packages/ion/src/cli/utils.ts` — imported by **24** files
- `apps/coder/src/services/tools/types.ts` — imported by **18** files
- `apps/coder/src/conductor/types.ts` — imported by **14** files
- `apps/coder/src/conductor/types.ts` — imported by **16** files
- `apps/server/src/services/tools.ts` — imported by **15** files
- `apps/coder/src/services/agent-backend.ts` — imported by **14** files
- `apps/coder/src/services/acp-tool-snapshot.ts` — imported by **14** files
- `apps/server/src/config.ts` — imported by **14** files
- `apps/server/src/services/tools/codecontext/factory.ts` — imported by **14** files
- `apps/server/src/services/tools.ts` — imported by **13** files
- `apps/server/src/services/tools/types.ts` — imported by **13** files
- `conductor/src/types.ts` — imported by **13** files
- `apps/coder/src/services/provider-config-registry.ts` — imported by **12** files
- `apps/server/src/config.ts` — imported by **12** files
- `apps/coder/src/config.ts` — imported by **11** files
- `apps/coder/src/services/provider-types.ts` — imported by **11** files
- `apps/server/src/services/broker.ts` — imported by **10** files
- `apps/server/src/services/agents.ts` — imported by **10** files
- `apps/server/src/services/path_guard.ts` — imported by **10** files
- `apps/coder/src/services/pending_changes.ts` — imported by **9** files
- `apps/server/src/services/broker.ts` — imported by **9** files
- `apps/server/src/services/path_guard.ts` — imported by **9** files
- `apps/server/src/services/inference/payload.ts` — imported by **9** files
## Import Map (who imports what)
- `apps/coder/src/db.ts``apps/coder/src/index.ts`, `apps/coder/src/routes/__tests__/agent-sessions.routes.test.ts`, `apps/coder/src/routes/__tests__/chat-resolve.test.ts`, `apps/coder/src/routes/__tests__/providers.routes.test.ts`, `apps/coder/src/routes/agent-sessions.ts` +35 more
- `apps/server/src/types/api.ts``apps/server/src/routes/chats.ts`, `apps/server/src/routes/messages.ts`, `apps/server/src/routes/models.ts`, `apps/server/src/routes/projects.ts`, `apps/server/src/routes/sessions.ts` +23 more
- `apps/server/src/db.ts``apps/server/src/index.ts`, `apps/server/src/routes/agents.ts`, `apps/server/src/routes/artifacts.ts`, `apps/server/src/routes/chats.ts`, `apps/server/src/routes/messages.ts` +20 more
- `apps/coder/src/db.ts``apps/coder/src/index.ts`, `apps/coder/src/routes/__tests__/agent-sessions.routes.test.ts`, `apps/coder/src/routes/__tests__/chat-resolve.test.ts`, `apps/coder/src/routes/__tests__/providers.routes.test.ts`, `apps/coder/src/routes/agent-sessions.ts` +39 more
- `apps/server/src/types/api.ts``apps/server/src/routes/chats.ts`, `apps/server/src/routes/messages.ts`, `apps/server/src/routes/models.ts`, `apps/server/src/routes/projects.ts`, `apps/server/src/routes/sessions.ts` +29 more
- `apps/server/src/db.ts``apps/server/src/index.ts`, `apps/server/src/routes/agents.ts`, `apps/server/src/routes/analytics.ts`, `apps/server/src/routes/artifacts.ts`, `apps/server/src/routes/chats.ts` +27 more
- `packages/ion/src/cli/utils.ts``packages/ion/src/cli/commands/abandon.ts`, `packages/ion/src/cli/commands/abandon.ts`, `packages/ion/src/cli/commands/approve.ts`, `packages/ion/src/cli/commands/approve.ts`, `packages/ion/src/cli/commands/cleanup.ts` +19 more
- `apps/coder/src/services/tools/types.ts``apps/coder/src/routes/messages.ts`, `apps/coder/src/services/dispatcher.ts`, `apps/coder/src/services/tools/adapter.ts`, `apps/coder/src/services/tools/apply_pending.ts`, `apps/coder/src/services/tools/check_task_status.ts` +13 more
- `apps/coder/src/conductor/types.ts``apps/coder/src/conductor/flows/_util.ts`, `apps/coder/src/conductor/flows/architectural-analysis.ts`, `apps/coder/src/conductor/flows/authoring.ts`, `apps/coder/src/conductor/flows/code-review.ts`, `apps/coder/src/conductor/flows/discovery.ts` +9 more
- `apps/coder/src/conductor/types.ts``apps/coder/src/conductor/flows/_util.ts`, `apps/coder/src/conductor/flows/architectural-analysis.ts`, `apps/coder/src/conductor/flows/authoring.ts`, `apps/coder/src/conductor/flows/code-review.ts`, `apps/coder/src/conductor/flows/discovery.ts` +11 more
- `apps/server/src/services/tools.ts``apps/server/src/index.ts`, `apps/server/src/services/__tests__/agent-allowlist.test.ts`, `apps/server/src/services/agents.ts`, `apps/server/src/services/inference/stream-phase-adapter.ts`, `apps/server/src/services/inference/stream-phase.ts` +10 more
- `apps/coder/src/services/agent-backend.ts``apps/coder/src/routes/lifecycle.ts`, `apps/coder/src/services/__tests__/stream-json-parser.test.ts`, `apps/coder/src/services/acp-event-map.ts`, `apps/coder/src/services/agent-pool.ts`, `apps/coder/src/services/backends/__tests__/claude-sdk-map.test.ts` +9 more
- `apps/coder/src/services/acp-tool-snapshot.ts``apps/coder/src/services/__tests__/acp-event-map.test.ts`, `apps/coder/src/services/__tests__/frame-emitter.test.ts`, `apps/coder/src/services/__tests__/stream-json-parser.test.ts`, `apps/coder/src/services/acp-dispatch.ts`, `apps/coder/src/services/acp-event-map.ts` +9 more
- `apps/server/src/services/tools/codecontext/factory.ts``apps/server/src/services/tools/codecontext/get_blast_radius.ts`, `apps/server/src/services/tools/codecontext/get_call_graph.ts`, `apps/server/src/services/tools/codecontext/get_codebase_overview.ts`, `apps/server/src/services/tools/codecontext/get_dependencies.ts`, `apps/server/src/services/tools/codecontext/get_file_analysis.ts` +9 more
- `apps/server/src/services/tools.ts``apps/server/src/index.ts`, `apps/server/src/services/__tests__/agent-allowlist.test.ts`, `apps/server/src/services/agents.ts`, `apps/server/src/services/inference/stream-phase-adapter.ts`, `apps/server/src/services/inference/stream-phase.ts` +8 more
- `apps/server/src/config.ts``apps/server/src/db.ts`, `apps/server/src/index.ts`, `apps/server/src/routes/chats.ts`, `apps/server/src/routes/messages.ts`, `apps/server/src/routes/models.ts` +9 more
---

View File

@@ -10,23 +10,34 @@
- **AttachmentChip** — props: attachment, onRemove, onPreview — `apps/web/src/components/AttachmentChip.tsx`
- **AttachmentPreviewModal** — props: attachment, onClose — `apps/web/src/components/AttachmentPreviewModal.tsx`
- **BottomSheet** — props: open, onClose, title — `apps/web/src/components/BottomSheet.tsx`
- **CacheShapeBadge** — props: cacheTokens, totalTokens — `apps/web/src/components/CacheShapeBadge.tsx`
- **CapHitSentinel** — props: message, capHitPosition, isLatest — `apps/web/src/components/CapHitSentinel.tsx`
- **ChatInput** — props: disabled, projectId, agentId, onAgentChange, sessionId, webSearchEnabled, onSend, onForceSend, generating, onStop — `apps/web/src/components/ChatInput.tsx`
- **ChatTabBar** — props: pane, tabs, tabNumbers, onSwitchTab, onRemoveTab, onCloseOthers, onCloseToRight, onCloseAll, onNewTab, onSplitPane — `apps/web/src/components/ChatTabBar.tsx`
- **ChatThroughput** — props: chatId, className — `apps/web/src/components/ChatThroughput.tsx`
- **CodeBlock** — props: code, lang — `apps/web/src/components/CodeBlock.tsx`
- **ComparePane** — props: models, responses, onClose — `apps/web/src/components/ComparePane.tsx`
- **ContextMeter** — props: messages, modelContextLimit, sessionCostUsd — `apps/web/src/components/ContextMeter.tsx`
- **CreateProjectModal** — props: open, onOpenChange — `apps/web/src/components/CreateProjectModal.tsx`
- **DiffSnippet** — props: diff — `apps/web/src/components/DiffSnippet.tsx`
- **DiffSplitView** — props: file, wrapLines — `apps/web/src/components/DiffSplitView.tsx`
- **DoomLoopSentinel** — props: message — `apps/web/src/components/DoomLoopSentinel.tsx`
- **DropOverlay** — props: visible — `apps/web/src/components/DropOverlay.tsx`
- **EmptyState** — props: icon, title, description, action, className — `apps/web/src/components/EmptyState.tsx`
- **FileMentionPopover** — props: query, files, anchorRect, onSelect, onClose — `apps/web/src/components/FileMentionPopover.tsx`
- **FileViewerOverlay** — props: path, content, lang, onClose — `apps/web/src/components/FileViewerOverlay.tsx`
- **FlowLauncherDialog** — `apps/web/src/components/FlowLauncherDialog.tsx`
- **GitDiffView** — props: result, loading, error, mode, onSelectMode, onRefresh, mutating, mutateError, onStage, onUnstage — `apps/web/src/components/GitDiffView.tsx`
- **HtmlArtifactPane** — props: chatId, state, onClose — `apps/web/src/components/HtmlArtifactPane.tsx`
- **InferenceSettings** — `apps/web/src/components/InferenceSettings.tsx`
- **InlineReviewEditor** — props: initialBody, onSave, onCancel — `apps/web/src/components/InlineReviewEditor.tsx`
- **InlineReviewGutterCell** — props: lineNumber, type, hasComments, canComment, onClick — `apps/web/src/components/InlineReviewGutterCell.tsx`
- **InlineReviewThread** — props: comments, onEditComment, onDeleteComment — `apps/web/src/components/InlineReviewThread.tsx`
- **KeyboardShortcutsDialog** — props: open, onOpenChange — `apps/web/src/components/KeyboardShortcutsDialog.tsx`
- **MarkdownArtifactPane** — props: chatId, state, onClose — `apps/web/src/components/MarkdownArtifactPane.tsx`
- **MarkdownRenderer** — props: content — `apps/web/src/components/MarkdownRenderer.tsx`
- **McpPermissionDialog** — props: toolCallId, toolName, toolArgs, chatId, open, onClose — `apps/web/src/components/McpPermissionDialog.tsx`
- **McpResponseDisplay** — props: toolCall, toolResult — `apps/web/src/components/McpResponseDisplay.tsx`
- **MessageBubble** — props: message, sessionChats, capHitInfo, actions, hideActions, hasCheckpoint, restoreDisabled — `apps/web/src/components/MessageBubble.tsx`
- **MessageList** — props: messages, sessionChats — `apps/web/src/components/MessageList.tsx`
- **MobileTabSwitcher** — props: panes, activePaneIdx, chats, onSwitchPane, onRemovePane, onRenameChat — `apps/web/src/components/MobileTabSwitcher.tsx`
@@ -38,12 +49,14 @@
- **RequestReadAccessCard** — props: toolCall, toolResult, chatId — `apps/web/src/components/RequestReadAccessCard.tsx`
- **RightRail** — props: projectId, sessionId — `apps/web/src/components/RightRail.tsx`
- **SessionLandingPage** — props: projectId, sessionId, agentId, onAgentChange, onSend, onSkillInvoke, createChat, chats, onOpenChat, onUnarchiveChat — `apps/web/src/components/SessionLandingPage.tsx`
- **SessionTimeline** — props: messages, onClose, onScrollToMessage — `apps/web/src/components/SessionTimeline.tsx`
- **SlashCommandPicker** — props: query, items, groups, inputRef, onSelect, onClose, emptyLabel — `apps/web/src/components/SlashCommandPicker.tsx`
- **StaleStreamBanner** — props: onRetry, onDiscard — `apps/web/src/components/StaleStreamBanner.tsx`
- **StatusDot** — props: chatId, className — `apps/web/src/components/StatusDot.tsx`
- **ThemePicker** — `apps/web/src/components/ThemePicker.tsx`
- **ToolCallGroup** — props: runs — `apps/web/src/components/ToolCallGroup.tsx`
- **ToolCallLine** — props: run, insideGroup — `apps/web/src/components/ToolCallLine.tsx`
- **ToolCallLine** — props: run, insideGroup, chatId`apps/web/src/components/ToolCallLine.tsx`
- **TraceViewer** — props: chatId — `apps/web/src/components/TraceViewer.tsx`
- **Workspace** — props: sessionId, projectId, agentId, onAgentChange, panesHook, chatsHook, session, project, onAddPane — `apps/web/src/components/Workspace.tsx`
- **AddProviderModal** — props: open, onOpenChange, onAdded — `apps/web/src/components/coder/AddProviderModal.tsx`
- **ProvidersSettings** — `apps/web/src/components/coder/ProvidersSettings.tsx`
@@ -52,20 +65,30 @@
- **ThemeFx** — `apps/web/src/components/fx/ThemeFx.tsx`
- **ClaudeIcon** — props: size, className — `apps/web/src/components/icons/ProviderIcons.tsx`
- **OpenCodeIcon** — props: size, className — `apps/web/src/components/icons/ProviderIcons.tsx`
- **ActionRow** — props: message, actions, hiddenSet, hasCheckpoint, restoreDisabled — `apps/web/src/components/message-parts/ActionRow.tsx`
- **CompactCard** — props: message, sessionChats — `apps/web/src/components/message-parts/CompactCard.tsx`
- **MistakeRecoverySentinel** — props: message — `apps/web/src/components/message-parts/MistakeRecoverySentinel.tsx`
- **ReasoningBlock** — props: text, streaming — `apps/web/src/components/message-parts/ReasoningBlock.tsx`
- **SendToTerminalMenu** — `apps/web/src/components/message-parts/SendToTerminalMenu.tsx`
- **StatsLine** — props: message — `apps/web/src/components/message-parts/StatsLine.tsx`
- **SummaryCard** — props: message — `apps/web/src/components/message-parts/SummaryCard.tsx`
- **ArenaPane** — props: state, onClose — `apps/web/src/components/panes/ArenaPane.tsx`
- **ChatPane** — props: sessionId, chatId, projectId, agentId, onAgentChange, sessionChats, webSearchEnabled — `apps/web/src/components/panes/ChatPane.tsx`
- **CoderMessageList** — props: messages, chatId, footer, actions, checkpointMessageIds, restoreDisabled — `apps/web/src/components/panes/CoderMessageList.tsx`
- **CoderPane** — props: sessionId, paneId, chatId, chatPending, projectPath, onConnectedChange, onAgentLabelChange — `apps/web/src/components/panes/CoderPane.tsx`
- **OrchestratorPane** — props: state, onClose — `apps/web/src/components/panes/OrchestratorPane.tsx`
- **SettingsPane** — props: session, project, maximized, onToggleMaximize, onClose, isMobile — `apps/web/src/components/panes/SettingsPane.tsx`
- **TerminalPane** — props: sessionId, paneId, label, active — `apps/web/src/components/panes/TerminalPane.tsx`
- **TerminalPane** — props: sessionId, paneId, label, description, parentAgent, active — `apps/web/src/components/panes/TerminalPane.tsx`
- **FloatingMenu** — props: x, y, hasSelection, chatInputs, onCopy, onPaste, onSelectAll, onSearch, onSendToChat, onDismiss — `apps/web/src/components/panes/terminal/FloatingMenu.tsx`
- **SearchBar** — props: searchRef, theme, onClose — `apps/web/src/components/panes/terminal/SearchBar.tsx`
- **TerminalHotkeyBar** — props: ctrlArmed, onSendBytes, onArmCtrl, onFit — `apps/web/src/components/panes/terminal/TerminalHotkeyBar.tsx`
- **RightRailDrawerProvider** — `apps/web/src/hooks/useRightRailDrawer.tsx`
- **SidebarDrawerProvider** — `apps/web/src/hooks/useSidebarDrawer.tsx`
- **PATH_REGEX** — `apps/web/src/lib/linkify-paths.tsx`
- **Analytics** — `apps/web/src/pages/Analytics.tsx`
- **Home** — `apps/web/src/pages/Home.tsx`
- **Memory** — `apps/web/src/pages/Memory.tsx`
- **Project** — `apps/web/src/pages/Project.tsx`
- **Results** — `apps/web/src/pages/Results.tsx`
- **Session** — `apps/web/src/pages/Session.tsx`
- **Settings** — `apps/web/src/pages/Settings.tsx`

View File

@@ -25,8 +25,11 @@
- `CONTAINER_GUIDANCE_FILE` **required** — apps/server/src/services/__tests__/system-prompt.test.ts
- `CONTEXT7_API_KEY` (has default) — .env
- `DATABASE_URL` (has default) — .env.example
- `DEEPSEEK_API_KEY` (has default) — .env
- `DEEPSEEK_BASE_URL` (has default) — .env
- `DEFAULT_MODEL` (has default) — .env.example
- `DEV_REMOTE_USER` **required** — apps/web/vite.config.ts
- `EMBEDDING_MODEL_PATH` **required** — apps/server/src/services/memory/embeddings.ts
- `GITEA_BASE_URL` (has default) — .env
- `GITEA_SSH_HOST` (has default) — .env
- `GITEA_TOKEN` (has default) — .env
@@ -34,6 +37,7 @@
- `LLAMA_SWAP_URL` (has default) — .env.example
- `MCP_TEST_MISSING` **required** — apps/server/src/services/__tests__/mcp-config.test.ts
- `MCP_TEST_SECRET` **required** — apps/server/src/services/__tests__/mcp-config.test.ts
- `MEMORY_SEARCH` **required** — apps/server/src/services/memory/recall.ts
- `NODE_ENV` (has default) — .env.example
- `PORT` (has default) — .env.example
- `POSTGRES_PASSWORD` (has default) — .env.example
@@ -48,3 +52,7 @@
- `Dockerfile`
- `apps/web/vite.config.ts`
- `docker-compose.yml`
## Key Dependencies
- better-sqlite3: ^11.10.0

View File

@@ -2,36 +2,36 @@
## Most Imported Files (change these carefully)
- `apps/coder/src/db.ts` — imported by **40** files
- `apps/server/src/types/api.ts` — imported by **28** files
- `apps/server/src/db.ts` — imported by **25** files
- `apps/coder/src/db.ts` — imported by **44** files
- `apps/server/src/types/api.ts` — imported by **34** files
- `apps/server/src/db.ts` — imported by **32** files
- `packages/ion/src/cli/utils.ts` — imported by **24** files
- `apps/coder/src/services/tools/types.ts` — imported by **18** files
- `apps/coder/src/conductor/types.ts` — imported by **14** files
- `apps/coder/src/conductor/types.ts` — imported by **16** files
- `apps/server/src/services/tools.ts` — imported by **15** files
- `apps/coder/src/services/agent-backend.ts` — imported by **14** files
- `apps/coder/src/services/acp-tool-snapshot.ts` — imported by **14** files
- `apps/server/src/config.ts` — imported by **14** files
- `apps/server/src/services/tools/codecontext/factory.ts` — imported by **14** files
- `apps/server/src/services/tools.ts` — imported by **13** files
- `apps/server/src/services/tools/types.ts` — imported by **13** files
- `conductor/src/types.ts` — imported by **13** files
- `apps/coder/src/services/provider-config-registry.ts` — imported by **12** files
- `apps/server/src/config.ts` — imported by **12** files
- `apps/coder/src/config.ts` — imported by **11** files
- `apps/coder/src/services/provider-types.ts` — imported by **11** files
- `apps/server/src/services/broker.ts` — imported by **10** files
- `apps/server/src/services/agents.ts` — imported by **10** files
- `apps/server/src/services/path_guard.ts` — imported by **10** files
- `apps/coder/src/services/pending_changes.ts` — imported by **9** files
- `apps/server/src/services/broker.ts` — imported by **9** files
- `apps/server/src/services/path_guard.ts` — imported by **9** files
- `apps/server/src/services/inference/payload.ts` — imported by **9** files
## Import Map (who imports what)
- `apps/coder/src/db.ts``apps/coder/src/index.ts`, `apps/coder/src/routes/__tests__/agent-sessions.routes.test.ts`, `apps/coder/src/routes/__tests__/chat-resolve.test.ts`, `apps/coder/src/routes/__tests__/providers.routes.test.ts`, `apps/coder/src/routes/agent-sessions.ts` +35 more
- `apps/server/src/types/api.ts``apps/server/src/routes/chats.ts`, `apps/server/src/routes/messages.ts`, `apps/server/src/routes/models.ts`, `apps/server/src/routes/projects.ts`, `apps/server/src/routes/sessions.ts` +23 more
- `apps/server/src/db.ts``apps/server/src/index.ts`, `apps/server/src/routes/agents.ts`, `apps/server/src/routes/artifacts.ts`, `apps/server/src/routes/chats.ts`, `apps/server/src/routes/messages.ts` +20 more
- `apps/coder/src/db.ts``apps/coder/src/index.ts`, `apps/coder/src/routes/__tests__/agent-sessions.routes.test.ts`, `apps/coder/src/routes/__tests__/chat-resolve.test.ts`, `apps/coder/src/routes/__tests__/providers.routes.test.ts`, `apps/coder/src/routes/agent-sessions.ts` +39 more
- `apps/server/src/types/api.ts``apps/server/src/routes/chats.ts`, `apps/server/src/routes/messages.ts`, `apps/server/src/routes/models.ts`, `apps/server/src/routes/projects.ts`, `apps/server/src/routes/sessions.ts` +29 more
- `apps/server/src/db.ts``apps/server/src/index.ts`, `apps/server/src/routes/agents.ts`, `apps/server/src/routes/analytics.ts`, `apps/server/src/routes/artifacts.ts`, `apps/server/src/routes/chats.ts` +27 more
- `packages/ion/src/cli/utils.ts``packages/ion/src/cli/commands/abandon.ts`, `packages/ion/src/cli/commands/abandon.ts`, `packages/ion/src/cli/commands/approve.ts`, `packages/ion/src/cli/commands/approve.ts`, `packages/ion/src/cli/commands/cleanup.ts` +19 more
- `apps/coder/src/services/tools/types.ts``apps/coder/src/routes/messages.ts`, `apps/coder/src/services/dispatcher.ts`, `apps/coder/src/services/tools/adapter.ts`, `apps/coder/src/services/tools/apply_pending.ts`, `apps/coder/src/services/tools/check_task_status.ts` +13 more
- `apps/coder/src/conductor/types.ts``apps/coder/src/conductor/flows/_util.ts`, `apps/coder/src/conductor/flows/architectural-analysis.ts`, `apps/coder/src/conductor/flows/authoring.ts`, `apps/coder/src/conductor/flows/code-review.ts`, `apps/coder/src/conductor/flows/discovery.ts` +9 more
- `apps/coder/src/conductor/types.ts``apps/coder/src/conductor/flows/_util.ts`, `apps/coder/src/conductor/flows/architectural-analysis.ts`, `apps/coder/src/conductor/flows/authoring.ts`, `apps/coder/src/conductor/flows/code-review.ts`, `apps/coder/src/conductor/flows/discovery.ts` +11 more
- `apps/server/src/services/tools.ts``apps/server/src/index.ts`, `apps/server/src/services/__tests__/agent-allowlist.test.ts`, `apps/server/src/services/agents.ts`, `apps/server/src/services/inference/stream-phase-adapter.ts`, `apps/server/src/services/inference/stream-phase.ts` +10 more
- `apps/coder/src/services/agent-backend.ts``apps/coder/src/routes/lifecycle.ts`, `apps/coder/src/services/__tests__/stream-json-parser.test.ts`, `apps/coder/src/services/acp-event-map.ts`, `apps/coder/src/services/agent-pool.ts`, `apps/coder/src/services/backends/__tests__/claude-sdk-map.test.ts` +9 more
- `apps/coder/src/services/acp-tool-snapshot.ts``apps/coder/src/services/__tests__/acp-event-map.test.ts`, `apps/coder/src/services/__tests__/frame-emitter.test.ts`, `apps/coder/src/services/__tests__/stream-json-parser.test.ts`, `apps/coder/src/services/acp-dispatch.ts`, `apps/coder/src/services/acp-event-map.ts` +9 more
- `apps/server/src/services/tools/codecontext/factory.ts``apps/server/src/services/tools/codecontext/get_blast_radius.ts`, `apps/server/src/services/tools/codecontext/get_call_graph.ts`, `apps/server/src/services/tools/codecontext/get_codebase_overview.ts`, `apps/server/src/services/tools/codecontext/get_dependencies.ts`, `apps/server/src/services/tools/codecontext/get_file_analysis.ts` +9 more
- `apps/server/src/services/tools.ts``apps/server/src/index.ts`, `apps/server/src/services/__tests__/agent-allowlist.test.ts`, `apps/server/src/services/agents.ts`, `apps/server/src/services/inference/stream-phase-adapter.ts`, `apps/server/src/services/inference/stream-phase.ts` +8 more
- `apps/server/src/config.ts``apps/server/src/db.ts`, `apps/server/src/index.ts`, `apps/server/src/routes/chats.ts`, `apps/server/src/routes/messages.ts`, `apps/server/src/routes/models.ts` +9 more

View File

@@ -14,8 +14,17 @@
- function ensureSession: (tmuxConfPath, sessionName, projectRoot, log, cols?, rows?) => Promise<void>
- function killSession: (tmuxConfPath, sessionName) => Promise<boolean>
- function capturePane: (tmuxConfPath, sessionName, lines) => Promise<string>
- _...1 more_
- `apps/booterm/src/pty/pty.ts` — function attachPty: (opts) => IPty
- `apps/booterm/src/ws/attach.ts` — function registerWsAttachRoute: (app, tmuxConfPath) => void
- `apps/booterm/src/pty/registry.ts`
- function register: (sessionId, paneId, projectPath, title?, opts?) => void
- function unregister: (paneId) => void
- function touchActivity: (paneId) => void
- function list: () => SessionMeta[]
- function get: (paneId) => SessionMeta | undefined
- function setPendingMetadata: (paneId, meta) => void
- _...8 more_
- `apps/booterm/src/ws/attach.ts` — function registerWsAttachRoute: (app, tmuxConfPath, idleTimeoutSeconds?, absoluteTimeoutSeconds?) => void
- `apps/coder/src/conductor/contracts.ts`
- function produceContract: (contracts) => string
- function reviewContract: (contracts) => string
@@ -102,7 +111,7 @@
- function classifyLane: (battleType, _identity, model, localModels) => ContestantLane
- function nextLocalContestant: (contestants) => string | null
- function isBattleComplete: (contestants) => boolean
- function computeBenchmark: (startedAt, endedAt, costTokens, lane) => Benchmark
- function computeBenchmark: (startedAt, endedAt, costTokens, lane, tokenBreakdown) => Benchmark
- function sanitizeSlug: (s) => string
- function buildBattleSlug: (battleId, battleType, createdAt) => string
- _...7 more_
@@ -166,6 +175,7 @@
- function stepEndedToUsage: (props) => StepUsage
- interface StepEndedProps
- interface StepUsage
- `apps/coder/src/services/backends/paseo.ts` — class PaseoBackend, interface PaseoBackendDeps
- `apps/coder/src/services/backends/pushable-iterable.ts` — function createPushable: () => Pushable<T>, interface Pushable
- `apps/coder/src/services/backends/turn-guard.ts`
- function armAbortGuard: (g) => void
@@ -174,6 +184,30 @@
- interface AbortTerminalGuard
- `apps/coder/src/services/backends/warm-acp-routing.ts` — function shouldUseWarmBackend: (task) => boolean, function isTurnOkForStopReason: (stopReason) => boolean
- `apps/coder/src/services/backends/warm-acp.ts` — class WarmAcpBackend, interface WarmAcpBackendDeps
- `apps/coder/src/services/behavioral/generation.ts`
- function createExecutionPlan: (observational, actionable, previouslyApplied, disambiguationGroups, lowCriticality) => BatchExecutionPlan[]
- function getRetryTemperatures: (baseTemp, maxAttempts) => number[]
- class SchematicGenerator
- class DefaultSchematicGenerator
- interface ObservationalOutput
- interface ActionableOutput
- _...7 more_
- `apps/coder/src/services/behavioral/matching.ts`
- function matchWithRetry: (fn) => void
- function executeBatchesParallel: (batches, _generationInfo) => Promise<GuidelineMatchingResult>
- function createScoredMatch: (guidelineId, score, rationale) => ScoredMatch
- class GuidelineMatchingBatchError
- class ObservationalGuidelineMatchingBatch
- class ActionableGuidelineMatchingBatch
- _...25 more_
- `apps/coder/src/services/behavioral/resolver.ts`
- class RelationalResolver
- interface RelationshipEntity
- interface Relationship
- interface RelationshipStore
- interface ResolvedEntity
- interface Resolution
- _...8 more_
- `apps/coder/src/services/cancel-registry.ts` — function createCancelRegistry: () => CancelRegistry, interface CancelRegistry
- `apps/coder/src/services/checkpoints.ts`
- function buildShadowCommitCommand: (worktreePath, id) => string
@@ -184,7 +218,15 @@
- interface RestoreCheckpointResult
- _...1 more_
- `apps/coder/src/services/claude-command-discovery.ts` — function discoverClaudeCommands: () => AgentCommand[]
- `apps/coder/src/services/collision-detector.ts`
- function findConflicts: (changedFiles, worktreeId, /** Approximate line range for the proposed changes, keyed by file path */
changedRanges, {...}, conflictIndex) => ConflictVerdict[]
- interface ConflictVerdict
- interface ConflictEntry
- type ConflictSeverity
- type ConflictIndexData
- `apps/coder/src/services/command-availability.ts` — function isCommandAvailable: (binary) => Promise<boolean>
- `apps/coder/src/services/conflict-index.ts` — class ConflictIndex, const conflictIndex
- `apps/coder/src/services/correction-service.ts`
- function recordCorrection: (originalClaim, correction, principleExtracted, persistedTo, basePath?) => Promise<UserCorrectionRecord>
- function scanForCorrections: (auditPath) => Promise<UserCorrectionRecord[]>
@@ -214,10 +256,11 @@
- function partitionReady: (ready, ctx) => void
- function isRunComplete: (flow, state) => boolean
- function isStuck: (flow, state) => boolean
- function reconcileResumeStep: (status, taskId, taskState) => ResumeAction
- _...5 more_
- function buildBatchState: (flow, inFlight) => Map<string,
- _...12 more_
- `apps/coder/src/services/flow-runner.ts`
- function createFlowRunner: (deps) => FlowRunner
- function resolveVariables: (prompt, results, string>) => string
- interface LaunchOpts
- interface FlowRunner
- `apps/coder/src/services/frame-emitter.ts`
@@ -237,6 +280,19 @@
- function deleteGuideline: (id, basePath?) => Promise<boolean>
- function findGuideline: (content, basePath?) => Promise<Guideline | null>
- _...14 more_
- `apps/coder/src/services/hashline/hash-computation.ts`
- function computeLineHash: (lineNumber, content) => string
- function computeLegacyLineHash: (lineNumber, content) => string
- function formatHashLine: (lineNumber, content) => string
- function formatHashLines: (content) => string
- `apps/coder/src/services/hashline/validation.ts`
- function normalizeLineRef: (ref) => string
- function parseLineRef: (ref) => LineRef
- function validateLineRef: (lines, ref) => void
- function validateLineRefs: (lines, refs) => void
- class HashlineMismatchError
- interface LineRef
- `apps/coder/src/services/hashline/xxhash32.ts` — function hashXxh32: (input, seed) => number
- `apps/coder/src/services/host-exec.ts` — function hostExec: (command, opts?) => Promise<HostExecResult>, interface HostExecResult
- `apps/coder/src/services/lsp/client.ts` — class LspClient
- `apps/coder/src/services/lsp/config.ts` — function getServerConfig: (filePath) => LspServerConfig | null, interface LspServerConfig
@@ -248,6 +304,44 @@
- function findReferences: (client, filePath, content, line, character) => Promise<Location[]>
- `apps/coder/src/services/lsp/server-manager.ts` — class LspServerManager, const lspManager
- `apps/coder/src/services/mcp-server.ts` — function startMcpServer: (sql) => Promise<void>
- `apps/coder/src/services/model-resolution/connected-providers-cache.ts`
- function readConnectedProvidersCache: () => string[] | null
- function findProviderModelMetadata: (_providerID, _modelID) => ModelMetadata | undefined
- function readProviderModelsCache: () => ProviderModelsCache | null
- interface ProviderModelsCache
- interface ConnectedProvidersAdapter
- const connectedProvidersAdapter: ConnectedProvidersAdapter
- `apps/coder/src/services/model-resolution/fallback-chain-from-models.ts`
- function parseFallbackModelEntry: (model, contextProviderID, defaultProviderID) => FallbackEntry | undefined
- function parseFallbackModelObjectEntry: (obj, contextProviderID, defaultProviderID) => FallbackEntry | undefined
- function findMostSpecificFallbackEntry: (providerID, modelID, chain) => FallbackEntry | undefined
- function buildFallbackChainFromModels: (fallbackModels) => void
- `apps/coder/src/services/model-resolution/model-availability.ts` — function fuzzyMatchModel: (target, available, providers?) => string | null, function isModelAvailable: (targetModel, availableModels) => boolean
- `apps/coder/src/services/model-resolution/model-error-classifier.ts`
- function isRetryableModelError: (error) => boolean
- function shouldRetryError: (error) => boolean
- function getNextFallback: (fallbackChain, attemptCount) => FallbackEntry | undefined
- function hasMoreFallbacks: (fallbackChain, attemptCount) => boolean
- function selectFallbackProvider: (providers, preferredProviderID?) => string
- function selectFallbackProviderWithCache: (providers, providerCache, preferredProviderID?) => string
- _...1 more_
- `apps/coder/src/services/model-resolution/model-normalization.ts` — function normalizeModel: (model?) => string | undefined, function normalizeModelID: (modelID) => string
- `apps/coder/src/services/model-resolution/model-resolution-pipeline.ts`
- function _setModelResolutionLogImplementationForTesting: (logImplementation) => void
- function resolveModelPipeline: (request, providerCache) => void
- type ModelResolutionRequest
- type ModelResolutionProvenance
- type ModelResolutionResult
- type ModelResolutionDeps
- `apps/coder/src/services/model-resolution/model-resolver.ts`
- function resolveModel: (input) => string | undefined
- function resolveModelWithFallback: (input, connectedProvidersAdapter) => ModelResolutionResult | undefined
- function normalizeFallbackModels: (models) => void
- function flattenToFallbackModelStrings: (models) => void
- type ModelResolutionInput
- type ModelSource
- _...2 more_
- `apps/coder/src/services/model-resolution/provider-model-id-transform.ts` — function transformModelForProvider: (provider, model) => string, function transformModelForProviderDisplay: (provider, model) => string
- `apps/coder/src/services/net/port-utils.ts`
- function reclaimPort: (port) => void
- function waitForPortRelease: (port, timeoutMs) => Promise<boolean>
@@ -257,6 +351,13 @@
- function createOrphanWorktreeReaper: (deps) => void
- interface OrphanWorktreeReaperDeps
- interface OrphanReaperResult
- `apps/coder/src/services/paseo-client.ts`
- class PaseoClientError
- class PaseoClient
- interface PaseoAgentListItem
- interface PaseoAgentDetail
- interface PaseoSendResult
- interface PaseoClientConfig
- `apps/coder/src/services/pending_changes.ts`
- function planEdit: (content, oldStr, newStr) => EditPlan
- function queueEdit: (sql, sessionId, taskId, filePath, oldString, newString, projectRoot, // v2.6 Phase 1-UX) => void
@@ -273,6 +374,14 @@
- function waitForElicitationResponse: (taskId, sessionId, provider, modeId, params, timeoutMs) => Promise<CreateElicitationResponse>
- function cancelPendingPermission: (taskId) => void
- _...3 more_
- `apps/coder/src/services/plan-store.ts`
- function createPlan: (sql, opts) => Promise<Plan>
- function getPlan: (sql, planId) => Promise<Plan | null>
- function listPlans: (sql, projectId) => Promise<Plan[]>
- function listActivePlans: (sql, projectId) => Promise<Plan[]>
- function updatePlan: (sql, planId, opts) => Promise<Plan | null>
- function updatePlanFromRun: (sql, runId, runStatus) => Promise<boolean>
- _...5 more_
- `apps/coder/src/services/provider-commands.ts`
- function getManifestCommands: (provider) => AgentCommand[]
- function mergeCommands: (...lists) => AgentCommand[]
@@ -295,13 +404,13 @@
- interface ProviderManifestEntry
- const PROVIDER_MANIFEST: Record<string, ProviderManifestEntry>
- `apps/coder/src/services/provider-snapshot.ts`
- function fetchDeepSeekModels: (config) => Promise<ProviderModel[]>
- function fetchLlamaSwapModels: (config) => Promise<ProviderModel[]>
- function prefixLlamaSwapModels: (models) => ProviderModel[]
- function mergeModels: (...lists) => ProviderModel[]
- function getProviderSnapshot: (sql, config, cwd?, force) => Promise<ProviderSnapshotEntry[]>
- function clearProviderSnapshotCache: () => void
- function peekSnapshotEntry: (name, cwd?) => ProviderSnapshotEntry | undefined
- _...1 more_
- _...2 more_
- `apps/coder/src/services/pty-dispatch.ts`
- function dispatchViaPty: (opts) => Promise<DispatchResult>
- interface DispatchResult
@@ -411,6 +520,17 @@
- function readSession: (sessionId, projectRoot?) => SessionJson | null
- _...9 more_
- `apps/server/src/services/auto_name.ts` — function maybeAutoNameChat: (ctx, chatId, sessionId) => Promise<void>
- `apps/server/src/services/background-task.ts`
- function setBackgroundInferenceEnqueuer: (enqueue, chatId, assistantMessageId, user) => void
- function spawnBackgroundTask: (sql, log, projectId, input, model, agent?, label?) => Promise<BackgroundTask>
- function getBackgroundTaskStatus: (sql, taskId) => Promise<BackgroundTask | null>
- function getBackgroundTaskResult: (sql, taskId, chatId) => Promise<
- function cancelBackgroundTask: (sql, taskId) => Promise<boolean>
- interface BackgroundTask
- `apps/server/src/services/boocontext_client.ts`
- function callBoocontext: (req, log?, msg) => void
- interface BoocontextRequest
- interface BoocontextResponse
- `apps/server/src/services/broker.ts`
- function createBroker: (log?) => Broker
- interface Broker
@@ -429,6 +549,7 @@
- function select: (messages, contextLimit, tailTurns) => SelectResult
- function deriveFilesRead: (head) => string[]
- _...8 more_
- `apps/server/src/services/export-formatter.ts` — function formatJson: (chat, messages, model) => string, function formatMarkdown: (chat, messages, model) => string
- `apps/server/src/services/file_index.ts` — function getProjectFiles: (projectId, projectRoot) => Promise<string[]>
- `apps/server/src/services/file_ops.ts`
- function listDir: (projectRoot, relPath, opts?) => Promise<ListDirResult>
@@ -453,7 +574,20 @@
- interface GiteaConfig
- interface GiteaRepo
- `apps/server/src/services/grant_resolver.ts` — function resolveGrantRoot: (sql, requestedPath, projectRoot, whitelistRoot) => Promise<GrantResolution>, type GrantResolution
- `apps/server/src/services/hooks.ts`
- function loadHooksConfig: (path) => HooksConfig
- function reloadHooksConfig: () => HooksConfig
- function createHookRunner: () => HookRunner
- interface HookConfig
- interface HooksConfig
- interface PreToolUsePayload
- _...10 more_
- `apps/server/src/services/inference/budget.ts` — function resolveToolBudget: (agent) => number
- `apps/server/src/services/inference/compute-diff.ts`
- function computeDiff: (oldStr, newStr, filePath) => string
- function isWriteTool: (name) => boolean
- function diffFromToolArgs: (name, args, unknown>, filePath?) => string
- const WRITE_TOOL_NAMES
- `apps/server/src/services/inference/content-flusher.ts` — function createContentFlusher: (sql, messageId, getContent) => void, interface ContentFlusher
- `apps/server/src/services/inference/dcp/messages.ts`
- function toDcpMessages: (parts) => DcpMessage[]
@@ -493,6 +627,10 @@
- type FailureKind
- const MISTAKE_THRESHOLD
- _...1 more_
- `apps/server/src/services/inference/multi-modal.ts`
- function hasImageAttachments: (_message) => boolean
- function imageAttachmentsToParts: (attachments) => Array<
- interface ImageAttachment
- `apps/server/src/services/inference/parts.ts`
- function insertParts: (sql, parts) => Promise<void>
- function partsFromAssistantMessage: (args) => void
@@ -505,10 +643,13 @@
- function maybeFlagForCompaction: (ctx, chatId, updated) => Promise<void>
- interface OpenAiMessage
- `apps/server/src/services/inference/provider.ts`
- function resolveRoute: (agent, config?) => RoutingInfo
- function isDeepSeekModel: (modelId) => boolean
- function resolveRoute: (agent, config?, modelId?) => RoutingInfo
- function upstreamModel: (config, modelId, agent?) => LanguageModel
- function resolveModelEndpoint: (config, modelId) => void
- function resetDeepSeekProvider: () => void
- interface RoutingInfo
- type InferenceRoute
- _...1 more_
- `apps/server/src/services/inference/prune.ts`
- function selectPruneTargets: (partsNewestFirst, tailStartCreatedAt) => void
- function prune: (args) => Promise<PruneResult>
@@ -529,6 +670,12 @@
- function isAnySentinel: (m) => boolean
- const DOOM_LOOP_THRESHOLD
- _...1 more_
- `apps/server/src/services/inference/state-graph.ts`
- function createDefaultGraph: () => GraphNode[]
- function runGraph: (ctx, args, extra) => Promise<GraphResult>
- interface GraphState
- interface GraphResult
- type GraphNodeType
- `apps/server/src/services/inference/step-decision.ts`
- function decideStep: (input) => PreStepDecision
- function decidePostToolAction: (action, mistakeTracker) => PostToolDecision
@@ -545,12 +692,14 @@
- `apps/server/src/services/inference/stream-phase.ts` — function executeStreamPhase: (ctx, args, session, messages, state, agent, // v1.11.8, web_search and web_fetch are stripped from the
// tool list sent to the LLM, so the model can't even attempt them.
webToolsEnabled) => Promise<StreamResult>
- `apps/server/src/services/inference/supervisor.ts` — function resolveSupervisorTurn: (latestUserMessage, agents, fallbackModel?) => Promise<SupervisorRoute | null>, interface SupervisorRoute
- `apps/server/src/services/inference/tool-call-parser.ts`
- function stripToolMarkup: (text, opts?) => string
- function extractToolCallBlocks: (buffer, log?) => ToolCallExtraction
- interface ParsedCall
- interface ToolCallExtraction
- `apps/server/src/services/inference/tool-phase.ts` — function executeToolPhase: (ctx, args, result, startedAt, session, projectRoot, agent?) => Promise<ToolPhaseResult>, interface ToolPhaseResult
- `apps/server/src/services/inference/tool-input-repair.ts` — function repairToolInput: (schema, unknown> | undefined, args, unknown>) => void, interface ToolInputRepair
- `apps/server/src/services/inference/tool-phase.ts` — function executeToolPhase: (ctx, args, result, startedAt, session, projectRoot, agent?, turnNumber?) => Promise<ToolPhaseResult>, interface ToolPhaseResult
- `apps/server/src/services/inference/tool-shim.ts`
- function extractToolCalls: (text) => ParsedToolCall[]
- function hasToolCallMarkup: (text) => boolean
@@ -566,20 +715,26 @@
- `apps/server/src/services/inference/turn.ts`
- function runAssistantTurn: (ctx, args) => Promise<void>
- function runInference: (ctx, sessionId, chatId, assistantMessageId, signal?) => Promise<void>
- function runInferenceWithModel: (ctx, sessionId, chatId, assistantMessageId, modelOverride, compareGroupId, signal?) => Promise<void>
- function createInferenceRunner: (ctx, 'publishUser'>, publishUserFn, frame) => void
- `apps/server/src/services/mcp-client.ts`
- function initialize: (entries, logger) => Promise<void>
- function callTool: (prefixedName, args, unknown>) => Promise<unknown>
- function getServerPermission: (prefixedToolName) => McpPermission
- function setServerPermission: (serverName, permission) => void
- function getServerName: (prefixedToolName) => string | null
- function getTools: () => ToolDef<Record<string, unknown>>[]
- function getMcpServers: () => Array<
- function shutdown: () => Promise<void>
- function wrapMcpTool: (serverName, mcpTool) => ToolDef<Record<string, unknown>>
- _...2 more_
- _...6 more_
- `apps/server/src/services/mcp-config.ts`
- function substituteEnvVars: (value, log, unsetVars?) => unknown
- function loadMcpConfig: (configPath, log) => McpServerEntry[]
- interface McpServerEntry
- type McpServerConfig
- `apps/server/src/services/memory/bm25.ts` — class Bm25Ranker
- `apps/server/src/services/memory/embeddings.ts`
- function isEmbeddingAvailable: () => boolean
- function initEmbeddings: (modelPath?) => Promise<boolean>
- function embed: (texts) => Promise<number[][] | null>
- `apps/server/src/services/memory/entries.ts` — function parseMemoryEntries: (fileName, markdown) => MemoryEntry[], interface MemoryEntry
- `apps/server/src/services/memory/paths.ts`
- function getMemoryRoot: (projectRoot) => string
@@ -587,7 +742,10 @@
- function ensureMemoryScaffold: (root) => Promise<void>
- type MemoryTopic
- `apps/server/src/services/memory/prompt.ts` — function formatMemoryBlock: (entries) => string
- `apps/server/src/services/memory/recall.ts` — function rankByRelevance: (query, entries) => MemoryEntry[], function loadMemoryForSession: (projectRoot, _sessionId?, query?) => Promise<string[]>
- `apps/server/src/services/memory/recall.ts`
- function rankByRelevance: (query, entries) => MemoryEntry[]
- function rankByHybrid: (query, entries) => Promise<MemoryEntry[]>
- function loadMemoryForSession: (projectRoot, _sessionId?, query?) => Promise<string[]>
- `apps/server/src/services/memory/scan.ts`
- function scanMemoryScopes: (scope) => Promise<MemoryEntry[]>
- function scanProjectMemory: (projectRoot) => Promise<MemoryEntry[]>
@@ -618,6 +776,11 @@
- function filterSecretEntries: (entries, pathOf) => void
- class SecretBlockedError
- const DEFAULT_SECURITY_IGNORE_FILETYPES: ReadonlyArray<string>
- `apps/server/src/services/session-snapshots.ts`
- function saveAgentSnapshot: (sql, chatId, data) => Promise<void>
- function loadAgentSnapshot: (sql, chatId) => Promise<AgentSnapshot | null>
- function deleteAgentSnapshot: (sql, chatId) => Promise<void>
- interface AgentSnapshot
- `apps/server/src/services/skill-invoke.ts`
- function runSkillInvokeTransaction: (sql, args) => Promise<
- function buildSkillInvokeSyntheticFrames: (chatId, result, toolCall, skillBody) => SkillInvokeSessionFrame[]
@@ -648,8 +811,53 @@
- _...2 more_
- `apps/server/src/services/task-model.ts` — function taskModelCompletion: (opts) => Promise<string>
- `apps/server/src/services/task-search-rewrite.ts` — function rewriteSearchQuery: (userMessage) => Promise<string>
- `apps/server/src/services/tool-traces.ts`
- function insertToolTrace: (sql, insert) => Promise<ToolTrace>
- function updateToolTrace: (sql, id, updates) => Promise<ToolTrace | null>
- interface ToolTrace
- interface ToolTraceInsert
- interface ToolTraceUpdate
- `apps/server/src/services/tools/background-subagent-tools.ts`
- function executeSpawnSubagent: (input, sql, sessionId) => Promise<Record<string, unknown>>
- function executeSubagentStatus: (input, sql) => Promise<Record<string, unknown>>
- function executeSubagentResult: (input, sql) => Promise<Record<string, unknown>>
- type SpawnSubagentInputT
- type SubagentStatusInputT
- type SubagentResultInputT
- _...6 more_
- `apps/server/src/services/tools/codecontext/factory.ts` — function makeCodecontextTool: (opts, unknown>;
mapArgs) => void
- `apps/server/src/services/tools/codecontext/get_code_health.ts`
- function executeGetCodeHealth: (input, projectPath) => Promise<string>
- type GetCodeHealthInputT
- const GetCodeHealthInput
- const getCodeHealth: ToolDef<GetCodeHealthInputT>
- `apps/server/src/services/tools/codecontext/get_code_impact.ts`
- function executeGetCodeImpact: (input, projectPath) => Promise<CodecontextResponse>
- type GetCodeImpactInputT
- const GetCodeImpactInput
- const getCodeImpact: ToolDef<GetCodeImpactInputT>
- `apps/server/src/services/tools/codecontext/get_code_map.ts`
- function executeGetCodeMap: (input, projectRoot) => Promise<CodeMapResponse>
- interface CodeMapResponse
- type GetCodeMapInputT
- const GetCodeMapInput
- const getCodeMap: ToolDef<GetCodeMapInputT>
- `apps/server/src/services/tools/codecontext/get_type_info.ts`
- function executeGetTypeInfo: (input, _projectPath?) => Promise<CodecontextResponse>
- type GetTypeInfoInputT
- const GetTypeInfoInput
- const getTypeInfo: ToolDef<GetTypeInfoInputT>
- `apps/server/src/services/tools/codecontext/get_wiki_article.ts`
- function executeGetWikiArticle: (input, projectPath) => Promise<string>
- type GetWikiArticleInputT
- const GetWikiArticleInput
- const getWikiArticle: ToolDef<GetWikiArticleInputT>
- `apps/server/src/services/tools/execute-command.ts`
- function executeRunCommand: (input, projectRoot) => Promise<RunCommandOutput>
- type RunCommandInputT
- type RunCommandOutput
- const runCommand: ToolDef<RunCommandInputT>
- `apps/server/src/services/tools/registry.ts` — function appendMcpTools: (mcpTools) => void, function toolJsonSchemas: () => ToolJsonSchema[]
- `apps/server/src/services/tools/tiers.ts`
- function resolveToolTier: (tier) => readonly string[]
@@ -675,6 +883,39 @@
- interface WebSearchOutput
- type WebSearchInputT
- const webSearch: ToolDef<WebSearchInputT>
- `apps/server/src/services/workflow/catalog.ts`
- function fingerprintAgentTask: (prompt, spec, unknown>, args) => string
- function getBuiltinWorkflows: () => BuiltinWorkflow[]
- function getBuiltinWorkflow: (name) => BuiltinWorkflow | undefined
- function mergeBuiltinWorkflows: (fileWorkflows) => Array<
- interface BuiltinWorkflow
- const meta
- `apps/server/src/services/workflow/discovery.ts`
- function isBuiltinWorkflow: (meta) => boolean
- function discoverWorkflows: (projectRoot) => WorkflowMeta[]
- function findWorkflow: (name, projectRoot) => WorkflowMeta | undefined
- function isValidWorkflowPath: (filePath) => boolean
- interface WorkflowMeta
- `apps/server/src/services/workflow/manager.ts`
- class WorkflowManager
- interface WorkflowMetaInfo
- type WorkflowEventHandler
- `apps/server/src/services/workflow/resumability.ts`
- function cacheKey: (spec, args) => string
- function getCachedResult: (key) => CachedResult | null
- function setCachedResult: (key, result) => void
- function invalidateRun: (runKey) => void
- function clearCache: () => void
- function cacheSize: () => number
- _...1 more_
- `apps/server/src/services/workflow/sandbox.ts`
- function transformEsmToCjs: (code) => string
- function name: (...) => void
- function isEsmSyntax: (code) => boolean
- function buildSandbox: (context) => Record<string, unknown>
- function loadWorkflowScript: (sourceFile, context) => (...args: unknown[]) => Promise<unknown>
- function loadWorkflowScriptFromCode: (code, context, filename?) => (...args: unknown[]) => Promise<unknown>
- _...3 more_
- `apps/server/src/utils/string-utils.ts` — function stripQuotes: (s) => string
- `apps/web/src/api/client.ts`
- class ApiError
@@ -695,7 +936,7 @@
- interface TerminalSelectionActions
- interface TerminalSelection
- `apps/web/src/hooks/terminal/useTerminalSocket.ts`
- function useTerminalSocket: ({...}, sessionId, paneId, fit, getSize, setSize, }) => TerminalSocket
- function useTerminalSocket: ({...}, sessionId, paneId, description, parentAgent, fit, getSize, setSize, }) => TerminalSocket
- interface TerminalSocket
- type ConnState
- `apps/web/src/hooks/useActivePane.ts`
@@ -719,7 +960,8 @@
- interface ThroughputSample
- `apps/web/src/hooks/useCoderUserEvents.ts` — function useCoderUserEvents: () => void
- `apps/web/src/hooks/useDiffPreferences.ts` — function useDiffPreferences: () => void, interface DiffPreferences
- `apps/web/src/hooks/useGitDiff.ts` — function useGitDiff: (projectId) => void
- `apps/web/src/hooks/useDraftPersistence.ts` — function useDraftPersistence: (chatId) => DraftPersistenceResult, interface DraftPersistenceResult
- `apps/web/src/hooks/useGitDiff.ts` — function useGitDiff: (projectId, hideWhitespace) => void
- `apps/web/src/hooks/useLongPress.ts` — function useLongPress: (callback) => void
- `apps/web/src/hooks/useProjectGit.ts` — function useProjectGit: (projectId) => GitMeta | null
- `apps/web/src/hooks/useProviderSnapshot.ts` — function refreshProviderSnapshot: (cwd?) => Promise<ProviderSnapshotEntry[]>, function useProviderSnapshot: (cwd?) => ProviderSnapshotEntry[] | null
@@ -732,6 +974,7 @@
- `apps/web/src/hooks/useSessions.ts` — function useSessions: (projectId) => void
- `apps/web/src/hooks/useSidebar.ts` — function useSidebar: () => void
- `apps/web/src/hooks/useSkills.ts` — function useSkills: () => void
- `apps/web/src/hooks/useTerminals.ts` — function useTerminals: () => TerminalRegistration[]
- `apps/web/src/hooks/useUserEvents.ts` — function useUserEvents: () => void
- `apps/web/src/hooks/useViewport.ts` — function useViewport: () => ViewportSnapshot, interface ViewportSnapshot
- `apps/web/src/hooks/useWorkspacePanes.ts`
@@ -794,7 +1037,16 @@
- interface ThemeMeta
- type ThemeId
- _...5 more_
- `apps/web/src/lib/tool-utils.ts`
- function isMcpTool: (name) => boolean
- function extractServerName: (name) => string | null
- function extractToolName: (name) => string | null
- const BUILT_IN_TOOLS
- `apps/web/src/lib/utils.ts` — function cn: (...inputs) => void
- `apps/web/src/stores/useDiffCommentStore.ts`
- function useDiffComments: (sessionId, mode) => void
- interface DiffComment
- interface DiffCommentTarget
- `apps/web/src/utils/diff-layout.ts`
- function parseDiff: (diffBody) => ParsedDiffFile[]
- function buildSplitRows: (file) => SplitRow[]

View File

@@ -7,6 +7,7 @@
- turn-guard — `apps/coder/src/services/backends/turn-guard.ts`
- get_middleware — `apps/server/src/services/tools/codecontext/get_middleware.ts`
- authoring — `conductor/src/flows/authoring.ts`
- spec — `openspec/changes/add-behavioral-engine/specs/audit-middleware/spec.md`
## custom
- write_guard.test — `apps/coder/src/services/__tests__/write_guard.test.ts`

View File

@@ -3,6 +3,7 @@
## CRUD Resources
- **`/api/battles`** GET | POST | GET/:id → Battle
- **`/api/plans`** GET | POST | GET/:id | PATCH/:id → Plan
- **`/api/runs`** GET | POST | GET/:id → Run
- **`/api/tasks`** GET | POST | GET/:id → Task
- **`/api/chats/:id/messages`** GET | POST | GET/:id | DELETE/:id → Message
@@ -14,11 +15,16 @@
### fastify
- `GET` `/api/term/health` params()
- `GET` `/api/term/sessions/:sid/panes/:pid/search` params(sid, pid) [auth]
- `GET` `/api/term/sessions` params() [auth]
- `POST` `/api/term/sessions/:sid/panes/:pid/start` params(sid, pid) [auth]
- `POST` `/api/term/sessions/:sid/panes/:pid/kill` params(sid, pid) [auth]
- `GET` `/ws/term/sessions/:sid/panes/:pid` params(sid, pid) [auth]
- `GET` `/api/health` params() [auth, db, queue, ai]
- `GET` `/api/sessions/:sessionId/agent-sessions` params(sessionId) [auth, db]
- `GET` `/api/analytics/summary` params() [auth, db]
- `GET` `/api/analytics/sessions` params() [auth, db]
- `GET` `/api/analytics/token-breakdown` params() [auth, db]
- `POST` `/api/battles/generate-prompt` params() [auth, db]
- `POST` `/api/battles/:id/stop` params(id) [auth, db]
- `GET` `/api/battles/:id/analysis` params(id) [auth, db]
@@ -42,6 +48,7 @@
- `POST` `/api/pending/:id/apply` params(id) [auth, db, queue]
- `POST` `/api/pending/:id/reject` params(id) [auth, db, queue]
- `POST` `/api/pending/:id/rewind` params(id) [auth, db, queue]
- `GET` `/api/plans/active` params() [db]
- `GET` `/api/providers/snapshot` params() [db, cache]
- `GET` `/api/providers/config` params() [db, cache]
- `PATCH` `/api/providers/config` params() [db, cache]
@@ -59,19 +66,22 @@
- `GET` `/api/ws/sessions/:sessionId` params(sessionId) [auth, db]
- `GET` `/api/ws/user` params() [auth, db]
- `GET` `/api/projects/:id/agents` params(id) [db, cache]
- `GET` `/api/analytics/context` params() [auth, db]
- `POST` `/api/chats/:id/messages/:msg_id/artifacts/download` params(id, msg_id) [auth, db]
- `GET` `/api/chats/:id/messages/:msg_id/html_artifact` params(id, msg_id) [auth, db]
- `GET` `/api/projects/:project_id/artifacts/:filename` params(project_id, filename) [auth, db]
- `GET` `/api/sessions/:id/chats` params(id) [auth, db]
- `POST` `/api/sessions/:id/chats` params(id) [auth, db]
- `PATCH` `/api/chats/:id` params(id) [auth, db]
- `POST` `/api/sessions/:id/chats/archive-all` params(id) [auth, db]
- `GET` `/api/sessions/:id/chats/open-count` params(id) [auth, db]
- `POST` `/api/chats/:id/archive` params(id) [auth, db]
- `POST` `/api/chats/:id/unarchive` params(id) [auth, db]
- `DELETE` `/api/chats/:id` params(id) [auth, db]
- `POST` `/api/chats/:id/fork` params(id) [auth, db]
- `POST` `/api/chats/:id/discard_stale` params(id) [auth, db]
- `GET` `/api/sessions/:id/chats` params(id) [auth, db, queue]
- `POST` `/api/sessions/:id/chats` params(id) [auth, db, queue]
- `PATCH` `/api/chats/:id` params(id) [auth, db, queue]
- `POST` `/api/sessions/:id/chats/archive-all` params(id) [auth, db, queue]
- `GET` `/api/sessions/:id/chats/open-count` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/archive` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/unarchive` params(id) [auth, db, queue]
- `DELETE` `/api/chats/:id` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/fork` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/discard_stale` params(id) [auth, db, queue]
- `GET` `/api/chats/:id/export` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/compare` params(id) [auth, db, queue]
- `GET` `/api/coder/ws/sessions/:sessionId` params(sessionId) [auth]
- `ALL` `/api/coder/*` params() [auth]
- `GET` `/api/settings/inference` params() [cache]
@@ -83,7 +93,9 @@
- `POST` `/api/chats/:id/continue` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/force_send` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/grant_read_access` params(id) [auth, db, queue]
- `GET` `/api/models` params()
- `POST` `/api/chats/:id/mcp-approve` params(id) [auth, db, queue]
- `POST` `/api/chats/:id/messages/:message_id/feedback` params(id, message_id) [auth, db, queue]
- `GET` `/api/models` params() [auth]
- `POST` `/api/projects/create` params() [auth, db]
- `POST` `/api/projects/:id/archive` params(id) [auth, db]
- `POST` `/api/projects/:id/unarchive` params(id) [auth, db]
@@ -111,6 +123,7 @@
- `GET` `/api/skills` params() [auth, db, queue]
- `POST` `/api/chats/:id/skill_invoke` params(id) [auth, db, queue]
- `GET` `/api/tools/cost_stats` params() [auth, db]
- `GET` `/api/chats/:id/traces` params(id) [db]
- `GET` `/api/ws/sessions/:id` params(id) [auth, db]
### go-net-http

View File

@@ -118,6 +118,25 @@
- model: text (required)
- verdict: text
### flow_step_events
- id: uuid (pk)
- run_id: uuid (required, fk)
- step_id: varchar (required, fk)
- event: varchar (required)
- payload: jsonb
### plans
- id: uuid (pk)
- project_id: uuid (required, fk)
- title: text (required)
- description: text
- status: text (required)
- flow_run_id: uuid (fk)
- progress_pct: integer (required)
- items_total: integer (required)
- items_completed: integer (required)
- metadata: jsonb
### projects
- id: uuid (pk)
- name: text (required)
@@ -139,6 +158,8 @@
- content: text (required)
- status: text (required)
- last_seq: integer (required)
- cache_tokens: integer
- reasoning_tokens: integer
### message_parts
- id: uuid (pk)
@@ -155,3 +176,42 @@
- session_id: uuid (required, fk)
- name: text
- status: text (required)
### tool_traces
- id: uuid (pk)
- session_id: uuid (required, fk)
- chat_id: uuid (required, fk)
- message_id: uuid (fk)
- turn_number: integer (required)
- tool_name: text (required)
- tool_input: jsonb (required)
- tool_output: text
- started_at: timestamp(tz) (required)
- finished_at: timestamp(tz)
- latency_ms: integer
- tokens_used: integer
- cache_tokens: integer
- reasoning_tokens: integer
- error: text
- outcome: text
### tool_trace_states
- id: uuid (pk)
- session_id: uuid (required, fk)
- chat_id: uuid (required, fk)
- message_id: uuid (fk)
- turn_number: integer (required)
- tool_name: text (required)
- tool_input: jsonb (required)
- started_at: timestamp(tz) (required)
### agent_snapshots
- id: uuid (pk)
- session_id: uuid (required, fk)
- chat_id: uuid (required, fk)
- model: text (required)
- agent: text
- mode: text
- turn_number: integer (required)
- messages: jsonb (required)
- tool_states: jsonb (required)

View File

@@ -20,6 +20,12 @@ SEARXNG_URL=http://100.114.205.53:8888
# with FAST_MODEL when unset.
# TASK_MODEL_URL=http://100.90.172.55:7995
# DeepSeek API key. When set, models with IDs starting with 'deepseek-'
# (e.g. deepseek-chat, deepseek-reasoner, deepseek-v4-flash) route through
# DeepSeek's API instead of llama-swap. Requires a DeepSeek Platform API key.
# DEEPSEEK_API_KEY=sk-...
# DEEPSEEK_BASE_URL=https://api.deepseek.com
# v1.13.15-tools: BOOCODE_TOOLS narrows the tool whitelist sent to the LLM.
# Unset (default) → all tools (~21k schema). Useful primarily for single-purpose
# sessions where the model only needs read-only filesystem access.

10
.gitignore vendored
View File

@@ -21,3 +21,13 @@ data/*
!data/coder-providers.example.json
codecontext/fork.tar.gz
/Arena
# Auto-generated & scratch artifacts
.impeccable/
.omo/
bun.lock
DESIGN.md
PRODUCT.md
# codesight auto-generated analysis cache
apps/web/.codesight/

View File

@@ -0,0 +1,55 @@
# Dynamic Workflow Engine — Design
## Architecture
```
User writes workflow JS file:
.boocode/workflows/my-flow.js
Workflow Runtime (apps/server)
├── isolated-vm sandbox (or node:vm)
├── API surface: agent(), parallel(), pipeline(), phase(), budget()
├── Tool bridge → BooCode's existing tool set
├── Workflow manager (concurrency, lifecycle)
├── Resumability cache (SHA-256 of agent spec)
└── Catalog (built-in workflows: deep-research, review-code)
Workflow execution:
1. User triggers workflow (slash command or Orchestrator panel)
2. File discovery finds .boocode/workflows/<name>.js
3. Sandbox compiles and executes the script
4. agent() calls go through tool bridge → existing inference pipeline
5. parallel() spawns concurrent agent calls (max 3 default)
6. Results stream via existing WS frames
7. Completed agents cached by hash for resume
API Surface (Claude Code compatible):
agent(prompt, { label?, schema?, model?, capabilities?, max_tool_calls? })
parallel([() => agent(...), () => agent(...)])
pipeline(items, ...stages)
phase(title)
log(message)
budget.total / budget.spent() / budget.remaining()
args
workflow(name, args?) — one level of nesting
```
## Implementation Plan
### Phase 1: Core Runtime (this session)
- Sandbox using Node's `vm` module (no extra deps)
- `agent()` function that creates a task and waits for completion
- Workflow file discovery
- Basic workflow manager
### Phase 2: Advanced Primitives
- `parallel()` with concurrency limits
- `pipeline()` streaming
- `budget()` token tracking
- Workflow resumability cache
### Phase 3: UI + Polish
- Integration with Orchestrator panel
- Built-in workflow catalog
- Workflow editor
- Error recovery

View File

@@ -0,0 +1,239 @@
# Paseo-like Orchestrator — Implementation Plan
> **Goal:** Transform BooCode into a Paseo-style thin-client orchestration layer with observability, dynamic workflows, resumability, background subagents, multi-modal, and cache shape telemetry.
>
> **Architecture:** Durable agent execution engine beneath thin chat/coder frontends. Trace system as foundation, workflow engine as the structural addition, everything else layered on top.
>
> **Inspired by:** Paseo (agent lifecycle, worktree isolation), Whale (workflow engine, cache telemetry), OpenCode (session resume), Claude Code (workflow script format).
---
## TL;DR
> **Quick Summary**: Build a durable orchestration layer with trace observability, dynamic JS workflows, session persistence, background subagents, and multi-modal support over 5 phases.
>
> **Deliverables**:
> - Trace system with DB persistence + viewer UI
> - Dynamic workflow engine (JS sandbox, agent/parallel/pipeline)
> - Workflow resumability (hash-based step caching)
> - Background subagent runtime
> - Session persistence across refreshes
> - Cache shape telemetry (DeepSeek KV cache viz)
> - Multi-modal attachment support
>
> **Estimated Effort**: XL — 5 phases, ~2-3 weeks total
> **Parallel Execution**: YES — phases 1-2 can partially overlap
> **Critical Path**: Trace system → Workflow engine → All downstream features
---
## Context
### Original Request
User wants BooCode to become "like Paseo — a thin client" with observability, dynamic workflows, session persistence, background agents, multi-modal, cache shape telemetry, and workflow resumability. They invoked skills across model evaluation, long context, SGLang, LangChain, LangSmith, agentic eval, agent harness construction, agent governance, and chat SDKs — indicating broad ambition for a production-quality AI coding platform.
### Key Decisions
- **Trace system first**: Foundation for all debugging and optimization
- **isolated-vm for workflow sandbox**: Node-native, no external deps
- **DB-backed sessions**: Postgres for trace store + session state
- **Existing WS frames + new `tool_trace` frame**: Live streaming to frontend
- **Phase ordering**: Foundation (trace) → UX (persistence) → Power (workflows) → Polish (background/multi-modal/cache)
---
## Phases
### Phase 1: Trace System + Observability
**Est. effort**: 3-4 days
Core observability infrastructure. Every tool call gets timed, logged, and persisted.
**Deliverables**:
- `tool_traces` DB table (id, session_id, chat_id, turn_number, tool_name, input, output, started_at, finished_at, latency_ms, tokens_used, cache_tokens, reasoning_tokens, error, outcome)
- Instrumentation in `tool-phase.ts` wrapping `executeToolCall` with start/end timing
- `tool_trace` WS frame type for live streaming to frontend
- GET `/api/chats/:id/traces` endpoint (paginated)
- Trace viewer pane (collapsible tree, timing bars, expand/collapse per call)
**Files to create**: 5-7 files across server + web + contracts
**Dependencies**: None — standalone feature
---
### Phase 2: Session Persistence + Resume
**Est. effort**: 2-3 days
Agent state survives browser refresh. Active sessions can be resumed.
**Deliverables**:
- Serialize active agent state to DB on each turn boundary
- Restore state on WS reconnect (existing `snapshot` frame enhanced)
- Agent session timeline view (history of all turns in a session)
- Coder pane rehydrates from persisted state
**Files to modify**: ws.ts, useSessionStream.ts, session store, dispatcher
**Dependencies**: None — standalone, but benefits from Phase 1 trace data
---
### Phase 3: Dynamic Workflow Engine
**Est. effort**: 5-7 days
JS sandbox for multi-agent orchestration. Claude Code compatible.
**Deliverables**:
- `isolated-vm` sandbox (or Node `vm` module with restricted context)
- Workflow API: `agent()`, `parallel()`, `pipeline()`, `phase()`, `budget()`, `log()`, `args`
- Workflow file discovery (`.boocode/workflows/*.js` → project, `~/.boocode/workflows/*.js` → global)
- Built-in workflow catalog (deep-research, multi-review, etc.)
- Workflow manager with concurrency limits, token budgets
- Integration with existing Orchestrator panel for UI
**Files to create**: 10-15 files (workflow runtime, scheduler, tool bridge, manager, catalog)
**Dependencies**: Phase 1 traces feed into workflow observability
**Workflow Resumability** (within Phase 3):
- SHA-256 hash of agent spec (prompt + options)
- Cache completed results by hash
- On re-run, skip cached agents, only execute new/changed ones
- In-memory cache for current session, optional DB persistence
**Est. effort**: 1-2 days within Phase 3
---
### Phase 4: Background Subagents
**Est. effort**: 2-3 days
Non-blocking subagent execution. `spawn_subagent` returns immediately, results collected later.
**Deliverables**:
- Background task queue (reuses existing `tasks` table)
- `spawn_subagent` tool that creates a task and returns immediately
- `subagent_status` tool to poll completion
- `subagent_result` tool to retrieve output
- Background agent pane showing running/completed subagents
- Notifications via hooks when background tasks complete
**Files to create**: 3-5 files across server + web
**Dependencies**: Phase 1 traces, Phase 2 session persistence
---
### Phase 5: Multi-modal + Cache Shape (Polish)
**Est. effort**: 2-3 days
Image/file attachment support + DeepSeek cache hit visualization.
**Deliverables (Multi-modal)**:
- Image/file attachment storage (tmpfs, referenced in message)
- Forward image content through DeepSeek API's multimodal support
- Render attached images in message bubble
- Model can "see" screenshots, diagrams, UI mocks
**Deliverables (Cache Shape)**:
- Extract `prompt_cache_hit_tokens` from DeepSeek provider metadata
- Build cache segment visualization (system prompt, tool schema, conversation)
- Per-turn cache hit rate in trace viewer
- Cumulative cache stats in session view
**Files to create**: 3-5 files
**Dependencies**: Phase 1 traces (for cache shape), existing DeepSeek integration
---
## Execution Strategy
### Parallel Execution Waves
```
Wave 1 (Start Immediately):
├── Phase 1: Trace system backend (tool_traces table + instrumentation) [deep]
├── Phase 1: Trace viewer frontend [visual-engineering]
└── Phase 2: Session persistence backbone [deep]
Wave 2 (After Wave 1):
├── Phase 3: Workflow engine sandbox + API surface [deep]
├── Phase 3: Workflow file discovery + manager [unspecified-high]
├── Phase 3: Workflow resumability cache [quick]
└── Phase 4: Background subagent queue + tools [unspecified-high]
Wave 3 (After Wave 2):
├── Phase 4: Background agent pane + notifications [visual-engineering]
├── Phase 5: Multi-modal attachment pipeline [deep]
└── Phase 5: Cache shape telemetry UI [visual-engineering]
Wave FINAL:
├── F1: Plan compliance audit (oracle)
├── F2: Code quality review (unspecified-high)
├── F3: Integration QA (unspecified-high)
└── F4: Scope fidelity check (deep)
```
---
## TODOs
> Phase 1: Trace System + Observability
- [ ] 1. Create tool_traces DB table + migration
- [ ] 2. Add tool_trace WS frame + contracts schema
- [ ] 3. Instrument tool-phase.ts with start/end timing
- [ ] 4. Add GET /api/chats/:id/traces endpoint
- [ ] 5. Build trace viewer frontend component
> Phase 2: Session Persistence + Resume
- [ ] 6. Serialize agent state to DB on turn boundaries
- [ ] 7. Restore state on WS reconnect
- [ ] 8. Agent session timeline view
> Phase 3: Dynamic Workflow Engine
- [ ] 9. Create isolated-vm workflow sandbox
- [ ] 10. Implement agent/parallel/pipeline primitives
- [ ] 11. Workflow file discovery system
- [ ] 12. Workflow manager + built-in catalog
- [ ] 13. Workflow resumability (hash-based cache)
- [ ] 14. Workflow UI integration with Orchestrator panel
> Phase 4: Background Subagents
- [ ] 15. Background task queue + spawn_subagent tool
- [ ] 16. subagent_status + subagent_result tools
- [ ] 17. Background agent pane
> Phase 5: Multi-modal + Cache Shape
- [ ] 18. Multi-modal attachment pipeline
- [ ] 19. Image render in message bubble
- [ ] 20. Cache shape telemetry data pipeline
- [ ] 21. Cache shape visualization in trace viewer
---
## Success Criteria
- Tool trace viewer shows every call with timing bars and token costs
- Browser refresh preserves agent session state
- Workflow scripts run in isolated sandbox with agent/parallel/pipeline
- Re-running a workflow skips cached agents (hash-based)
- Background subagents run independently, results collected later
- Model can see attached images in chat
- Cache hit rate visible per-turn and cumulative

View File

@@ -1,4 +1,4 @@
# BooChat
# BooChat — v2.7.17 (2026-06-08)
## Capabilities
@@ -9,6 +9,9 @@
- `ask_user_input` (interactive option chips)
- Opt-in per chat: `web_search`, `web_fetch` (SearXNG-backed, SSRF-guarded)
## Guidance resolution order
When multiple sources conflict: inline file guidance (this file) → per-session `system_prompt` → agent definition → model default. Last wins on samplers, first wins on refusals.
## You cannot
- Write, edit, or delete files
@@ -44,6 +47,11 @@
Always-true rules (process discipline, refusals, behavior contracts) live here in `BOOCHAT.md` — and in `BOOCODER.md` / `CLAUDE.md` per their scopes — where they are 100% present in every turn. On-demand recipes (specific procedures, scaffolds, checklists) live in `/data/skills/` and invoke roughly 6% of the time in clean multi-turn flow (Codeminer42 measurement, 2026). Don't file workflow rules as skills — they silently misfire. See Anthropic agent-skills best-practices (platform.claude.com/docs/en/agents-and-tools/agent-skills/best-practices) for the canonical conventions.
## Cross-file invariants
- **Tool capability lists**: `BOOCHAT.md:5-10` (read-only tools) must stay in sync with `apps/server/src/services/tools/registry.ts` `ALL_TOOLS`. If a tool is added to the registry but not listed here, models won't know to reach for it.
- **Capability refusals**: `BOOCHAT.md:12-17` ("You cannot") mirrors the path/secret/url guards in `apps/server/src/services/{path_guard,secret_guard,url_guard}.ts`. Adding a new guard type should update this refusal list.
## Verification discipline
- When assessing implementation status, verify against the running container (`curl /api/health`) and latest git commit (`git log --oneline -3`), not just source file contents. Source files can be mid-edit. The deployed state is the truth.

View File

@@ -1,4 +1,4 @@
# BooCoder — Container Guidance
# BooCoder — Container Guidance — v2.7.x (last meaningful update: 2026-06)
You are BooCoder, a write-capable coding agent. You can read AND modify files within the project scope.
@@ -19,6 +19,10 @@ You are BooCoder, a write-capable coding agent. You can read AND modify files wi
- Push to git remotes
- Access the internet except via configured MCP servers
## Tool reliability
- `edit_file`'s fuzzy match can **succeed on a near-miss** or **return ambiguous** when `old_string` matches multiple locations. Always verify the queued diff before calling `apply_pending` — the diff preview is authoritative, the tool's "success" return is not.
- The external agent's worktree diff only shows changes since the **last turn**, not since the project baseline. The DiffPanel merges these, but if you call `git diff` directly, you'll get incomplete results.
## Pending changes discipline
Every file modification queues in `pending_changes` before touching disk. The user sees a diff preview and approves/rejects each change. Never bypass this queue — it is the safety boundary between inference and the filesystem.

View File

@@ -2,6 +2,18 @@
All notable changes per release tag. Most recent on top, ordered by tag creation date (which matches the git history). Tag names follow `vMAJOR.MINOR.PATCH-slug` — the slug describes what shipped, so the tag name alone is enough to recall the batch.
## v2.8.20-paseo-orchestrator-ph3-5 — 2026-06-08
Completes the Paseo-like Orchestrator with phases 35. Phase 3 ships a Dynamic Workflow Engine built on Node's `vm` sandbox — Claude Code compatible JavaScript workflows with `agent()`, `parallel()`, `pipeline()`, `phase()`, and `budget()` primitives. Includes a built-in workflow catalog (`deep-research`, `review-code`, `find-issues`) with SHA-256 hash-based resumability cache that skips completed steps on re-run. Phase 4 adds background subagents — `spawn_subagent` returns immediately, `subagent_status` and `subagent_result` tools let the model poll and collect results. Phase 5 adds a cache shape telemetry badge to the trace viewer (colored bar + hit rate percentage) and a multi-modal attachment stub. Also ships inline diff snippets in the chat stream after write tool calls, and the `run_command` tool with auto-fix loop that detects build failures after edits and injects errors for self-correction.
## v2.8.19-paseo-orchestrator-ph1-2 — 2026-06-08
Ships the trace system and session persistence backbone. Every tool call is now timed via `tool_traces` DB table with latency, token counts, cache/reasoning breakdowns, and WS frames streamed live to a new trace viewer pane. Agent sessions survive browser refresh — `agent_snapshots` table persists state on turn boundaries and restores on WebSocket reconnect. A session timeline view shows agent turn history with scroll-to and restore. New frontend components: `TraceViewer` (collapsible panel with timing bars) and `SessionTimeline` (vertical timeline).
## v2.8.18-deepseek-whale-lift — 2026-06-08
Integrates DeepSeek API directly into BooChat and BooCoder via `@ai-sdk/deepseek`, replacing the generic `openai-compatible` wrapper. DeepSeek V4 models (`deepseek-v4-flash`, `deepseek-v4-pro`) with configurable thinking effort levels appear in both chat and coder pane model pickers. Full token tracking — cache hit tokens and reasoning tokens — flow from the API through new DB columns and WS frames into the UI message stats line. Lifts three high-value features from the Whale codebase: a schema-based tool input repair system that coerces types and unwraps markdown autolinks before Zod validation, a shell-based lifecycle hooks system (PreToolUse, PostToolUse, Stop, PreCompact, PostCompact) with JSON stdin/stdout contract, and per-MCP-server permissions (allow/ask/deny) gating tool execution.
## v2.8.0-fork-lifts — 2026-06-07
Completes the eight fork-lift integrations from `/opt/forks` into BooCode: boocontext sidecar upgrade, LSP code intelligence, DCP clean-room pruning, institutional memory, subagent protocol enhancements, plugin hook host, inference reliability (tool-shim + loop detectors), and TokenScope token breakdown. Backfills edit safety guards (truncation + dropped imports) and the TokenScope analyzer/persist module. Closes the fork-lifts-mit epic.

View File

@@ -1,5 +1,13 @@
# CLAUDE.md
<!-- Last meaningful update: 2026-06-08 (v2.8.20-paseo-orchestrator-ph3-5) -->
## You cannot
- Write, edit, or delete files (BooChat only — use BooCoder for writes)
- Run shell commands (use booterm terminal panes)
- Make commits, push, or pull (Sam reviews and commits manually)
- `git add -A` (stage only files you changed)
This file provides guidance to Claude Code (claude.ai/code) when working with code in this repository.
**Cursor agents:** start with `docs/ARCHITECTURE.md` (diagram); this file is the deep engineering reference. `data/AGENTS.md` is the agent *registry*, not navigation (the root navigation `AGENTS.md` was removed).
@@ -51,6 +59,9 @@ Detailed engineering notes live in per-app `CLAUDE.md` files, **auto-loaded when
Cross-app contracts (WS-frame & provider-type parity, sentinels) and everything below stay here.
### Guidance resolution order
When multiple sources conflict: `CLAUDE.md` (repo root) → `BOOCHAT.md` / `BOOCODER.md` (per-surface) → per-app `CLAUDE.md` (auto-loaded by file context) → `data/AGENTS.md` (agent preamble beats per-agent body) → session `system_prompt` → user prompt. Last-encountered wins on samplers; refusals cascade downward (you cannot do what any layer forbids).
### Data flow for chat
1. User sends message → POST `/api/sessions/:id/messages` creates user + assistant (status=streaming) rows

View File

@@ -7,6 +7,8 @@ const ConfigSchema = z.object({
DATABASE_URL: z.string().url(),
LOG_LEVEL: z.string().default('info'),
TMUX_CONF_PATH: z.string().default('/etc/booterm/tmux.conf'),
PTY_IDLE_TIMEOUT_SECONDS: z.coerce.number().int().min(0).default(0),
PTY_ABSOLUTE_TIMEOUT_SECONDS: z.coerce.number().int().min(0).default(0),
});
type Config = z.infer<typeof ConfigSchema>;

View File

@@ -14,12 +14,13 @@ interface SessionInfo {
id: string;
project_id: string;
project_path: string;
name: string | null;
}
export async function getSessionInfo(sessionId: string): Promise<SessionInfo | null> {
if (!pool) throw new Error('db pool not initialized');
const res = await pool.query<SessionInfo>(
`SELECT s.id, s.project_id, p.path AS project_path
`SELECT s.id, s.project_id, p.path AS project_path, s.name
FROM sessions s
JOIN projects p ON p.id = s.project_id
WHERE s.id = $1`,

View File

@@ -5,6 +5,7 @@ import { getPool, closeDb } from './db.js';
import { registerHealthRoutes } from './routes/health.js';
import { registerTerminalRoutes } from './routes/terminals.js';
import { registerSessionRoutes } from './routes/sessions.js';
import { registerSearchRoutes } from './routes/search.js';
import { registerWsAttachRoute } from './ws/attach.js';
async function main(): Promise<void> {
@@ -35,6 +36,7 @@ async function main(): Promise<void> {
registerHealthRoutes(app);
registerTerminalRoutes(app, config.TMUX_CONF_PATH);
registerSessionRoutes(app);
registerSearchRoutes(app, config.TMUX_CONF_PATH);
registerWsAttachRoute(app, config.TMUX_CONF_PATH);
const shutdown = async (signal: string) => {

View File

@@ -1,5 +1,6 @@
import { spawn } from 'node:child_process';
import type { FastifyBaseLogger } from 'fastify';
import * as registry from './registry.js';
const ID_RE = /^[a-zA-Z0-9_-]{1,64}$/;
@@ -162,3 +163,36 @@ export async function capturePane(
if (res.code !== 0) return '';
return res.stdout.replace(/(?:\r?\n)+$/, '');
}
/**
* Sweep the registry for expired sessions and kill the underlying tmux sessions.
* Logs each kill with the expiry reason (idle timeout vs absolute timeout).
* Returns the list of paneIds that were killed.
*/
export async function sweepExpired(
tmuxConfPath: string,
log: FastifyBaseLogger,
): Promise<string[]> {
const expired = registry.getTimedOutSessions();
const killed: string[] = [];
for (const meta of expired) {
const reason =
meta.idleExpiresAt &&
(!meta.absoluteExpiresAt || meta.idleExpiresAt.getTime() <= meta.absoluteExpiresAt.getTime())
? 'idle timeout'
: 'absolute timeout';
log.info({ paneId: meta.paneId, reason }, 'sweeping expired PTY session');
const sessionName = tmuxSessionName(meta.paneId);
try {
const ok = await killSession(tmuxConfPath, sessionName);
if (!ok) {
log.warn({ paneId: meta.paneId, sessionName }, 'killSession returned false during sweep');
}
} catch (err) {
log.warn({ paneId: meta.paneId, err }, 'killSession threw during sweep');
}
registry.unregister(meta.paneId);
killed.push(meta.paneId);
}
return killed;
}

View File

@@ -3,17 +3,30 @@ export interface SessionMeta {
sessionId: string;
projectPath: string;
title?: string;
description?: string;
parentAgent?: string;
createdAt: Date;
lastActivityAt: Date;
timeoutSeconds?: number;
idleExpiresAt?: Date;
absoluteExpiresAt?: Date;
}
const sessions = new Map<string, SessionMeta>();
export interface RegisterOpts {
timeoutSeconds?: number;
absoluteTimeoutSeconds?: number;
description?: string;
parentAgent?: string;
}
export function register(
sessionId: string,
paneId: string,
projectPath: string,
title?: string,
opts?: RegisterOpts,
): void {
const now = new Date();
const existing = sessions.get(paneId);
@@ -21,18 +34,42 @@ export function register(
existing.lastActivityAt = now;
return;
}
const idleExpiresAt = opts?.timeoutSeconds && opts.timeoutSeconds > 0
? new Date(now.getTime() + opts.timeoutSeconds * 1000)
: undefined;
const absoluteExpiresAt = opts?.absoluteTimeoutSeconds && opts.absoluteTimeoutSeconds > 0
? new Date(now.getTime() + opts.absoluteTimeoutSeconds * 1000)
: undefined;
sessions.set(paneId, {
paneId,
sessionId,
projectPath,
title,
description: opts?.description,
parentAgent: opts?.parentAgent,
createdAt: now,
lastActivityAt: now,
timeoutSeconds: opts?.timeoutSeconds,
idleExpiresAt,
absoluteExpiresAt,
});
}
export function unregister(paneId: string): void {
sessions.delete(paneId);
ringBuffers.delete(paneId);
}
/**
* Bump the lastActivityAt timestamp for a pane.
* Called on every PTY data write so the idle-timeout sweep knows when a session
* was last active.
*/
export function touchActivity(paneId: string): void {
const meta = sessions.get(paneId);
if (meta) {
meta.lastActivityAt = new Date();
}
}
export function list(): SessionMeta[] {
@@ -42,3 +79,162 @@ export function list(): SessionMeta[] {
export function get(paneId: string): SessionMeta | undefined {
return sessions.get(paneId);
}
// ── Pending metadata (POST /start → WS attach handoff) ──────────────────────
//
// The POST /start route stores optional description/parentAgent here; the WS
// attach handler consumes it when calling register(). This avoids coupling the
// HTTP route to the WS lifecycle while keeping the handoff single-process and
// ephemeral (no DB writes).
const pendingMetadata = new Map<string, { description?: string; parentAgent?: string }>();
export function setPendingMetadata(
paneId: string,
meta: { description?: string; parentAgent?: string },
): void {
pendingMetadata.set(paneId, meta);
}
export function consumePendingMetadata(
paneId: string,
): { description?: string; parentAgent?: string } | undefined {
const meta = pendingMetadata.get(paneId);
if (meta) pendingMetadata.delete(paneId);
return meta;
}
// ── Ring buffer for PTY output search ──────────────────────────────────────
export interface SearchMatch {
line: number;
content: string;
contextBefore: string[];
contextAfter: string[];
}
const ringBuffers = new Map<string, string[]>();
/**
* Append raw PTY data to the ring buffer for a given pane.
* Splits incoming data on newlines and pushes each line into the buffer,
* trimming to `maxLines` (default 5000) from the tail.
*/
export function appendOutput(
paneId: string,
data: string,
maxLines: number = 5000,
): void {
let buf = ringBuffers.get(paneId);
if (!buf) {
buf = [];
ringBuffers.set(paneId, buf);
}
// Split on newlines — each chunk may contain multiple complete lines and
// potentially a trailing partial line (which we store as-is; the next chunk
// will either complete it or be another partial).
const lines = data.split('\n');
// The first element of `lines` may be a continuation of the last partial
// line from the previous append. If the buffer is non-empty and the last
// stored entry is a partial (no trailing newline previously), glue them.
// We detect "partial" by checking whether `data` ended with '\n' — if it
// did, the last element after split is '' (empty) which we drop.
const endedWithNewline = data.endsWith('\n');
if (endedWithNewline) {
// The final empty-string element is discarded.
lines.pop();
}
if (buf.length > 0 && lines.length > 0) {
// Concatenate the last partial line in the buffer with the first split
// segment. This avoids splitting ANSI sequences or text across chunks.
buf[buf.length - 1] = (buf[buf.length - 1] ?? '') + (lines[0] ?? '');
lines.shift();
}
for (const line of lines) {
buf.push(line);
}
// Trim from head if over maxLines
if (buf.length > maxLines) {
buf = buf.slice(buf.length - maxLines);
ringBuffers.set(paneId, buf);
}
}
/**
* Search the ring buffer for a pane using a regex pattern.
* Returns matches with optional context lines before and after each match.
*/
export function searchRingBuffer(
paneId: string,
pattern: string,
opts?: { limit?: number; context?: number },
): SearchMatch[] {
const buf = ringBuffers.get(paneId);
if (!buf || buf.length === 0) return [];
const limit = opts?.limit ?? 50;
const context = opts?.context ?? 0;
let re: RegExp;
try {
re = new RegExp(pattern, 'u');
} catch {
return []; // invalid regex — caller should validate, but be defensive
}
const results: SearchMatch[] = [];
for (let i = 0; i < buf.length; i++) {
if (results.length >= limit) break;
if (re.test(buf[i]!)) {
const contextBefore: string[] = [];
const contextAfter: string[] = [];
for (let c = 1; c <= context; c++) {
const ci = i - c;
if (ci >= 0) contextBefore.unshift(buf[ci]!);
}
for (let c = 1; c <= context; c++) {
const ci = i + c;
if (ci < buf.length) contextAfter.push(buf[ci]!);
}
results.push({
line: i + 1, // 1-based line number for display
content: buf[i]!,
contextBefore,
contextAfter,
});
}
}
return results;
}
/**
* Remove the ring buffer for a pane. Called on session kill / pane close.
*/
export function clearBuffer(paneId: string): void {
ringBuffers.delete(paneId);
}
/**
* Return all sessions whose idle-expiry or absolute-expiry has passed.
* A session with no timeout configured is never included.
* Called by the sweepExpired interval in manager.ts.
*/
export function getTimedOutSessions(): SessionMeta[] {
const now = Date.now();
const result: SessionMeta[] = [];
for (const meta of sessions.values()) {
const idleHit = meta.idleExpiresAt && now >= meta.idleExpiresAt.getTime();
const absoluteHit = meta.absoluteExpiresAt && now >= meta.absoluteExpiresAt.getTime();
if (idleHit || absoluteHit) {
result.push(meta);
}
}
return result;
}

View File

@@ -0,0 +1,167 @@
import type { FastifyInstance } from 'fastify';
import { z } from 'zod';
import { sanitizeId, tmuxSessionName, capturePane } from '../pty/manager.js';
import { searchRingBuffer, clearBuffer } from '../pty/registry.js';
const ParamsSchema = z.object({
sid: z.string(),
pid: z.string(),
});
const MAX_PATTERN_LENGTH = 200;
// Zod-refined string: reject empty and overly-long patterns to prevent ReDoS
const PatternQuerySchema = z
.string()
.min(1, 'pattern is required')
.max(MAX_PATTERN_LENGTH, `pattern must not exceed ${MAX_PATTERN_LENGTH} characters`);
const QuerySchema = z.object({
pattern: PatternQuerySchema,
limit: z.coerce.number().int().min(1).max(500).default(50),
context: z.coerce.number().int().min(0).max(50).default(0),
});
interface SearchMatch {
line: number;
content: string;
contextBefore: string[];
contextAfter: string[];
}
interface SearchResponse {
matches: SearchMatch[];
total: number;
truncated: boolean;
source: 'ring' | 'capture';
}
/**
* Search a captured pane buffer using a regex. This is the fallback path
* when the ring buffer doesn't have enough matches.
*/
function grepBuffer(
text: string,
pattern: string,
limit: number,
context: number,
): SearchMatch[] {
let re: RegExp;
try {
re = new RegExp(pattern, 'u');
} catch {
return [];
}
const lines = text.split('\n');
const results: SearchMatch[] = [];
for (let i = 0; i < lines.length; i++) {
if (results.length >= limit) break;
if (re.test(lines[i]!)) {
const contextBefore: string[] = [];
const contextAfter: string[] = [];
for (let c = 1; c <= context; c++) {
const ci = i - c;
if (ci >= 0) contextBefore.unshift(lines[ci]!);
}
for (let c = 1; c <= context; c++) {
const ci = i + c;
if (ci < lines.length) contextAfter.push(lines[ci]!);
}
results.push({
line: i + 1,
content: lines[i]!,
contextBefore,
contextAfter,
});
}
}
return results;
}
export function registerSearchRoutes(app: FastifyInstance, tmuxConfPath: string): void {
app.get<{
Params: { sid: string; pid: string };
Querystring: { pattern?: string; limit?: string; context?: string };
}>(
'/api/term/sessions/:sid/panes/:pid/search',
async (req, reply) => {
const p = ParamsSchema.safeParse(req.params);
if (!p.success) return reply.code(400).send({ error: 'bad_params' });
const sid = sanitizeId(p.data.sid);
const pid = sanitizeId(p.data.pid);
if (!sid || !pid) return reply.code(400).send({ error: 'bad_id_format' });
const q = QuerySchema.safeParse(req.query);
if (!q.success) {
return reply.code(400).send({
error: 'bad_query',
details: q.error.flatten().fieldErrors,
});
}
const { pattern, limit, context } = q.data;
// ── Path 1: ring buffer search (fast, no tmux interaction) ──
const ringMatches = searchRingBuffer(pid, pattern, { limit, context });
if (ringMatches.length >= limit) {
return reply.code(200).send({
matches: ringMatches,
total: ringMatches.length,
truncated: ringMatches.length >= limit,
source: 'ring' as const,
});
}
// ── Path 2: capture-pane + grep fallback (10s timeout) ──
const sessionName = tmuxSessionName(pid);
let capture: string;
try {
capture = await withTimeout(
capturePane(tmuxConfPath, sessionName, 5000),
10_000,
);
} catch (err) {
req.log.warn({ err, pid }, 'capture-pane timed out or failed');
return reply.code(200).send({
matches: ringMatches,
total: ringMatches.length,
truncated: false,
source: 'ring' as const,
});
}
if (!capture) {
// tmux pane may no longer exist — return whatever ring had
return reply.code(200).send({
matches: ringMatches,
total: ringMatches.length,
truncated: false,
source: 'ring' as const,
});
}
const captureMatches = grepBuffer(capture, pattern, limit, context);
return reply.code(200).send({
matches: captureMatches,
total: captureMatches.length,
truncated: captureMatches.length >= limit,
source: 'capture' as const,
});
},
);
}
function withTimeout<T>(promise: Promise<T>, ms: number): Promise<T> {
return Promise.race([
promise,
new Promise<never>((_, reject) =>
setTimeout(() => reject(new Error('timeout')), ms),
),
]);
}

View File

@@ -10,6 +10,8 @@ export function registerSessionRoutes(app: FastifyInstance): void {
sessionId: s.sessionId,
projectPath: s.projectPath,
title: s.title ?? null,
description: s.description ?? null,
parentAgent: s.parentAgent ?? null,
createdAt: s.createdAt.toISOString(),
lastActivityAt: s.lastActivityAt.toISOString(),
})),

View File

@@ -8,6 +8,7 @@ import {
killSession,
hasSession,
} from '../pty/manager.js';
import { setPendingMetadata } from '../pty/registry.js';
const ParamsSchema = z.object({ sid: z.string(), pid: z.string() });
// v1.10.8c: optional cols/rows on /start so the per-pane tmux session is
@@ -17,6 +18,8 @@ const StartBodySchema = z
.object({
cols: z.coerce.number().int().min(1).max(2000).optional(),
rows: z.coerce.number().int().min(1).max(2000).optional(),
description: z.string().max(500).optional(),
parentAgent: z.string().max(100).optional(),
})
.partial()
.optional();
@@ -29,7 +32,7 @@ export function registerTerminalRoutes(app: FastifyInstance, tmuxConfPath: strin
// errors as HTTP responses (vs WS 1011 close codes).
app.post<{
Params: { sid: string; pid: string };
Body: { cols?: number; rows?: number } | undefined;
Body: { cols?: number; rows?: number; description?: string; parentAgent?: string } | undefined;
}>(
'/api/term/sessions/:sid/panes/:pid/start',
async (req, reply) => {
@@ -43,6 +46,14 @@ export function registerTerminalRoutes(app: FastifyInstance, tmuxConfPath: strin
const cols = b.success ? b.data?.cols : undefined;
const rows = b.success ? b.data?.rows : undefined;
// Store optional metadata for the WS attach handler to consume
if (b.success && b.data) {
const { description, parentAgent } = b.data;
if (description || parentAgent) {
setPendingMetadata(pid, { description, parentAgent });
}
}
const session = await getSessionInfo(sid);
if (!session) return reply.code(404).send({ error: 'unknown_session' });

View File

@@ -9,9 +9,14 @@ import {
} from '../pty/manager.js';
import { attachPty } from '../pty/pty.js';
import { getUser } from '../auth.js';
import { register, unregister } from '../pty/registry.js';
import { register, unregister, appendOutput, touchActivity, consumePendingMetadata } from '../pty/registry.js';
export function registerWsAttachRoute(app: FastifyInstance, tmuxConfPath: string): void {
export function registerWsAttachRoute(
app: FastifyInstance,
tmuxConfPath: string,
idleTimeoutSeconds?: number,
absoluteTimeoutSeconds?: number,
): void {
app.get<{
Params: { sid: string; pid: string };
Querystring: { cols?: string; rows?: string };
@@ -58,7 +63,25 @@ export function registerWsAttachRoute(app: FastifyInstance, tmuxConfPath: string
return;
}
register(sid, pid, session.project_path);
const pendingMeta = consumePendingMetadata(pid);
const regOpts: {
timeoutSeconds?: number;
absoluteTimeoutSeconds?: number;
description?: string;
parentAgent?: string;
} = {};
if (idleTimeoutSeconds && idleTimeoutSeconds > 0) regOpts.timeoutSeconds = idleTimeoutSeconds;
if (absoluteTimeoutSeconds && absoluteTimeoutSeconds > 0) regOpts.absoluteTimeoutSeconds = absoluteTimeoutSeconds;
if (pendingMeta) {
if (pendingMeta.description) regOpts.description = pendingMeta.description;
if (pendingMeta.parentAgent) regOpts.parentAgent = pendingMeta.parentAgent;
}
const hasRegOpts =
regOpts.timeoutSeconds !== undefined ||
regOpts.absoluteTimeoutSeconds !== undefined ||
regOpts.description !== undefined ||
regOpts.parentAgent !== undefined;
register(sid, pid, session.project_path, session.name ?? undefined, hasRegOpts ? regOpts : undefined);
let handle: IPty;
try {
@@ -106,6 +129,10 @@ export function registerWsAttachRoute(app: FastifyInstance, tmuxConfPath: string
} catch (err) {
req.log.warn({ err }, 'ws send failed');
}
// Feed the ring buffer for pattern-based search
appendOutput(pid, data);
// Bump activity timestamp for idle-timeout tracking
touchActivity(pid);
};
handle.onData(onData);

View File

@@ -36,12 +36,44 @@ export interface StepContext {
* Falls back to a default in render functions when absent.
*/
readonly model?: string;
/**
* Inter-agent messaging within the same flow run.
* `publish` broadcasts on the user WS channel and delivers to in-process
* subscribers via the broker. `subscribe` registers a handler scoped to the
* run and channel; returns an unsubscribe function.
* Undefined in contexts without a run id (manifest-only contexts).
*/
readonly messaging?: {
publish(channel: string, message: unknown): void;
subscribe(channel: string, handler: (msg: unknown) => void): () => void;
};
}
export type StepKind = 'agent' | 'code' | 'approval';
export type StepKind = 'agent' | 'code' | 'approval' | 'switch' | 'do_while';
/**
* One branch of a SWITCH step. The first case whose condition evaluates to true
* is selected; all other branches' stepIds are excluded from execution.
*/
export interface SwitchCase {
/** Human-readable label for this branch (reported in switch output). */
label: string;
/** Pure guard — called with the current step context to decide this branch. */
condition: (ctx: StepContext) => boolean;
/** stepIds belonging to this branch. */
stepIds: string[];
}
export type TriggerRule = 'all_success' | 'one_success' | 'all_done';
/** Possible statuses for a flow step (persisted in flow_steps.status). */
export type StepStatus = 'pending' | 'running' | 'completed' | 'failed' | 'skipped' | 'cancelled' | 'timed_out';
/** Retry policy for a step that times out. */
export interface RetryConfig {
maxRetries: number;
}
export interface Step {
/** unique id within the flow; other steps depend on it by this id */
id: string;
@@ -55,10 +87,25 @@ export interface Step {
/**
* For kind:'agent', returns the worker PROMPT (task + any prior outputs).
* For kind:'code', returns the step RESULT directly (the fold/transform).
* For kind:'switch', unused (the runner evaluates cases internally).
*/
run: (ctx: StepContext) => string | Promise<string>;
/** optional guard — when it returns false the step is skipped (e.g. no repo) */
when?: (ctx: StepContext) => boolean;
/** max retries on timeout (0 or unset = no retry) */
maxRetries?: number;
/** batch group id; steps sharing the same batch are gated by batchConfig.maxConcurrent */
batch?: string;
/** for kind:'switch' — ordered list of branches evaluated in declaration order */
cases?: SwitchCase[];
/** for kind:'switch' — fallback step ids when no case matches */
defaultBranch?: string[];
/** for kind:'do_while' — step IDs in the loop body (re-evaluated each iteration) */
loopBody?: string[];
/** for kind:'do_while' — guard evaluated each iteration; terminates when false */
loopCondition?: (ctx: StepContext) => boolean;
/** for kind:'do_while' — cap on total iterations (default 100) */
loopMaxIterations?: number;
}
export interface Flow {
@@ -69,6 +116,8 @@ export interface Flow {
render: (ctx: StepContext) => string;
/** optional output filename for the artifact, derived from input */
output?: (ctx: StepContext) => string;
/** batch parallelism control — gates concurrent dispatch of steps sharing the same batch id */
batchConfig?: { maxConcurrent: number; timeoutMs?: number; joinRule?: TriggerRule };
}
export interface RunResult {

View File

@@ -50,6 +50,11 @@ const ConfigSchema = z.object({
// only reaped after it's been untouched this long (avoids sweeping a dir mid
// ensureSessionWorktree create). 1h default.
ORPHAN_WORKTREE_GRACE_MS: z.coerce.number().int().positive().default(3_600_000),
DEEPSEEK_API_KEY: z.string().optional(),
DEEPSEEK_BASE_URL: z.string().url().default('https://api.deepseek.com'),
// v2.9.x: flow step timeout (default 5 min). When a 'running' step exceeds
// this duration, it is marked 'timed_out' and may be retried.
FLOW_STEP_TIMEOUT_MS: z.coerce.number().int().positive().default(300_000),
});
export type Config = z.infer<typeof ConfigSchema>;

View File

@@ -29,7 +29,9 @@ import { registerProviderRoutes } from './routes/providers.js';
import { registerWorktreeSafetyRoutes } from './routes/worktree-safety.js';
import { registerLifecycleRoutes } from './routes/lifecycle.js';
import { registerAnalyticsRoutes } from './routes/analytics.js';
import { registerPlanRoutes } from './routes/plans.js';
import { registerWebSocket } from './routes/ws.js';
import { updatePlanFromRun } from './services/plan-store.js';
// Phase 4: dispatcher + agent probe
import { createDispatcher } from './services/dispatcher.js';
// Orchestrator (Phase 2): DB-backed flow-runner; advances on the dispatcher's
@@ -229,8 +231,16 @@ async function main() {
// Orchestrator (Phase 2): the flow-runner reacts to the dispatcher's
// onTaskTerminal hook to advance flow_runs. Created before the dispatcher so its
// terminal callback can be wired in.
const flowRunner = createFlowRunner({ sql, broker, log: app.log, config });
// terminal callback can be wired in. onRunTerminal updates linked plans.
const flowRunner = createFlowRunner({
sql, broker, log: app.log, config,
onRunTerminal: (runId, status) => {
updatePlanFromRun(sql, runId, status).catch((err) => {
app.log.error({ err: err instanceof Error ? err.message : String(err), runId },
'plans: updatePlanFromRun failed');
});
},
});
// Arena SEAM (a): build the local-model set from the live llama-swap model list.
// Both bare IDs ('qwen3.6-35b') and prefixed IDs ('llama-swap/qwen3.6-35b') are
@@ -384,6 +394,7 @@ async function main() {
registerWorktreeSafetyRoutes(app, sql);
registerLifecycleRoutes(app, sql);
registerAnalyticsRoutes(app, sql);
registerPlanRoutes(app, sql);
registerWebSocket(app, sql, broker);
// Graceful shutdown

View File

@@ -0,0 +1,134 @@
/**
* Boulder state — plan routes.
*
* GET /api/plans?project_id= — list plans for a project
* GET /api/plans/active?project_id= — list active (in-flight) plans
* POST /api/plans — create a new plan
* PATCH /api/plans/:id — update plan progress / status
*/
import type { FastifyInstance } from 'fastify';
import { z } from 'zod';
import type { Sql } from '../db.js';
import {
createPlan,
getPlan,
listPlans,
listActivePlans,
updatePlan,
} from '../services/plan-store.js';
const CreatePlanBody = z.object({
project_id: z.string().uuid(),
title: z.string().min(1).max(500),
description: z.string().max(10_000).optional(),
flow_run_id: z.string().uuid().optional(),
metadata: z.record(z.unknown()).optional(),
});
const ListPlansQuery = z.object({
project_id: z.string().uuid(),
});
const UpdatePlanBody = z.object({
title: z.string().min(1).max(500).optional(),
description: z.string().max(10_000).nullable().optional(),
status: z.enum(['active', 'completed', 'cancelled', 'failed']).optional(),
progress_pct: z.number().int().min(0).max(100).optional(),
items_total: z.number().int().min(0).optional(),
items_completed: z.number().int().min(0).optional(),
metadata: z.record(z.unknown()).nullable().optional(),
});
const PlanIdParam = z.string().uuid();
export function registerPlanRoutes(app: FastifyInstance, sql: Sql): void {
// GET /api/plans?project_id= — all plans for a project
app.get('/api/plans', async (req, reply) => {
const parsed = ListPlansQuery.safeParse(req.query);
if (!parsed.success) {
reply.code(400);
return { error: 'invalid query', details: parsed.error.flatten() };
}
const plans = await listPlans(sql, parsed.data.project_id);
return { plans };
});
// GET /api/plans/active?project_id= — active plans only
app.get('/api/plans/active', async (req, reply) => {
const parsed = ListPlansQuery.safeParse(req.query);
if (!parsed.success) {
reply.code(400);
return { error: 'invalid query', details: parsed.error.flatten() };
}
const plans = await listActivePlans(sql, parsed.data.project_id);
return { plans };
});
// POST /api/plans — create a new plan
app.post('/api/plans', async (req, reply) => {
const parsed = CreatePlanBody.safeParse(req.body);
if (!parsed.success) {
reply.code(400);
return { error: 'invalid body', details: parsed.error.flatten() };
}
const { project_id, title, description, flow_run_id, metadata } = parsed.data;
const plan = await createPlan(sql, {
projectId: project_id,
title,
description,
flowRunId: flow_run_id,
metadata,
});
reply.code(201);
return { plan };
});
// GET /api/plans/:id — single plan
app.get<{ Params: { id: string } }>('/api/plans/:id', async (req, reply) => {
const parsedId = PlanIdParam.safeParse(req.params.id);
if (!parsedId.success) {
reply.code(400);
return { error: 'invalid id' };
}
const plan = await getPlan(sql, parsedId.data);
if (!plan) {
reply.code(404);
return { error: 'plan not found' };
}
return { plan };
});
// PATCH /api/plans/:id — update plan
app.patch<{ Params: { id: string } }>('/api/plans/:id', async (req, reply) => {
const parsedId = PlanIdParam.safeParse(req.params.id);
if (!parsedId.success) {
reply.code(400);
return { error: 'invalid id' };
}
const parsed = UpdatePlanBody.safeParse(req.body);
if (!parsed.success) {
reply.code(400);
return { error: 'invalid body', details: parsed.error.flatten() };
}
const { title, description, status, progress_pct, items_total, items_completed, metadata } = parsed.data;
const plan = await updatePlan(sql, parsedId.data, {
title,
description: description === null ? null : description,
status,
progressPct: progress_pct,
itemsTotal: items_total,
itemsCompleted: items_completed,
metadata: metadata === null ? null : metadata,
});
if (!plan) {
reply.code(404);
return { error: 'plan not found' };
}
return { plan };
});
}

View File

@@ -266,7 +266,7 @@ CREATE INDEX IF NOT EXISTS claude_session_entries_key_idx ON claude_session_entr
-- replaces it with the three-value list).
ALTER TABLE agent_sessions DROP CONSTRAINT IF EXISTS agent_sessions_backend_chk;
ALTER TABLE agent_sessions ADD CONSTRAINT agent_sessions_backend_chk
CHECK (backend IN ('opencode_server', 'acp_warm', 'claude_sdk'));
CHECK (backend IN ('opencode_server', 'acp_warm', 'claude_sdk', 'paseo'));
-- LISTEN/NOTIFY fast path: every tasks INSERT (from any call site — routes,
-- new_task tool, MCP server) fires pg_notify('tasks_new') in the same
@@ -340,11 +340,12 @@ CREATE INDEX IF NOT EXISTS flow_steps_task_id_idx ON flow_steps(task_id);
-- edits above are no-ops on the existing DB (CREATE TABLE IF NOT EXISTS skips an
-- existing table) — widen via the repo's DROP-IF-EXISTS → guarded-ADD discipline.
-- Pure ADD of a new allowed value, so no row UPDATE is needed (no value renamed).
-- v2.9.x: widen status CHECKs to include 'timed_out' for Task State Machine.
ALTER TABLE flow_runs DROP CONSTRAINT IF EXISTS flow_runs_status_chk;
DO $$ BEGIN
IF NOT EXISTS (SELECT 1 FROM pg_constraint WHERE conname = 'flow_runs_status_chk') THEN
ALTER TABLE flow_runs ADD CONSTRAINT flow_runs_status_chk
CHECK (status IN ('running', 'completed', 'failed', 'cancelled'));
CHECK (status IN ('running', 'completed', 'failed', 'cancelled', 'timed_out'));
END IF;
END $$;
@@ -352,10 +353,14 @@ ALTER TABLE flow_steps DROP CONSTRAINT IF EXISTS flow_steps_status_chk;
DO $$ BEGIN
IF NOT EXISTS (SELECT 1 FROM pg_constraint WHERE conname = 'flow_steps_status_chk') THEN
ALTER TABLE flow_steps ADD CONSTRAINT flow_steps_status_chk
CHECK (status IN ('pending', 'running', 'completed', 'failed', 'skipped', 'cancelled'));
CHECK (status IN ('pending', 'running', 'completed', 'failed', 'skipped', 'cancelled', 'timed_out'));
END IF;
END $$;
-- Task State Machine: retry columns for flow_steps.
ALTER TABLE flow_steps ADD COLUMN IF NOT EXISTS retry_count INTEGER NOT NULL DEFAULT 0;
ALTER TABLE flow_steps ADD COLUMN IF NOT EXISTS max_retries INTEGER;
-- Arena: battles + contestants + cross_examinations.
-- project_id carries no FK (matches tasks.project_id + flow_runs.project_id convention).
-- winner_contestant_id FK is deferred (forward reference): added via guarded ALTER below.
@@ -438,3 +443,31 @@ CREATE TABLE IF NOT EXISTS flow_step_events (
created_at TIMESTAMPTZ NOT NULL DEFAULT clock_timestamp()
);
CREATE INDEX IF NOT EXISTS flow_step_events_run_idx ON flow_step_events(run_id);
-- v2.9.0: Boulder state — cross-session plan persistence with auto-resumption.
-- project_id carries no FK (matches tasks/fow_runs convention).
-- flow_run_id links the plan to an in-flight orchestrator run for auto-tracking.
CREATE TABLE IF NOT EXISTS plans (
id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
project_id UUID NOT NULL,
title TEXT NOT NULL,
description TEXT,
status TEXT NOT NULL DEFAULT 'active',
flow_run_id UUID REFERENCES flow_runs(id) ON DELETE SET NULL,
progress_pct INTEGER NOT NULL DEFAULT 0,
items_total INTEGER NOT NULL DEFAULT 0,
items_completed INTEGER NOT NULL DEFAULT 0,
metadata JSONB,
created_at TIMESTAMPTZ NOT NULL DEFAULT clock_timestamp(),
updated_at TIMESTAMPTZ NOT NULL DEFAULT clock_timestamp(),
CONSTRAINT plans_status_chk CHECK (status IN ('active', 'completed', 'cancelled', 'failed')),
CONSTRAINT plans_progress_chk CHECK (progress_pct >= 0 AND progress_pct <= 100),
CONSTRAINT plans_items_chk CHECK (items_total >= 0 AND items_completed >= 0 AND items_completed <= items_total)
);
-- Plan queries by project and status.
CREATE INDEX IF NOT EXISTS plans_project_status_idx ON plans(project_id, status);
-- Fast lookup of the plan owning a flow run (for onRunTerminal updates).
CREATE INDEX IF NOT EXISTS plans_flow_run_id_idx ON plans(flow_run_id);
-- Plans sorted by recency (for "resume from last" surface).
CREATE INDEX IF NOT EXISTS plans_project_created_idx ON plans(project_id, created_at DESC);

View File

@@ -0,0 +1,90 @@
import { describe, it, expect } from 'vitest';
import { findConflicts } from '../collision-detector.js';
import type { ConflictEntry, ConflictIndexData } from '../collision-detector.js';
function entry(worktreeId: string, agent: string, start?: number, end?: number): ConflictEntry {
return {
worktreeId,
agent,
lineRange: start !== undefined && end !== undefined ? { start, end } : undefined,
status: 'pending' as const,
timestamp: 1000,
};
}
function index(entries: Array<[string, ConflictEntry[]]>): ConflictIndexData {
return new Map(entries.map(([path, es]) => [path, new Set(es)] as const));
}
describe('findConflicts', () => {
it('returns empty when no files in index', () => {
const result = findConflicts(['src/a.ts'], 'wt-1', new Map(), new Map());
expect(result).toEqual([]);
});
it('returns empty when only own worktree has the file', () => {
const idx = index([['src/a.ts', [entry('wt-1', 'agent-a', 1, 10)]]]);
const result = findConflicts(['src/a.ts'], 'wt-1', new Map(), idx);
expect(result).toEqual([]);
});
it('detects same_file conflict from another worktree', () => {
const idx = index([['src/a.ts', [entry('wt-2', 'agent-b', 5, 15)]]]);
const result = findConflicts(['src/a.ts'], 'wt-1', new Map(), idx);
expect(result).toHaveLength(1);
expect(result[0]!.filePath).toBe('src/a.ts');
expect(result[0]!.worktrees).toEqual(['wt-2']);
expect(result[0]!.agents).toEqual(['agent-b']);
});
it('reports same_line severity when ranges overlap', () => {
const idx = index([['src/a.ts', [entry('wt-2', 'agent-b', 10, 20)]]]);
const ranges = new Map([['src/a.ts', { start: 15, end: 25 }]]);
const result = findConflicts(['src/a.ts'], 'wt-1', ranges, idx);
expect(result[0]!.severity).toBe('same_line');
});
it('reports different_area severity when ranges are far apart', () => {
const idx = index([['src/a.ts', [entry('wt-2', 'agent-b', 1, 10)]]]);
const ranges = new Map([['src/a.ts', { start: 100, end: 200 }]]);
const result = findConflicts(['src/a.ts'], 'wt-1', ranges, idx);
expect(result[0]!.severity).toBe('different_area');
});
it('reports adjacent_line severity when ranges are 3 lines apart', () => {
const idx = index([['src/a.ts', [entry('wt-2', 'agent-b', 10, 15)]]]);
const ranges = new Map([['src/a.ts', { start: 19, end: 25 }]]);
const result = findConflicts(['src/a.ts'], 'wt-1', ranges, idx);
expect(result[0]!.severity).toBe('adjacent_line');
});
it('returns entry for each conflicting file', () => {
const idx = index([
['src/a.ts', [entry('wt-2', 'agent-b', 1, 10)]],
['src/b.ts', [entry('wt-3', 'agent-c', 1, 10)]],
]);
const result = findConflicts(['src/a.ts', 'src/b.ts', 'src/c.ts'], 'wt-1', new Map(), idx);
expect(result).toHaveLength(2);
expect(result.map((v) => v.filePath).sort()).toEqual(['src/a.ts', 'src/b.ts']);
});
it('excludes entries from the same worktree', () => {
const idx = index([['src/a.ts', [entry('wt-1', 'agent-a', 1, 10), entry('wt-2', 'agent-b', 5, 15)]]]);
const result = findConflicts(['src/a.ts'], 'wt-1', new Map(), idx);
expect(result).toHaveLength(1);
expect(result[0]!.worktrees).toEqual(['wt-2']);
});
it('deduplicates worktree IDs in verdict', () => {
const idx = index([['src/a.ts', [entry('wt-2', 'agent-b', 1, 5), entry('wt-2', 'agent-b', 10, 15)]]]);
const result = findConflicts(['src/a.ts'], 'wt-1', new Map(), idx);
expect(result[0]!.worktrees).toEqual(['wt-2']);
});
it('reports same_line when no lineRange on either side (create/delete conflates)', () => {
const idx = index([['src/a.ts', [entry('wt-2', 'agent-b')]]]);
const result = findConflicts(['src/a.ts'], 'wt-1', new Map(), idx);
expect(result).toHaveLength(1);
expect(result[0]!.severity).toBe('different_area');
});
});

View File

@@ -0,0 +1,146 @@
import { describe, it, expect, beforeEach } from 'vitest';
import { ConflictIndex } from '../conflict-index.js';
describe('ConflictIndex', () => {
let idx: ConflictIndex;
beforeEach(() => {
idx = new ConflictIndex();
});
describe('registerChange', () => {
it('adds an entry for a file path', () => {
idx.registerChange('src/a.ts', 'wt-1', 'agent-a', { start: 1, end: 10 });
const entries = idx.getEntriesFor('src/a.ts');
expect(entries.size).toBe(1);
const entry = [...entries][0]!;
expect(entry.worktreeId).toBe('wt-1');
expect(entry.agent).toBe('agent-a');
expect(entry.lineRange).toEqual({ start: 1, end: 10 });
expect(entry.status).toBe('pending');
expect(entry.timestamp).toBeGreaterThan(0);
});
it('supports multiple entries for the same file path', () => {
idx.registerChange('src/a.ts', 'wt-1', 'agent-a', { start: 1, end: 10 });
idx.registerChange('src/a.ts', 'wt-2', 'agent-b', { start: 20, end: 30 });
expect(idx.getEntriesFor('src/a.ts').size).toBe(2);
});
it('allows a worktree to have multiple entries (several edits to same file)', () => {
idx.registerChange('src/a.ts', 'wt-1', 'agent-a', { start: 1, end: 10 });
idx.registerChange('src/a.ts', 'wt-1', 'agent-a', { start: 20, end: 30 });
// Duplicate entries with same fields — the Set dedupes by ref,
// so a second identical call is still a distinct object (allowed).
expect(idx.getEntriesFor('src/a.ts').size).toBe(2);
});
it('separates files into distinct keys', () => {
idx.registerChange('src/a.ts', 'wt-1', 'agent-a');
idx.registerChange('src/b.ts', 'wt-2', 'agent-b');
expect(idx.getEntriesFor('src/a.ts').size).toBe(1);
expect(idx.getEntriesFor('src/b.ts').size).toBe(1);
});
});
describe('removeWorktree', () => {
it('removes all entries for a given worktree', () => {
idx.registerChange('src/a.ts', 'wt-1', 'agent-a');
idx.registerChange('src/a.ts', 'wt-2', 'agent-b');
idx.registerChange('src/b.ts', 'wt-1', 'agent-a');
idx.removeWorktree('wt-1');
expect(idx.getEntriesFor('src/a.ts').size).toBe(1);
expect([...idx.getEntriesFor('src/a.ts')][0]!.worktreeId).toBe('wt-2');
expect(idx.getEntriesFor('src/b.ts').size).toBe(0);
});
it('is a no-op when worktree has no entries', () => {
idx.registerChange('src/a.ts', 'wt-1', 'agent-a');
idx.removeWorktree('wt-ghost');
expect(idx.getEntriesFor('src/a.ts').size).toBe(1);
});
it('cleans up file key when last entry is removed', () => {
idx.registerChange('src/a.ts', 'wt-1', 'agent-a');
idx.removeWorktree('wt-1');
// After removal the key should be gone
expect(idx.snapshot().has('src/a.ts')).toBe(false);
});
});
describe('sweepStale', () => {
it('removes entries older than maxAgeMs', async () => {
idx.registerChange('src/a.ts', 'wt-1', 'agent-a');
idx.registerChange('src/b.ts', 'wt-2', 'agent-b');
// Wait a tick so timestamps diverge
await new Promise((r) => setTimeout(r, 10));
idx.registerChange('src/c.ts', 'wt-3', 'agent-c');
const removed = idx.sweepStale(5); // 5ms cutoff — entries from before the await are stale
expect(removed).toBeGreaterThanOrEqual(1);
});
it('removes file key when all entries swept', async () => {
idx.registerChange('src/a.ts', 'wt-1', 'agent-a');
// Wait so timestamp is definitely older than cutoff
await new Promise((r) => setTimeout(r, 10));
const removed = idx.sweepStale(5);
expect(removed).toBe(1);
expect(idx.snapshot().has('src/a.ts')).toBe(false);
});
it('returns 0 when no entries are stale', () => {
idx.registerChange('src/a.ts', 'wt-1', 'agent-a');
const removed = idx.sweepStale(86_400_000); // 24h
expect(removed).toBe(0);
});
});
describe('getConflictsFor', () => {
it('returns conflicts between worktrees', () => {
idx.registerChange('src/a.ts', 'wt-1', 'agent-a', { start: 1, end: 10 });
idx.registerChange('src/a.ts', 'wt-2', 'agent-b', { start: 5, end: 15 });
const conflicts = idx.getConflictsFor('src/a.ts');
expect(conflicts).toHaveLength(1);
expect(conflicts[0]!.filePath).toBe('src/a.ts');
// getConflictsFor doesn't know the caller's line range,
// so severity defaults to 'different_area'
expect(conflicts[0]!.severity).toBe('different_area');
});
it('returns empty for files with only one worktree', () => {
idx.registerChange('src/a.ts', 'wt-1', 'agent-a');
expect(idx.getConflictsFor('src/a.ts')).toEqual([]);
});
it('returns empty for files not in index', () => {
expect(idx.getConflictsFor('src/never-touched.ts')).toEqual([]);
});
});
describe('query', () => {
it('delegates to findConflicts with proper data', () => {
idx.registerChange('src/a.ts', 'wt-2', 'agent-b', { start: 5, end: 15 });
const ranges = new Map([['src/a.ts', { start: 10, end: 20 }]]);
const result = idx.query(['src/a.ts'], 'wt-1', ranges);
expect(result).toHaveLength(1);
expect(result[0]!.severity).toBe('same_line');
});
it('returns empty when no conflicts', () => {
idx.registerChange('src/a.ts', 'wt-1', 'agent-a', { start: 1, end: 10 });
const result = idx.query(['src/a.ts'], 'wt-1', new Map());
expect(result).toEqual([]);
});
});
describe('snapshot', () => {
it('returns a copy of the internal map', () => {
idx.registerChange('src/a.ts', 'wt-1', 'agent-a');
const snap = idx.snapshot();
expect(snap.has('src/a.ts')).toBe(true);
// Mutating the snapshot doesn't affect the original
idx.removeWorktree('wt-1');
expect(snap.has('src/a.ts')).toBe(true);
});
});
});

View File

@@ -1,16 +1,20 @@
import { describe, it, expect } from 'vitest';
import type { Flow, Step, StepContext } from '../../conductor/types.js';
import {
buildBatchState,
getReadyInBatch,
manifestSteps,
readySteps,
partitionReady,
readySteps,
isRunComplete,
isStuck,
reconcileResumeStep,
reconcileRun,
resolveSwitch,
shouldFailOnMissingAgent,
type SchedulerState,
} from '../flow-runner-decisions.js';
import type { StepContext } from '../../conductor/types.js';
/**
* The DB-driven flow-runner replaces the Phase-1 in-memory wave scheduler
@@ -52,6 +56,8 @@ const emptyState = (over: Partial<SchedulerState> = {}): SchedulerState => ({
skipped: new Set(),
inFlight: new Set(),
excluded: new Set(),
timedOut: new Set(),
switchResults: new Map(),
...over,
});
@@ -237,6 +243,442 @@ describe('isRunComplete / isStuck', () => {
});
});
// ─── SWITCH branching (v2.9) ─────────────────────────────────────────────────
describe('resolveSwitch', () => {
const baseCtx: StepContext = { input: { question: 'q', band: 'small' }, results: {} };
it('selects the first matching case and excludes other branches', () => {
const step: Step = {
id: 'router',
kind: 'switch',
run: () => '',
cases: [
{ label: 'a', condition: () => false, stepIds: ['a1', 'a2'] },
{ label: 'b', condition: () => true, stepIds: ['b1', 'b2'] },
{ label: 'c', condition: () => true, stepIds: ['c1', 'c2'] },
],
};
const result = resolveSwitch(step, baseCtx);
expect(result.chosenCase).toBe('b');
expect(result.excluded).toEqual(['a1', 'a2', 'c1', 'c2']);
});
it('falls back to defaultBranch when no case matches', () => {
const step: Step = {
id: 'router',
kind: 'switch',
run: () => '',
cases: [
{ label: 'x', condition: () => false, stepIds: ['x1'] },
{ label: 'y', condition: () => false, stepIds: ['y1'] },
],
defaultBranch: ['z1', 'z2'],
};
const result = resolveSwitch(step, baseCtx);
expect(result.chosenCase).toBeNull();
// Only case branch steps are excluded; default steps are not.
expect(result.excluded).toEqual(['x1', 'y1']);
});
it('excludes all branch steps when no case matches and no default', () => {
const step: Step = {
id: 'router',
kind: 'switch',
run: () => '',
cases: [
{ label: 'p', condition: () => false, stepIds: ['p1'] },
{ label: 'q', condition: () => false, stepIds: ['q1', 'q2'] },
],
};
const result = resolveSwitch(step, baseCtx);
expect(result.chosenCase).toBeNull();
expect(result.excluded).toEqual(['p1', 'q1', 'q2']);
});
it('excludes defaultBranch when a case matched', () => {
const step: Step = {
id: 'router',
kind: 'switch',
run: () => '',
cases: [
{ label: 'hit', condition: () => true, stepIds: ['h1'] },
{ label: 'miss', condition: () => false, stepIds: ['m1'] },
],
defaultBranch: ['d1'],
};
const result = resolveSwitch(step, baseCtx);
expect(result.chosenCase).toBe('hit');
expect(result.excluded).toEqual(['m1', 'd1']);
});
it('returns empty excluded for a degenerate switch with no cases and no default', () => {
const step: Step = {
id: 'noop',
kind: 'switch',
run: () => '',
};
const result = resolveSwitch(step, baseCtx);
expect(result.chosenCase).toBeNull();
expect(result.excluded).toEqual([]);
});
it('uses ctx.results in condition evaluation', () => {
const step: Step = {
id: 'router',
kind: 'switch',
run: () => '',
cases: [
{ label: 'has', condition: (ctx) => ctx.results['prev'] === 'yes', stepIds: ['yes-branch'] },
{ label: 'no', condition: () => true, stepIds: ['no-branch'] },
],
};
const ctxWithResult: StepContext = { input: { question: 'q', band: 'small' }, results: { prev: 'yes' } };
const result = resolveSwitch(step, ctxWithResult);
expect(result.chosenCase).toBe('has');
expect(result.excluded).toEqual(['no-branch']);
});
});
describe('readySteps with switch-excluded steps', () => {
// Flow: switch router → branch-a/branch-b → fold
function switchFlow(): Flow {
const steps: Step[] = [
{
id: 'switch', kind: 'switch', run: () => '',
cases: [
{ label: 'a', condition: () => true, stepIds: ['branch-a'] },
{ label: 'b', condition: () => false, stepIds: ['branch-b'] },
],
},
{ id: 'branch-a', kind: 'agent', agent: 'x', deps: ['switch'], run: () => 'p' },
{ id: 'branch-b', kind: 'agent', agent: 'y', deps: ['switch'], run: () => 'q' },
{ id: 'fold', kind: 'code', deps: ['branch-a', 'branch-b'], run: () => 'r' },
];
return { name: 'switch-demo', description: '', steps, render: () => '' };
}
it('excludes non-selected branch steps and treats them as satisfied deps', () => {
const flow = switchFlow();
// switch completed, branch-b excluded by switch (branch-a selected)
const switchResult = new Map<string, { chosenCase: string | null; excluded: Set<string> }>([
['switch', { chosenCase: 'a', excluded: new Set(['branch-b']) }],
]);
const state: SchedulerState = {
done: new Set(['switch']),
skipped: new Set(),
inFlight: new Set(),
excluded: new Set(),
timedOut: new Set(),
switchResults: switchResult,
};
const ready = readySteps(flow, state).map((s) => s.id);
// branch-a is ready (dep switch is done), branch-b is excluded
expect(ready).toContain('branch-a');
expect(ready).not.toContain('branch-b');
});
it('fold unblocks once selected branch completes (excluded branch satisfied)', () => {
const flow = switchFlow();
const switchResult = new Map<string, { chosenCase: string | null; excluded: Set<string> }>([
['switch', { chosenCase: 'a', excluded: new Set(['branch-b']) }],
]);
const state: SchedulerState = {
done: new Set(['switch', 'branch-a']),
skipped: new Set(),
inFlight: new Set(),
excluded: new Set(),
timedOut: new Set(),
switchResults: switchResult,
};
const ready = readySteps(flow, state).map((s) => s.id);
// fold's deps: branch-a done, branch-b excluded (via switch) → satisfied
expect(ready).toContain('fold');
});
it('fold stays blocked until selected branch completes, even with excluded dep', () => {
const flow = switchFlow();
const switchResult = new Map<string, { chosenCase: string | null; excluded: Set<string> }>([
['switch', { chosenCase: 'a', excluded: new Set(['branch-b']) }],
]);
const state: SchedulerState = {
done: new Set(['switch']),
skipped: new Set(),
inFlight: new Set(['branch-a']),
excluded: new Set(),
timedOut: new Set(),
switchResults: switchResult,
};
const ready = readySteps(flow, state).map((s) => s.id);
// branch-a in flight, branch-b excluded — only branch-a offered
expect(ready).not.toContain('fold');
});
it('isRunComplete returns true when switch-excluded steps are the only unsettled', () => {
const flow = switchFlow();
// All non-excluded steps done; branch-b is excluded via switch
const switchResult = new Map<string, { chosenCase: string | null; excluded: Set<string> }>([
['switch', { chosenCase: 'a', excluded: new Set(['branch-b']) }],
]);
const state: SchedulerState = {
done: new Set(['switch', 'branch-a', 'fold']),
skipped: new Set(),
inFlight: new Set(),
excluded: new Set(),
timedOut: new Set(),
switchResults: switchResult,
};
expect(isRunComplete(flow, state)).toBe(true);
expect(isStuck(flow, state)).toBe(false);
});
it('combines static excluded with switch-excluded', () => {
const flow = switchFlow();
// band gating excludes branch-b at launch, AND switch also excludes it
const switchResult = new Map<string, { chosenCase: string | null; excluded: Set<string> }>([
['switch', { chosenCase: 'a', excluded: new Set(['branch-b']) }],
]);
const state: SchedulerState = {
done: new Set(['switch', 'branch-a']),
skipped: new Set(),
inFlight: new Set(),
excluded: new Set(['branch-b']),
timedOut: new Set(),
switchResults: switchResult,
};
// branch-b excluded both ways; fold sees branch-a done, branch-b excluded
const ready = readySteps(flow, state).map((s) => s.id);
expect(ready).toContain('fold');
});
});
// ─── Batch parallelism (v2.8.22) ─────────────────────────────────────────────
describe('buildBatchState', () => {
it('returns empty map when flow has no batchConfig', () => {
const flow: Flow = {
name: 'no-batch',
description: '',
steps: [
{ id: 'a', kind: 'agent', agent: 'x', run: () => 'p' },
{ id: 'b', kind: 'code', deps: ['a'], run: () => 'r' },
],
render: () => '',
};
const bs = buildBatchState(flow, new Set());
expect(bs.size).toBe(0);
});
it('maps each batch group to its running set and config', () => {
const flow: Flow = {
name: 'batched',
description: '',
steps: [
{ id: 'a1', kind: 'agent', agent: 'x', batch: 'review', run: () => 'p' },
{ id: 'a2', kind: 'agent', agent: 'y', batch: 'review', run: () => 'q' },
{ id: 'b1', kind: 'agent', agent: 'z', batch: 'check', run: () => 'r' },
{ id: 'fold', kind: 'code', deps: ['a1', 'a2', 'b1'], run: () => 's' },
],
render: () => '',
batchConfig: { maxConcurrent: 2 },
};
// a1 is in flight → review batch has 1 running, check has 0.
const bs = buildBatchState(flow, new Set(['a1']));
expect(bs.size).toBe(2);
const review = bs.get('review');
expect(review).toBeDefined();
expect([...review!.running]).toEqual(['a1']);
expect(review!.maxConcurrent).toBe(2);
expect(review!.joinRule).toBe('all_success');
const check = bs.get('check');
expect(check).toBeDefined();
expect(check!.running.size).toBe(0);
expect(check!.maxConcurrent).toBe(2);
});
it('uses joinRule from batchConfig when provided', () => {
const flow: Flow = {
name: 'join',
description: '',
steps: [
{ id: 'x', kind: 'agent', agent: 'a', batch: 'g1', run: () => 'p' },
],
render: () => '',
batchConfig: { maxConcurrent: 1, joinRule: 'one_success' },
};
const bs = buildBatchState(flow, new Set());
expect(bs.get('g1')!.joinRule).toBe('one_success');
});
it('ignores steps without a batch field', () => {
const flow: Flow = {
name: 'mixed',
description: '',
steps: [
{ id: 'a', kind: 'agent', agent: 'x', run: () => 'p' },
{ id: 'b', kind: 'agent', agent: 'y', batch: 'g1', run: () => 'q' },
],
render: () => '',
batchConfig: { maxConcurrent: 3 },
};
const bs = buildBatchState(flow, new Set(['a', 'b']));
// a is inFlight but has no batch — it does not create an entry
expect(bs.size).toBe(1);
expect(bs.has('g1')).toBe(true);
expect(bs.get('g1')!.running.has('b')).toBe(true);
// a is not in any batch entry
for (const entry of bs.values()) {
expect(entry.running.has('a')).toBe(false);
}
});
});
describe('getReadyInBatch', () => {
function makeBatchState(
overrides?: Map<string, { running: Set<string>; maxConcurrent: number; joinRule: TriggerRule }>,
): Map<string, { running: Set<string>; maxConcurrent: number; joinRule: TriggerRule }> {
return overrides ?? new Map();
}
it('passes all steps through when batchState is empty', () => {
const steps: Step[] = [
{ id: 'a', kind: 'agent', agent: 'x', run: () => 'p' },
{ id: 'b', kind: 'agent', agent: 'y', batch: 'g1', run: () => 'q' },
];
const state: SchedulerState = {
done: new Set(),
skipped: new Set(),
inFlight: new Set(),
excluded: new Set(),
timedOut: new Set(),
switchResults: new Map(),
batchState: makeBatchState(),
};
const result = getReadyInBatch(steps, state, {} as Flow);
expect(result.map((s) => s.id)).toEqual(['a', 'b']);
});
it('passes non-batched steps through regardless of batch capacity', () => {
const batchState = new Map();
batchState.set('g1', { running: new Set(['a']), maxConcurrent: 1, joinRule: 'all_success' });
const steps: Step[] = [
{ id: 'nobatch', kind: 'agent', agent: 'z', run: () => 'r' },
{ id: 'batched', kind: 'agent', agent: 'x', batch: 'g1', run: () => 'p' },
];
const state: SchedulerState = {
done: new Set(),
skipped: new Set(),
inFlight: new Set(['a']),
excluded: new Set(),
timedOut: new Set(),
switchResults: new Map(),
batchState,
};
const result = getReadyInBatch(steps, state, {} as Flow);
// nobatch passes, batched is at maxConcurrent=1 with a already running → blocked
expect(result.map((s) => s.id)).toEqual(['nobatch']);
});
it('allows batch steps up to maxConcurrent', () => {
const batchState = new Map();
batchState.set('g1', { running: new Set(), maxConcurrent: 2, joinRule: 'all_success' });
const steps: Step[] = [
{ id: 's1', kind: 'agent', agent: 'x', batch: 'g1', run: () => 'p' },
{ id: 's2', kind: 'agent', agent: 'y', batch: 'g1', run: () => 'q' },
{ id: 's3', kind: 'agent', agent: 'z', batch: 'g1', run: () => 'r' },
];
const state: SchedulerState = {
done: new Set(),
skipped: new Set(),
inFlight: new Set(),
excluded: new Set(),
timedOut: new Set(),
switchResults: new Map(),
batchState,
};
// All 0 running, maxConcurrent=2 → all 3 pass through (readySteps would return them,
// but the flow-runner dispatches them one-by-one in the agent dispatch loop; getReadyInBatch
// is called each tick to allow up to maxConcurrent. Since batch is empty on this tick,
// all are allowed — the runner's dispatch loop will put 2 in flight, then next tick blocks.)
const result = getReadyInBatch(steps, state, {} as Flow);
expect(result.map((s) => s.id)).toEqual(['s1', 's2', 's3']);
});
it('blocks batch steps when at capacity', () => {
const batchState = new Map();
batchState.set('g1', { running: new Set(['a', 'b']), maxConcurrent: 2, joinRule: 'all_success' });
const steps: Step[] = [
{ id: 'c', kind: 'agent', agent: 'x', batch: 'g1', run: () => 'p' },
{ id: 'd', kind: 'agent', agent: 'y', batch: 'g1', run: () => 'q' },
];
const state: SchedulerState = {
done: new Set(),
skipped: new Set(),
inFlight: new Set(['a', 'b']),
excluded: new Set(),
timedOut: new Set(),
switchResults: new Map(),
batchState,
};
// Both batches at capacity → everything filtered out
expect(getReadyInBatch(steps, state, {} as Flow)).toEqual([]);
});
it('handles multiple independent batch groups', () => {
const batchState = new Map();
batchState.set('g1', { running: new Set(['a']), maxConcurrent: 1, joinRule: 'all_success' });
batchState.set('g2', { running: new Set(), maxConcurrent: 5, joinRule: 'all_success' });
const steps: Step[] = [
{ id: 'b', kind: 'agent', agent: 'x', batch: 'g1', run: () => 'p' }, // g1 at capacity → blocked
{ id: 'c', kind: 'agent', agent: 'y', batch: 'g2', run: () => 'q' }, // g2 has room → passes
{ id: 'd', kind: 'agent', agent: 'z', batch: 'g2', run: () => 'r' }, // g2 has room → passes
];
const state: SchedulerState = {
done: new Set(),
skipped: new Set(),
inFlight: new Set(['a']),
excluded: new Set(),
timedOut: new Set(),
switchResults: new Map(),
batchState,
};
expect(getReadyInBatch(steps, state, {} as Flow).map((s) => s.id)).toEqual(['c', 'd']);
});
it('lets a step pass when its batch group is known but has no running steps yet', () => {
const batchState = new Map();
batchState.set('g1', { running: new Set(), maxConcurrent: 2, joinRule: 'all_success' });
const steps: Step[] = [
{ id: 'first', kind: 'agent', agent: 'x', batch: 'g1', run: () => 'p' },
];
const state: SchedulerState = {
done: new Set(),
skipped: new Set(),
inFlight: new Set(),
excluded: new Set(),
timedOut: new Set(),
switchResults: new Map(),
batchState,
};
expect(getReadyInBatch(steps, state, {} as Flow).map((s) => s.id)).toEqual(['first']);
});
it('handles empty step list gracefully', () => {
const state: SchedulerState = {
done: new Set(),
skipped: new Set(),
inFlight: new Set(),
excluded: new Set(),
timedOut: new Set(),
switchResults: new Map(),
batchState: makeBatchState(),
};
expect(getReadyInBatch([], state, {} as Flow)).toEqual([]);
});
});
// ─── Resume reconciliation (D-9) ─────────────────────────────────────────────
describe('reconcileResumeStep', () => {

View File

@@ -0,0 +1,195 @@
import { describe, it, expect, vi } from 'vitest';
import { PaseoClient, PaseoClientError } from '../paseo-client.js';
/**
* Create a PaseoClient whose runCli method is replaced with a mock.
* The mock is returned as the second tuple element so tests can
* control and inspect it directly.
*/
function makeClient(config?: { paseoBin?: string; cliHost?: string }): {
client: PaseoClient;
mockRunCli: ReturnType<typeof vi.fn>;
} {
const client = new PaseoClient(config);
const mockRunCli = vi.fn();
(client as any).runCli = mockRunCli;
return { client, mockRunCli };
}
describe('PaseoClient', () => {
describe('listAgents', () => {
it('returns parsed agent list from paseo ls --json', async () => {
const agents = [
{ id: 'abc-123', shortId: 'abc', name: 'Agent 1', provider: 'opencode', status: 'running' },
{ id: 'def-456', shortId: 'def', name: 'Agent 2', provider: 'claude', status: 'idle' },
];
const { client, mockRunCli } = makeClient();
mockRunCli.mockResolvedValue(JSON.stringify(agents));
const result = await client.listAgents();
expect(mockRunCli).toHaveBeenCalledWith(['ls', '--json']);
expect(result).toEqual(agents);
});
it('throws PaseoClientError on non-JSON output', async () => {
const { client, mockRunCli } = makeClient();
mockRunCli.mockResolvedValue('not json');
await expect(client.listAgents()).rejects.toThrow(PaseoClientError);
await expect(client.listAgents()).rejects.toThrow(/invalid JSON/);
});
it('propagates runCli rejection as-is', async () => {
const { client, mockRunCli } = makeClient();
const err = new PaseoClientError('ls failed: connection refused', 'ls', 1, 'connection refused');
mockRunCli.mockRejectedValue(err);
await expect(client.listAgents()).rejects.toThrow(PaseoClientError);
await expect(client.listAgents()).rejects.toThrow(/ls failed/);
});
});
describe('getAgentStatus', () => {
it('returns parsed agent detail from paseo inspect --json', async () => {
const detail = {
Id: 'abc-123', Name: 'Agent 1', Provider: 'opencode',
Status: 'idle', Archived: false,
CreatedAt: '2026-01-01T00:00:00Z', UpdatedAt: '2026-01-01T01:00:00Z',
};
const { client, mockRunCli } = makeClient();
mockRunCli.mockResolvedValue(JSON.stringify(detail));
const result = await client.getAgentStatus('abc-123');
expect(mockRunCli).toHaveBeenCalledWith(['inspect', '--json', 'abc-123']);
expect(result.Id).toBe('abc-123');
expect(result.Status).toBe('idle');
});
});
describe('health', () => {
it('returns ok when paseo ls succeeds', async () => {
const { client, mockRunCli } = makeClient();
mockRunCli.mockResolvedValue('[]');
const result = await client.health();
expect(result).toEqual({ status: 'ok' });
});
it('returns error when runCli throws', async () => {
const { client, mockRunCli } = makeClient();
mockRunCli.mockRejectedValue(new Error('connection refused'));
const result = await client.health();
expect(result).toEqual({ status: 'error' });
});
});
describe('importAgent', () => {
it('calls paseo import with provider and labels', async () => {
const agentResult = { Id: 'new-789', Name: 'Imported', Provider: 'opencode', Status: 'idle' };
const { client, mockRunCli } = makeClient();
mockRunCli.mockResolvedValue(JSON.stringify(agentResult));
const result = await client.importAgent('ses-001', 'opencode', {
origin: 'boocode',
project: 'proj-1',
});
expect(mockRunCli).toHaveBeenCalledWith([
'import', '--json',
'--provider', 'opencode',
'--label', 'origin=boocode',
'--label', 'project=proj-1',
'ses-001',
]);
expect(result.Id).toBe('new-789');
});
it('works without labels', async () => {
const { client, mockRunCli } = makeClient();
mockRunCli.mockResolvedValue(JSON.stringify({ Id: 'new-789' }));
const result = await client.importAgent('ses-001', 'claude');
expect(mockRunCli).toHaveBeenCalledWith([
'import', '--json',
'--provider', 'claude',
'ses-001',
]);
expect(result.Id).toBe('new-789');
});
});
describe('archiveAgent', () => {
it('calls paseo archive --json', async () => {
const { client, mockRunCli } = makeClient();
mockRunCli.mockResolvedValue('{}');
await client.archiveAgent('abc-123');
expect(mockRunCli).toHaveBeenCalledWith(['archive', '--json', 'abc-123']);
});
});
describe('sendPrompt', () => {
it('sends prompt and parses JSON result', async () => {
const sendResult = { text: 'Hello!', ok: true };
const { client, mockRunCli } = makeClient();
mockRunCli.mockResolvedValue(JSON.stringify(sendResult));
const result = await client.sendPrompt('abc-123', 'Hello');
expect(mockRunCli).toHaveBeenCalledWith(['send', '--json', 'abc-123', 'Hello'], undefined);
expect(result).toEqual(sendResult);
});
it('falls back to plain text on non-JSON output', async () => {
const { client, mockRunCli } = makeClient();
mockRunCli.mockResolvedValue('plain text response');
const result = await client.sendPrompt('abc-123', 'Hi');
expect(result).toEqual({ text: 'plain text response', ok: true });
});
it('supports --no-wait flag', async () => {
const { client, mockRunCli } = makeClient();
mockRunCli.mockResolvedValue('{}');
await client.sendPrompt('abc-123', 'Hi', { noWait: true });
expect(mockRunCli).toHaveBeenCalledWith([
'send', '--json', '--no-wait',
'abc-123', 'Hi',
], undefined);
});
});
describe('stopAgent', () => {
it('calls paseo stop', async () => {
const { client, mockRunCli } = makeClient();
mockRunCli.mockResolvedValue('');
await client.stopAgent('abc-123');
expect(mockRunCli).toHaveBeenCalledWith(['stop', 'abc-123']);
});
});
describe('cliHost config', () => {
it('includes --host flag in args when cliHost is set', async () => {
const { client, mockRunCli } = makeClient({ cliHost: 'tcp://localhost:6767?ssl=true' });
mockRunCli.mockResolvedValue('[]');
await client.listAgents();
expect(mockRunCli).toHaveBeenCalledWith([
'ls', '--json', '--host', 'tcp://localhost:6767?ssl=true',
]);
});
});
});

View File

@@ -0,0 +1,16 @@
import { describe, it, expect } from 'vitest';
import { planStatusFromRun } from '../plan-store.js';
describe('planStatusFromRun', () => {
it('maps completed to completed', () => {
expect(planStatusFromRun('completed')).toBe('completed');
});
it('maps failed to failed', () => {
expect(planStatusFromRun('failed')).toBe('failed');
});
it('maps cancelled to cancelled', () => {
expect(planStatusFromRun('cancelled')).toBe('cancelled');
});
});

View File

@@ -13,7 +13,7 @@ import type { AcpToolSnapshot } from './acp-tool-snapshot.js';
import type { AgentCommand } from './provider-types.js';
/** Backend transport kind. Mirrors `agent_sessions.backend` CHECK in schema.sql. */
export type AgentBackendKind = 'opencode_server' | 'acp_warm' | 'claude_sdk';
export type AgentBackendKind = 'opencode_server' | 'acp_warm' | 'claude_sdk' | 'paseo';
/**
* Normalized, transport-agnostic events a backend emits during a turn (§2).

View File

@@ -0,0 +1,254 @@
/**
* v2.10 — PaseoBackend: Paseo agent integration for the agent-pool.
*
* Wraps the Paseo CLI daemon as an AgentBackend. Each Paseo agent maps to one
* (chat_id, agent) pair and is persisted via `paseo import` (which registers
* an agent with the Paseo daemon). Prompts are sent via `paseo send`, and
* the session is cleaned up via `paseo archive`.
*
* Paseo is a meta-agent hub — it wraps provider sessions (opencode, claude,
* acp, etc.). The `provider` option in `EnsureSessionOpts` selects which
* provider Paseo delegates to.
*
* Backend kind: 'paseo' (must be added to agent_sessions_backend_chk).
*
* Spec: openspec/changes/v2-10-paseo-integration/design.md.
*/
import type { FastifyBaseLogger } from 'fastify';
import type { Sql } from '../../db.js';
import { PaseoClient, type PaseoSendResult } from '../paseo-client.js';
import type {
AgentBackend,
AgentSessionHandle,
EnsureSessionOpts,
PromptCtx,
TurnResult,
} from '../agent-backend.js';
/** Default provider to use when Paseo wraps a generic agent. */
const DEFAULT_PASEO_PROVIDER = 'opencode';
export interface PaseoBackendDeps {
sql: Sql;
log: FastifyBaseLogger;
/** The (chat, agent) this backend serves — its pool identity + DB key. */
chatId: string;
/** Agent name (e.g. 'opencode', 'claude', 'paseo'). */
agent: string;
/** Resolved PaseoClient instance. */
client: PaseoClient;
/** Provider string to pass to `paseo import --provider`. */
provider: string;
}
export class PaseoBackend implements AgentBackend {
readonly backend = 'paseo' as const;
private readonly sql: Sql;
private readonly log: FastifyBaseLogger;
private readonly chatId: string;
private readonly agent: string;
private readonly client: PaseoClient;
private readonly provider: string;
/** Map of BooCode sessionId → Paseo agent ID. */
private readonly agentIds = new Map<string, string>();
/** True between prompt() start and settle. */
private busy = false;
private up = false;
constructor(deps: PaseoBackendDeps) {
this.sql = deps.sql;
this.log = deps.log;
this.chatId = deps.chatId;
this.agent = deps.agent;
this.client = deps.client;
this.provider = deps.provider || DEFAULT_PASEO_PROVIDER;
}
/** §2: liveness for the health endpoint + dispatcher fallback decision. */
health(): 'up' | 'down' {
return this.up ? 'up' : 'down';
}
/** Phase 3: busy iff a turn is in flight (pool never evicts a busy backend). */
isBusy(): boolean {
return this.busy;
}
// ─── ensureSession: create/import a Paseo agent ─────────────────────────────
async ensureSession(sessionId: string, opts: EnsureSessionOpts): Promise<AgentSessionHandle> {
// Check if we already have a Paseo agent ID for this session.
let paseoId = this.agentIds.get(sessionId);
if (!paseoId) {
// Resolve existing agent_session_id from DB (e.g. after a restart).
const [row] = await this.sql<{ agent_session_id: string | null }[]>`
SELECT agent_session_id FROM agent_sessions
WHERE chat_id = ${opts.chatId} AND agent = ${opts.agent} AND backend = 'paseo'
`;
if (row?.agent_session_id) {
paseoId = row.agent_session_id;
this.agentIds.set(sessionId, paseoId);
}
}
if (!paseoId) {
// Import a new Paseo agent. Use the session UUID as the provider session id.
const labels: Record<string, string> = {
origin: 'boocode',
project: opts.projectId,
chat: opts.chatId,
worktree: opts.worktreeId,
agent: this.agent,
};
try {
const agent = await this.client.importAgent(sessionId, this.provider, labels);
paseoId = agent.Id;
this.agentIds.set(sessionId, paseoId);
this.log.info(
{ paseoId, agent: this.agent, chatId: this.chatId },
'paseo: imported agent',
);
} catch (err) {
this.log.error(
{ err: String(err), agent: this.agent, chatId: this.chatId },
'paseo: importAgent failed',
);
throw err;
}
}
// Upsert the agent_sessions row.
await this.sql`
INSERT INTO agent_sessions
(chat_id, session_id, worktree_id, agent, backend, agent_session_id, server_port, status, last_active_at)
VALUES
(${opts.chatId}, ${sessionId}, ${opts.worktreeId}, ${opts.agent}, 'paseo', ${paseoId}, NULL, 'active', clock_timestamp())
ON CONFLICT (chat_id, agent) DO UPDATE SET
session_id = EXCLUDED.session_id,
worktree_id = EXCLUDED.worktree_id,
backend = 'paseo',
agent_session_id = COALESCE(EXCLUDED.agent_session_id, agent_sessions.agent_session_id),
server_port = NULL,
status = 'active',
last_active_at = clock_timestamp()
`.catch((err) => {
this.log.warn(
{ err: String(err), chatId: opts.chatId, agent: opts.agent },
'paseo: agent_sessions upsert failed (non-fatal)',
);
});
this.up = true;
return {
sessionId,
agent: opts.agent,
backend: 'paseo',
chatId: opts.chatId,
worktreeId: opts.worktreeId,
agentSessionId: paseoId,
serverPort: null,
};
}
// ─── prompt: send a message to the Paseo agent ─────────────────────────────
async prompt(handle: AgentSessionHandle, input: string, ctx: PromptCtx): Promise<TurnResult> {
const paseoId = handle.agentSessionId;
if (!paseoId) {
return { ok: false, error: 'paseo: no agent session id in handle' };
}
this.busy = true;
try {
// Use streamSend for real-time text output via onEvent.
const result: PaseoSendResult = await this.client.streamSend(
paseoId,
input,
(event) => {
ctx.onEvent(event);
},
ctx.signal,
);
// Update last_active_at.
await this.sql`
UPDATE agent_sessions
SET last_active_at = clock_timestamp()
WHERE chat_id = ${handle.chatId} AND agent = ${handle.agent}
`.catch(() => { /* non-fatal */ });
if (result.error) {
return { ok: false, error: result.error };
}
return { ok: true };
} catch (err) {
const msg = err instanceof Error ? err.message : String(err);
// Check if abortion
if (ctx.signal.aborted) {
return { ok: false, error: 'cancelled' };
}
return { ok: false, error: `paseo: ${msg}` };
} finally {
this.busy = false;
}
}
// ─── closeSession: archive the Paseo agent ─────────────────────────────────
async closeSession(handle: AgentSessionHandle): Promise<void> {
const paseoId = handle.agentSessionId;
if (!paseoId) return;
try {
await this.client.archiveAgent(paseoId);
this.log.info({ paseoId, agent: handle.agent }, 'paseo: archived agent');
} catch (err) {
this.log.warn(
{ err: String(err), paseoId, agent: handle.agent },
'paseo: archiveAgent failed (non-fatal)',
);
}
this.agentIds.delete(handle.sessionId);
// Update DB row.
await this.sql`
UPDATE agent_sessions
SET status = 'closed', last_active_at = clock_timestamp()
WHERE chat_id = ${handle.chatId} AND agent = ${handle.agent}
`.catch(() => { /* non-fatal */ });
}
// ─── dispose: archive all tracked agents ───────────────────────────────────
async dispose(): Promise<void> {
const ids = [...this.agentIds.values()];
this.agentIds.clear();
for (const paseoId of ids) {
try {
await this.client.archiveAgent(paseoId);
} catch {
// Best-effort cleanup during shutdown.
}
}
this.up = false;
}
/** Phase 3: periodic health tick — probes the Paseo daemon. */
async tickHealth(_now?: number): Promise<void> {
try {
const h = await this.client.health();
this.up = h.status === 'ok';
} catch {
this.up = false;
}
}
}

View File

@@ -0,0 +1,115 @@
// v2.8 Collision detection — pure functions that find file overlaps between
// worktrees/agents editing the same files concurrently. Advisory only; writes
// are never blocked, but the collision info surfaces in the UI and logs.
//
// Severity levels:
// same_line — the same file, exact same line region
// adjacent_line — the same file, lines touch or are within 5 lines
// different_area — the same file, distant lines
//
// Pure functions, no side effects. Testable in isolation.
export type ConflictSeverity = 'same_line' | 'adjacent_line' | 'different_area';
export interface ConflictVerdict {
filePath: string;
worktrees: string[];
severity: ConflictSeverity;
agents: string[];
}
/**
* Registry entry for a single file change recorded by a worktree.
* Stored in the ConflictIndex Map value for each file path.
*/
export interface ConflictEntry {
worktreeId: string;
agent: string;
/**
* Approximate line range touched by the change. undefined when the change
* creates or deletes the file (full-file collision vs. same-line).
*/
lineRange?: { start: number; end: number };
status: 'pending' | 'applied' | 'reverted';
timestamp: number;
}
/**
* Shape of the conflict index consumed by findConflicts.
* File path → set of entries from different worktrees/agents.
*/
export type ConflictIndexData = ReadonlyMap<string, ReadonlySet<ConflictEntry>>;
/**
* Find file overlaps between `changedFiles` and the conflict index, excluding
* the caller's own worktree.
*
* Returns one ConflictVerdict per file that has entries from other worktrees.
* Severity is the highest found (same_line > adjacent_line > different_area).
*/
export function findConflicts(
changedFiles: string[],
worktreeId: string,
/** Approximate line range for the proposed changes, keyed by file path */
changedRanges: Map<string, { start: number; end: number }>,
conflictIndex: ConflictIndexData,
): ConflictVerdict[] {
const verdicts: ConflictVerdict[] = [];
for (const filePath of changedFiles) {
const entries = conflictIndex.get(filePath);
if (!entries || entries.size === 0) continue;
// Filter to entries from OTHER worktrees
const otherEntries = [...entries].filter((e) => e.worktreeId !== worktreeId);
if (otherEntries.length === 0) continue;
const myRange = changedRanges.get(filePath);
let severity: ConflictSeverity = 'different_area';
for (const entry of otherEntries) {
if (!myRange || !entry.lineRange) {
// Full-file changes (create/delete) always hit at least different_area
continue;
}
const sev = lineOverlapSeverity(myRange, entry.lineRange);
if (sev === 'same_line') {
severity = 'same_line';
break; // Can't get higher than this
}
if (sev === 'adjacent_line' && severity === 'different_area') {
severity = 'adjacent_line';
}
}
const worktrees = [...new Set(otherEntries.map((e) => e.worktreeId))];
const agents = [...new Set(otherEntries.map((e) => e.agent))];
verdicts.push({ filePath, worktrees, severity, agents });
}
return verdicts;
}
const ADJACENT_LINE_THRESHOLD = 5;
/**
* Determine severity of overlap between two line ranges.
*/
function lineOverlapSeverity(
a: { start: number; end: number },
b: { start: number; end: number },
): ConflictSeverity {
// Same_line: ranges intersect
if (a.start <= b.end && b.start <= a.end) {
return 'same_line';
}
// Adjacent: ranges are within ADJACENT_LINE_THRESHOLD lines of each other
const gap = a.start > b.end ? a.start - b.end : b.start - a.end;
if (gap <= ADJACENT_LINE_THRESHOLD) {
return 'adjacent_line';
}
return 'different_area';
}

View File

@@ -0,0 +1,151 @@
// v2.8 In-memory conflict index — tracks which worktrees/agents are editing
// which files so the collision detector can find overlaps.
//
// Singleton exported as `conflictIndex`; imported by pending_changes.ts to
// register changes at queue time and unregister on worktree teardown.
//
// NOT persisted — survives only as long as the BooCoder process. Postgres
// is the durable record (pending_changes table); this is the hot in-memory
// probe for concurrent edit warnings.
import type { ConflictEntry, ConflictVerdict } from './collision-detector.js';
import { findConflicts } from './collision-detector.js';
export class ConflictIndex {
/**
* filePath → Set of ConflictEntry from various worktrees.
* A single worktree may have multiple entries for the same file
* (several pending edits to the same file in one session).
*/
#map = new Map<string, Set<ConflictEntry>>();
// ---- mutation -------------------------------------------------------
/**
* Register that `worktreeId` (agent) is touching `filePath`.
* Creates an entry in the index so subsequent callers see it as a conflict.
*/
registerChange(
filePath: string,
worktreeId: string,
agent: string,
lineRange?: { start: number; end: number },
): void {
let entries = this.#map.get(filePath);
if (!entries) {
entries = new Set();
this.#map.set(filePath, entries);
}
entries.add({
worktreeId,
agent,
lineRange,
status: 'pending' as const,
timestamp: Date.now(),
});
}
/**
* Remove all entries for a given worktree. Called on worktree teardown
* so stale entries don't trigger false warnings.
*/
removeWorktree(worktreeId: string): void {
for (const [filePath, entries] of this.#map) {
const before = entries.size;
for (const entry of entries) {
if (entry.worktreeId === worktreeId) {
entries.delete(entry);
}
}
if (entries.size === 0) {
this.#map.delete(filePath);
}
}
}
/**
* Remove entries older than `maxAgeMs`. Useful as a periodic cleanup
* when worktree teardown was missed (crash, unclean exit).
*/
sweepStale(maxAgeMs: number): number {
const cutoff = Date.now() - maxAgeMs;
let removed = 0;
for (const [filePath, entries] of this.#map) {
for (const entry of entries) {
if (entry.timestamp < cutoff) {
entries.delete(entry);
removed++;
}
}
if (entries.size === 0) {
this.#map.delete(filePath);
}
}
return removed;
}
// ---- query ----------------------------------------------------------
/**
* Query the raw ConflictEntry set for a file path. Returns empty set
* when there are no entries (never mutated the file).
*/
getEntriesFor(filePath: string): ReadonlySet<ConflictEntry> {
return this.#map.get(filePath) ?? new Set();
}
/**
* Get all conflict verdicts for a given file path — which other
* worktrees are touching it. Returns empty when only one worktree
* has entries (no actual conflict).
*/
getConflictsFor(filePath: string): ConflictVerdict[] {
const entries = this.#map.get(filePath);
if (!entries || entries.size === 0) return [];
// Determine distinct worktree IDs. If only one, no conflict.
const worktreeIds = new Set<string>();
for (const e of entries) worktreeIds.add(e.worktreeId);
if (worktreeIds.size <= 1) return [];
// Use the first worktree as the "caller" so findConflicts excludes
// its entries and returns only entries from OTHER worktrees.
const caller = [...worktreeIds][0]!;
return findConflicts(
[filePath],
caller,
new Map(),
this.#toIndexData(),
);
}
/**
* Get conflicts for a set of file changes from a specific worktree.
* Delegates to the pure findConflicts function.
*/
query(
changedFiles: string[],
worktreeId: string,
changedRanges: Map<string, { start: number; end: number }>,
): ConflictVerdict[] {
return findConflicts(changedFiles, worktreeId, changedRanges, this.#toIndexData());
}
/**
* Snapshot the current map for testing/inspection.
*/
snapshot(): Map<string, ReadonlySet<ConflictEntry>> {
return new Map(this.#map);
}
// ---- private --------------------------------------------------------
#toIndexData(): ReadonlyMap<string, ReadonlySet<ConflictEntry>> {
return this.#map as ReadonlyMap<string, ReadonlySet<ConflictEntry>>;
}
}
// Singleton — the whole BooCoder process shares one conflict index.
export const conflictIndex = new ConflictIndex();

View File

@@ -33,11 +33,52 @@ export interface SchedulerState {
readonly inFlight: ReadonlySet<string>;
/** step ids pre-skipped at launch (band/when gating) — never given a row */
readonly excluded: ReadonlySet<string>;
/** step ids that timed out (terminal — no retries remaining or not retriable) */
readonly timedOut: ReadonlySet<string>;
/**
* Per-batch running sets, populated by buildBatchState from the flow definition
* and the current inFlight set. Only read by getReadyInBatch; never mutated by
* decision functions (the caller maintains it across ticks).
*/
readonly batchState?: Map<string, { running: Set<string>; maxConcurrent: number; joinRule: TriggerRule }>;
/**
* Per-switch-step routing results. Populated when a SWITCH step completes.
* Step ids in any result's `excluded` set are treated as excluded for the
* remainder of the run — they won't execute and won't block dependents.
*/
readonly switchResults: ReadonlyMap<string, { chosenCase: string | null; excluded: ReadonlySet<string> }>;
/** Per-DO_WHILE iteration count; presence in the map indicates an active loop */
readonly loopIterations: ReadonlyMap<string, number>;
}
/** A dependency is satisfied once it is done, skipped, or excluded. */
/** A dependency is satisfied once it is done, skipped, excluded, or timed out.
* Dependencies on a running DO_WHILE step are also satisfied so body steps
* execute during an active loop iteration. */
function isSatisfied(state: SchedulerState, id: string): boolean {
return state.done.has(id) || state.skipped.has(id) || state.excluded.has(id);
const effectiveExcluded = getEffectiveExcluded(state);
if (state.done.has(id) || state.skipped.has(id) || effectiveExcluded.has(id) || state.timedOut.has(id)) {
return true;
}
// A dependency on a running DO_WHILE step is satisfied (body runs during the loop).
if (state.loopIterations.has(id) && state.inFlight.has(id)) return true;
return false;
}
/**
* The union of the static `excluded` set and every switch result's excluded
* step ids. Steps excluded by a SWITCH evaluation act exactly like launch-time
* excluded steps: they never run and they don't block dependents.
*/
function getEffectiveExcluded(state: SchedulerState): ReadonlySet<string> {
// Fast path: no switch results → static excluded only.
if (state.switchResults.size === 0) return state.excluded;
const combined = new Set(state.excluded);
for (const result of state.switchResults.values()) {
for (const id of result.excluded) {
combined.add(id);
}
}
return combined;
}
/**
@@ -56,13 +97,14 @@ export function manifestSteps(flow: Flow, launchCtx: StepContext): Step[] {
* Faithful to `conductor/flow.ts:27-36`. Pure.
*/
export function readySteps(flow: Flow, state: SchedulerState): Step[] {
const effectiveExcluded = getEffectiveExcluded(state);
return flow.steps.filter(
(s) =>
!state.done.has(s.id) &&
!state.skipped.has(s.id) &&
!state.inFlight.has(s.id) &&
!state.excluded.has(s.id) &&
((s.deps ?? []).length === 0 || evaluateTriggerRule(s.deps ?? [], state.done, state.skipped, state.excluded, s.trigger_rule)),
!effectiveExcluded.has(s.id) &&
((s.deps ?? []).length === 0 || evaluateTriggerRule(s.deps ?? [], state.done, state.skipped, effectiveExcluded, s.trigger_rule)),
);
}
@@ -102,6 +144,57 @@ export function isStuck(flow: Flow, state: SchedulerState): boolean {
);
}
// ─── Batch parallelism (v2.8.22) ─────────────────────────────────────────────
/**
* Build the batchState Map from the flow definition and the current inFlight set.
* Only steps with a `batch` field are tracked. Empty map when `flow.batchConfig`
* is absent or no steps belong to a batch. Pure — no IO.
*/
export function buildBatchState(
flow: Flow,
inFlight: ReadonlySet<string>,
): Map<string, { running: Set<string>; maxConcurrent: number; joinRule: TriggerRule }> {
const result = new Map<string, { running: Set<string>; maxConcurrent: number; joinRule: TriggerRule }>();
if (!flow.batchConfig) return result;
// Collect every unique batch group referenced by the flow's steps.
const groups = new Set<string>();
for (const s of flow.steps) {
if (s.batch) groups.add(s.batch);
}
const { maxConcurrent, joinRule } = flow.batchConfig;
for (const batch of groups) {
const running = new Set<string>(
flow.steps.filter((s) => s.batch === batch && inFlight.has(s.id)).map((s) => s.id),
);
result.set(batch, { running, maxConcurrent, joinRule: joinRule ?? 'all_success' });
}
return result;
}
/**
* Gate a ready step list by batch parallelism limits. Steps without a `batch`
* field always pass through. Steps belonging to a batch are only included if
* that batch's currently-running count is below its `maxConcurrent` cap.
*
* This is ADDITIVE to the existing wave scheduler: pure dep-based readiness
* is computed first (readySteps), then this function applies the batch ceiling.
* Steps excluded here remain pending and will be picked up on the next tick
* when a running batch step completes.
*/
export function getReadyInBatch(ready: readonly Step[], state: SchedulerState, _flow: Flow): Step[] {
const batchState = state.batchState;
if (!batchState || batchState.size === 0) return [...ready];
return ready.filter((s) => {
if (!s.batch) return true;
const bs = batchState.get(s.batch);
if (!bs) return true;
return bs.running.size < bs.maxConcurrent;
});
}
// ─── Resume reconciliation (D-9) ─────────────────────────────────────────────
/**
@@ -118,25 +211,50 @@ export function isStuck(flow: Flow, state: SchedulerState): boolean {
* - 'mark-cancelled': task was cancelled before the callback ran; propagate so
* advance() cancels the run.
*/
/**
* True when the step definition allows retries on timeout.
* Pure — no IO.
*/
export function isRetriable(step: { maxRetries?: number }): boolean {
return (step.maxRetries ?? 0) > 0;
}
/**
* True when the step has retries remaining.
* Pure — no IO.
*/
export function shouldRetry(maxRetries: number | undefined | null, retryCount: number): boolean {
return retryCount < (maxRetries ?? 0);
}
export type ResumeAction =
| 'keep'
| 're-dispatch'
| 'mark-done'
| 'mark-failed'
| 'mark-cancelled';
| 'mark-cancelled'
| 'retry';
/**
* Decide what to do with ONE flow step during startup resume (D-9). Pure.
*
* @param status - flow_steps.status
* @param taskId - flow_steps.task_id (null for code steps or unstarted agent steps)
* @param taskState - tasks.state for taskId, or null if the task row is absent
* @param status - flow_steps.status
* @param taskId - flow_steps.task_id (null for code steps or unstarted agent steps)
* @param taskState - tasks.state for taskId, or null if the task row is absent
* @param retryCount - flow_steps.retry_count (default 0)
* @param maxRetries - flow_steps.max_retries (null = no retry)
*/
export function reconcileResumeStep(
status: string,
taskId: string | null,
taskState: string | null,
retryCount?: number,
maxRetries?: number | null,
): ResumeAction {
if (status === 'timed_out') {
if (shouldRetry(maxRetries, retryCount ?? 0)) return 'retry';
return 'mark-failed';
}
if (status !== 'running') return 'keep';
// Running step: decide by its task's current state.
if (!taskId || taskState === null) return 're-dispatch'; // task gone or never created
@@ -167,6 +285,60 @@ export function shouldFailOnMissingAgent(agent: string, modeId: string | null):
return agent === 'qwen' && modeId === 'plan';
}
/**
* Evaluate a SWITCH step: iterate cases in declaration order and return the
* label of the first matching case plus every step id that belongs to a
* non-selected branch. When no case matches, the defaultBranch (if present)
* is the effective choice. If there is no default, all branch steps are
* excluded and the switch returns `chosenCase: null`.
*
* Pure — no IO. The caller adds the returned `excluded` ids to the scheduler
* state's switchResults so downstream decision functions see them as excluded.
*/
export function resolveSwitch(
step: Step,
ctx: StepContext,
): { chosenCase: string | null; excluded: string[] } {
const cases = step.cases;
if (!cases || cases.length === 0) {
// Degenerate switch — nothing to evaluate.
return { chosenCase: null, excluded: [] };
}
// Evaluate conditions in order.
for (const c of cases) {
if (c.condition(ctx)) {
// This case matches — exclude all OTHER branches.
const excluded: string[] = [];
for (const other of cases) {
if (other.label !== c.label) {
excluded.push(...other.stepIds);
}
}
// The default branch is also excluded when a case matched.
if (step.defaultBranch) excluded.push(...step.defaultBranch);
return { chosenCase: c.label, excluded };
}
}
// No case matched — use default branch if present.
if (step.defaultBranch) {
// Default is the chosen branch: exclude all explicit case branches.
const excluded: string[] = [];
for (const c of cases) {
excluded.push(...c.stepIds);
}
return { chosenCase: null, excluded };
}
// No case matched and no default — exclude everything.
const excluded: string[] = [];
for (const c of cases) {
excluded.push(...c.stepIds);
}
return { chosenCase: null, excluded };
}
/**
* Evaluate a trigger rule against dependency results.
* - all_success: every dep must be done (not skipped/failed)
@@ -198,7 +370,7 @@ export function evaluateTriggerRule(
* decision per step. Pure — no IO.
*/
export function reconcileRun(
steps: ReadonlyArray<{ stepId: string; taskId: string | null; status: string }>,
steps: ReadonlyArray<{ stepId: string; taskId: string | null; status: string; retryCount?: number; maxRetries?: number | null }>,
taskStates: ReadonlyMap<string, string>,
): StepResumeDecision[] {
return steps.map((step) => ({
@@ -207,6 +379,22 @@ export function reconcileRun(
step.status,
step.taskId,
step.taskId ? (taskStates.get(step.taskId) ?? null) : null,
step.retryCount,
step.maxRetries,
),
}));
}
/**
* True when a DO_WHILE loop should stop: the condition returned false or the
* iteration cap was reached. Pure — no IO.
*
* @param step - the DO_WHILE step definition
* @param ctx - current step context (input + accumulated results)
* @param iterations - number of completed iterations so far
*/
export function isLoopTerminated(step: Step, ctx: StepContext, iterations: number): boolean {
if (iterations >= (step.loopMaxIterations ?? 100)) return true;
if (step.loopCondition) return !step.loopCondition(ctx);
return false;
}

View File

@@ -32,7 +32,7 @@
* already emits. (Phase 8 wires the OrchestratorPane's subscription to both.)
*/
import type { Sql } from '../db.js';
import type { Broker } from '@boocode/server/broker';
import type { Broker, Frame, Listener } from '@boocode/server/broker';
import type { WsFrame } from '@boocode/contracts/ws-frames';
import type { FastifyBaseLogger } from 'fastify';
import type { Config } from '../config.js';
@@ -40,11 +40,15 @@ import { getFlow } from '../conductor/flows/index.js';
import { loadPersona } from '../conductor/persona-loader.js';
import type { Band, DispatchFn, Flow, FlowInput, Step, StepContext } from '../conductor/types.js';
import {
buildBatchState,
getReadyInBatch,
isLoopTerminated,
isRunComplete,
manifestSteps,
partitionReady,
readySteps,
reconcileRun,
resolveSwitch,
type SchedulerState,
type StepResumeDecision,
} from './flow-runner-decisions.js';
@@ -89,15 +93,20 @@ interface Deps {
broker: Broker;
log: FastifyBaseLogger;
config: Config;
/** Fired when a flow run reaches a terminal state (for plan-store integration). */
onRunTerminal?: (runId: string, status: 'completed' | 'failed' | 'cancelled') => void;
}
interface FlowStepRow {
step_id: string;
kind: 'agent' | 'code';
kind: 'agent' | 'code' | 'switch' | 'do_while';
agent: string | null;
status: string;
chat_id: string | null;
output: string | null;
updated_at: string | null;
retry_count: number | null;
max_retries: number | null;
}
export function createFlowRunner(deps: Deps): FlowRunner {
@@ -110,6 +119,10 @@ export function createFlowRunner(deps: Deps): FlowRunner {
// taskId → resolver map. These tasks have NO flow_steps row; handleTaskTerminal
// resolves them here instead of advancing a run.
const subDispatchWaiters = new Map<string, (output: string) => void>();
/** Per-DO_WHILE step iteration count; persists across advance() calls. */
const loopIterations = new Map<string, number>();
/** Per-run messaging subscriptions; cleaned up when the run terminates. */
const messagingCleanups = new Map<string, Set<() => void>>();
function publishUser(frame: Record<string, unknown>): void {
broker.publishUserFrame('default', frame as unknown as WsFrame);
@@ -126,8 +139,42 @@ export function createFlowRunner(deps: Deps): FlowRunner {
results: Record<string, string>,
model: string,
dispatch?: DispatchFn,
runId?: string,
stepId?: string,
): StepContext {
return { input, results, model, dispatch };
let messaging: StepContext['messaging'] = undefined;
if (runId) {
if (!messagingCleanups.has(runId)) {
messagingCleanups.set(runId, new Set());
}
const subs = messagingCleanups.get(runId)!;
messaging = {
publish(channel: string, message: unknown) {
const content = typeof message === 'string' ? message : JSON.stringify(message);
const topic = `run:${runId}:${channel}`;
const frame = {
type: 'agent_message' as const,
run_id: runId,
sender_step_id: stepId ?? '',
content,
...(channel ? { channel } : {}),
};
broker.publishUserFrame('default', frame as unknown as WsFrame);
broker.publish(topic, frame as unknown as Frame);
},
subscribe(channel: string, handler: (msg: unknown) => void) {
const topic = `run:${runId}:${channel}`;
const listener: Listener = (f) => { handler(f); };
const unsub = broker.subscribe(topic, listener);
subs.add(unsub);
return () => {
unsub();
subs.delete(unsub);
};
},
};
}
return { input, results, model, dispatch, messaging };
}
/** Latest assistant message text for a chat — the FULL worker output (≤50k as
@@ -261,7 +308,8 @@ export function createFlowRunner(deps: Deps): FlowRunner {
const dispatch: DispatchFn = (agent, task) => dispatchSubAgent(run.project_id, model, agent, task);
const rows = await sql<FlowStepRow[]>`
SELECT step_id, kind, agent, status, chat_id, output FROM flow_steps WHERE run_id = ${runId}
SELECT step_id, kind, agent, status, chat_id, output, updated_at, retry_count, max_retries
FROM flow_steps WHERE run_id = ${runId}
`;
// Re-derive the excluded set (band/when pre-skips) from the flow def + input —
@@ -273,6 +321,9 @@ export function createFlowRunner(deps: Deps): FlowRunner {
const done = new Set<string>();
const skipped = new Set<string>();
const inFlight = new Set<string>();
const timedOut = new Set<string>();
/** Per-switch routing results — maps switch step id → resolved branch details */
const switchExcluded = new Map<string, { chosenCase: string | null; excluded: Set<string> }>();
const results: Record<string, string> = {};
for (const r of rows) {
switch (r.status) {
@@ -286,6 +337,9 @@ export function createFlowRunner(deps: Deps): FlowRunner {
case 'running':
inFlight.add(r.step_id);
break;
case 'timed_out':
timedOut.add(r.step_id);
break;
case 'failed':
// A failed worker makes the deterministic report untrustworthy — fail the
// whole run (matches the Phase-1 CLI, which throws on a dispatch failure).
@@ -298,19 +352,120 @@ export function createFlowRunner(deps: Deps): FlowRunner {
}
}
// ─── Timeout detection ───────────────────────────────────────────────────────
// Check running steps. If a step has been 'running' longer than
// FLOW_STEP_TIMEOUT_MS, mark it timed_out or re-dispatch if retriable.
// Build a context here so the timeout retry path can re-dispatch the step.
const timeoutCtx = buildCtx(input, results, model, dispatch);
const timeoutMs = config.FLOW_STEP_TIMEOUT_MS;
const nowDate = new Date();
let detectedTimedOut = false;
for (const r of rows) {
if (r.status !== 'running') continue;
if (!r.updated_at) continue;
const elapsed = nowDate.getTime() - new Date(r.updated_at).getTime();
if (elapsed <= timeoutMs) continue;
// Step has exceeded the timeout
detectedTimedOut = true;
const retryCount = r.retry_count ?? 0;
const maxRetries = r.max_retries ?? 0;
if (maxRetries > 0 && retryCount < maxRetries) {
// Retriable: re-dispatch the step with an incremented retry_count
const step = flow.steps.find((s) => s.id === r.step_id);
if (!step || step.kind !== 'agent') {
// Non-agent steps can't be retried via dispatch
inFlight.delete(r.step_id);
await failRun(runId, flow, input, model,
`step '${r.step_id}' timed out (non-retriable kind)`, r.step_id);
return;
}
inFlight.delete(r.step_id);
await sql`
UPDATE flow_steps
SET retry_count = ${retryCount + 1}, updated_at = clock_timestamp()
WHERE run_id = ${runId} AND step_id = ${r.step_id} AND status = 'running'
`;
await dispatchAgentStep(runId, run.project_id, model, step, timeoutCtx);
inFlight.add(r.step_id);
log.warn({ runId, stepId: r.step_id, retry: retryCount + 1, maxRetries },
'flow-runner: step timed out, retrying');
} else {
// Not retriable — mark as timed_out, fail the run
inFlight.delete(r.step_id);
await sql`
UPDATE flow_steps SET status = 'timed_out', updated_at = clock_timestamp()
WHERE run_id = ${runId} AND step_id = ${r.step_id} AND status = 'running'
`;
timedOut.add(r.step_id);
publishStep(runId, r.step_id, 'timed_out');
await failRun(runId, flow, input, model,
`step '${r.step_id}' timed out`, r.step_id);
return;
}
}
// If we modified any steps, re-query so the state sets reflect the latest DB.
if (detectedTimedOut) {
// Continue with the in-memory state we already adjusted above (inFlight/timedOut
// were mutated directly). No re-query needed.
}
// Drain ready skips + code steps (synchronous), re-evaluating after each batch,
// then dispatch the full ready agent wave and wait for their terminal callbacks.
for (;;) {
const state: SchedulerState = { done, skipped, inFlight, excluded };
// Build per-batch state from the current inFlight set for batch parallelism gating.
const batchState = buildBatchState(flow, inFlight);
const state: SchedulerState = { done, skipped, inFlight, excluded, timedOut, batchState, switchResults: switchExcluded, loopIterations };
if (isRunComplete(flow, state)) {
await finishRun(runId, flow, input, results, model, dispatch);
return;
}
const ready = readySteps(flow, state);
const ready = getReadyInBatch(readySteps(flow, state), state, flow);
if (ready.length === 0) {
if (inFlight.size > 0) return; // agents in flight will re-enter via the hook
// Before declaring stuck, check for running DO_WHILE steps whose body
// is fully done — triggers the next loop iteration or terminates.
if (inFlight.size > 0) {
let doWhileReEval = false;
for (const s of flow.steps) {
if (s.kind !== 'do_while' || !s.loopBody || s.loopBody.length === 0) continue;
if (!inFlight.has(s.id)) continue;
if (!s.loopBody.every((bId) => done.has(bId))) continue;
doWhileReEval = true;
const iterations = loopIterations.get(s.id) ?? 0;
const dwCtx = buildCtx(input, results, model, dispatch);
if (isLoopTerminated(s, dwCtx, iterations)) {
await markStep(runId, s.id, 'completed');
done.add(s.id);
results[s.id] = '';
inFlight.delete(s.id);
publishStep(runId, s.id, 'completed');
} else {
await sql`
UPDATE flow_steps SET status = 'running', updated_at = clock_timestamp()
WHERE run_id = ${runId} AND step_id = ${s.id}
`;
inFlight.add(s.id);
loopIterations.set(s.id, iterations + 1);
for (const bodyId of s.loopBody) {
done.delete(bodyId);
delete results[bodyId];
await sql`
UPDATE flow_steps
SET status = 'pending', output = NULL, updated_at = clock_timestamp()
WHERE run_id = ${runId} AND step_id = ${bodyId}
`;
}
publishStep(runId, s.id, 'running');
}
break; // one DO_WHILE at a time
}
if (doWhileReEval) continue;
return; // genuine inFlight agents with no ready steps
}
await failRun(runId, flow, input, model, 'unsatisfiable dependencies / cycle');
return;
}
@@ -327,6 +482,74 @@ export function createFlowRunner(deps: Deps): FlowRunner {
continue; // re-evaluate — a skip can settle a fan-in step's deps
}
// SWITCH steps run synchronously — evaluate conditions, update the excluded
// set in SchedulerState, and mark themselves complete. Non-selected branch
// step ids are excluded from ever running.
const switchReady = toRun.filter((s) => s.kind === 'switch');
if (switchReady.length > 0) {
for (const s of switchReady) {
let result: { chosenCase: string | null; excluded: string[] };
try {
result = resolveSwitch(s, buildCtx(input, results, model, dispatch));
} catch (err) {
await failRun(runId, flow, input, model, `switch step '${s.id}' threw: ${errMsg(err)}`, s.id);
return;
}
switchExcluded.set(s.id, {
chosenCase: result.chosenCase,
excluded: new Set(result.excluded),
});
const outputText = result.chosenCase ? `branch:${result.chosenCase}` : '';
await markStep(runId, s.id, 'completed', outputText);
results[s.id] = outputText;
done.add(s.id);
}
continue; // re-evaluate — excluded steps may unblock dependents
}
// DO_WHILE steps: first-activation only (ready to run for the first time).
// Re-evaluation of running DO_WHILE steps whose body is complete is handled
// in the `ready.length === 0` block above (Path 1) — this avoids duplicate
// SQL updates and competing state mutations.
const doWhileReady = toRun.filter((s) => s.kind === 'do_while');
if (doWhileReady.length > 0) {
for (const s of doWhileReady) {
const iterations = loopIterations.get(s.id) ?? 0;
const dwCtx = buildCtx(input, results, model, dispatch);
if (isLoopTerminated(s, dwCtx, iterations)) {
// Loop done — mark DO_WHILE completed. Body steps stay in their
// current state (already done from the last iteration).
await markStep(runId, s.id, 'completed');
done.add(s.id);
results[s.id] = '';
inFlight.delete(s.id);
publishStep(runId, s.id, 'completed');
} else {
// Start or continue the loop.
await sql`
UPDATE flow_steps SET status = 'running', updated_at = clock_timestamp()
WHERE run_id = ${runId} AND step_id = ${s.id}
`;
inFlight.add(s.id);
loopIterations.set(s.id, iterations + 1);
// On re-iteration, reset body steps from 'completed' back to 'pending'.
if (iterations > 0 && s.loopBody) {
for (const bodyId of s.loopBody) {
done.delete(bodyId);
delete results[bodyId];
await sql`
UPDATE flow_steps
SET status = 'pending', output = NULL, updated_at = clock_timestamp()
WHERE run_id = ${runId} AND step_id = ${bodyId}
`;
}
}
publishStep(runId, s.id, 'running');
}
}
continue; // re-evaluate — body steps may be newly pending
}
const codeReady = toRun.filter((s) => s.kind === 'code');
if (codeReady.length > 0) {
for (const s of codeReady) {
@@ -334,7 +557,7 @@ export function createFlowRunner(deps: Deps): FlowRunner {
try {
// Code steps run IN-PROCESS (fold / synthesis-fold / code-review verify).
// verify uses ctx.dispatch → dispatchSubAgent (read-only qwen workers).
out = await s.run(buildCtx(input, results, model, dispatch));
out = await s.run(buildCtx(input, results, model, dispatch, runId, s.id));
} catch (err) {
await failRun(runId, flow, input, model, `code step '${s.id}' threw: ${errMsg(err)}`, s.id);
return;
@@ -457,6 +680,14 @@ export function createFlowRunner(deps: Deps): FlowRunner {
await appendStepEvent(sql, runId, stepId, status, output ? { outputLength: output.length } : undefined);
}
function cleanupMessaging(runId: string): void {
const cleanups = messagingCleanups.get(runId);
if (cleanups) {
for (const fn of cleanups) fn();
messagingCleanups.delete(runId);
}
}
// ─── run completion ─────────────────────────────────────────────────────────
async function finishRun(
@@ -478,11 +709,16 @@ export function createFlowRunner(deps: Deps): FlowRunner {
UPDATE flow_runs SET status = 'completed', report = ${report}, updated_at = clock_timestamp()
WHERE id = ${runId} AND status = 'running'
`;
if (updated.count === 0) return; // already terminal (e.g. cancelled) — don't publish
if (updated.count === 0) {
cleanupMessaging(runId);
return; // already terminal (e.g. cancelled) — don't publish
}
deps.onRunTerminal?.(runId, 'completed');
publishStep(runId, lastAgentStepId(flow, input, model), 'completed', {
run_status: 'completed',
report,
});
cleanupMessaging(runId);
}
async function failRun(
@@ -498,10 +734,12 @@ export function createFlowRunner(deps: Deps): FlowRunner {
WHERE id = ${runId} AND status = 'running'
`;
if (updated.count === 0) return;
deps.onRunTerminal?.(runId, 'failed');
const stepId = failedStepId ?? (flow ? lastAgentStepId(flow, input, model) : 'run');
log.warn({ runId, error }, 'flow-runner: run failed');
await appendStepEvent(sql, runId, stepId, 'failed', { error });
publishStep(runId, stepId, 'failed', { run_status: 'failed' });
cleanupMessaging(runId);
}
async function cancelRun(runId: string): Promise<void> {
@@ -512,6 +750,7 @@ export function createFlowRunner(deps: Deps): FlowRunner {
WHERE id = ${runId} AND status = 'running'
`;
if (updated.count === 0) return; // idempotent — already terminal
deps.onRunTerminal?.(runId, 'cancelled');
// Any remaining pending steps are unreachable; mark + publish them so the
// pane can show them as cancelled rather than stuck in pending.
const pending = await sql<{ step_id: string; kind: string }[]>`
@@ -528,6 +767,7 @@ export function createFlowRunner(deps: Deps): FlowRunner {
}
}
log.info({ runId }, 'flow-runner: run cancelled');
cleanupMessaging(runId);
}
/** The terminal agent step in roster order — a valid roster step_id to carry the
@@ -540,7 +780,7 @@ export function createFlowRunner(deps: Deps): FlowRunner {
function publishStep(
runId: string,
stepId: string,
status: 'running' | 'completed' | 'failed' | 'skipped' | 'cancelled' | 'blocked',
status: 'running' | 'completed' | 'failed' | 'skipped' | 'cancelled' | 'blocked' | 'timed_out',
extra?: { run_status?: 'running' | 'completed' | 'failed' | 'cancelled'; report?: string },
): void {
publishUser({
@@ -678,6 +918,38 @@ export function createFlowRunner(deps: Deps): FlowRunner {
log.info({ runId, stepId: step.step_id, taskId: task!.id }, 'flow-runner: step re-dispatched on resume');
break;
}
case 'retry': {
// Like re-dispatch but increments retry_count and sets status to 'running'.
if (!step.input) {
await sql`
UPDATE flow_steps
SET status = 'failed', error = 'retry: no stored prompt',
updated_at = clock_timestamp()
WHERE run_id = ${runId} AND step_id = ${step.step_id}
`;
break;
}
const chatIdR = step.chat_id;
const [chatR] = chatIdR
? await sql<{ session_id: string }[]>`SELECT session_id FROM chats WHERE id = ${chatIdR}`
: [];
const sessionIdR = chatR?.session_id ?? null;
const [taskR] = await sql<{ id: string }[]>`
INSERT INTO tasks (project_id, input, agent, model, mode_id, session_id, chat_id)
VALUES (${projectId}, ${step.input}, 'qwen', ${model}, 'plan', ${sessionIdR}, ${chatIdR})
RETURNING id
`;
await sql`
UPDATE flow_steps
SET task_id = ${taskR!.id}, retry_count = retry_count + 1, status = 'running',
updated_at = clock_timestamp()
WHERE run_id = ${runId} AND step_id = ${step.step_id}
`;
log.info({ runId, stepId: step.step_id, taskId: taskR!.id },
'flow-runner: step retried on resume');
break;
}
}
}
@@ -692,7 +964,9 @@ export function createFlowRunner(deps: Deps): FlowRunner {
status: string;
chat_id: string | null;
input: string | null;
}[]>`SELECT step_id, task_id, status, chat_id, input FROM flow_steps WHERE run_id = ${run.id}`;
retry_count: number | null;
max_retries: number | null;
}[]>`SELECT step_id, task_id, status, chat_id, input, retry_count, max_retries FROM flow_steps WHERE run_id = ${run.id}`;
// Load task states for all referenced tasks in one query.
const taskIds = rows.map((r) => r.task_id).filter((id): id is string => id !== null);
@@ -705,7 +979,13 @@ export function createFlowRunner(deps: Deps): FlowRunner {
}
const decisions = reconcileRun(
rows.map((r) => ({ stepId: r.step_id, taskId: r.task_id, status: r.status })),
rows.map((r) => ({
stepId: r.step_id,
taskId: r.task_id,
status: r.status,
retryCount: r.retry_count ?? undefined,
maxRetries: r.max_retries,
})),
taskStates,
);
@@ -742,17 +1022,18 @@ export function createFlowRunner(deps: Deps): FlowRunner {
WHERE id = ${runId} AND status = 'running'
`;
if (updated.count === 0) return { cancelled: false, taskIds: [] };
deps.onRunTerminal?.(runId, 'cancelled');
// Mark all non-terminal steps cancelled and collect in-flight task_ids.
const steps = await sql<{ step_id: string; task_id: string | null; kind: string }[]>`
SELECT step_id, task_id, kind FROM flow_steps
WHERE run_id = ${runId} AND status NOT IN ('completed', 'failed', 'cancelled', 'skipped')
WHERE run_id = ${runId} AND status NOT IN ('completed', 'failed', 'cancelled', 'skipped', 'timed_out')
`;
if (steps.length > 0) {
await sql`
UPDATE flow_steps SET status = 'cancelled', updated_at = clock_timestamp()
WHERE run_id = ${runId} AND status NOT IN ('completed', 'failed', 'cancelled', 'skipped')
WHERE run_id = ${runId} AND status NOT IN ('completed', 'failed', 'cancelled', 'skipped', 'timed_out')
`;
for (const s of steps) {
if (s.kind === 'agent') publishStep(runId, s.step_id, 'cancelled', { run_status: 'cancelled' });
@@ -772,6 +1053,7 @@ export function createFlowRunner(deps: Deps): FlowRunner {
.map((s) => s.task_id);
log.info({ runId }, 'flow-runner: run cancelled by request');
cleanupMessaging(runId);
return { cancelled: true, taskIds };
}

View File

@@ -0,0 +1,341 @@
/**
* v2.10 — PaseoClient: thin CLI-based client for the Paseo daemon.
*
* Paseo is a multi-agent hub daemon running at a configurable address
* (default Unix socket / localhost:6767). This client wraps the `paseo` CLI
* via child_process spawn for all operations (the daemon does not expose a
* separate REST API for write operations). Read operations (listAgents,
* getAgentStatus) use `paseo ls --json` / `paseo inspect --json`; write
* operations (import, archive, send) use the corresponding subcommands.
*
* Spec: openspec/changes/v2-10-paseo-integration/design.md.
*/
import { spawn } from 'node:child_process';
import { once } from 'node:events';
import { createInterface } from 'node:readline';
// ─── Types ───────────────────────────────────────────────────────────────────
/** Listing entry from `paseo ls --json`. Fields are lowercase. */
export interface PaseoAgentListItem {
id: string;
shortId: string;
name: string;
provider: string;
status: string;
cwd?: string;
created?: string;
thinking?: string;
}
/** Detailed agent info from `paseo inspect --json`. Fields are PascalCase. */
export interface PaseoAgentDetail {
Id: string;
Name: string;
Provider: string;
Model?: string;
Status: string;
Thinking?: string;
Archived: boolean;
ArchivedAt?: string | null;
Cwd?: string;
CreatedAt: string;
UpdatedAt: string;
Mode?: string;
AvailableModes?: Array<{ id: string; label: string }>;
Capabilities?: {
Streaming?: boolean;
Persistence?: boolean;
DynamicModes?: boolean;
McpServers?: boolean;
};
Labels?: Record<string, string>;
Worktree?: string | null;
ParentAgentId?: string | null;
}
/** Result of `paseo send --json`. */
export interface PaseoSendResult {
/** The agent's textual response. */
text?: string;
/** Structured output if the agent produced any. */
output?: unknown;
/** Error message if the turn failed. */
error?: string;
/** True if the turn completed successfully. */
ok?: boolean;
}
export interface PaseoClientConfig {
/** Path to the paseo binary. Default: auto-resolved from PATH. */
paseoBin: string;
/**
* Explicit `--host <host>` value for CLI calls.
* Format: `host:port` or `tcp://host:port?ssl=true&password=secret`.
* Omit to use the CLI default (Unix socket, fallback localhost:6767).
*/
cliHost?: string;
}
const DEFAULT_PASEO_BIN = 'paseo';
// ─── Client ──────────────────────────────────────────────────────────────────
export class PaseoClientError extends Error {
constructor(
message: string,
public readonly command: string,
public readonly exitCode: number | null,
public readonly stderr: string,
) {
super(message);
this.name = 'PaseoClientError';
}
}
export class PaseoClient {
/** @internal visible for testing */
readonly bin: string;
private readonly hostArgs: string[];
constructor(config?: Partial<PaseoClientConfig>) {
this.bin = config?.paseoBin ?? DEFAULT_PASEO_BIN;
this.hostArgs = config?.cliHost ? ['--host', config.cliHost] : [];
}
// ─── Read operations (CLI `ls --json`, `inspect --json`) ──────────────────
/** List all non-archived agents. */
async listAgents(): Promise<PaseoAgentListItem[]> {
const raw = await this.runJson(['ls', '--json', ...this.hostArgs]);
return raw as PaseoAgentListItem[];
}
/** Get detailed status for a single agent by ID or prefix. */
async getAgentStatus(agentId: string): Promise<PaseoAgentDetail> {
const raw = await this.runJson(['inspect', '--json', agentId, ...this.hostArgs]);
return raw as PaseoAgentDetail;
}
/**
* Quick liveness check — runs `paseo ls --json --limit 1` and returns success.
* The daemon is healthy if the CLI exits 0.
*/
async health(): Promise<{ status: string }> {
try {
await this.runCli(['ls', '--json', '--limit', '1', ...this.hostArgs]);
return { status: 'ok' };
} catch {
return { status: 'error' };
}
}
// ─── Write operations (CLI subcommands) ───────────────────────────────────
/**
* Import a provider session as a Paseo agent.
* Uses `paseo import <sessionId> --provider <provider> [--label k=v]`.
*/
async importAgent(
sessionId: string,
provider: string,
labels?: Record<string, string>,
): Promise<PaseoAgentDetail> {
const args: string[] = ['import', '--json', ...this.hostArgs];
if (provider) {
args.push('--provider', provider);
}
if (labels) {
for (const [k, v] of Object.entries(labels)) {
args.push('--label', `${k}=${v}`);
}
}
args.push(sessionId);
const raw = await this.runJson(args);
return raw as PaseoAgentDetail;
}
/** Archive (soft-delete) a Paseo agent by ID or prefix. */
async archiveAgent(agentId: string): Promise<void> {
await this.runCli(['archive', '--json', ...this.hostArgs, agentId]);
}
/**
* Send a prompt to an existing agent.
*
* By default waits for the agent to complete the turn (streams text events
* via the optional `onEvent` callback) and returns the structured result.
* Pass `noWait: true` to fire-and-forget.
*/
async sendPrompt(
agentId: string,
prompt: string,
options?: {
noWait?: boolean;
onEvent?: (event: { type: 'text' | 'reasoning'; text: string }) => void;
signal?: AbortSignal;
},
): Promise<PaseoSendResult> {
const args: string[] = ['send', '--json', ...this.hostArgs];
if (options?.noWait) {
args.push('--no-wait');
}
args.push(agentId, prompt);
// With --json and no --no-wait, the output is JSON after completion.
// For streaming, we read stderr without --json for real-time text.
const raw = await this.runCli(args, options?.signal);
try {
return JSON.parse(raw) as PaseoSendResult;
} catch {
return { text: raw, ok: true };
}
}
/**
* Stream-send: runs `paseo send` WITHOUT `--json`, forward text/reasoning
* lines to onEvent in real time. Use when the caller wants to stream agent
* output as it arrives rather than wait for the full JSON result.
*/
async streamSend(
agentId: string,
prompt: string,
onEvent: (event: { type: 'text' | 'reasoning'; text: string }) => void,
signal?: AbortSignal,
): Promise<PaseoSendResult> {
return new Promise<PaseoSendResult>((resolve, reject) => {
const args = ['send', ...this.hostArgs, agentId, prompt];
const child = spawn(this.bin, args, {
stdio: ['ignore', 'pipe', 'pipe'],
signal,
});
let stdout = '';
let stderr = '';
if (child.stdout) {
const rl = createInterface({ input: child.stdout });
rl.on('line', (line: string) => {
stdout += line + '\n';
// Forward as text event for real-time display
onEvent({ type: 'text', text: line + '\n' });
});
}
if (child.stderr) {
child.stderr.on('data', (chunk: Buffer) => {
stderr += chunk.toString();
});
}
once(child, 'close').then((raw) => {
const exitCode = (raw[0] as number | null) ?? 0;
if (exitCode !== 0) {
reject(
new PaseoClientError(
`paseo send failed (exit ${exitCode}): ${stderr.trim()}`,
'send',
exitCode,
stderr,
),
);
return;
}
resolve({ text: stdout, ok: true });
});
child.on('error', reject);
});
}
/** Interrupt/stop a running agent. */
async stopAgent(agentId: string): Promise<void> {
await this.runCli(['stop', ...this.hostArgs, agentId]);
}
// ─── Private helpers ───────────────────────────────────────────────────────
/**
* Run a CLI command and return stdout as a string.
* Throws PaseoClientError on non-zero exit.
*/
private async runCli(
args: string[],
signal?: AbortSignal,
): Promise<string> {
return new Promise<string>((resolve, reject) => {
const child = spawn(this.bin, args, {
stdio: ['ignore', 'pipe', 'pipe'],
signal,
});
let stdout = '';
let stderr = '';
if (child.stdout) {
child.stdout.on('data', (chunk: Buffer) => {
stdout += chunk.toString();
});
}
if (child.stderr) {
child.stderr.on('data', (chunk: Buffer) => {
stderr += chunk.toString();
});
}
child.on('error', (err: Error) => {
// If signal aborted, treat as cancellation not error
if (signal?.aborted) {
resolve('');
return;
}
reject(err);
});
once(child, 'close').then((raw) => {
const exitCode = (raw[0] as number | null) ?? 0;
if (signal?.aborted) {
resolve('');
return;
}
if (exitCode !== 0) {
const msg = stderr.trim() || `exit code ${exitCode}`;
reject(
new PaseoClientError(
`paseo ${args[0] ?? '?'} failed: ${msg}`,
args[0] ?? '?',
exitCode,
stderr,
),
);
return;
}
resolve(stdout);
});
});
}
/**
* Run a CLI command and parse stdout as JSON.
* Throws PaseoClientError on non-zero exit or parse failure.
*/
private async runJson(args: string[]): Promise<unknown> {
const stdout = await this.runCli(args);
try {
return JSON.parse(stdout);
} catch (err) {
throw new PaseoClientError(
`paseo ${args[0] ?? '?'} returned invalid JSON: ${(stdout || '<empty>').slice(0, 200)}`,
args[0] ?? '?',
0,
stdout,
);
}
}
}

View File

@@ -4,6 +4,8 @@ import { randomBytes } from 'node:crypto';
import type { Sql } from '../db.js';
import { resolveWritePath } from './write_guard.js';
import { locateMatch } from './fuzzy-match.js';
import { conflictIndex } from './conflict-index.js';
import { findConflicts } from './collision-detector.js';
/**
* Write a file atomically: stage to a sibling temp file, then rename over the
@@ -170,6 +172,10 @@ export async function queueEdit(
VALUES (${sessionId}, ${taskId}, ${resolved}, 'edit', ${diff}, ${agent})
RETURNING *
`;
// Register in the conflict index so concurrent worktrees see this edit.
conflictIndex.registerChange(resolved, sessionId, agent ?? 'unknown');
return row!;
}
@@ -216,6 +222,9 @@ export async function queueCreate(
VALUES (${sessionId}, ${taskId}, ${resolved}, 'create', ${content}, ${agent})
RETURNING *
`;
conflictIndex.registerChange(resolved, sessionId, agent ?? 'unknown');
return row!;
}
@@ -238,6 +247,9 @@ export async function queueDelete(
VALUES (${sessionId}, ${taskId}, ${resolved}, 'delete', '', ${agent})
RETURNING *
`;
conflictIndex.registerChange(resolved, sessionId, agent ?? 'unknown');
return row!;
}
@@ -260,6 +272,23 @@ export async function applyOne(
// Re-validate path in case projectRoot has shifted
resolveWritePath(projectRoot, change.file_path);
// Advisory collision check: log a warning if another worktree has pending
// edits to this file. Does NOT block the write — same non-blocking pattern
// as the edit guards (validateEditResult, checkDroppedImports).
{
const conflicts = conflictIndex.query(
[change.file_path],
change.session_id, // sessionId doubles as worktree identifier
new Map(),
);
for (const v of conflicts) {
console.log(
`[collision] ${v.filePath} — conflict with worktrees [${v.worktrees.join(', ')}] ` +
`agents [${v.agents.join(', ')}] severity=${v.severity}`,
);
}
}
switch (change.operation) {
case 'create': {
await mkdir(dirname(change.file_path), { recursive: true });

View File

@@ -0,0 +1,184 @@
/**
* Boulder state — cross-session plan persistence for BooCode.
*
* Plans live above flow_runs: a plan tracks a user's work goal and can link to
* a flow run for automatic progress tracking. When the linked flow run reaches
* a terminal state (completed/failed/cancelled), the plan is auto-updated.
*
* Auto-resumption: on startup, plans with a linked in-flight flow_run are
* surfaced via the GET endpoint so the UI can show a resume prompt. The
* flow-runner's initResume() re-advances the actual run; this store surfaces
* the plan-level view.
*/
import type { Sql } from '../db.js';
export interface Plan {
id: string;
project_id: string;
title: string;
description: string | null;
status: string;
flow_run_id: string | null;
progress_pct: number;
items_total: number;
items_completed: number;
metadata: Record<string, unknown> | null;
created_at: Date;
updated_at: Date;
}
export interface CreatePlanOpts {
projectId: string;
title: string;
description?: string;
flowRunId?: string;
metadata?: Record<string, unknown>;
}
export interface UpdatePlanOpts {
title?: string;
description?: string | null;
status?: 'active' | 'completed' | 'cancelled' | 'failed';
progressPct?: number;
itemsTotal?: number;
itemsCompleted?: number;
metadata?: Record<string, unknown> | null;
}
export function createPlan(sql: Sql, opts: CreatePlanOpts): Promise<Plan> {
return sql`
INSERT INTO plans (project_id, title, description, flow_run_id, metadata)
VALUES (
${opts.projectId},
${opts.title},
${opts.description ?? null},
${opts.flowRunId ?? null},
${opts.metadata ? sql.json(opts.metadata as never) : null}
)
RETURNING *
`.then((rows) => rows[0] as unknown as Plan);
}
export function getPlan(sql: Sql, planId: string): Promise<Plan | null> {
return sql`
SELECT * FROM plans WHERE id = ${planId}
`.then((rows) => (rows[0] as unknown as Plan) ?? null);
}
export function listPlans(sql: Sql, projectId: string): Promise<Plan[]> {
return sql`
SELECT * FROM plans
WHERE project_id = ${projectId}
ORDER BY created_at DESC
LIMIT 100
` as Promise<Plan[]>;
}
export function listActivePlans(sql: Sql, projectId: string): Promise<Plan[]> {
return sql`
SELECT * FROM plans
WHERE project_id = ${projectId} AND status = 'active'
ORDER BY created_at DESC
` as Promise<Plan[]>;
}
export async function updatePlan(
sql: Sql,
planId: string,
opts: UpdatePlanOpts,
): Promise<Plan | null> {
const sets: string[] = [];
const values: unknown[] = [];
if (opts.title !== undefined) {
sets.push(`title = $${values.length + 1}`);
values.push(opts.title);
}
if (opts.description !== undefined) {
sets.push(`description = $${values.length + 1}`);
values.push(opts.description);
}
if (opts.status !== undefined) {
sets.push(`status = $${values.length + 1}`);
values.push(opts.status);
}
if (opts.progressPct !== undefined) {
sets.push(`progress_pct = $${values.length + 1}`);
values.push(opts.progressPct);
}
if (opts.itemsTotal !== undefined) {
sets.push(`items_total = $${values.length + 1}`);
values.push(opts.itemsTotal);
}
if (opts.itemsCompleted !== undefined) {
sets.push(`items_completed = $${values.length + 1}`);
values.push(opts.itemsCompleted);
}
if (opts.metadata !== undefined) {
sets.push(`metadata = $${values.length + 1}::jsonb`);
values.push(opts.metadata !== null ? JSON.stringify(opts.metadata) : null);
}
if (sets.length === 0) return getPlan(sql, planId);
sets.push(`updated_at = clock_timestamp()`);
const query = `
UPDATE plans SET ${sets.join(', ')}
WHERE id = $${values.length + 1}
RETURNING *
`;
values.push(planId);
const result = await sql.unsafe(query, values as never[]);
return (result[0] as unknown as Plan) ?? null;
}
/**
* Called when a flow run reaches a terminal state. Updates the linked plan's
* status based on the run outcome:
* - completed → plan completed
* - failed → plan failed
* - cancelled → plan cancelled
* Returns true when a plan was updated, false when no plan is linked to the run.
*/
export async function updatePlanFromRun(
sql: Sql,
runId: string,
runStatus: 'completed' | 'failed' | 'cancelled',
): Promise<boolean> {
const planStatus = planStatusFromRun(runStatus);
const updated = await sql`
UPDATE plans
SET status = ${planStatus}, progress_pct = 100,
items_completed = items_total, updated_at = clock_timestamp()
WHERE flow_run_id = ${runId} AND status = 'active'
`;
return updated.count > 0;
}
/** Map a flow-run terminal status to its corresponding plan status. Pure. */
export function planStatusFromRun(runStatus: 'completed' | 'failed' | 'cancelled'): string {
return runStatus === 'completed' ? 'completed' : runStatus;
}
/**
* Find any active plan linked to a running flow run — used by the startup
* resume path to surface plans that have in-flight orchestrator runs.
*/
export async function findPlanWithRunningRun(
sql: Sql,
projectId: string,
): Promise<(Plan & { run_status: string }) | null> {
const [row] = await sql`
SELECT p.*, fr.status AS run_status
FROM plans p
JOIN flow_runs fr ON fr.id = p.flow_run_id
WHERE p.project_id = ${projectId}
AND p.status = 'active'
AND fr.status = 'running'
ORDER BY p.created_at DESC
LIMIT 1
`;
return (row as unknown as Plan & { run_status: string }) ?? null;
}

View File

@@ -29,6 +29,22 @@ interface AgentRow {
last_probed_at: string | Date | null;
}
export async function fetchDeepSeekModels(config: Config): Promise<ProviderModel[]> {
if (!config.DEEPSEEK_API_KEY) return [];
try {
const baseURL = (config.DEEPSEEK_BASE_URL ?? 'https://api.deepseek.com').replace(/\/+$/, '');
const res = await fetch(`${baseURL}/v1/models`, {
headers: { Authorization: `Bearer ${config.DEEPSEEK_API_KEY}` },
signal: AbortSignal.timeout(5_000),
});
if (!res.ok) return [];
const parsed = (await res.json()) as { data?: Array<{ id: string }> };
return (parsed.data ?? []).map((m) => ({ id: m.id, label: m.id }));
} catch {
return [];
}
}
export async function fetchLlamaSwapModels(config: Config): Promise<ProviderModel[]> {
try {
const res = await fetch(`${config.LLAMA_SWAP_URL}/v1/models`);
@@ -256,7 +272,13 @@ export async function getProviderSnapshot(
}
const build = async (): Promise<ProviderSnapshotEntry[]> => {
const llamaModels = await fetchLlamaSwapModels(config);
const [llamaModels, deepseekModels] = await Promise.all([
fetchLlamaSwapModels(config),
fetchDeepSeekModels(config),
]);
// Merge DeepSeek models into the llama-swap model pool so the boocode
// provider (which sources from llama-swap) also includes DeepSeek models.
const mergedModels = mergeModels(llamaModels, deepseekModels);
const agents = await sql<AgentRow[]>`
SELECT name, install_path, supports_acp, models, commands, label, transport, last_probed_at FROM available_agents
`;
@@ -265,7 +287,7 @@ export async function getProviderSnapshot(
const entries = await Promise.all(
[...getResolvedRegistry().values()].map((resolved) =>
buildProviderEntry(resolved, agentMap.get(resolved.id), llamaModels, resolvedCwd, ttlMs, force),
buildProviderEntry(resolved, agentMap.get(resolved.id), mergedModels, resolvedCwd, ttlMs, force),
),
);

View File

@@ -1,7 +1,12 @@
# apps/server — BooChat backend (deep reference)
# apps/server — BooChat backend (deep reference) — v2.7.x (last meaningful update: 2026-06)
> Per-app engineering notes for `apps/server/src/`. Cross-cutting commands, database, environment, workflow, and cross-app contracts (WS-frame / provider-type parity, sentinels) live in the **root `CLAUDE.md`**. This file auto-loads when you read/edit files under `apps/server/`.
## These gotchas are load-bearing — do not remove or refactor without understanding why
- Do NOT remove the abort-signal pinning comment in `stream-phase.ts``fullStream` exits cleanly on abort without throwing; the post-iteration `if (signal?.aborted)` check is the only thing that distinguishes cancelled from complete.
- Do NOT remove `includeUsage: true` from `provider.ts` — the adapter defaults it false; without it, token counts are always NULL.
- Do NOT add raw `broker.publish()`/`publishUser()` calls — always use `publishFrame`/`publishUserFrame` which Zod-validate against `WsFrameSchema`.
## Stack
- **Fastify** with `@fastify/websocket` and `@fastify/static` (serves the built frontend).

View File

@@ -77,8 +77,9 @@
"test": "vitest run"
},
"dependencies": {
"@boocode/contracts": "workspace:*",
"@ai-sdk/deepseek": "^2.0.35",
"@ai-sdk/openai-compatible": "^2.0.47",
"@boocode/contracts": "workspace:*",
"@fastify/static": "^7.0.4",
"@fastify/websocket": "^10.0.1",
"@modelcontextprotocol/sdk": "^1.29.0",

View File

@@ -26,6 +26,14 @@ const ConfigSchema = z.object({
FAST_MODEL: z.string().optional(),
TASK_MODEL_URL: z.string().url().optional(),
LLAMA_SIDECAR_URL: z.string().url().optional(),
// vDeepSeek: DeepSeek API key for direct API access. When set, models
// with IDs starting with 'deepseek-' route through DeepSeek's API instead
// of llama-swap. Defaults to empty (DeepSeek routing disabled).
DEEPSEEK_API_KEY: z.string().optional(),
// Optional base URL override for DeepSeek API. Defaults to api.deepseek.com.
DEEPSEEK_BASE_URL: z.string().url().default('https://api.deepseek.com'),
// vWhale hooks: path to hooks JSON config file. Missing file = no hooks.
HOOKS_CONFIG_PATH: z.string().default('/data/hooks.json'),
});
export type Config = z.infer<typeof ConfigSchema>;

View File

@@ -18,11 +18,14 @@ import { registerCoderProxy } from './routes/coder-proxy.js';
import { registerModelRoutes } from './routes/models.js';
import { registerAgentRoutes } from './routes/agents.js';
import { registerSkillsRoutes } from './routes/skills.js';
import { registerTraceRoutes } from './routes/traces.js';
import { registerToolsRoutes } from './routes/tools.js';
import { registerAnalyticsRoutes } from './routes/analytics.js';
import { registerInferenceSettingsRoutes } from './routes/inference-settings.js';
import { createInferenceRunner } from './services/inference/index.js';
import { createInferenceRunner, runInferenceWithModel } from './services/inference/index.js';
import { createBroker } from './services/broker.js';
import { setBackgroundInferenceEnqueuer } from './services/background-task.js';
import { listSkills } from './services/skills.js';
import * as compaction from './services/compaction.js';
import { configureModelContext } from './services/model-context.js';
@@ -31,6 +34,7 @@ import { loadMcpConfig } from './services/mcp-config.js';
import { initialize as initMcp, getTools as getMcpTools, shutdown as shutdownMcp } from './services/mcp-client.js';
import { appendMcpTools } from './services/tools.js';
import { refreshToolNames, getAgentsForProject } from './services/agents.js';
import { loadHooksConfig, createHookRunner } from './services/hooks.js';
async function main() {
const config = loadConfig();
@@ -122,7 +126,35 @@ async function main() {
registerModelRoutes(app, config);
registerAgentRoutes(app, sql);
registerSidebarRoutes(app, sql);
registerChatRoutes(app, sql, broker);
registerChatRoutes(app, sql, broker, config, {
enqueueCompare: (sessionId, chatId, assistantMessageId, modelOverride, compareGroupId) => {
// Reuse the inference runner's context pattern for compare mode.
// Each compare run gets its own AbortController; cancellation keyed by
// chatId (cancels ALL parallel runs in that compare group).
const compareCtx: import('./services/inference/types.js').InferenceContext = {
sql,
config,
log: app.log,
publish: (sid, frame) => {
broker.publishFrame(sid, frame as unknown as import('@boocode/contracts/ws-frames').WsFrame);
},
publishUser: (frame) => {
broker.publishUserFrame('default', frame as unknown as import('@boocode/contracts/ws-frames').WsFrame);
},
broker,
hooks: hasHooks ? hookRunner : undefined,
};
compareCtx.publishUser({ type: 'chat_status', chat_id: chatId, status: 'streaming', at: new Date().toISOString() });
void runInferenceWithModel(compareCtx, sessionId, chatId, assistantMessageId, modelOverride, compareGroupId).catch(
(err: Error) => app.log.error({ err, chatId, modelOverride }, 'compare inference failed'),
);
},
cancelInference: async (_sessionId, chatId) => {
return inference.cancel(_sessionId, chatId);
},
hasActiveInference: (chatId) => inference.hasActive(chatId),
});
registerTraceRoutes(app, sql);
registerToolsRoutes(app, sql);
registerAnalyticsRoutes(app, sql);
registerInferenceSettingsRoutes(app);
@@ -136,11 +168,17 @@ async function main() {
app.log.warn({ err }, 'skills boot walk failed');
}
// vWhale hooks: load hook config and create runner. Missing file = no hooks.
loadHooksConfig(config.HOOKS_CONFIG_PATH);
const hookRunner = createHookRunner();
const hasHooks = Object.keys(loadHooksConfig(config.HOOKS_CONFIG_PATH).hooks).length > 0;
const inference = createInferenceRunner(
{
sql,
config,
log: app.log,
hooks: hasHooks ? hookRunner : undefined,
publish: (sessionId, frame) => {
// v1.13.11-b: route through the typed publishFrame so the broker's
// Zod gate validates every inference frame before delivery.
@@ -156,6 +194,13 @@ async function main() {
broker.publishUserFrame(user, frame as unknown as import('@boocode/contracts/ws-frames').WsFrame);
}
);
// v2.x: wire the background subagent task system to the inference runner.
// Tools (spawn_subagent) dispatch fire-and-forget inference via this
// module-level reference — no import cycle through the tool registry.
setBackgroundInferenceEnqueuer((sessionId, chatId, assistantId, user) => {
inference.enqueue(sessionId, chatId, assistantId, user);
});
registerMessageRoutes(app, sql, config, broker, {
enqueueInference: (sessionId, chatId, assistantId, user) => {
inference.enqueue(sessionId, chatId, assistantId, user);
@@ -166,7 +211,7 @@ async function main() {
// bubble up so the route can reply 500 — manual /compact failures
// should be loud (the user just clicked a button).
runCompaction: (chatId) =>
compaction.process({ sql, config, log: app.log, broker, chatId }),
compaction.process({ sql, config, log: app.log, broker, chatId, hooks: hasHooks ? hookRunner : undefined }),
cancelInference: async (sessionId, chatId) => {
return inference.cancel(sessionId, chatId);
},

View File

@@ -1,18 +1,33 @@
import type { FastifyInstance } from 'fastify';
import { z } from 'zod';
import crypto from 'node:crypto';
import type { Sql } from '../db.js';
import type { Config } from '../config.js';
import type { Broker } from '../services/broker.js';
import type { Chat, Message } from '../types/api.js';
import { getModelContext } from '../services/model-context.js';
import { notifyCoderClose } from '../services/coder-notify.js';
import { MESSAGE_COLUMNS } from '../services/message-columns.js';
import { formatJson, formatMarkdown } from '../services/export-formatter.js';
export interface CompareHandlers {
enqueueCompare: (
sessionId: string,
chatId: string,
assistantMessageId: string,
modelOverride: string,
compareGroupId: string,
) => void;
cancelInference: (sessionId: string, chatId: string) => Promise<boolean>;
hasActiveInference: (chatId: string) => boolean;
}
const CreateBody = z.object({
name: z.string().min(1).max(200).optional(),
});
const PatchBody = z.object({
name: z.string().min(1).max(200),
name: z.string().min(1).max(200).optional(),
model: z.string().min(1).optional(),
});
const ForkBody = z.object({
@@ -26,10 +41,17 @@ const DiscardStaleBody = z.object({
const STALE_MIN_AGE_SECONDS = 60;
const CompareBody = z.object({
message: z.string().min(1).max(64_000),
models: z.array(z.string().min(1)).min(2).max(3),
});
export function registerChatRoutes(
app: FastifyInstance,
sql: Sql,
broker: Broker
broker: Broker,
config?: Config,
compareHandlers?: CompareHandlers,
): void {
app.get<{ Params: { id: string }; Querystring: { status?: string } }>(
'/api/sessions/:id/chats',
@@ -122,12 +144,15 @@ export function registerChatRoutes(
reply.code(400);
return { error: 'invalid body', details: parsed.error.flatten() };
}
const { name, model } = parsed.data;
const sets: Array<ReturnType<typeof sql>> = [sql`updated_at = clock_timestamp()`];
if (name !== undefined) sets.push(sql`name = ${name}`);
if (model !== undefined) sets.push(sql`model = ${model}`);
const rows = await sql<Chat[]>`
UPDATE chats
SET name = ${parsed.data.name},
updated_at = clock_timestamp()
SET ${(sql as any).join(sets, sql`, `)}
WHERE id = ${req.params.id}
RETURNING id, session_id, name, status, created_at, updated_at
RETURNING id, session_id, name, model, status, created_at, updated_at
`;
if (rows.length === 0) {
reply.code(404);
@@ -448,4 +473,128 @@ export function registerChatRoutes(
return rows;
}
);
app.get<{ Params: { id: string }; Querystring: { format?: string } }>(
'/api/chats/:id/export',
async (req, reply) => {
const format = req.query.format ?? 'json';
if (format !== 'json' && format !== 'markdown') {
reply.code(400);
return { error: 'format must be json or markdown' };
}
const chat = await sql<Chat[]>`SELECT * FROM chats WHERE id = ${req.params.id}`;
if (chat.length === 0) {
reply.code(404);
return { error: 'chat not found' };
}
const messages = await sql<Message[]>`
SELECT ${sql.unsafe(MESSAGE_COLUMNS)}
FROM messages_with_parts
WHERE chat_id = ${req.params.id}
ORDER BY created_at ASC, id ASC
`;
if (format === 'markdown') {
reply.header('Content-Type', 'text/markdown');
return formatMarkdown(chat[0]!, messages, chat[0]!.model);
}
reply.header('Content-Type', 'application/json');
return formatJson(chat[0]!, messages, chat[0]!.model);
}
);
// v2.8-compare: send the same message to N models and stream back parallel
// responses. Creates N assistant messages (one per model) and launches N
// parallel inference runs with model overrides. Each publishes frames
// scoped to the shared compare_group_id so the frontend can group them.
if (config && compareHandlers) {
app.post<{ Params: { id: string } }>(
'/api/chats/:id/compare',
async (req, reply) => {
const parsed = CompareBody.safeParse(req.body);
if (!parsed.success) {
reply.code(400);
return { error: 'invalid body', details: parsed.error.flatten() };
}
const { message, models } = parsed.data;
// Check for active inference first.
if (compareHandlers.hasActiveInference(req.params.id)) {
reply.code(409);
return { error: 'chat is currently streaming; stop it first' };
}
const chatRows = await sql<Chat[]>`
SELECT id, session_id FROM chats WHERE id = ${req.params.id} AND status = 'open'
`;
if (chatRows.length === 0) {
reply.code(404);
return { error: 'chat not found' };
}
const chat = chatRows[0]!;
const sessionId = chat.session_id;
const compareGroupId = crypto.randomUUID();
// Insert user message + N assistant messages in a single transaction.
const result = await sql.begin(async (tx) => {
const [userMsg] = await tx<{ id: string }[]>`
INSERT INTO messages (session_id, chat_id, role, content, status, created_at, metadata)
VALUES (${sessionId}, ${chat.id}, 'user', ${message}, 'complete', clock_timestamp(), NULL)
RETURNING id
`;
const responses: Array<{ model: string; assistant_message_id: string }> = [];
for (const model of models) {
const [asst] = await tx<{ id: string }[]>`
INSERT INTO messages (session_id, chat_id, role, content, status, created_at, metadata)
VALUES (
${sessionId}, ${chat.id}, 'assistant', '', 'streaming', clock_timestamp(),
${tx.json({ compare_group_id: compareGroupId, model } as never)}
)
RETURNING id
`;
responses.push({ model, assistant_message_id: asst!.id });
}
await tx`UPDATE sessions SET updated_at = clock_timestamp() WHERE id = ${sessionId}`;
await tx`UPDATE chats SET updated_at = clock_timestamp() WHERE id = ${chat.id}`;
return { user_message_id: userMsg!.id, responses };
});
// Publish user message frames.
broker.publishFrame(sessionId, {
type: 'message_started',
message_id: result.user_message_id,
chat_id: chat.id,
role: 'user',
});
broker.publishFrame(sessionId, {
type: 'delta',
message_id: result.user_message_id,
chat_id: chat.id,
content: message,
});
broker.publishFrame(sessionId, {
type: 'message_complete',
message_id: result.user_message_id,
chat_id: chat.id,
});
// Enqueue N parallel inference runs with model overrides.
for (const resp of result.responses) {
compareHandlers.enqueueCompare(
sessionId, chat.id, resp.assistant_message_id, resp.model, compareGroupId,
);
}
reply.code(202);
return { compare_group_id: compareGroupId, ...result };
},
);
}
}

View File

@@ -3,12 +3,13 @@ import { z } from 'zod';
import type { Sql } from '../db.js';
import type { Config } from '../config.js';
import type { Broker } from '../services/broker.js';
import type { Chat, Message, Session, ToolCall } from '../types/api.js';
import type { Chat, Message, MessageMetadata, Session, ToolCall } from '../types/api.js';
// v1.13.17-cross-repo-reads: grant_read_access resolves the grant root at
// decision time (not at request time) so concurrent project changes don't
// stale-bind the resolution.
import { resolveGrantRoot } from '../services/grant_resolver.js';
import { MESSAGE_COLUMNS } from '../services/message-columns.js';
import { setServerPermission, getServerName } from '../services/mcp-client.js';
// Shared lookup for the answer_user_input + grant_read_access pause-resume
// endpoints. Finds the originating assistant tool_call by id in message_parts,
@@ -846,4 +847,117 @@ export function registerMessageRoutes(
};
},
);
// v1.15.0-mcp-permission: approve/deny MCP tool calls for 'ask' state servers.
const McpApproveBody = z.object({
tool_call_id: z.string().min(1),
permission: z.enum(['allow_once', 'allow_always', 'deny']),
});
app.post<{ Params: { id: string } }>(
'/api/chats/:id/mcp-approve',
async (req, reply) => {
const parsed = McpApproveBody.safeParse(req.body);
if (!parsed.success) {
reply.code(400);
return { error: 'invalid body', details: parsed.error.flatten() };
}
const { tool_call_id, permission } = parsed.data;
const chatRows = await sql<{ id: string }[]>`
SELECT id FROM chats WHERE id = ${req.params.id} AND status = 'open'
`;
if (chatRows.length === 0) {
reply.code(404);
return { error: 'chat_not_found' };
}
// Look up the tool call to get the prefixed tool name
const callerRows = await sql<{
payload: { name: string };
}[]>`
SELECT p.payload
FROM message_parts p
JOIN messages m ON m.id = p.message_id
WHERE m.chat_id = ${req.params.id}
AND m.role = 'assistant'
AND p.kind = 'tool_call'
AND p.payload->>'id' = ${tool_call_id}
ORDER BY m.created_at DESC
LIMIT 1
`;
const callerRow = callerRows[0];
if (!callerRow) {
reply.code(404);
return { error: 'tool_call_not_found' };
}
const toolName = callerRow.payload.name;
const serverName = getServerName(toolName);
if (!serverName) {
reply.code(400);
return { error: 'not_an_mcp_tool', detail: `tool '${toolName}' is not from an MCP server` };
}
if (permission === 'allow_always' || permission === 'allow_once') {
setServerPermission(serverName, 'allow');
} else if (permission === 'deny') {
setServerPermission(serverName, 'deny');
}
return { ok: true };
},
);
const FeedbackBody = z.object({
value: z.enum(['up', 'down']),
});
app.post<{ Params: { id: string; message_id: string } }>(
'/api/chats/:id/messages/:message_id/feedback',
async (req, reply) => {
const parsed = FeedbackBody.safeParse(req.body);
if (!parsed.success) {
reply.code(400);
return { error: 'invalid body', details: parsed.error.flatten() };
}
const { id: chatId, message_id: messageId } = req.params;
const { value } = parsed.data;
const msg = await sql<{ id: string; role: string; metadata: MessageMetadata | null }[]>`
SELECT id, role, metadata FROM messages WHERE id = ${messageId} AND chat_id = ${chatId}
`;
if (msg.length === 0) {
reply.code(404);
return { error: 'message not found' };
}
// Only allow feedback on assistant messages.
if (msg[0]!.role !== 'assistant') {
reply.code(400);
return { error: 'only assistant messages can receive feedback' };
}
// Check if feedback already exists
const existingMeta = msg[0]!.metadata;
if (existingMeta && existingMeta.kind === 'feedback') {
reply.code(409);
return { error: 'feedback already recorded' };
}
const feedbackMeta: MessageMetadata = {
kind: 'feedback',
value,
chat_id: chatId,
};
await sql`
UPDATE messages
SET metadata = ${sql.json(feedbackMeta as never)}, updated_at = clock_timestamp()
WHERE id = ${messageId}
`;
return { ok: true };
},
);
}

View File

@@ -2,26 +2,55 @@ import type { FastifyInstance } from 'fastify';
import type { Config } from '../config.js';
import type { ModelInfo } from '../types/api.js';
interface LlamaSwapModelsResponse {
interface ApiModelsResponse {
data?: ModelInfo[];
}
const DEEPSEEK_STATIC_MODELS: ModelInfo[] = [
{ id: 'deepseek-v4-flash', object: 'model', created: 0, owned_by: 'deepseek' },
{ id: 'deepseek-v4-pro', object: 'model', created: 0, owned_by: 'deepseek' },
];
export function registerModelRoutes(app: FastifyInstance, config: Config): void {
app.get('/api/models', async (_req, reply) => {
const models: ModelInfo[] = [];
// 1. Fetch llama-swap models
try {
const res = await fetch(`${config.LLAMA_SWAP_URL}/v1/models`);
if (!res.ok) {
reply.code(502);
return { error: `llama-swap returned ${res.status}` };
if (res.ok) {
const parsed = (await res.json()) as ApiModelsResponse;
if (parsed.data) models.push(...parsed.data);
}
const parsed = (await res.json()) as LlamaSwapModelsResponse;
return parsed.data ?? [];
} catch (err) {
reply.code(502);
return {
error: 'failed to reach llama-swap',
details: err instanceof Error ? err.message : String(err),
};
} catch {
// llama-swap unreachable — proceed with whatever we have
}
// 2. If DeepSeek is configured, fetch live models from their API
if (config.DEEPSEEK_API_KEY) {
try {
const baseURL = (config.DEEPSEEK_BASE_URL ?? 'https://api.deepseek.com').replace(/\/+$/, '');
const res = await fetch(`${baseURL}/v1/models`, {
headers: { Authorization: `Bearer ${config.DEEPSEEK_API_KEY}` },
signal: AbortSignal.timeout(5_000),
});
if (res.ok) {
const parsed = (await res.json()) as ApiModelsResponse;
if (parsed.data) models.push(...parsed.data);
} else {
// API call failed — fall back to static model list
models.push(...DEEPSEEK_STATIC_MODELS);
}
} catch {
// Network error — fall back to static model list
models.push(...DEEPSEEK_STATIC_MODELS);
}
}
if (models.length === 0) {
reply.code(502);
return { error: 'no models available from any provider' };
}
return models;
});
}

View File

@@ -145,7 +145,7 @@ export function registerSessionRoutes(
}
const status = req.query.status === 'archived' ? 'archived' : 'open';
const rows = await sql<Session[]>`
SELECT id, project_id, name, model, system_prompt, status, created_at, updated_at, agent_id, web_search_enabled, workspace_panes, allowed_read_paths
SELECT id, project_id, name, model, system_prompt, status, created_at, updated_at, agent_id, web_search_enabled, workspace_panes, allowed_read_paths, state_graph_enabled
FROM sessions
WHERE project_id = ${req.params.id} AND status = ${status}
ORDER BY updated_at DESC
@@ -213,7 +213,7 @@ export function registerSessionRoutes(
app.get<{ Params: { id: string } }>('/api/sessions/:id', async (req, reply) => {
const rows = await sql<Session[]>`
SELECT id, project_id, name, model, system_prompt, status, created_at, updated_at, agent_id, web_search_enabled, workspace_panes, allowed_read_paths
SELECT id, project_id, name, model, system_prompt, status, created_at, updated_at, agent_id, web_search_enabled, workspace_panes, allowed_read_paths, state_graph_enabled
FROM sessions WHERE id = ${req.params.id}
`;
if (rows.length === 0) {
@@ -349,10 +349,10 @@ export function registerSessionRoutes(
const rows = await sql<Session[]>`
UPDATE sessions
SET workspace_panes = ${sql.json(envelope as never)},
updated_at = clock_timestamp()
updated_at = clock_timestamp()
WHERE id = ${req.params.id}
RETURNING id, project_id, name, model, system_prompt, status, created_at, updated_at,
agent_id, web_search_enabled, workspace_panes, allowed_read_paths
agent_id, web_search_enabled, workspace_panes, allowed_read_paths, state_graph_enabled
`;
if (rows.length === 0) {
reply.code(404);

View File

@@ -0,0 +1,38 @@
import type { FastifyInstance } from 'fastify';
import type { Sql } from '../db.js';
import type { ToolTrace } from '../services/tool-traces.js';
export function registerTraceRoutes(app: FastifyInstance, sql: Sql): void {
app.get<{ Params: { id: string }; Querystring: { limit?: string; offset?: string } }>(
'/api/chats/:id/traces',
async (req, reply) => {
const chat = await sql`SELECT id FROM chats WHERE id = ${req.params.id}`;
if (chat.length === 0) {
reply.code(404);
return { error: 'chat not found' };
}
const limit = Math.min(Math.max(Number(req.query.limit) || 50, 1), 200);
const offset = Math.max(Number(req.query.offset) || 0, 0);
const rows = await sql<ToolTrace[]>`
SELECT * FROM tool_traces
WHERE chat_id = ${req.params.id}
ORDER BY started_at ASC
LIMIT ${limit}
OFFSET ${offset}
`;
const [countRow] = await sql<{ count: number }[]>`
SELECT count(*)::int AS count FROM tool_traces WHERE chat_id = ${req.params.id}
`;
return {
data: rows,
total: countRow?.count ?? 0,
limit,
offset,
};
},
);
}

View File

@@ -3,6 +3,7 @@ import type { Sql } from '../db.js';
import type { Broker } from '../services/broker.js';
import type { Message } from '../types/api.js';
import { MESSAGE_COLUMNS } from '../services/message-columns.js';
import { loadAgentSnapshot } from '../services/session-snapshots.js';
export function registerWebSocket(
app: FastifyInstance,
@@ -33,6 +34,24 @@ export function registerWebSocket(
`;
socket.send(JSON.stringify({ type: 'snapshot', messages }));
// v2.7.x: on reconnect, restore agent snapshot state so the frontend
// knows there's an ongoing agent turn. Best-effort per chat; most
// sessions won't have any snapshots.
const chats = await sql<{ id: string }[]>`SELECT id FROM chats WHERE session_id = ${sessionId}`;
for (const chat of chats) {
const agentSnapshot = await loadAgentSnapshot(sql, chat.id).catch(() => null);
if (agentSnapshot) {
socket.send(JSON.stringify({
type: 'agent_snapshot',
chat_id: chat.id,
agent: agentSnapshot.agent,
model: agentSnapshot.model,
mode: agentSnapshot.mode,
turn_number: agentSnapshot.turn_number,
}));
}
}
const unsubscribe = broker.subscribe(sessionId, (frame) => {
if (socket.readyState !== socket.OPEN) return;
try {

View File

@@ -32,11 +32,18 @@ CREATE TABLE IF NOT EXISTS messages (
content TEXT NOT NULL DEFAULT '',
status TEXT NOT NULL DEFAULT 'complete',
last_seq INT NOT NULL DEFAULT 0,
cache_tokens INTEGER,
reasoning_tokens INTEGER,
created_at TIMESTAMPTZ NOT NULL DEFAULT clock_timestamp()
);
CREATE INDEX IF NOT EXISTS idx_messages_session ON messages(session_id, created_at);
-- vDeepSeek: add cache/reasoning token columns early so messages_with_parts
-- view (defined below) can reference them. IF NOT EXISTS guards re-runs.
ALTER TABLE messages ADD COLUMN IF NOT EXISTS cache_tokens INTEGER;
ALTER TABLE messages ADD COLUMN IF NOT EXISTS reasoning_tokens INTEGER;
-- v1.13.0: granular message parts table. v1.13.20: legacy tool_calls/
-- tool_results columns dropped; message_parts is now the sole source of
-- truth for tool calls, tool results, and reasoning. ON DELETE CASCADE
@@ -126,8 +133,8 @@ SELECT
FROM message_parts p
WHERE p.message_id = m.id AND p.kind = 'reasoning' AND p.hidden_at IS NULL) AS reasoning_parts,
-- NEW columns MUST be appended at the end: CREATE OR REPLACE VIEW can't
-- reorder/rename existing columns (42P16). m.model added last.
m.model
-- reorder/rename existing columns (42P16). cache_tokens and reasoning_tokens added last.
m.model, m.cache_tokens, m.reasoning_tokens
FROM messages m;
-- v1.13.20: drop legacy tool_calls/tool_results columns. Reads have routed
@@ -227,6 +234,7 @@ ALTER TABLE sessions ADD COLUMN IF NOT EXISTS workspace_panes JSONB NOT NULL DEF
ALTER TABLE sessions ADD COLUMN IF NOT EXISTS status TEXT NOT NULL DEFAULT 'open';
-- v1.2: chats table
-- per-chat-model-switching v2.x: ALTER below adds the model override column.
CREATE TABLE IF NOT EXISTS chats (
id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
session_id UUID NOT NULL REFERENCES sessions(id) ON DELETE CASCADE,
@@ -237,6 +245,9 @@ CREATE TABLE IF NOT EXISTS chats (
);
CREATE INDEX IF NOT EXISTS idx_chats_session_status ON chats (session_id, status, updated_at DESC);
-- v2.7.x: per-chat model override. NULL = inherit from session.model.
ALTER TABLE chats ADD COLUMN IF NOT EXISTS model TEXT;
-- v1.2: messages.chat_id + messages.kind
ALTER TABLE messages ADD COLUMN IF NOT EXISTS chat_id UUID REFERENCES chats(id) ON DELETE CASCADE;
ALTER TABLE messages ADD COLUMN IF NOT EXISTS kind TEXT NOT NULL DEFAULT 'message';
@@ -313,6 +324,9 @@ BEGIN
END IF;
END $$;
-- per-chat-model-switching: per-chat model override. NULL = inherit from session model.
ALTER TABLE chats ADD COLUMN IF NOT EXISTS model TEXT;
-- v1.x-batch9: per-session agent reference. Agent definitions are not stored in
-- the DB; they live in builtins (services/agents.ts) and a per-project AGENTS.md.
-- agent_id is the slugified agent name. NULL means "use BooCode defaults".
@@ -348,6 +362,11 @@ INSERT INTO settings (key, value) VALUES ('theme_mode', '"dark"') ON CONFLICT (k
ALTER TABLE projects ADD COLUMN IF NOT EXISTS default_system_prompt TEXT NOT NULL DEFAULT '';
ALTER TABLE projects ADD COLUMN IF NOT EXISTS default_web_search_enabled BOOLEAN NOT NULL DEFAULT false;
ALTER TABLE sessions ADD COLUMN IF NOT EXISTS web_search_enabled BOOLEAN;
-- v[state-graph]: optional declarative state-graph engine flag. Default OFF
-- (existing procedural while loop). When ON, runAssistantTurn routes
-- through runGraph in state-graph.ts for node-based execution.
ALTER TABLE sessions ADD COLUMN IF NOT EXISTS state_graph_enabled BOOLEAN NOT NULL DEFAULT FALSE;
ALTER TABLE sessions DROP COLUMN IF EXISTS tags;
-- v1.11: anchored rolling compaction.
@@ -407,3 +426,55 @@ END $$;
-- Remove the v2.0.5 arena_id column (replaced by the new Arena feature).
ALTER TABLE tasks DROP COLUMN IF EXISTS arena_id;
-- v2.x-tool-traces: per-call tool execution records for observability.
CREATE TABLE IF NOT EXISTS tool_traces (
id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
session_id UUID NOT NULL REFERENCES sessions(id) ON DELETE CASCADE,
chat_id UUID NOT NULL REFERENCES chats(id) ON DELETE CASCADE,
message_id UUID REFERENCES messages(id) ON DELETE SET NULL,
turn_number INTEGER NOT NULL,
tool_name TEXT NOT NULL,
tool_input JSONB NOT NULL,
tool_output TEXT,
started_at TIMESTAMPTZ NOT NULL DEFAULT clock_timestamp(),
finished_at TIMESTAMPTZ,
latency_ms INTEGER,
tokens_used INTEGER,
cache_tokens INTEGER,
reasoning_tokens INTEGER,
error TEXT,
outcome TEXT,
created_at TIMESTAMPTZ NOT NULL DEFAULT clock_timestamp()
);
CREATE INDEX IF NOT EXISTS idx_tool_traces_chat ON tool_traces(chat_id, created_at);
-- v2.x-tool-traces: active tool call state for in-flight instrumentation.
CREATE TABLE IF NOT EXISTS tool_trace_states (
id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
session_id UUID NOT NULL REFERENCES sessions(id) ON DELETE CASCADE,
chat_id UUID NOT NULL REFERENCES chats(id) ON DELETE CASCADE,
message_id UUID REFERENCES messages(id) ON DELETE SET NULL,
turn_number INTEGER NOT NULL,
tool_name TEXT NOT NULL,
tool_input JSONB NOT NULL,
started_at TIMESTAMPTZ NOT NULL DEFAULT clock_timestamp()
);
-- agent_snapshots: persistent agent session state for cross-refresh resume.
CREATE TABLE IF NOT EXISTS agent_snapshots (
id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
session_id UUID NOT NULL REFERENCES sessions(id) ON DELETE CASCADE,
chat_id UUID NOT NULL REFERENCES chats(id) ON DELETE CASCADE,
model TEXT NOT NULL,
agent TEXT,
mode TEXT,
turn_number INTEGER NOT NULL DEFAULT 0,
messages JSONB NOT NULL DEFAULT '[]'::jsonb,
tool_states JSONB NOT NULL DEFAULT '[]'::jsonb,
created_at TIMESTAMPTZ NOT NULL DEFAULT clock_timestamp(),
updated_at TIMESTAMPTZ NOT NULL DEFAULT clock_timestamp()
);
CREATE INDEX IF NOT EXISTS idx_agent_snapshots_chat ON agent_snapshots(chat_id);
CREATE UNIQUE INDEX IF NOT EXISTS idx_agent_snapshots_chat_unique ON agent_snapshots(chat_id);

View File

@@ -106,6 +106,8 @@ interface ParsedFrontmatter {
// allowed" — the model responds text-only.
steps?: number;
llama_extra_args?: string[];
// vDeepSeek: thinking effort for DeepSeek V4 models.
reasoning_effort?: string;
}
// P5: table-driven validation for the "soft-range" numeric frontmatter fields.
@@ -386,6 +388,7 @@ function parseAgentSection(section: RawSection): Omit<Agent, 'source'> {
max_tool_calls: typeof fm.max_tool_calls === 'number' ? fm.max_tool_calls : null,
steps: typeof fm.steps === 'number' ? fm.steps : null,
llama_extra_args: Array.isArray(fm.llama_extra_args) ? fm.llama_extra_args : null,
reasoning_effort: typeof fm.reasoning_effort === 'string' ? (fm.reasoning_effort as Agent['reasoning_effort']) : null,
};
}

View File

@@ -0,0 +1,260 @@
// v2.x: Background subagent task service.
// Creates and tracks background tasks that run as independent inference
// sessions. The spawner creates a session+chat, inserts messages, and
// dispatches inference asynchronously. Callers poll status and retrieve
// results via the companion tools (background-subagent-tools.ts).
//
// Module-level inference enqueuer: set at server startup so tools can
// dispatch background inference without importing the runner directly.
import type { Sql } from '../db.js';
import type { FastifyBaseLogger } from 'fastify';
export interface BackgroundTask {
id: string;
session_id: string;
chat_id: string;
agent: string | null;
model: string;
input: string;
status: 'pending' | 'running' | 'completed' | 'failed' | 'cancelled';
output_summary: string | null;
created_at: string;
finished_at: string | null;
}
// Module-level reference to the inference enqueuer, set at server startup.
let _enqueueInference:
| ((sessionId: string, chatId: string, assistantMessageId: string, user: string) => void)
| null = null;
export function setBackgroundInferenceEnqueuer(
enqueue: (
sessionId: string,
chatId: string,
assistantMessageId: string,
user: string,
) => void,
): void {
_enqueueInference = enqueue;
}
function mapTaskState(state: string): BackgroundTask['status'] {
switch (state) {
case 'pending':
return 'pending';
case 'running':
return 'running';
case 'completed':
return 'completed';
case 'failed':
return 'failed';
case 'blocked':
return 'pending'; // blocked is internal — surface as pending
case 'cancelled':
return 'cancelled';
default:
return 'pending';
}
}
// Spawn a background subagent task: create session + chat + messages + tasks
// row, then fire-and-forget the inference. Returns immediately with the task
// metadata — inference runs asynchronously.
export async function spawnBackgroundTask(
sql: Sql,
log: FastifyBaseLogger,
projectId: string,
input: string,
model: string,
agent?: string,
label?: string,
): Promise<BackgroundTask> {
const sessionName =
label != null && label.length > 0
? `Subagent: ${label}`
: `Background: ${input.slice(0, 50)}${input.length > 50 ? '...' : ''}`;
const result = await sql.begin(async (tx) => {
// 1. Create session for the background task
const [sess] = await tx<{ id: string }[]>`
INSERT INTO sessions (project_id, name, model, system_prompt)
VALUES (${projectId}, ${sessionName}, ${model}, '')
RETURNING id
`;
const sessionId = sess!.id;
// 2. Create chat in that session
const [ch] = await tx<{ id: string }[]>`
INSERT INTO chats (session_id, name, status)
VALUES (${sessionId}, ${label ?? null}, 'open')
RETURNING id
`;
const chatId = ch!.id;
// 3. Insert user message with the task input
await tx`
INSERT INTO messages (session_id, chat_id, role, content, status, created_at)
VALUES (${sessionId}, ${chatId}, 'user', ${input}, 'complete', clock_timestamp())
`;
// 4. Insert streaming assistant message (inference fills it)
const [assistantRow] = await tx<{ id: string }[]>`
INSERT INTO messages (session_id, chat_id, role, content, status, created_at)
VALUES (${sessionId}, ${chatId}, 'assistant', '', 'streaming', clock_timestamp())
RETURNING id
`;
const assistantMessageId = assistantRow!.id;
// 5. Insert tasks row for tracking
const [task] = await tx<{ id: string; created_at: string }[]>`
INSERT INTO tasks (project_id, session_id, state, input, agent, model)
VALUES (${projectId}, ${sessionId}, 'running', ${input}, ${agent ?? null}, ${model})
RETURNING id, created_at
`;
return { sessionId, chatId, assistantMessageId, task: task! };
});
// After the transaction commits, fire-and-forget inference dispatch.
if (_enqueueInference) {
try {
_enqueueInference(result.sessionId, result.chatId, result.assistantMessageId, 'default');
} catch (err) {
log.warn(
{ err, taskId: result.task.id },
'background inference enqueue failed',
);
}
}
log.info(
{
taskId: result.task.id,
sessionId: result.sessionId,
chatId: result.chatId,
model,
agent,
},
'spawned background subagent task',
);
return {
id: result.task.id,
session_id: result.sessionId,
chat_id: result.chatId,
agent: agent ?? null,
model,
input,
status: 'running',
output_summary: null,
created_at: result.task.created_at,
finished_at: null,
};
}
// Look up a background task by its tasks.id. Includes the status from the
// tasks table and the chat_id from the linked chat.
export async function getBackgroundTaskStatus(
sql: Sql,
taskId: string,
): Promise<BackgroundTask | null> {
const rows = await sql<
{
id: string;
session_id: string;
state: string;
input: string;
agent: string | null;
model: string | null;
output_summary: string | null;
created_at: string;
ended_at: string | null;
}[]
>`
SELECT id, session_id, state, input, agent, model, output_summary, created_at, ended_at
FROM tasks
WHERE id = ${taskId}
`;
if (rows.length === 0) return null;
const r = rows[0]!;
// Find the chat_id from the session (background sessions have exactly one chat).
const chatRows = await sql<{ id: string }[]>`
SELECT id FROM chats WHERE session_id = ${r.session_id} LIMIT 2
`;
return {
id: r.id,
session_id: r.session_id,
chat_id: chatRows[0]?.id ?? '',
agent: r.agent,
model: r.model ?? '',
input: r.input,
status: mapTaskState(r.state),
output_summary: r.output_summary,
created_at: r.created_at,
finished_at: r.ended_at,
};
}
// Retrieve the full output and token usage from a completed background task.
// Returns null if the task has no completed assistant message.
export async function getBackgroundTaskResult(
sql: Sql,
taskId: string,
chatId: string,
): Promise<{
output: string;
token_usage: { prompt: number; completion: number } | null;
} | null> {
// Verify the task exists and chatId belongs to it.
const taskRows = await sql<{ session_id: string }[]>`
SELECT session_id FROM tasks WHERE id = ${taskId}
`;
if (taskRows.length === 0) return null;
// Read the last complete assistant message (the one with content).
const msgRows = await sql<
{
content: string;
tokens_used: number | null;
ctx_used: number | null;
}[]
>`
SELECT content, tokens_used, ctx_used
FROM messages
WHERE chat_id = ${chatId}
AND role = 'assistant'
AND status = 'complete'
AND content <> ''
ORDER BY created_at DESC
LIMIT 1
`;
if (msgRows.length === 0) return null;
const m = msgRows[0]!;
return {
output: m.content,
token_usage:
m.tokens_used != null || m.ctx_used != null
? { prompt: m.ctx_used ?? 0, completion: m.tokens_used ?? 0 }
: null,
};
}
// Cancel a pending or running background task. Returns true if a row was
// actually updated (the task existed and was in a cancellable state).
export async function cancelBackgroundTask(
sql: Sql,
taskId: string,
): Promise<boolean> {
const rows = await sql<{ id: string }[]>`
UPDATE tasks
SET state = 'cancelled', ended_at = clock_timestamp()
WHERE id = ${taskId}
AND state IN ('pending', 'running')
RETURNING id
`;
return rows.length > 0;
}

View File

@@ -0,0 +1,110 @@
/**
* v2.7.18: shared MCP client wrapper for the boocontext sidecar.
*
* Calls into the existing multi-server MCP client infrastructure
* (services/mcp-client.ts) which connects to boocontext as a stdio
* MCP process defined in data/mcp.json (server name "boocontext",
* command: `node /opt/forks/boocontext/dist/standalone.js`).
*
* The boocontext MCP server is initialized once at app boot in
* index.ts via initMcp() and the actual MCP tool call routing is
* handled by mcp-client.ts:callTool() — this module is a thin
* convenience wrapper that prepends the "boocontext_" server prefix,
* normalises the response, and applies inline truncation matching
* the same pattern as codecontext_client.ts.
*
* Usage:
* import { callBoocontext } from './services/boocontext_client.js';
* const resp = await callBoocontext({
* toolName: 'codesight_get_summary',
* args: { directory: '/opt/boocode' },
* });
*/
import { callTool } from './mcp-client.js';
import { truncateIfNeeded } from './truncate.js';
// ---- Exported types ----
export interface BoocontextRequest {
/** Unprefixed tool name as defined on the boocontext MCP server
* (e.g. "codesight_scan", "boocontext_overview", "codesight_get_summary"). */
toolName: string;
/** Arguments to pass to the tool. */
args: Record<string, unknown>;
}
export interface BoocontextResponse {
/** The tool output text. */
result: string;
/** Whether the result was truncated to fit the inline limit. */
truncated: boolean;
/** Opaque id pointing at the full pre-slice content on tmpfs, set when
* truncated=true and storage succeeded. */
outputPath?: string;
}
// ---- Constants ----
/** Must match the server name in data/mcp.json. */
const BOOCONTEXT_SERVER_NAME = 'boocontext';
/** Inline truncation limit, matching codecontext_client.ts. */
const TRUNCATION_LIMIT = 32_000;
// ---- Public API ----
/**
* Call a boocontext MCP tool by its unprefixed name.
*
* Prepends the "boocontext_" server prefix, delegates to the
* multi-server MCP client's callTool(), and normalises the response
* into a BoocontextResponse with inline truncation.
*
* @param req The tool name and arguments.
* @param log Optional Fastify-compatible logger (for debug traces).
* @returns The tool result, possibly truncated.
* @throws If the boocontext server is not connected or the tool
* returns an MCP-level error.
*/
export async function callBoocontext(
req: BoocontextRequest,
log?: { debug?: (obj: object, msg: string) => void; warn?: (obj: object, msg: string) => void },
): Promise<BoocontextResponse> {
const prefixedName = `${BOOCONTEXT_SERVER_NAME}_${req.toolName}`;
log?.debug?.({ tool: prefixedName }, 'boocontext: calling tool');
const raw = await callTool(prefixedName, req.args);
// callTool returns { error: true, output: string } on failure (both
// for MCP-level isError and for network/protocol exceptions).
if (typeof raw === 'object' && raw !== null && (raw as Record<string, unknown>).error === true) {
const errOutput = (raw as Record<string, unknown>).output ?? 'Unknown MCP error';
throw new Error(`boocontext error: ${String(errOutput)}`);
}
const result = typeof raw === 'string' ? raw : JSON.stringify(raw);
// Inline truncation at 32 kB, matching codecontext_client.ts.
// The model gets a clear hint about how to narrow the next call
// rather than a silent cut.
if (result.length > TRUNCATION_LIMIT) {
const truncated = result.slice(0, TRUNCATION_LIMIT);
const omitted = result.length - TRUNCATION_LIMIT;
const slicedWithMarker =
`${truncated}\n\n[truncated, ${omitted} chars omitted; narrow with additional filters]`;
const wrapped = await truncateIfNeeded({
fullContent: result,
slicedContent: slicedWithMarker,
wasTruncated: true,
});
return {
result: wrapped.content,
truncated: wrapped.truncated,
...(wrapped.outputPath ? { outputPath: wrapped.outputPath } : {}),
};
}
return { result, truncated: false };
}

View File

@@ -1,3 +1,10 @@
// DEPRECATED (Phase 4, Domain 2, v2.8.14): This HTTP client routes through
// the Go codecontext sidecar (http://codecontext:8080). Superseded by the
// boocontext MCP server. New callers should use boocontext MCP tool wrappers
// directly. Keep this file for backward compatibility — the 16 existing
// codecontext tool wrappers (under tools/codecontext/) still call through
// callCodecontext(). Remove after full migration.
//
// v1.12 Track B.2: shared HTTP client for the codecontext sidecar. The 8
// per-tool wrappers under tools/codecontext/ all funnel through callCodecontext
// — they're thin adapters that supply toolName + args + projectPath. The
@@ -19,6 +26,7 @@
import { access, copyFile, realpath } from 'node:fs/promises';
import { isAbsolute, join, resolve, sep } from 'node:path';
import { truncateIfNeeded } from './truncate.js';
import { callBoocontext } from './boocontext_client.js';
// v1.13.12 fix: codecontext crashes on empty source files (upstream issue #37)
// when it can't ignore them. The .codecontextignore.template ships with the
@@ -112,6 +120,16 @@ export async function callCodecontext(
req: CodecontextRequest,
fetcher: typeof fetch = fetch,
): Promise<CodecontextResponse> {
// Phase 4: try boocontext MCP first. Falls back to the HTTP sidecar if the
// MCP server is not available or the tool doesn't exist there.
try {
return await callBoocontext({ toolName: req.toolName, args: req.args });
} catch (err) {
console.warn(
`[codecontext_client] boocontext MCP unavailable for "${req.toolName}", falling back to HTTP sidecar: ${err instanceof Error ? err.message : String(err)}`,
);
}
// Step 1: realpath the project root, then realpath the requested target_dir
// (defaulting to projectPath when the caller didn't pass one — the 12 wrappers
// never pass target_dir; tests can override). A non-existent target_dir

View File

@@ -24,6 +24,8 @@ import { SUMMARY_TEMPLATE } from './compaction-prompt.js';
import * as modelContextLookup from './model-context.js';
import { SENTINEL_KINDS } from './inference/sentinels.js';
import type { OpenAiMessage } from './inference/payload.js';
import { resolveModelEndpoint } from './inference/provider.js';
import type { HookRunner } from './hooks.js';
// v1.13.9: ratio-only overflow trigger. Fires compaction at 85% of ctx_max
// (opencode session/overflow.ts pattern). Replaces the v1.11.0-era
@@ -346,20 +348,22 @@ interface CompletionResult {
completionTokens: number;
}
async function callLlamaSwap(
async function callLlm(
config: Config,
model: string,
messages: OpenAiMessage[],
log: FastifyBaseLogger,
): Promise<CompletionResult> {
const res = await fetch(`${config.LLAMA_SWAP_URL}/v1/chat/completions`, {
const { url, headers, model: resolvedModel } = resolveModelEndpoint(config, model);
const res = await fetch(`${url}/v1/chat/completions`, {
method: 'POST',
headers: { 'Content-Type': 'application/json' },
body: JSON.stringify({ model, messages, stream: false }),
headers,
body: JSON.stringify({ model: resolvedModel, messages, stream: false }),
});
if (!res.ok) {
const text = await res.text().catch(() => '');
throw new Error(`llama-swap returned ${res.status}: ${text.slice(0, 200)}`);
const prefix = model.startsWith('deepseek-') ? 'deepseek' : 'llama-swap';
throw new Error(`${prefix} returned ${res.status}: ${text.slice(0, 200)}`);
}
const json = (await res.json()) as {
choices?: Array<{ message?: { content?: string } }>;
@@ -383,6 +387,8 @@ export interface ProcessInput {
log: FastifyBaseLogger;
broker: Broker;
chatId: string;
/** vWhale: lifecycle hooks runner. Undefined when no hooks configured. */
hooks?: HookRunner;
}
// Runs one round of anchored rolling compaction on `chatId`. No-ops cleanly
@@ -497,6 +503,17 @@ export async function process(input: ProcessInput): Promise<void> {
at: new Date().toISOString(),
});
// vWhale: PreCompact hook (best-effort, non-blocking).
const msgBefore = messages.length;
if (input.hooks) {
input.hooks.run('PreCompact', {
event: 'PreCompact',
session_id: sessionId,
chat_id: chatId,
messages_before: msgBefore,
}).catch(() => {});
}
// try/finally so the dot ALWAYS drops back to idle, even if the LLM call
// throws or a downstream DB write fails. The succeeded flag gates the
// 'compacted' frame + final log: we only signal completion to the UI when
@@ -506,7 +523,7 @@ export async function process(input: ProcessInput): Promise<void> {
let result: CompletionResult | undefined;
try {
// 7. Single completion (no tools). Throws on llama-swap failure.
result = await callLlamaSwap(config, session.model, payload, log);
result = await callLlm(config, session.model, payload, log);
// 7b. v1.11.3: fetch the model's true context window from llama-swap's
// /upstream/<model>/props (the streaming completion doesn't carry it).
@@ -558,6 +575,18 @@ export async function process(input: ProcessInput): Promise<void> {
`;
succeeded = true;
// vWhale: PostCompact hook (best-effort, non-blocking).
if (input.hooks) {
input.hooks.run('PostCompact', {
event: 'PostCompact',
session_id: sessionId,
chat_id: chatId,
messages_before: msgBefore,
messages_after: sel.head.length,
summary: (result?.content ?? '').slice(0, 500),
}).catch(() => {});
}
} finally {
// Always restore the dot. Status='idle' (not 'error') even on failure —
// the caller logs/re-surfaces the error separately; the dot doesn't

View File

@@ -0,0 +1,93 @@
import type { Chat, Message } from '../types/api.js';
interface ExportMessage {
role: string;
content: string;
model: string | null;
created_at: string;
tokens_used: number | null;
status: string;
kind: string;
tool_calls: Record<string, unknown>[] | null;
}
interface ExportJson {
chat: {
id: string;
name: string | null;
model: string | null;
created_at: string;
};
messages: ExportMessage[];
}
export function formatJson(
chat: Chat,
messages: Message[],
model: string | null,
): string {
const data: ExportJson = {
chat: {
id: chat.id,
name: chat.name,
model,
created_at: chat.created_at,
},
messages: messages.map((m) => ({
role: m.role,
content: m.content,
model: m.model ?? null,
created_at: m.created_at,
tokens_used: m.tokens_used,
status: m.status,
kind: m.kind,
tool_calls: m.tool_calls as Record<string, unknown>[] | null,
})),
};
return JSON.stringify(data, null, 2);
}
export function formatMarkdown(
chat: Chat,
messages: Message[],
model: string | null,
): string {
const parts: string[] = [];
parts.push(`# ${chat.name ?? 'Untitled Chat'}`);
parts.push(`Model: ${model ?? 'unknown'}`);
parts.push('');
parts.push('---');
parts.push('');
for (const msg of messages) {
// Skip system/sentinel messages for a cleaner transcript
if (msg.role === 'system') continue;
const label =
msg.role === 'user'
? 'User'
: msg.role === 'assistant'
? 'Assistant'
: 'Tool';
parts.push(`## ${label}`);
parts.push('');
if (msg.content) {
parts.push(msg.content);
parts.push('');
}
if (msg.tool_calls && msg.tool_calls.length > 0) {
for (const tc of msg.tool_calls) {
parts.push(`> \`${tc.name}\``);
parts.push('');
parts.push('```json');
parts.push(JSON.stringify(tc.args, null, 2));
parts.push('```');
parts.push('');
}
}
}
return parts.join('\n');
}

View File

@@ -0,0 +1,299 @@
/**
* vWhale: lifecycle hook runner. Hooks are shell commands that fire at key
* points in the inference pipeline. Each hook receives a JSON payload on
* stdin and can return JSON on stdout to influence behavior.
*
* Inspired by Whale's hook system with 11 lifecycle events. BooCode
* implements the most relevant subset: PreToolUse, PostToolUse,
* UserPromptSubmit, Stop, PreCompact, PostCompact.
*
* Config: JSON file at HOOKS_CONFIG_PATH (default /data/hooks.json).
* Format:
* ```json
* {
* "hooks": {
* "PreToolUse": [
* { "match": "shell_run", "command": "python3 /data/hooks/check_shell.py", "timeout": 30 }
* ],
* "Stop": [
* { "command": "node /data/hooks/log_turn.mjs" }
* ]
* }
* }
* ```
*/
import { spawn } from 'node:child_process';
import { readFileSync, existsSync } from 'node:fs';
import type { FastifyBaseLogger } from 'fastify';
// ─── Events ───────────────────────────────────────────────────────────────
export type HookEvent =
| 'PreToolUse'
| 'PostToolUse'
| 'UserPromptSubmit'
| 'Stop'
| 'PreCompact'
| 'PostCompact';
const ALL_EVENTS: HookEvent[] = [
'PreToolUse',
'PostToolUse',
'UserPromptSubmit',
'Stop',
'PreCompact',
'PostCompact',
];
// ─── Config ────────────────────────────────────────────────────────────────
export interface HookConfig {
/** Glob or exact tool name to match (PreToolUse/PostToolUse only). Omit or '*' for all. */
match?: string;
/** Shell command to run. Receives JSON payload on stdin. */
command: string;
/** Timeout in seconds (default 30). */
timeout?: number;
}
export interface HooksConfig {
hooks: Partial<Record<HookEvent, HookConfig[]>>;
}
// ─── Payloads ──────────────────────────────────────────────────────────────
export interface PreToolUsePayload {
event: 'PreToolUse';
session_id: string;
tool_name: string;
tool_args: Record<string, unknown>;
}
export interface PostToolUsePayload {
event: 'PostToolUse';
session_id: string;
tool_name: string;
tool_args: Record<string, unknown>;
tool_result: unknown;
tool_error?: string;
}
export interface UserPromptSubmitPayload {
event: 'UserPromptSubmit';
session_id: string;
chat_id: string;
prompt: string;
}
export interface StopPayload {
event: 'Stop';
session_id: string;
chat_id: string;
last_assistant_text: string;
turn: number;
}
export interface PreCompactPayload {
event: 'PreCompact';
session_id: string;
chat_id: string;
messages_before: number;
}
export interface PostCompactPayload {
event: 'PostCompact';
session_id: string;
chat_id: string;
messages_before: number;
messages_after: number;
summary: string;
}
export type HookPayload =
| PreToolUsePayload
| PostToolUsePayload
| UserPromptSubmitPayload
| StopPayload
| PreCompactPayload
| PostCompactPayload;
// ─── Response ──────────────────────────────────────────────────────────────
export type HookDecision = 'pass' | 'warn' | 'block';
export interface HookResponse {
decision?: HookDecision;
reason?: string;
/** When present, replaces the original tool args / user prompt. */
updated_input?: Record<string, unknown> | string;
/** Injected into the model's context for the next turn. */
additional_context?: string;
}
// ─── Runner ────────────────────────────────────────────────────────────────
export interface HookRunner {
/** Run all hooks for the given event. Returns the effective response. */
run(event: HookEvent, payload: HookPayload, log?: FastifyBaseLogger): Promise<HookResponse>;
}
let hooksConfig: HooksConfig | null = null;
let hooksPath: string | null = null;
/** Load hooks config from disk. Missing file = no hooks. Never throws. */
export function loadHooksConfig(path: string): HooksConfig {
hooksPath = path;
if (!existsSync(path)) {
hooksConfig = { hooks: {} };
return hooksConfig;
}
try {
const raw = readFileSync(path, 'utf8');
const parsed = JSON.parse(raw) as HooksConfig;
hooksConfig = {
hooks: { ...parsed.hooks },
};
// Validate event names
for (const event of Object.keys(hooksConfig.hooks)) {
if (!ALL_EVENTS.includes(event as HookEvent)) {
console.warn(`hooks: unknown event '${event}' in ${path} — ignoring`);
delete hooksConfig.hooks[event as HookEvent];
}
}
} catch (err) {
console.error(`hooks: failed to load ${path}`, err);
hooksConfig = { hooks: {} };
}
return hooksConfig;
}
/** Reload the config file (call after a PATCH). */
export function reloadHooksConfig(): HooksConfig {
if (hooksPath) return loadHooksConfig(hooksPath);
hooksConfig = { hooks: {} };
return hooksConfig;
}
function getConfig(): HooksConfig {
return hooksConfig ?? { hooks: {} };
}
/** Create a HookRunner for the current config. */
export function createHookRunner(): HookRunner {
return {
async run(event, payload, log): Promise<HookResponse> {
const configs = getConfig().hooks[event];
if (!configs || configs.length === 0) return { decision: 'pass' };
// Pre-filter by match pattern for tool events
const toolName = 'tool_name' in payload ? (payload as PreToolUsePayload).tool_name : undefined;
let effective: HookResponse = { decision: 'pass' };
for (const cfg of configs) {
// Skip if match doesn't apply
if (toolName && cfg.match && cfg.match !== '*' && cfg.match !== toolName) continue;
const result = await runSingleHook(cfg, payload, log);
// Merge decisions: block > warn > pass
if (result.decision === 'block') {
effective = { ...result, decision: 'block' };
break; // block is terminal
}
if (result.decision === 'warn' && effective.decision !== 'block') {
effective = { ...result, decision: 'warn' };
}
// Merge additional_context and updated_input
if (result.additional_context) {
effective.additional_context = effective.additional_context
? effective.additional_context + '\n' + result.additional_context
: result.additional_context;
}
if (result.updated_input && !effective.updated_input) {
effective.updated_input = result.updated_input;
}
}
return effective;
},
};
}
async function runSingleHook(
cfg: HookConfig,
payload: HookPayload,
log?: FastifyBaseLogger,
): Promise<HookResponse> {
const timeoutMs = (cfg.timeout ?? 30) * 1000;
return new Promise((resolve) => {
const child = spawn('sh', ['-c', cfg.command], {
stdio: ['pipe', 'pipe', 'pipe'],
timeout: timeoutMs,
env: { ...process.env },
});
const stdout: Buffer[] = [];
const stderr: Buffer[] = [];
child.stdout.on('data', (chunk: Buffer) => stdout.push(chunk));
child.stderr.on('data', (chunk: Buffer) => stderr.push(chunk));
let settled = false;
const timer = setTimeout(() => {
if (!settled) {
settled = true;
child.kill('SIGTERM');
log?.warn({ event: payload.event, command: cfg.command }, 'hooks: timeout');
resolve({ decision: 'warn', reason: 'hook timed out' });
}
}, timeoutMs);
child.on('error', (err) => {
if (!settled) {
settled = true;
clearTimeout(timer);
log?.warn({ err, event: payload.event }, 'hooks: spawn error');
resolve({ decision: 'warn', reason: `hook failed: ${err.message}` });
}
});
child.on('close', (code) => {
if (settled) return;
settled = true;
clearTimeout(timer);
const out = Buffer.concat(stdout).toString('utf8').trim();
const errOut = Buffer.concat(stderr).toString('utf8').trim();
if (code !== 0 && !out) {
log?.warn({ event: payload.event, code, stderr: errOut.slice(0, 200) }, 'hooks: non-zero exit');
resolve({ decision: 'warn', reason: `hook exited ${code}` });
return;
}
// Parse stdout as JSON response
if (out) {
try {
const parsed = JSON.parse(out) as HookResponse;
resolve(parsed);
return;
} catch {
// Not JSON — treat as pass with stdout as context
if (out.length > 0) {
resolve({ decision: 'pass', additional_context: out });
return;
}
}
}
resolve({ decision: 'pass' });
});
// Write payload to stdin
const json = JSON.stringify(payload);
child.stdin.write(json);
child.stdin.end();
});
}

View File

@@ -0,0 +1,132 @@
/**
* Compact unified-diff generator for write-tool results.
*
* Produces a minimal unified diff string (---/+++ header + +/- lines) from
* old/new text pairs so the frontend can render an inline diff snippet
* without pulling in a full diff library.
*/
// Write-tool names that can produce file diffs.
export const WRITE_TOOL_NAMES = new Set([
'edit_file',
'create_file',
'delete_file',
'apply_pending',
]);
/**
* Compute a compact unified diff from old → new text.
*
* @param oldStr The original text (empty for creates)
* @param newStr The replacement text (empty for deletes)
* @param filePath Display path for the file header
* @returns A unified-diff string, or empty string if old === new
*/
export function computeDiff(oldStr: string, newStr: string, filePath: string): string {
if (oldStr === newStr) return '';
const oldLines = oldStr.split('\n');
const newLines = newStr.split('\n');
// For empty old → new file (create), show all lines as additions
if (oldStr.length === 0 && newStr.length > 0) {
const header = `--- /dev/null\n+++ b/${filePath}\n`;
const body = newLines.map((line) => `+${line}`).join('\n');
return header + body;
}
// For old → empty (delete), show all lines as removals
if (newStr.length === 0 && oldStr.length > 0) {
const header = `--- a/${filePath}\n+++ /dev/null\n`;
const body = oldLines.map((line) => `-${line}`).join('\n');
return header + body;
}
// Simple line-by-line diff for edit: collect changed lines with context.
// Uses a straightforward algorithm: find the first differing line and the
// last differing line, then output the block with +/- markers.
const header = `--- a/${filePath}\n+++ b/${filePath}\n`;
const maxLen = Math.max(oldLines.length, newLines.length);
let firstDiff = -1;
let lastDiff = -1;
for (let i = 0; i < maxLen; i++) {
const a = i < oldLines.length ? oldLines[i] : undefined;
const b = i < newLines.length ? newLines[i] : undefined;
if (a !== b) {
if (firstDiff === -1) firstDiff = i;
lastDiff = i;
}
}
if (firstDiff === -1) return '';
// Add context lines around the changed block (up to 2 lines each side)
const contextBefore = 2;
const contextAfter = 2;
const start = Math.max(0, firstDiff - contextBefore);
const end = Math.min(maxLen - 1, lastDiff + contextAfter);
// Build the unified diff hunk
const hunkLines: string[] = [];
const hunkOldStart = start + 1; // 1-indexed
const hunkNewStart = start + 1;
const hunkOldLen = end - start + 1;
const hunkNewLen = end - start + 1;
for (let i = start; i <= end; i++) {
const oldLine = i < oldLines.length ? oldLines[i] : undefined;
const newLine = i < newLines.length ? newLines[i] : undefined;
if (oldLine === newLine) {
hunkLines.push(` ${oldLine ?? ''}`);
} else {
if (oldLine !== undefined) {
hunkLines.push(`-${oldLine}`);
}
if (newLine !== undefined) {
hunkLines.push(`+${newLine}`);
}
}
}
const hunkHeader = `@@ -${hunkOldStart},${hunkOldLen} +${hunkNewStart},${hunkNewLen} @@\n`;
return header + hunkHeader + hunkLines.join('\n');
}
/**
* Check whether a tool name corresponds to a file-modifying write tool
* that should produce a diff in its tool result.
*/
export function isWriteTool(name: string): boolean {
return WRITE_TOOL_NAMES.has(name);
}
/**
* Extract a diff string from tool call args for write tools.
* Returns empty string if the tool doesn't produce diffs or args are missing.
*/
export function diffFromToolArgs(name: string, args: Record<string, unknown>, filePath?: string): string {
switch (name) {
case 'edit_file': {
const oldStr = String(args.old_string ?? '');
const newStr = String(args.new_string ?? '');
const path = filePath ?? String(args.file_path ?? 'file');
return computeDiff(oldStr, newStr, path);
}
case 'create_file': {
const content = String(args.content ?? '');
const path = filePath ?? String(args.file_path ?? 'file');
return computeDiff('', content, path);
}
case 'delete_file':
// No content available at queue time — actual content is read at apply time.
return '';
case 'apply_pending':
// Meta-tool — individual changes produce their own diffs.
return '';
default:
return '';
}
}

View File

@@ -74,6 +74,7 @@ export async function handleAbortOrError(
type: 'message_complete',
message_id: assistantMessageId,
chat_id: chatId,
...(args.compareGroupId ? { compare_group_id: args.compareGroupId } : {}),
});
ctx.log.info({ sessionId, chatId, assistantMessageId }, 'inference cancelled');
} else {
@@ -90,6 +91,7 @@ export async function handleAbortOrError(
chat_id: chatId,
error: errMsg,
reason: 'llm_provider_error',
...(args.compareGroupId ? { compare_group_id: args.compareGroupId } : {}),
});
ctx.log.error({ err, sessionId, assistantMessageId }, 'inference failed');
}
@@ -122,7 +124,10 @@ export async function finalizeStreamedRow(
completionTokens: number | null;
promptTokens: number | null;
startedAt: string | null;
cacheTokens?: number | null;
reasoningTokens?: number | null;
beforeComplete?: () => Promise<void>;
compareGroupId?: string;
},
): Promise<void> {
// v1.11.3: see executeToolPhase for the rationale.
@@ -137,6 +142,8 @@ export async function finalizeStreamedRow(
tokens_used = ${opts.completionTokens},
ctx_used = ${opts.promptTokens},
ctx_max = ${nCtx},
cache_tokens = ${opts.cacheTokens ?? null},
reasoning_tokens = ${opts.reasoningTokens ?? null},
finished_at = clock_timestamp()
WHERE id = ${opts.messageId}
RETURNING tokens_used, ctx_used, ctx_max, finished_at
@@ -149,9 +156,12 @@ export async function finalizeStreamedRow(
tokens_used: updated?.tokens_used ?? null,
ctx_used: updated?.ctx_used ?? null,
ctx_max: updated?.ctx_max ?? null,
cache_tokens: opts.cacheTokens ?? null,
reasoning_tokens: opts.reasoningTokens ?? null,
started_at: opts.startedAt,
finished_at: updated?.finished_at ?? null,
model: opts.model,
...(opts.compareGroupId ? { compare_group_id: opts.compareGroupId } : {}),
});
}
@@ -176,6 +186,7 @@ export async function finalizeEmpty(
type: 'message_complete',
message_id: assistantMessageId,
chat_id: chatId,
...(args.compareGroupId ? { compare_group_id: args.compareGroupId } : {}),
});
}
@@ -188,7 +199,7 @@ export async function finalizeCompletion(
): Promise<void> {
const { sessionId, chatId, assistantMessageId } = args;
const content = stripToolMarkup(result.content, { final: true });
const { finishReason, promptTokens, completionTokens } = result;
const { finishReason, promptTokens, completionTokens, cacheReadTokens, reasoningTokens } = result;
// v1.11.3: see executeToolPhase for the rationale.
const mctx = await modelContext.getModelContext(session.model);
@@ -203,6 +214,8 @@ export async function finalizeCompletion(
tokens_used = ${completionTokens},
ctx_used = ${promptTokens},
ctx_max = ${nCtx},
cache_tokens = ${cacheReadTokens ?? null},
reasoning_tokens = ${reasoningTokens ?? null},
model = ${session.model},
finished_at = clock_timestamp()
WHERE id = ${assistantMessageId}
@@ -268,9 +281,12 @@ export async function finalizeCompletion(
tokens_used: updated?.tokens_used ?? null,
ctx_used: updated?.ctx_used ?? null,
ctx_max: updated?.ctx_max ?? null,
cache_tokens: cacheReadTokens ?? null,
reasoning_tokens: reasoningTokens ?? null,
started_at: startedAt,
finished_at: updated?.finished_at ?? null,
model: session.model,
...(args.compareGroupId ? { compare_group_id: args.compareGroupId } : {}),
});
ctx.log.info(
{

View File

@@ -8,6 +8,7 @@ export {
createInferenceRunner,
MAX_STEPS,
runInference,
runInferenceWithModel,
} from './turn.js';
// P5: the shared pipeline types moved from turn.ts to types.ts (breaking the
// hub-and-leaf near-cycle). Re-exported here so the public surface is unchanged.
@@ -21,3 +22,4 @@ export type {
export type { ToolPhaseResult } from './tool-phase.js';
export { detectDoomLoop, DOOM_LOOP_THRESHOLD } from './sentinels.js';
export { buildMessagesPayload } from './payload.js';
export { runGraph, type GraphNodeType, type GraphState, type GraphResult } from './state-graph.js';

View File

@@ -0,0 +1,56 @@
// vDeepSeek (stub): multi-modal (image) attachment support.
//
// When a message carries images, DeepSeek V4 models can process them
// natively via the @ai-sdk/deepseek provider. This module provides the
// helper types and functions to detect and convert image attachments.
//
// FULL INTEGRATION requires:
// 1. Storing image data alongside messages (message_parts with kind='image'
// or a dedicated attachments table with base64-encoded data).
// 2. Extending OpenAiMessage.content from `string | null` to
// `string | null | Array<{ type: 'text'; text: string } | { type: 'image'; image: string }>`
// in apps/server/src/services/inference/payload.ts.
// 3. Updating toModelMessages() in stream-phase-adapter.ts to emit AI SDK
// content arrays with image parts for multimodal user messages.
//
// None of the above is done yet — this file is a type scaffold.
import type { Message } from '../../types/api.js';
/** Shape of a decoded image attachment ready for the AI SDK. */
export interface ImageAttachment {
/** Base64-encoded image data (no data URI prefix — raw bytes). */
data: string;
/** MIME type (e.g. 'image/png', 'image/jpeg', 'image/webp'). */
mimeType: string;
}
/**
* Check if a user message has image content that can be forwarded to a
* multimodal model. Currently a stub — always returns false until the
* message-pipeline stores image attachments addressably.
*/
export function hasImageAttachments(_message: Message): boolean {
// TODO(vDeepSeek): scan message_parts for kind='image' or inspect
// message.content for inline data URIs (data:image/...).
return false;
}
/**
* Convert internal image attachments to the format expected by the AI SDK
* ModelMessage content array.
*
* The @ai-sdk/deepseek provider accepts images as:
* { type: 'image'; image: 'data:image/png;base64,...' }
*
* @param attachments — List of decoded image attachments.
* @returns AI SDK inline file parts suitable for ModelMessage.content.
*/
export function imageAttachmentsToParts(
attachments: ImageAttachment[],
): Array<{ type: 'image'; image: string }> {
return attachments.map((a) => ({
type: 'image' as const,
image: `data:${a.mimeType};base64,${a.data}`,
}));
}

View File

@@ -194,6 +194,14 @@ export async function buildMessagesPayload(
out.push(msg);
continue;
}
// TODO(vDeepSeek): when m has image attachments, use a content array
// with text + image parts (see multi-modal.ts:imageAttachmentsToParts).
// The AI SDK ModelMessage content shape supports:
// content: [
// { type: 'text', text: '...' },
// { type: 'image', image: 'data:image/png;base64,...' }
// ]
// The @ai-sdk/deepseek provider handles the image parts natively.
out.push({ role: 'user', content: m.content });
}
return out;
@@ -206,7 +214,7 @@ export async function loadContext(
): Promise<{ session: Session; project: Project; history: Message[] } | null> {
const sessionRows = await sql<Session[]>`
SELECT id, project_id, name, model, system_prompt, status, created_at, updated_at,
agent_id, web_search_enabled, allowed_read_paths
agent_id, web_search_enabled, allowed_read_paths, state_graph_enabled
FROM sessions WHERE id = ${sessionId}
`;
if (sessionRows.length === 0) return null;

View File

@@ -1,4 +1,5 @@
import { createOpenAICompatible } from '@ai-sdk/openai-compatible';
import { createDeepSeek } from '@ai-sdk/deepseek';
import type { LanguageModel } from 'ai';
// v1.13.1-A: AI SDK provider against llama-swap. baseURL is threaded from
@@ -11,6 +12,12 @@ import type { LanguageModel } from 'ai';
// llama-sidecar instead. A fresh provider is created per call (not cached)
// because the X-Agent-Flags header varies per agent. The llama-swap path
// stays cached since it has no per-request headers.
//
// vDeepSeek: when the model ID starts with 'deepseek-' and DEEPSEEK_API_KEY
// is set, route through the official @ai-sdk/deepseek provider (not
// openai-compatible) so DeepSeek-specific features work: providerMetadata
// with promptCacheHitTokens/promptCacheMissTokens, reasoning via
// LanguageModelV4Usage.outputTokens.reasoning, and thinking-mode options.
const swapCache = new Map<string, ReturnType<typeof createOpenAICompatible>>();
@@ -41,7 +48,28 @@ function sidecarProvider(
});
}
export type InferenceRoute = 'swap' | 'sidecar';
const DEEPSEEK_MODEL_PREFIX = 'deepseek-';
export function isDeepSeekModel(modelId: string): boolean {
return modelId.startsWith(DEEPSEEK_MODEL_PREFIX);
}
let deepseekProviderCache: ReturnType<typeof createDeepSeek> | null = null;
function getDeepSeekProvider(
apiKey: string,
baseURL: string,
): ReturnType<typeof createDeepSeek> {
if (!deepseekProviderCache) {
deepseekProviderCache = createDeepSeek({
apiKey,
baseURL,
});
}
return deepseekProviderCache;
}
export type InferenceRoute = 'swap' | 'sidecar' | 'deepseek';
export interface RoutingInfo {
route: InferenceRoute;
@@ -55,12 +83,21 @@ interface AgentLike {
interface ConfigLike {
LLAMA_SWAP_URL: string;
LLAMA_SIDECAR_URL?: string;
DEEPSEEK_API_KEY?: string;
DEEPSEEK_BASE_URL?: string;
}
export function resolveRoute(
agent: AgentLike | null,
config?: ConfigLike,
modelId?: string,
): RoutingInfo {
// vDeepSeek: if the model starts with deepseek- and DEEPSEEK_API_KEY is set,
// route through the DeepSeek provider. Checked first so DeepSeek models
// always bypass llama-swap/sidecar even when those are also configured.
if (modelId?.startsWith(DEEPSEEK_MODEL_PREFIX) && config?.DEEPSEEK_API_KEY) {
return { route: 'deepseek', flags: null };
}
// When llama_extra_args are explicitly set, route through sidecar with them.
const flags = agent?.llama_extra_args;
if (flags && flags.length > 0) {
@@ -80,7 +117,13 @@ export function upstreamModel(
modelId: string,
agent?: AgentLike | null,
): LanguageModel {
const { route, flags } = resolveRoute(agent ?? null, config);
const { route, flags } = resolveRoute(agent ?? null, config, modelId);
if (route === 'deepseek') {
return getDeepSeekProvider(
config.DEEPSEEK_API_KEY!,
config.DEEPSEEK_BASE_URL ?? 'https://api.deepseek.com',
).chat(modelId);
}
if (route === 'sidecar') {
const url = config.LLAMA_SIDECAR_URL;
if (!url) {
@@ -90,3 +133,30 @@ export function upstreamModel(
}
return getSwapProvider(config.LLAMA_SWAP_URL).chatModel(modelId);
}
/** Resolve the API endpoint for non-streaming calls (compaction, task-model).
* Returns the URL + model + optional auth header for direct fetch() usage. */
export function resolveModelEndpoint(
config: ConfigLike,
modelId: string,
): { url: string; model: string; headers: Record<string, string> } {
const baseHeaders: Record<string, string> = { 'Content-Type': 'application/json' };
if (modelId.startsWith(DEEPSEEK_MODEL_PREFIX) && config.DEEPSEEK_API_KEY) {
const baseURL = (config.DEEPSEEK_BASE_URL ?? 'https://api.deepseek.com').replace(/\/+$/, '');
return {
url: baseURL,
model: modelId,
headers: { ...baseHeaders, Authorization: `Bearer ${config.DEEPSEEK_API_KEY}` },
};
}
return {
url: config.LLAMA_SWAP_URL.replace(/\/+$/, ''),
model: modelId,
headers: baseHeaders,
};
}
/** Invalidate the cached DeepSeek provider (e.g. when env vars change at runtime). */
export function resetDeepSeekProvider(): void {
deepseekProviderCache = null;
}

View File

@@ -0,0 +1,531 @@
// P5: Optional declarative state graph engine for the inference turn loop.
//
// Replaces the procedural `while (stepNumber < effectiveCap)` in turn.ts
// with a node-based execution model. Default OFF via
// session.state_graph_enabled — zero behavior change when disabled.
//
// Nodes wrap EXISTING infrastructure (no new I/O patterns):
// PLAN → top-of-loop gate, compaction, loadContext, buildMessagesPayload,
// executeStreamPhase
// CALL_TOOL → executeToolPhase
// OBSERVE → process tool results, update loop locals
// REFLECT → decidePostToolAction, sentinel insertion, mistake tracker
// SYNTHESIZE → terminal (graph loop exits)
import type { Agent, Project, Session, ToolCall } from '../../types/api.js';
import { resolveProjectRoot } from '../path_guard.js';
import { rewriteSearchQuery } from '../task-search-rewrite.js';
import * as compaction from '../compaction.js';
import { decideStep, decidePostToolAction } from './step-decision.js';
import {
recordStep,
MISTAKE_RECOVERY_NOTE,
type MistakeState,
} from './mistake-tracker.js';
import {
buildMessagesPayload,
loadContext,
} from './payload.js';
import { toDcpMessages, transformMessages, fromDcpMessages } from './dcp/index.js';
import {
finalizeCompletion,
finalizeEmpty,
handleAbortOrError,
} from './error-handler.js';
import {
executeStreamPhase,
} from './stream-phase.js';
import { executeToolPhase, type ToolPhaseResult } from './tool-phase.js';
import type {
InferenceContext,
StreamPhaseState,
StreamResult,
TurnArgs,
} from './types.js';
import {
runCapHitSummary,
runDoomLoopSummary,
insertMistakeRecoverySentinel,
} from './sentinel-summaries.js';
import { execFile } from 'node:child_process';
import { readFileSync, existsSync } from 'node:fs';
import { join } from 'node:path';
const BUILD_TIMEOUT_MS = 60_000;
const BUILD_OUTPUT_CAP = 8_000;
async function detectAndRunBuild(
ctx: InferenceContext,
projectRoot: string,
sessionId: string,
chatId: string,
model: string,
existingNote: string | undefined,
): Promise<string | undefined> {
if (!model.startsWith('deepseek-')) return undefined;
const pkgPath = join(projectRoot, 'package.json');
if (!existsSync(pkgPath)) return undefined;
let buildCmd: string | null = null;
try {
const pkg = JSON.parse(readFileSync(pkgPath, 'utf8')) as { scripts?: Record<string, string> };
if (pkg.scripts?.build) buildCmd = 'build';
else if (pkg.scripts?.compile) buildCmd = 'compile';
else if (pkg.scripts?.typecheck) buildCmd = 'typecheck';
} catch {
return undefined;
}
if (!buildCmd) return undefined;
const hasPnpm = existsSync(join(projectRoot, 'pnpm-lock.yaml'));
const hasYarn = existsSync(join(projectRoot, 'yarn.lock'));
const pm = hasPnpm ? 'pnpm' : hasYarn ? 'yarn' : 'npm';
try {
const out = await new Promise<string>((resolve, reject) => {
execFile(pm, ['run', buildCmd!], { cwd: projectRoot, timeout: BUILD_TIMEOUT_MS, maxBuffer: BUILD_OUTPUT_CAP * 2 },
(err, stdout, stderr) => {
if (err && (err as NodeJS.ErrnoException).code === 'ENOENT') {
resolve('');
return;
}
const merged = (stdout + '\n' + stderr).trim();
resolve(merged.slice(0, BUILD_OUTPUT_CAP));
},
);
});
if (!out) return undefined;
ctx.log.info({ sessionId, chatId, buildCmd, outputLen: out.length }, 'auto-fix: build failed');
const combined = existingNote
? existingNote + '\n\n--- Build error ---\n' + out.slice(0, BUILD_OUTPUT_CAP - existingNote.length)
: '--- Build error ---\n' + out.slice(0, BUILD_OUTPUT_CAP);
return combined;
} catch {
return undefined;
}
}
// -- Types ----------------------------------------------------------------
export type GraphNodeType = 'PLAN' | 'CALL_TOOL' | 'OBSERVE' | 'REFLECT' | 'SYNTHESIZE';
export interface GraphState {
stepNumber: number;
toolsUsed: number;
recentToolCalls: ToolCall[];
assistantMessageId: string;
mistakeTracker: MistakeState;
pendingRecoveryNote?: string;
effectiveCap: number;
budget: number;
projectRoot: string;
iterSession?: Session;
iterProject?: Project;
streamResult?: StreamResult;
startedAt?: string | null;
toolPhaseResult?: ToolPhaseResult;
shouldStop: boolean;
}
interface GraphNode {
type: GraphNodeType;
edges: Array<{ to: GraphNodeType; condition: (state: GraphState) => boolean }>;
execute: (
ctx: InferenceContext,
args: TurnArgs,
state: GraphState,
agent: Agent | null,
) => Promise<void>;
}
export interface GraphResult {
stepNumber: number;
assistantMessageId: string;
toolsUsed: number;
recentToolCalls: ToolCall[];
mistakeTracker: MistakeState;
}
// -- Default graph --------------------------------------------------------
export function createDefaultGraph(): GraphNode[] {
return [
{
type: 'PLAN',
edges: [
{ to: 'CALL_TOOL', condition: (s) => !!s.streamResult && s.streamResult.toolCalls.length > 0 },
{ to: 'SYNTHESIZE', condition: () => true },
],
execute: planNode,
},
{
type: 'CALL_TOOL',
edges: [
{ to: 'OBSERVE', condition: () => true },
],
execute: callToolNode,
},
{
type: 'OBSERVE',
edges: [
{ to: 'REFLECT', condition: (s) => s.toolPhaseResult?.action === 'continue' },
{ to: 'SYNTHESIZE', condition: () => true },
],
execute: observeNode,
},
{
type: 'REFLECT',
edges: [
{ to: 'PLAN', condition: (s) => s.stepNumber < s.effectiveCap },
{ to: 'SYNTHESIZE', condition: () => true },
],
execute: reflectNode,
},
{
type: 'SYNTHESIZE',
edges: [],
execute: async () => {},
},
];
}
// -- Graph runner ---------------------------------------------------------
export async function runGraph(
ctx: InferenceContext,
args: TurnArgs,
extra: { effectiveCap: number; budget: number; agent: Agent | null; projectRoot: string },
): Promise<GraphResult> {
const { effectiveCap, budget, agent } = extra;
const state: GraphState = {
stepNumber: 0,
toolsUsed: args.toolsUsed,
recentToolCalls: args.recentToolCalls,
assistantMessageId: args.assistantMessageId,
mistakeTracker: args.mistakeTracker,
pendingRecoveryNote: args.pendingRecoveryNote,
effectiveCap,
budget,
projectRoot: extra.projectRoot,
shouldStop: false,
};
const graph = createDefaultGraph();
let currentNode: GraphNodeType = 'PLAN';
while (currentNode !== 'SYNTHESIZE' && !state.shouldStop) {
const node = graph.find((n) => n.type === currentNode)!;
await node.execute(ctx, args, state, agent);
if (state.shouldStop) break;
const nextEdge = node.edges.find((e) => e.condition(state));
if (!nextEdge) break;
currentNode = nextEdge.to;
}
return {
stepNumber: state.stepNumber,
assistantMessageId: state.assistantMessageId,
toolsUsed: state.toolsUsed,
recentToolCalls: state.recentToolCalls,
mistakeTracker: state.mistakeTracker,
};
}
// -- PLAN node ------------------------------------------------------------
// Top-of-loop gate → compaction → loadContext → DCP → buildPayload → stream
async function planNode(
ctx: InferenceContext,
args: TurnArgs,
state: GraphState,
agent: Agent | null,
): Promise<void> {
const { sessionId, chatId, signal } = args;
// 1. Top-of-loop gate: doom-loop, then budget (pure decisions)
const decision = decideStep({
recentToolCalls: state.recentToolCalls,
toolsUsed: state.toolsUsed,
budget: state.budget,
});
if (decision.kind === 'doom') {
const loaded = await loadContext(ctx.sql, sessionId, chatId);
if (loaded) {
const dlSession = args.modelOverride ? { ...loaded.session, model: args.modelOverride } : loaded.session;
const iterArgs: TurnArgs = {
sessionId, chatId, assistantMessageId: state.assistantMessageId,
toolsUsed: state.toolsUsed, recentToolCalls: state.recentToolCalls,
mistakeTracker: state.mistakeTracker, signal,
};
await runDoomLoopSummary(ctx, iterArgs, dlSession, loaded.project, loaded.history, agent, decision.loop);
}
state.shouldStop = true;
return;
}
if (decision.kind === 'budget') {
const loaded = await loadContext(ctx.sql, sessionId, chatId);
if (loaded) {
const bhSession = args.modelOverride ? { ...loaded.session, model: args.modelOverride } : loaded.session;
const iterArgs: TurnArgs = {
sessionId, chatId, assistantMessageId: state.assistantMessageId,
toolsUsed: state.toolsUsed, recentToolCalls: state.recentToolCalls,
mistakeTracker: state.mistakeTracker, signal,
};
await runCapHitSummary(ctx, iterArgs, bhSession, loaded.project, loaded.history, agent, state.budget);
}
state.shouldStop = true;
return;
}
// decision.kind === 'stream' → proceed.
// 2. Compaction check
const chatFlag = await ctx.sql<{ needs_compaction: boolean }[]>`
SELECT needs_compaction FROM chats WHERE id = ${chatId}
`;
if (chatFlag[0]?.needs_compaction) {
try {
await compaction.process({
sql: ctx.sql, config: ctx.config, log: ctx.log,
broker: ctx.broker, chatId, hooks: ctx.hooks,
});
} catch (err) {
ctx.log.warn({ err, chatId }, 'auto-compaction failed; clearing flag and proceeding');
await ctx.sql`UPDATE chats SET needs_compaction = false WHERE id = ${chatId}`;
}
}
// 3. Load context (must re-load each iteration — new messages)
const loaded = await loadContext(ctx.sql, sessionId, chatId);
if (!loaded) {
ctx.log.warn({ sessionId }, 'inference: session or project missing mid-loop');
state.shouldStop = true;
return;
}
let { session: iterSession, project: iterProject, history } = loaded;
if (args.modelOverride) {
iterSession = { ...iterSession, model: args.modelOverride };
}
state.iterSession = iterSession;
state.iterProject = iterProject;
const projectRoot = await resolveProjectRoot(iterProject.path);
state.projectRoot = projectRoot;
// 4. DCP transform
try {
const dcpMsgs = toDcpMessages(history);
const { messages: pruned, stats } = transformMessages(chatId, dcpMsgs);
if (stats.removedCount > 0) {
ctx.log.info({ chatId, ...stats }, 'dcp: transform removed messages');
history = fromDcpMessages(pruned) as typeof history;
}
} catch (err) {
ctx.log.warn({ err: err instanceof Error ? err.message : String(err), chatId }, 'dcp: transform skipped');
}
// 5. Log step boundary
ctx.log.info(
{ sessionId, chatId, step: state.stepNumber, assistantMessageId: state.assistantMessageId },
'step_start',
);
// 6. Build messages + stream phase
const messages = await buildMessagesPayload(iterSession, iterProject, history, agent, ctx.log);
const webToolsEnabled =
iterSession.web_search_enabled ?? iterProject.default_web_search_enabled ?? false;
if (state.stepNumber === 0 && webToolsEnabled && messages.length >= 2) {
const lastUserMsg = [...messages].reverse().find((m) => m.role === 'user');
if (lastUserMsg?.content) {
const hint = await rewriteSearchQuery(lastUserMsg.content);
if (hint && messages[0]?.role === 'system' && messages[0].content) {
messages[0].content += `\n\nThe user's search intent can be summarized as: "${hint}"`;
}
}
}
if (state.pendingRecoveryNote) {
messages.push({ role: 'system', content: state.pendingRecoveryNote });
state.pendingRecoveryNote = undefined;
}
// 7. Stream phase
const iterArgs: TurnArgs = {
sessionId, chatId, assistantMessageId: state.assistantMessageId,
toolsUsed: state.toolsUsed, recentToolCalls: state.recentToolCalls,
mistakeTracker: state.mistakeTracker, signal,
};
const streamState: StreamPhaseState = { accumulated: '', startedAt: null };
try {
const result = await executeStreamPhase(ctx, iterArgs, iterSession, messages, streamState, agent, webToolsEnabled);
state.streamResult = result;
state.startedAt = streamState.startedAt;
// Non-tool finish: Stop hook + finalize here (edge from PLAN → SYNTHESIZE
// will break the graph loop after this node returns).
if (result.toolCalls.length === 0) {
if (ctx.hooks) {
ctx.hooks.run('Stop', {
event: 'Stop',
session_id: sessionId,
chat_id: chatId,
last_assistant_text: result.content.slice(0, 500),
turn: state.stepNumber,
}).catch(() => {});
}
await finalizeCompletion(ctx, iterArgs, result, streamState.startedAt, iterSession);
}
} catch (err) {
await handleAbortOrError(ctx, iterArgs, streamState.accumulated, err);
state.shouldStop = true;
}
}
// -- CALL_TOOL node -------------------------------------------------------
// Executes the tool phase and stores the result for OBSERVE.
async function callToolNode(
ctx: InferenceContext,
args: TurnArgs,
state: GraphState,
agent: Agent | null,
): Promise<void> {
const { sessionId, chatId } = args;
const result = state.streamResult;
if (!result) {
ctx.log.warn({ sessionId }, 'state-graph: CALL_TOOL without stream result');
state.shouldStop = true;
return;
}
const session = state.iterSession;
if (!session) {
ctx.log.warn({ sessionId }, 'state-graph: CALL_TOOL without iterSession');
state.shouldStop = true;
return;
}
try {
state.toolPhaseResult = await executeToolPhase(
ctx, args, result, state.startedAt ?? null,
session, state.projectRoot, agent, state.stepNumber,
);
} catch (err) {
ctx.log.error({ err, sessionId, chatId, step: state.stepNumber }, 'tool phase threw unexpectedly');
state.shouldStop = true;
}
}
// -- OBSERVE node ---------------------------------------------------------
// Processes tool results: updates loop locals, mistake tracking, build errors.
async function observeNode(
ctx: InferenceContext,
args: TurnArgs,
state: GraphState,
_agent: Agent | null,
): Promise<void> {
const { sessionId, chatId } = args;
const tpr = state.toolPhaseResult;
if (!tpr) {
state.shouldStop = true;
return;
}
// Update loop locals (mirrors the existing while-loop post-tool logic)
state.toolsUsed += tpr.toolCallCount;
state.recentToolCalls = [...state.recentToolCalls, ...tpr.toolCalls];
state.stepNumber++;
// Fold tool outcomes into the mistake tracker
for (const o of tpr.outcomes) {
recordStep(state.mistakeTracker, o);
}
// Auto-fix: after write tools, attempt build and inject errors.
const WRITE_TOOLS = new Set(['edit_file', 'create_file', 'delete_file', 'apply_pending']);
const hasWriteTools = tpr.toolCalls.some((tc) => WRITE_TOOLS.has(tc.name));
if (hasWriteTools && state.iterSession) {
detectAndRunBuild(ctx, state.projectRoot, sessionId, chatId, state.iterSession.model, state.pendingRecoveryNote)
.then((buildError) => {
if (buildError) state.pendingRecoveryNote = buildError;
})
.catch(() => {});
}
}
// -- REFLECT node ---------------------------------------------------------
// Post-tool decision: decidePostToolAction, nudge/escalate/continue handling.
async function reflectNode(
ctx: InferenceContext,
args: TurnArgs,
state: GraphState,
_agent: Agent | null,
): Promise<void> {
const { sessionId, chatId, signal } = args;
const tpr = state.toolPhaseResult;
if (!tpr) {
state.shouldStop = true;
return;
}
const post = decidePostToolAction(tpr.action, state.mistakeTracker);
if (post === 'stop') {
state.shouldStop = true;
return;
}
if (post === 'nudge') {
state.pendingRecoveryNote = MISTAKE_RECOVERY_NOTE;
const failureKinds = [...state.mistakeTracker.run];
await insertMistakeRecoverySentinel(ctx, sessionId, chatId, {
failureKinds,
count: failureKinds.length,
escalated: false,
canContinue: true,
});
state.mistakeTracker.nudges += 1;
state.mistakeTracker.run = [];
ctx.log.info(
{ sessionId, chatId, step: state.stepNumber, nudges: state.mistakeTracker.nudges, failureKinds },
'mistake_recovery nudge',
);
// Continue to next PLAN node — edges check step < cap.
if (state.assistantMessageId !== tpr.nextAssistantId && tpr.nextAssistantId) {
state.assistantMessageId = tpr.nextAssistantId;
}
return;
}
if (post === 'escalate') {
const failureKinds = [...state.mistakeTracker.run];
if (tpr.nextAssistantId) {
state.assistantMessageId = tpr.nextAssistantId;
}
const escalateArgs: TurnArgs = {
sessionId, chatId, assistantMessageId: state.assistantMessageId,
toolsUsed: state.toolsUsed, recentToolCalls: state.recentToolCalls,
mistakeTracker: state.mistakeTracker, signal,
};
await finalizeEmpty(ctx, escalateArgs);
await insertMistakeRecoverySentinel(ctx, sessionId, chatId, {
failureKinds,
count: failureKinds.length,
escalated: true,
canContinue: true,
});
ctx.publishUser({ type: 'chat_status', chat_id: chatId, status: 'idle', at: new Date().toISOString() });
ctx.log.info(
{ sessionId, chatId, step: state.stepNumber, failureKinds },
'mistake_recovery escalate — stopping turn',
);
state.shouldStop = true;
return;
}
// 'continue' — advance to next assistant message.
if (tpr.nextAssistantId) {
state.assistantMessageId = tpr.nextAssistantId;
}
}

View File

@@ -13,7 +13,7 @@ import type { OpenAiMessage } from './payload.js';
import { extractToolCallBlocks } from './tool-call-parser.js';
import { classifyStreamError } from './stream-error-classifier.js';
import type { StreamResult } from './types.js';
import { upstreamModel } from './provider.js';
import { isDeepSeekModel, upstreamModel } from './provider.js';
import {
jsonSchema,
streamText,
@@ -51,6 +51,9 @@ export interface StreamOptions {
dry_base?: number | null;
dry_allowed_length?: number | null;
dry_penalty_last_n?: number | null;
// vDeepSeek: thinking/reasoning effort. Maps to DeepSeek's reasoning_effort
// API param for deepseek-v4-flash / deepseek-v4-pro models.
reasoning_effort?: 'off' | 'low' | 'medium' | 'high' | 'xhigh' | 'max';
}
// P5: the 10-field sampler-options literal that was copy-pasted at 4 sites
@@ -74,6 +77,7 @@ export function samplerOptsFromAgent(agent: Agent | null): SamplerOpts {
dry_base: agent?.dry_base ?? undefined,
dry_allowed_length: agent?.dry_allowed_length ?? undefined,
dry_penalty_last_n: agent?.dry_penalty_last_n ?? undefined,
reasoning_effort: agent?.reasoning_effort ?? undefined,
};
}
@@ -272,6 +276,19 @@ export async function streamCompletion(
// before this. They now go through the same extraBody path as the new params.
const samplerBody = buildSamplerProviderOptions(opts);
// vDeepSeek: build providerOptions.deepseek for DeepSeek V4 models.
let deepseekProviderOptions:
| { thinking: { type: 'enabled' | 'disabled' }; reasoningEffort?: 'low' | 'medium' | 'high' | 'xhigh' | 'max' }
| undefined;
if (isDeepSeekModel(model)) {
const dsEffort = opts.reasoning_effort;
const thinkingEnabled = dsEffort && dsEffort !== 'off';
deepseekProviderOptions = {
thinking: { type: thinkingEnabled ? 'enabled' : 'disabled' },
...(thinkingEnabled ? { reasoningEffort: dsEffort } : {}),
};
}
// F6: per-chunk stall deadline. If the model stops emitting chunks for
// STALL_TIMEOUT_MS the stallAc fires through AbortSignal.any; the post-loop
// abort check below then throws AbortError → handleAbortOrError writes
@@ -297,7 +314,14 @@ export async function streamCompletion(
...(typeof opts.temperature === 'number' ? { temperature: opts.temperature } : {}),
...(typeof opts.top_p === 'number' ? { topP: opts.top_p } : {}),
...(typeof opts.presence_penalty === 'number' ? { presencePenalty: opts.presence_penalty } : {}),
...(samplerBody ? { providerOptions: { openaiCompatible: samplerBody } } : {}),
...(samplerBody || deepseekProviderOptions
? {
providerOptions: {
...(samplerBody ? { openaiCompatible: samplerBody } : {}),
...(deepseekProviderOptions ? { deepseek: deepseekProviderOptions } : {}),
},
}
: {}),
abortSignal: effectiveSignal,
});
@@ -401,12 +425,26 @@ export async function streamCompletion(
// Usage lands as a promise on the result; awaiting after fullStream is
// drained is safe. AI SDK v6 names: `inputTokens` / `outputTokens`.
// Some providers (llama-swap via openai-compatible) return plain numbers;
// others (deepseek via @ai-sdk/deepseek) return {total, cacheRead, noCache, ...}.
let promptTokens: number | null = null;
let completionTokens: number | null = null;
let cacheReadTokens: number | null = null;
let reasoningTokens: number | null = null;
try {
const usage = await result.usage;
if (typeof usage.inputTokens === 'number') promptTokens = usage.inputTokens;
if (typeof usage.outputTokens === 'number') completionTokens = usage.outputTokens;
if (typeof usage.inputTokens === 'number') {
promptTokens = usage.inputTokens;
} else if (usage.inputTokens && typeof usage.inputTokens === 'object') {
promptTokens = (usage.inputTokens as Record<string, number | undefined>).total ?? null;
cacheReadTokens = (usage.inputTokens as Record<string, number | undefined>).cacheRead ?? null;
}
if (typeof usage.outputTokens === 'number') {
completionTokens = usage.outputTokens;
} else if (usage.outputTokens && typeof usage.outputTokens === 'object') {
completionTokens = (usage.outputTokens as Record<string, number | undefined>).total ?? null;
reasoningTokens = (usage.outputTokens as Record<string, number | undefined>).reasoning ?? null;
}
} catch {
// Some providers omit usage on partial streams; leave both null.
}
@@ -422,6 +460,13 @@ export async function streamCompletion(
);
}
if (cacheReadTokens !== null || reasoningTokens !== null) {
ctx.log.debug(
{ promptTokens, completionTokens, cacheReadTokens, reasoningTokens, model },
'streamCompletion: deepseek usage breakdown',
);
}
return {
finishReason,
content,
@@ -429,6 +474,10 @@ export async function streamCompletion(
promptTokens,
completionTokens,
reasoning: reasoningAccumulated,
// vDeepSeek: optional usage breakdown populated when the provider returns
// structured usage (cache hit tokens, reasoning tokens).
cacheReadTokens: cacheReadTokens ?? undefined,
reasoningTokens: reasoningTokens ?? undefined,
};
} finally {
// Clear the stall timer whether the stream completes normally, throws, or

View File

@@ -56,6 +56,7 @@ export async function executeStreamPhase(
message_id: assistantMessageId,
chat_id: chatId,
role: 'assistant',
...(args.compareGroupId ? { compare_group_id: args.compareGroupId } : {}),
});
const flusher = createContentFlusher(ctx.sql, assistantMessageId, () => state.accumulated);
@@ -119,6 +120,7 @@ export async function executeStreamPhase(
message_id: assistantMessageId,
chat_id: chatId,
content: delta,
...(args.compareGroupId ? { compare_group_id: args.compareGroupId } : {}),
});
ctx.log.debug({ sessionId, delta }, 'inference delta');
flusher.scheduleFlush();

View File

@@ -0,0 +1,75 @@
// Supervisor agent: routes user requests to the best agent via a cheap LLM
// classification call. Activated when session.agent_id === 'supervisor'.
import type { Agent } from '../../types/api.js';
import { taskModelCompletion } from '../task-model.js';
export interface SupervisorRoute {
agent_id: string;
confidence: number;
reasoning: string;
}
const SUPERVISOR_SYSTEM_PROMPT = `You are a router. Given the user's request and the available agents, choose the best agent to handle the request.
Rules:
- Match the request to the agent whose description and toolset best fits the task.
- For code review / bug finding requests → code-reviewer
- For debugging / diagnosing failures → debugger
- For refactoring / simplifying code → refactorer
- For architecture / design / planning → architect or planner
- For security audits → security-auditor
- For building prompts for other agents → prompt-builder
- For exploring / understanding unfamiliar code → recon
- For implementing / writing code changes → builder
- Respond with ONLY the agent id (e.g. "builder") or "none" if no agent fits.
- Do not include any other text, punctuation, or explanation.`;
const MAX_ROUTING_TOKENS = 30;
/**
* Given the user's latest message and available agents, classifies which agent
* should handle this turn. Returns null to fall through to default (no agent).
*/
export async function resolveSupervisorTurn(
latestUserMessage: string,
agents: Agent[],
fallbackModel?: string,
): Promise<SupervisorRoute | null> {
// Build agent listing — skip the supervisor itself to avoid self-routing.
const agentList = agents
.filter((a) => a.id !== 'supervisor')
.map((a) => `- ${a.id}: ${a.description} (${a.tools.length} tools)`)
.join('\n');
if (!agentList) {
return null;
}
const userPrompt = `Available agents:\n${agentList}\n\nUser request: ${latestUserMessage.slice(0, 2000)}`;
const response = await taskModelCompletion({
system: SUPERVISOR_SYSTEM_PROMPT,
user: userPrompt,
maxTokens: MAX_ROUTING_TOKENS,
temperature: 0.1,
fallbackModel,
});
const agentId = response.trim().toLowerCase();
if (!agentId || agentId === 'none') {
return null;
}
// Map back to a real agent to validate the id.
const matched = agents.find((a) => a.id === agentId);
if (!matched) {
return null;
}
return {
agent_id: matched.id,
confidence: 1,
reasoning: `supervisor routed to "${matched.name}" based on request classification`,
};
}

View File

@@ -0,0 +1,179 @@
/**
* vWhale: schema-based tool input repair. When the model emits tool call args
* that don't match the expected types (common with weaker models), apply
* heuristic repairs before falling through to the Zod parse.
*
* Inspired by Whale's RepairToolInputForSpec:
* - Coerce string "true"/"false" → boolean
* - Unwrap markdown autolinks in string fields: <file:///path> → /path
* - Wrap bare values in arrays when schema expects array
* - Convert "42.0" decimal string → "42" for integer fields
* - Recurse into objects to repair nested properties
*/
export interface ToolInputRepair {
field: string;
kind: string;
detail: string;
}
const MARKDOWN_AUTOLINK_RE = /^<(?:file|path):\/\/(.+?)>$/;
/**
* Attempt to repair tool call args against the tool's JSON Schema.
* Returns the (possibly modified) args plus a list of repairs applied.
*/
export function repairToolInput(
schema: Record<string, unknown> | undefined,
args: Record<string, unknown>,
): { repaired: Record<string, unknown>; repairs: ToolInputRepair[] } {
const repairs: ToolInputRepair[] = [];
if (!schema || typeof schema !== 'object') {
return { repaired: args, repairs };
}
const properties = (schema as Record<string, unknown>).properties as
Record<string, unknown> | undefined;
if (!properties) {
return { repaired: args, repairs };
}
const required = new Set<string>(
Array.isArray((schema as Record<string, unknown>).required)
? (schema as Record<string, unknown>).required as string[]
: [],
);
const repaired: Record<string, unknown> = {};
for (const [key, value] of Object.entries(args)) {
const propSchema = properties[key] as Record<string, unknown> | undefined;
if (propSchema && value !== null && value !== undefined) {
repaired[key] = repairValue(key, propSchema, value, repairs, required.has(key));
} else {
repaired[key] = value;
}
}
// Drop keys not in the schema (only for required fields that are missing)
// to avoid polluting the model with hallucinated params.
for (const key of Object.keys(repaired)) {
if (!(key in properties)) {
repairs.push({ field: key, kind: 'removed_unknown', detail: `Removed unknown parameter '${key}'` });
delete repaired[key];
}
}
return { repaired, repairs };
}
function repairValue(
field: string,
schema: Record<string, unknown>,
value: unknown,
repairs: ToolInputRepair[],
required: boolean,
): unknown {
const schemaType = schema.type;
const isArray = schemaType === 'array' || Array.isArray(schemaType)
? schemaType === 'array' || (Array.isArray(schemaType) && schemaType.includes('array'))
: false;
const isObject = schemaType === 'object';
const isBoolean = schemaType === 'boolean';
const isInteger = schemaType === 'integer' || schemaType === 'number';
const isString = schemaType === 'string';
// --- Array repair: wrap bare value or empty object ---
if (isArray) {
if (!Array.isArray(value)) {
if (typeof value === 'string') {
// Try parsing as JSON array first
try {
const parsed = JSON.parse(value);
if (Array.isArray(parsed)) {
repairs.push({ field, kind: 'parsed_json_array', detail: `Parsed string as JSON array for '${field}'` });
return parsed;
}
} catch { /* not JSON */ }
}
if (typeof value === 'object' && value !== null && Object.keys(value).length === 0) {
if (required) {
repairs.push({ field, kind: 'empty_object_to_array', detail: `Converted empty object to empty array for '${field}'` });
return [];
}
repairs.push({ field, kind: 'empty_object_to_undefined', detail: `Removed empty object for optional array '${field}'` });
return undefined;
}
repairs.push({ field, kind: 'wrapped_in_array', detail: `Wrapped bare value in array for '${field}'` });
return [value];
}
// Recurse into array items
const itemsSchema = schema.items as Record<string, unknown> | undefined;
if (itemsSchema) {
return value.map((item, i) => repairValue(`${field}[${i}]`, itemsSchema, item, repairs, required));
}
return value;
}
// --- Object repair: recurse into properties ---
if (isObject && typeof value === 'object' && value !== null && !Array.isArray(value)) {
const props = (schema.properties as Record<string, unknown>) ?? {};
const repaired: Record<string, unknown> = {};
for (const [k, v] of Object.entries(value as Record<string, unknown>)) {
const propSchema = props[k] as Record<string, unknown> | undefined;
if (propSchema) {
repaired[k] = repairValue(`${field}.${k}`, propSchema, v, repairs, required);
} else {
repaired[k] = v;
}
}
return repaired;
}
// --- String repair: unwrap markdown autolinks ---
if (isString && typeof value === 'string') {
const match = value.match(MARKDOWN_AUTOLINK_RE);
if (match) {
repairs.push({ field, kind: 'unwrapped_markdown_link', detail: `Unwrapped markdown autolink for '${field}': ${value}` });
return match[1];
}
return value;
}
// --- Boolean coercion ---
if (isBoolean && typeof value === 'string') {
const lower = value.toLowerCase();
if (lower === 'true') {
repairs.push({ field, kind: 'coerced_to_boolean', detail: `Coerced string '${value}' → true for '${field}'` });
return true;
}
if (lower === 'false') {
repairs.push({ field, kind: 'coerced_to_boolean', detail: `Coerced string '${value}' → false for '${field}'` });
return false;
}
return value;
}
// --- Integer coercion: "42.0" → 42 ---
if (isInteger && typeof value === 'string') {
const num = Number(value);
if (!Number.isNaN(num)) {
repairs.push({ field, kind: 'coerced_to_number', detail: `Coerced string '${value}' → ${num} for '${field}'` });
return num;
}
return value;
}
// --- Integer coercion: boolean → 0/1 ---
if (isInteger && typeof value === 'boolean') {
repairs.push({ field, kind: 'coerced_boolean_to_integer', detail: `Coerced boolean ${value}${value ? 1 : 0} for '${field}'` });
return value ? 1 : 0;
}
// --- Empty string to null for optional fields ---
if (value === '' && !required) {
repairs.push({ field, kind: 'empty_string_to_undefined', detail: `Converted empty string for optional '${field}'` });
return undefined;
}
return value;
}

View File

@@ -6,6 +6,7 @@ import type { ToolExecCtx } from '../tools.js';
import { matchToolGlob } from '../agents.js';
import { maybeFlagForCompaction } from './payload.js';
import { insertParts, partsFromAssistantMessage, partsFromToolMessage } from './parts.js';
import { getServerPermission } from '../mcp-client.js';
// v1.13.16: richer unknown-tool error so the model can self-correct when it
// drifts to a Claude Code tool name (e.g. read_file → suggest view_file).
// Applies to all unknown tool names, not just <invoke>-derived ones — at the
@@ -17,7 +18,10 @@ import { formatUnknownToolError } from './tool-suggestions.js';
// prompted about paths we couldn't grant anyway (e.g. /etc/passwd).
import { resolveGrantRoot } from '../grant_resolver.js';
import { stripToolMarkup } from './tool-call-parser.js';
import { repairToolInput } from './tool-input-repair.js';
import { diffFromToolArgs, isWriteTool } from './compute-diff.js';
import type { FailureKind } from './mistake-tracker.js';
import { insertToolTrace, updateToolTrace } from '../tool-traces.js';
import type {
InferenceContext,
StreamResult,
@@ -34,6 +38,8 @@ async function executeToolCall(
toolCall: ToolCall,
extraRoots: readonly string[],
toolCtx?: ToolExecCtx,
hooks?: import('../hooks.js').HookRunner,
sessionId?: string,
): Promise<{ output: unknown; truncated: boolean; error?: string; outcome: FailureKind | 'success' }> {
// v#12 MistakeTracker: every return path carries an `outcome` so the turn
// loop can detect a run of heterogeneous failures. The failure taxonomy
@@ -48,7 +54,61 @@ async function executeToolCall(
outcome: 'tool_not_found',
};
}
const parsed = tool.inputSchema.safeParse(toolCall.args);
// MCP permission gate — block deny/ask before any Zod parsing or execution
const mcpPerm = getServerPermission(toolCall.name);
if (mcpPerm === 'deny') {
return { output: null, truncated: false, error: `blocked: MCP server denied tool '${toolCall.name}'`, outcome: 'permission_denied' };
}
if (mcpPerm === 'ask') {
return { output: null, truncated: false, error: `requires approval: tool '${toolCall.name}' needs user approval`, outcome: 'permission_denied' };
}
// vWhale: schema-based tool input repair. If the Zod parse fails, attempt
// heuristic repairs (type coercion, markdown-link unwrapping, array wrapping)
// and retry. Logs repairs for debugging.
let args = toolCall.args;
let parsed = tool.inputSchema.safeParse(args);
if (!parsed.success) {
const schema = tool.jsonSchema?.function?.parameters;
if (schema) {
const { repaired: repairedArgs, repairs } = repairToolInput(
schema as Record<string, unknown>,
args as Record<string, unknown>,
);
if (repairs.length > 0) {
const retry = tool.inputSchema.safeParse(repairedArgs);
if (retry.success) {
args = repairedArgs;
parsed = retry;
}
}
}
}
// vWhale: PreToolUse hook — can block execution.
if (hooks && sessionId) {
const hookResult = await hooks.run('PreToolUse', {
event: 'PreToolUse',
session_id: sessionId,
tool_name: toolCall.name,
tool_args: args as Record<string, unknown>,
});
if (hookResult.decision === 'block') {
return {
output: null,
truncated: false,
error: `blocked by hook: ${hookResult.reason ?? 'PreToolUse denied'}`,
outcome: 'permission_denied',
};
}
// Apply updated_input if the hook rewrote the args
if (hookResult.updated_input && typeof hookResult.updated_input === 'object') {
const reParsed = tool.inputSchema.safeParse(hookResult.updated_input);
if (reParsed.success) {
args = hookResult.updated_input as Record<string, unknown>;
parsed = reParsed;
}
}
}
if (!parsed.success) {
// v1.12 Track B.2: enrich the zod-reject path so the model sees a
// one-line, tool-named hint ("tool 'search_symbols' rejected — query:
@@ -117,6 +177,7 @@ export async function executeToolPhase(
session: Session,
projectRoot: string,
agent?: Agent | null,
turnNumber?: number,
): Promise<ToolPhaseResult> {
const { sessionId, chatId, assistantMessageId } = args;
const content = stripToolMarkup(result.content, { final: true });
@@ -183,6 +244,8 @@ export async function executeToolPhase(
tokens_used: updated?.tokens_used ?? null,
ctx_used: updated?.ctx_used ?? null,
ctx_max: updated?.ctx_max ?? null,
cache_tokens: result.cacheReadTokens ?? null,
reasoning_tokens: result.reasoningTokens ?? null,
started_at: startedAt,
finished_at: updated?.finished_at ?? null,
model: session.model,
@@ -318,10 +381,64 @@ export async function executeToolPhase(
});
return;
}
const tres = await executeToolCall(projectRoot, tc, session.allowed_read_paths, {
sql: ctx.sql,
sessionId,
// tool_trace instrumentation - start
const traceId = crypto.randomUUID();
const traceStartTime = Date.now();
const startedAtIso = new Date().toISOString();
insertToolTrace(ctx.sql, {
session_id: sessionId,
chat_id: chatId,
message_id: assistantMessageId,
turn_number: turnNumber ?? 0,
tool_name: tc.name,
tool_input: tc.args as Record<string, unknown>,
}).catch(() => {});
ctx.publish(sessionId, {
type: 'tool_trace_start',
trace_id: traceId,
message_id: assistantMessageId,
chat_id: chatId,
tool_name: tc.name,
tool_input: tc.args as Record<string, unknown>,
started_at: startedAtIso,
});
const tres = await executeToolCall(
projectRoot, tc, session.allowed_read_paths,
{ sql: ctx.sql, sessionId },
ctx.hooks, sessionId,
);
// tool_trace instrumentation - finish
const finishedAtIso = new Date().toISOString();
const latencyMs = Date.now() - traceStartTime;
updateToolTrace(ctx.sql, traceId, {
finished_at: finishedAtIso,
...(tres.outcome === 'success' && tres.output != null ? { tool_output: JSON.stringify(tres.output) } : {}),
latency_ms: latencyMs,
outcome: tres.outcome,
...(tres.error ? { error: tres.error } : {}),
}).catch(() => {});
ctx.publish(sessionId, {
type: 'tool_trace_finish',
trace_id: traceId,
message_id: assistantMessageId,
chat_id: chatId,
tool_name: tc.name,
finished_at: finishedAtIso,
outcome: tres.outcome,
latency_ms: latencyMs,
...(tres.error ? { error: tres.error } : {}),
});
// vWhale: PostToolUse hook (best-effort, non-blocking).
if (ctx.hooks) {
ctx.hooks.run('PostToolUse', {
event: 'PostToolUse',
session_id: sessionId,
tool_name: tc.name,
tool_args: tc.args as Record<string, unknown>,
tool_result: tres.output,
tool_error: tres.error,
}).catch(() => {});
}
// v#12 MistakeTracker: record the real execution outcome (success or a
// FailureKind). This is the primary signal for heterogeneous-failure
// detection.
@@ -329,6 +446,16 @@ export async function executeToolPhase(
if (SYNTHESIS_TOOLS.has(tc.name)) {
synthEntries.push({ tc, output: tres.output, ...(tres.error ? { error: tres.error } : {}) });
}
// v2.8: compute a compact unified diff for successful write-tool results.
// The diff is derived from tool call args (old_string/new_string for
// edit_file, content for create_file) and included in the WS frame so
// the frontend can render a DiffSnippet inline. Not persisted to message_parts
// (the args alone are enough to reproduce it on reload if needed).
const toolDiff =
!tres.error && tres.outcome === 'success' && isWriteTool(tc.name)
? diffFromToolArgs(tc.name, tc.args as Record<string, unknown>)
: undefined;
const stored = {
tool_call_id: tc.id,
output: tres.output,
@@ -351,6 +478,7 @@ export async function executeToolPhase(
output: tres.output,
truncated: tres.truncated,
...(tres.error ? { error: tres.error } : {}),
...(toolDiff ? { diff: toolDiff } : {}),
});
})
);

View File

@@ -8,7 +8,7 @@ import type {
import { resolveProjectRoot } from '../path_guard.js';
import { maybeAutoNameChat } from '../auto_name.js';
import { rewriteSearchQuery } from '../task-search-rewrite.js';
import { getAgentById } from '../agents.js';
import { getAgentById, getAgentsForProject } from '../agents.js';
import * as compaction from '../compaction.js';
import { resolveTurnConfig } from './turn-config.js';
import { decideStep, decidePostToolAction } from './step-decision.js';
@@ -37,12 +37,85 @@ import type {
StreamResult,
TurnArgs,
} from './types.js';
import { saveAgentSnapshot } from '../session-snapshots.js';
// vWhale: auto-fix loop — after write tools, build the project and inject
// errors. Uses execFile (no shell) against the project root.
import { execFile } from 'node:child_process';
import { readFileSync, existsSync } from 'node:fs';
import { join } from 'node:path';
import {
runCapHitSummary,
runDoomLoopSummary,
runStepCapSummary,
insertMistakeRecoverySentinel,
} from './sentinel-summaries.js';
import { resolveSupervisorTurn } from './supervisor.js';
import { runGraph } from './state-graph.js';
// vWhale: auto-fix — detect build command from package.json, run it, return
// error text for injection into next iteration. Best-effort, never throws.
const BUILD_TIMEOUT_MS = 60_000;
const BUILD_OUTPUT_CAP = 8_000;
async function detectAndRunBuild(
ctx: InferenceContext,
projectRoot: string,
sessionId: string,
chatId: string,
model: string,
existingNote: string | undefined,
): Promise<string | undefined> {
// Only run for DeepSeek models (local Qwen models don't benefit from build loop).
if (!model.startsWith('deepseek-')) return undefined;
// Detect build command from package.json in project root.
const pkgPath = join(projectRoot, 'package.json');
if (!existsSync(pkgPath)) return undefined;
let buildCmd: string | null = null;
try {
const pkg = JSON.parse(readFileSync(pkgPath, 'utf8')) as { scripts?: Record<string, string> };
if (pkg.scripts?.build) buildCmd = 'build';
else if (pkg.scripts?.compile) buildCmd = 'compile';
else if (pkg.scripts?.typecheck) buildCmd = 'typecheck';
} catch {
return undefined;
}
if (!buildCmd) return undefined;
// Detect package manager.
const hasPnpm = existsSync(join(projectRoot, 'pnpm-lock.yaml'));
const hasYarn = existsSync(join(projectRoot, 'yarn.lock'));
const pm = hasPnpm ? 'pnpm' : hasYarn ? 'yarn' : 'npm';
// Run the build.
try {
const out = await new Promise<string>((resolve, reject) => {
execFile(pm, ['run', buildCmd!], { cwd: projectRoot, timeout: BUILD_TIMEOUT_MS, maxBuffer: BUILD_OUTPUT_CAP * 2 },
(err, stdout, stderr) => {
if (err && (err as NodeJS.ErrnoException).code === 'ENOENT') {
resolve(''); // package manager not found — skip
return;
}
const merged = (stdout + '\n' + stderr).trim();
resolve(merged.slice(0, BUILD_OUTPUT_CAP));
},
);
});
if (!out) return undefined; // build succeeded or no output
ctx.log.info({ sessionId, chatId, buildCmd, outputLen: out.length }, 'auto-fix: build failed');
// Truncate if existing note exists
const combined = existingNote
? existingNote + '\n\n--- Build error ---\n' + out.slice(0, BUILD_OUTPUT_CAP - existingNote.length)
: '--- Build error ---\n' + out.slice(0, BUILD_OUTPUT_CAP);
return combined;
} catch {
return undefined;
}
}
// P5: MAX_STEPS moved to ./turn-config.ts (with resolveTurnConfig). Re-exported
// here so the public surface (index.ts → './turn.js') is unchanged.
@@ -78,10 +151,39 @@ export async function runAssistantTurn(
ctx.log.warn({ sessionId }, 'inference: session or project missing');
return;
}
const { session, project } = initialLoaded;
const agent = session.agent_id
let { session, project, history: initialHistory } = initialLoaded;
if (args.modelOverride) {
session = { ...session, model: args.modelOverride };
}
let agent = session.agent_id
? await getAgentById(project.path, session.agent_id)
: null;
// vSupervisor: if the session is set to supervisor mode, resolve the real
// agent via a cheap classification call. Falls through to default (no agent)
// if routing returns null.
if (agent?.id === 'supervisor') {
const { agents: availableAgents } = await getAgentsForProject(project.path);
const latestUser = [...initialHistory].reverse().find((m) => m.role === 'user');
const userMessage = latestUser?.content ?? '';
if (userMessage) {
const route = await resolveSupervisorTurn(userMessage, availableAgents, session.model ?? undefined);
if (route) {
ctx.log.info(
{ sessionId, chatId, resolvedAgent: route.agent_id, reasoning: route.reasoning },
'supervisor: routed turn',
);
agent = await getAgentById(project.path, route.agent_id);
} else {
ctx.log.info({ sessionId, chatId }, 'supervisor: no agent matched, falling through to default');
agent = null;
}
} else {
ctx.log.info({ sessionId, chatId }, 'supervisor: no user message found, falling through to default');
agent = null;
}
}
// P5: pure per-turn config (budget + cap math + text-only flag).
const { effectiveCap, budget, isTextOnly } = resolveTurnConfig(agent);
@@ -91,7 +193,8 @@ export async function runAssistantTurn(
if (isTextOnly) {
const loaded = await loadContext(ctx.sql, sessionId, chatId);
if (loaded) {
await runTextOnlyTurn(ctx, args, loaded.session, loaded.project, loaded.history, agent);
const txtSession = args.modelOverride ? { ...loaded.session, model: args.modelOverride } : loaded.session;
await runTextOnlyTurn(ctx, args, txtSession, loaded.project, loaded.history, agent);
}
return;
}
@@ -107,206 +210,273 @@ export async function runAssistantTurn(
const mistakeTracker = args.mistakeTracker;
let pendingRecoveryNote: string | undefined = args.pendingRecoveryNote;
while (stepNumber < effectiveCap) {
// ---- top-of-loop gate: doom-loop, then budget (pure decision) ----
const decision = decideStep({ recentToolCalls, toolsUsed, budget });
if (decision.kind === 'doom') {
// Need fresh history for the summary.
const loaded = await loadContext(ctx.sql, sessionId, chatId);
if (loaded) {
const iterArgs: TurnArgs = { sessionId, chatId, assistantMessageId, toolsUsed, recentToolCalls, mistakeTracker, signal };
await runDoomLoopSummary(ctx, iterArgs, loaded.session, loaded.project, loaded.history, agent, decision.loop);
if (session.state_graph_enabled) {
// ---- optional state graph path ----
const gProjectRoot = await resolveProjectRoot(project.path);
const graphResult = await runGraph(ctx, args, { effectiveCap, budget, agent, projectRoot: gProjectRoot });
stepNumber = graphResult.stepNumber;
toolsUsed = graphResult.toolsUsed;
recentToolCalls = graphResult.recentToolCalls;
assistantMessageId = graphResult.assistantMessageId;
// mistakeTracker is the same object reference (mutated in place by the graph).
} else {
while (stepNumber < effectiveCap) {
// ---- top-of-loop gate: doom-loop, then budget (pure decision) ----
const decision = decideStep({ recentToolCalls, toolsUsed, budget });
if (decision.kind === 'doom') {
// Need fresh history for the summary.
const loaded = await loadContext(ctx.sql, sessionId, chatId);
if (loaded) {
const dlSession = args.modelOverride ? { ...loaded.session, model: args.modelOverride } : loaded.session;
const iterArgs: TurnArgs = { sessionId, chatId, assistantMessageId, toolsUsed, recentToolCalls, mistakeTracker, signal };
await runDoomLoopSummary(ctx, iterArgs, dlSession, loaded.project, loaded.history, agent, decision.loop);
}
break;
}
break;
}
if (decision.kind === 'budget') {
const loaded = await loadContext(ctx.sql, sessionId, chatId);
if (loaded) {
const iterArgs: TurnArgs = { sessionId, chatId, assistantMessageId, toolsUsed, recentToolCalls, mistakeTracker, signal };
await runCapHitSummary(ctx, iterArgs, loaded.session, loaded.project, loaded.history, agent, budget);
if (decision.kind === 'budget') {
const loaded = await loadContext(ctx.sql, sessionId, chatId);
if (loaded) {
const bhSession = args.modelOverride ? { ...loaded.session, model: args.modelOverride } : loaded.session;
const iterArgs: TurnArgs = { sessionId, chatId, assistantMessageId, toolsUsed, recentToolCalls, mistakeTracker, signal };
await runCapHitSummary(ctx, iterArgs, bhSession, loaded.project, loaded.history, agent, budget);
}
break;
}
break;
}
// decision.kind === 'stream' → proceed with compaction + stream + tools.
// decision.kind === 'stream' → proceed with compaction + stream + tools.
// ---- compaction check ----
// v1.11: if the prior turn flagged this chat for compaction, run it
// before loadContext so we read post-compaction history. Swallow
// failures and proceed with un-compacted history.
const chatFlag = await ctx.sql<{ needs_compaction: boolean }[]>`
SELECT needs_compaction FROM chats WHERE id = ${chatId}
`;
if (chatFlag[0]?.needs_compaction) {
try {
await compaction.process({
sql: ctx.sql,
config: ctx.config,
log: ctx.log,
broker: ctx.broker,
chatId,
});
} catch (err) {
ctx.log.warn({ err, chatId }, 'auto-compaction failed; clearing flag and proceeding');
await ctx.sql`UPDATE chats SET needs_compaction = false WHERE id = ${chatId}`;
}
}
// ---- load context (must re-load each iteration — new messages since last step) ----
const loaded = await loadContext(ctx.sql, sessionId, chatId);
if (!loaded) {
ctx.log.warn({ sessionId }, 'inference: session or project missing mid-loop');
break;
}
let { session: iterSession, project: iterProject, history } = loaded;
const projectRoot = await resolveProjectRoot(iterProject.path);
try {
const dcpMsgs = toDcpMessages(history);
const { messages: pruned, stats } = transformMessages(chatId, dcpMsgs);
if (stats.removedCount > 0) {
ctx.log.info({ chatId, ...stats }, 'dcp: transform removed messages');
history = fromDcpMessages(pruned) as typeof history;
}
} catch (err) {
ctx.log.warn({ err: err instanceof Error ? err.message : String(err), chatId }, 'dcp: transform skipped');
}
// v1.14.0: log step boundary for instrumentation. step_start parts are in
// the schema CHECK but not emitted here — writing to the assistant message
// before the stream phase creates a sequence-0 collision with
// partsFromAssistantMessage. A WS frame or structured log is sufficient
// since the frontend doesn't render step boundaries in v1.14.
ctx.log.info({ sessionId, chatId, step: stepNumber, assistantMessageId }, 'step_start');
// ---- build messages + stream phase ----
const messages = await buildMessagesPayload(iterSession, iterProject, history, agent, ctx.log);
const webToolsEnabled =
iterSession.web_search_enabled ?? iterProject.default_web_search_enabled ?? false;
if (stepNumber === 0 && webToolsEnabled && messages.length >= 2) {
const lastUserMsg = [...messages].reverse().find((m) => m.role === 'user');
if (lastUserMsg?.content) {
const hint = await rewriteSearchQuery(lastUserMsg.content);
if (hint && messages[0]?.role === 'system' && messages[0].content) {
messages[0].content += `\n\nThe user's search intent can be summarized as: "${hint}"`;
// ---- compaction check ----
// v1.11: if the prior turn flagged this chat for compaction, run it
// before loadContext so we read post-compaction history. Swallow
// failures and proceed with un-compacted history.
const chatFlag = await ctx.sql<{ needs_compaction: boolean }[]>`
SELECT needs_compaction FROM chats WHERE id = ${chatId}
`;
if (chatFlag[0]?.needs_compaction) {
try {
await compaction.process({
sql: ctx.sql,
config: ctx.config,
log: ctx.log,
broker: ctx.broker,
chatId,
hooks: ctx.hooks,
});
} catch (err) {
ctx.log.warn({ err, chatId }, 'auto-compaction failed; clearing flag and proceeding');
await ctx.sql`UPDATE chats SET needs_compaction = false WHERE id = ${chatId}`;
}
}
}
// v#12 MistakeTracker: if the prior iteration's nudge fired, append the
// transient recovery note to THIS payload (consumed exactly once, then
// cleared). Never persisted — same lifecycle as the cap-hit/doom-loop
// summary notes, which live only inside the in-memory messages array.
if (pendingRecoveryNote) {
messages.push({ role: 'system', content: pendingRecoveryNote });
pendingRecoveryNote = undefined;
}
// ---- load context (must re-load each iteration — new messages since last step) ----
const loaded = await loadContext(ctx.sql, sessionId, chatId);
if (!loaded) {
ctx.log.warn({ sessionId }, 'inference: session or project missing mid-loop');
break;
}
let { session: iterSession, project: iterProject, history } = loaded;
if (args.modelOverride) {
iterSession = { ...iterSession, model: args.modelOverride };
}
const projectRoot = await resolveProjectRoot(iterProject.path);
const iterArgs: TurnArgs = { sessionId, chatId, assistantMessageId, toolsUsed, recentToolCalls, mistakeTracker, signal };
const state: StreamPhaseState = { accumulated: '', startedAt: null };
let result: StreamResult;
try {
result = await executeStreamPhase(ctx, iterArgs, iterSession, messages, state, agent, webToolsEnabled);
} catch (err) {
await handleAbortOrError(ctx, iterArgs, state.accumulated, err);
break;
}
try {
const dcpMsgs = toDcpMessages(history);
const { messages: pruned, stats } = transformMessages(chatId, dcpMsgs);
if (stats.removedCount > 0) {
ctx.log.info({ chatId, ...stats }, 'dcp: transform removed messages');
history = fromDcpMessages(pruned) as typeof history;
}
} catch (err) {
ctx.log.warn({ err: err instanceof Error ? err.message : String(err), chatId }, 'dcp: transform skipped');
}
// ---- non-tool finish → finalize and exit ----
if (result.toolCalls.length === 0) {
await finalizeCompletion(ctx, iterArgs, result, state.startedAt, iterSession);
break;
}
// v1.14.0: log step boundary for instrumentation. step_start parts are in
// the schema CHECK but not emitted here — writing to the assistant message
// before the stream phase creates a sequence-0 collision with
// partsFromAssistantMessage. A WS frame or structured log is sufficient
// since the frontend doesn't render step boundaries in v1.14.
ctx.log.info({ sessionId, chatId, step: stepNumber, assistantMessageId }, 'step_start');
// ---- steps: 0 edge case ----
// effectiveCap check above guarantees we're inside the loop, but this
// guard handles the theoretical case where the model emits tool calls
// on step 0 when effectiveCap would have been 0 (impossible since the
// while condition prevents entry, but kept for safety). If effectiveCap
// is 1 and we're on step 0, tool calls ARE executed — steps counts
// iterations, not post-first-stream.
// ---- build messages + stream phase ----
const messages = await buildMessagesPayload(iterSession, iterProject, history, agent, ctx.log);
const webToolsEnabled =
iterSession.web_search_enabled ?? iterProject.default_web_search_enabled ?? false;
// ---- tool phase ----
let toolPhaseResult: ToolPhaseResult;
try {
toolPhaseResult = await executeToolPhase(ctx, iterArgs, result, state.startedAt, iterSession, projectRoot, agent);
} catch (err) {
// Tool phase errors are unexpected (individual tool failures are
// caught inside executeToolPhase). Log and break.
ctx.log.error({ err, sessionId, chatId, step: stepNumber }, 'tool phase threw unexpectedly');
break;
}
if (stepNumber === 0 && webToolsEnabled && messages.length >= 2) {
const lastUserMsg = [...messages].reverse().find((m) => m.role === 'user');
if (lastUserMsg?.content) {
const hint = await rewriteSearchQuery(lastUserMsg.content);
if (hint && messages[0]?.role === 'system' && messages[0].content) {
messages[0].content += `\n\nThe user's search intent can be summarized as: "${hint}"`;
}
}
}
// ---- update loop locals ----
toolsUsed += toolPhaseResult.toolCallCount;
recentToolCalls = [...recentToolCalls, ...toolPhaseResult.toolCalls];
stepNumber++;
// v#12 MistakeTracker: if the prior iteration's nudge fired, append the
// transient recovery note to THIS payload (consumed exactly once, then
// cleared). Never persisted — same lifecycle as the cap-hit/doom-loop
// summary notes, which live only inside the in-memory messages array.
if (pendingRecoveryNote) {
messages.push({ role: 'system', content: pendingRecoveryNote });
pendingRecoveryNote = undefined;
}
// v#12 MistakeTracker: fold this iteration's tool outcomes into the
// tracker, in order. recordStep mutates `mistakeTracker` in place (it is
// the same object referenced by args). A 'success' clears the streak.
for (const o of toolPhaseResult.outcomes) {
recordStep(mistakeTracker, o);
}
const iterArgs: TurnArgs = { sessionId, chatId, assistantMessageId, toolsUsed, recentToolCalls, mistakeTracker, signal };
const state: StreamPhaseState = { accumulated: '', startedAt: null };
let result: StreamResult;
try {
result = await executeStreamPhase(ctx, iterArgs, iterSession, messages, state, agent, webToolsEnabled);
} catch (err) {
await handleAbortOrError(ctx, iterArgs, state.accumulated, err);
break;
}
// v#12 MistakeTracker: post-tool decision (pure). 'stop' = the tool phase
// returned a non-'continue' action ('paused' for user input, or
// 'synthesis_done') — neither a nudge nor an escalate would change the
// control flow, so the mistake check is skipped. On 'continue' the
// heterogeneous-failure pattern gates nudge/escalate/continue. Complements
// the doom-loop gate above, which only catches *identical* repeats.
const post = decidePostToolAction(toolPhaseResult.action, mistakeTracker);
if (post === 'stop') {
break;
}
if (post === 'nudge') {
// Soft intervention: inject model-facing recovery guidance into the NEXT
// step's payload, drop a UI sentinel, bump nudges, reset the streak, and
// continue. The note is consumed (and cleared) at the top of the next
// iteration's payload build.
pendingRecoveryNote = MISTAKE_RECOVERY_NOTE;
const failureKinds = [...mistakeTracker.run];
await insertMistakeRecoverySentinel(ctx, sessionId, chatId, {
failureKinds,
count: failureKinds.length,
escalated: false,
canContinue: true,
});
mistakeTracker.nudges += 1;
mistakeTracker.run = [];
ctx.log.info(
{ sessionId, chatId, step: stepNumber, nudges: mistakeTracker.nudges, failureKinds },
'mistake_recovery nudge',
);
// ---- non-tool finish → finalize and exit ----
if (result.toolCalls.length === 0) {
// vWhale: Stop hook (best-effort, non-blocking).
if (ctx.hooks) {
ctx.hooks.run('Stop', {
event: 'Stop',
session_id: sessionId,
chat_id: chatId,
last_assistant_text: result.content.slice(0, 500),
turn: stepNumber,
}).catch(() => {});
}
await finalizeCompletion(ctx, iterArgs, result, state.startedAt, iterSession);
break;
}
// ---- steps: 0 edge case ----
// effectiveCap check above guarantees we're inside the loop, but this
// guard handles the theoretical case where the model emits tool calls
// on step 0 when effectiveCap would have been 0 (impossible since the
// while condition prevents entry, but kept for safety). If effectiveCap
// is 1 and we're on step 0, tool calls ARE executed — steps counts
// iterations, not post-first-stream.
// ---- tool phase ----
let toolPhaseResult: ToolPhaseResult;
try {
toolPhaseResult = await executeToolPhase(ctx, iterArgs, result, state.startedAt, iterSession, projectRoot, agent, stepNumber);
} catch (err) {
// Tool phase errors are unexpected (individual tool failures are
// caught inside executeToolPhase). Log and break.
ctx.log.error({ err, sessionId, chatId, step: stepNumber }, 'tool phase threw unexpectedly');
break;
}
// ---- update loop locals ----
toolsUsed += toolPhaseResult.toolCallCount;
recentToolCalls = [...recentToolCalls, ...toolPhaseResult.toolCalls];
stepNumber++;
// v#12 MistakeTracker: fold this iteration's tool outcomes into the
// tracker, in order. recordStep mutates `mistakeTracker` in place (it is
// the same object referenced by args). A 'success' clears the streak.
for (const o of toolPhaseResult.outcomes) {
recordStep(mistakeTracker, o);
}
// vWhale: auto-fix — after write tools, attempt build and inject errors.
const WRITE_TOOLS = new Set(['edit_file', 'create_file', 'delete_file', 'apply_pending']);
const hasWriteTools = toolPhaseResult.toolCalls.some((tc) => WRITE_TOOLS.has(tc.name));
if (hasWriteTools) {
detectAndRunBuild(ctx, projectRoot, sessionId, chatId, iterSession.model, pendingRecoveryNote)
.then((buildError) => {
if (buildError) pendingRecoveryNote = buildError;
})
.catch(() => {});
}
// v#12 MistakeTracker: post-tool decision (pure). 'stop' = the tool phase
// returned a non-'continue' action ('paused' for user input, or
// 'synthesis_done') — neither a nudge nor an escalate would change the
// control flow, so the mistake check is skipped. On 'continue' the
// heterogeneous-failure pattern gates nudge/escalate/continue. Complements
// the doom-loop gate above, which only catches *identical* repeats.
const post = decidePostToolAction(toolPhaseResult.action, mistakeTracker);
if (post === 'stop') {
break;
}
if (post === 'nudge') {
// Soft intervention: inject model-facing recovery guidance into the NEXT
// step's payload, drop a UI sentinel, bump nudges, reset the streak, and
// continue. The note is consumed (and cleared) at the top of the next
// iteration's payload build.
pendingRecoveryNote = MISTAKE_RECOVERY_NOTE;
const failureKinds = [...mistakeTracker.run];
await insertMistakeRecoverySentinel(ctx, sessionId, chatId, {
failureKinds,
count: failureKinds.length,
escalated: false,
canContinue: true,
});
mistakeTracker.nudges += 1;
mistakeTracker.run = [];
ctx.log.info(
{ sessionId, chatId, step: stepNumber, nudges: mistakeTracker.nudges, failureKinds },
'mistake_recovery nudge',
);
assistantMessageId = toolPhaseResult.nextAssistantId!;
continue;
}
if (post === 'escalate') {
// The nudge didn't break the failure run — stop the turn (cap-hit-style)
// to avoid burning the whole step budget on heterogeneous failures. The
// next assistant row is still 'streaming'; finalize it as an empty
// complete row so the slot doesn't dangle, then drop the escalate
// sentinel.
const failureKinds = [...mistakeTracker.run];
assistantMessageId = toolPhaseResult.nextAssistantId!;
const escalateArgs: TurnArgs = { sessionId, chatId, assistantMessageId, toolsUsed, recentToolCalls, mistakeTracker, signal };
await finalizeEmpty(ctx, escalateArgs);
await insertMistakeRecoverySentinel(ctx, sessionId, chatId, {
failureKinds,
count: failureKinds.length,
escalated: true,
canContinue: true,
});
ctx.publishUser({ type: 'chat_status', chat_id: chatId, status: 'idle', at: new Date().toISOString() });
ctx.log.info(
{ sessionId, chatId, step: stepNumber, failureKinds },
'mistake_recovery escalate — stopping turn',
);
break;
}
// 'continue' — advance to next assistant message.
assistantMessageId = toolPhaseResult.nextAssistantId!;
continue;
}
if (post === 'escalate') {
// The nudge didn't break the failure run — stop the turn (cap-hit-style)
// to avoid burning the whole step budget on heterogeneous failures. The
// next assistant row is still 'streaming'; finalize it as an empty
// complete row so the slot doesn't dangle, then drop the escalate
// sentinel.
const failureKinds = [...mistakeTracker.run];
assistantMessageId = toolPhaseResult.nextAssistantId!;
const escalateArgs: TurnArgs = { sessionId, chatId, assistantMessageId, toolsUsed, recentToolCalls, mistakeTracker, signal };
await finalizeEmpty(ctx, escalateArgs);
await insertMistakeRecoverySentinel(ctx, sessionId, chatId, {
failureKinds,
count: failureKinds.length,
escalated: true,
canContinue: true,
});
ctx.publishUser({ type: 'chat_status', chat_id: chatId, status: 'idle', at: new Date().toISOString() });
ctx.log.info(
{ sessionId, chatId, step: stepNumber, failureKinds },
'mistake_recovery escalate — stopping turn',
);
break;
}
}
// 'continue' — advance to next assistant message.
assistantMessageId = toolPhaseResult.nextAssistantId!;
// vWhale: Stop hook at post-loop exit (best-effort, non-blocking).
if (ctx.hooks) {
const loaded = await loadContext(ctx.sql, sessionId, chatId);
const lastAssistant = loaded?.history?.slice().reverse().find(
(m: import('../../types/api.js').Message) => m.role === 'assistant',
);
const content = lastAssistant?.content ?? '';
ctx.hooks.run('Stop', {
event: 'Stop',
session_id: sessionId,
chat_id: chatId,
last_assistant_text: content.slice(0, 500),
turn: stepNumber,
}).catch(() => {});
}
// ---- persist agent snapshot (best-effort, never blocks inference) ----
const snapLoaded = await loadContext(ctx.sql, sessionId, chatId).catch(() => null);
if (snapLoaded) {
await saveAgentSnapshot(ctx.sql, chatId, {
session_id: sessionId,
model: snapLoaded.session.model,
agent: agent?.name ?? null,
mode: null,
turn_number: stepNumber,
messages: snapLoaded.history.map((m) => ({ role: m.role, content: m.content })),
}).catch(() => {});
}
// ---- post-loop: step-cap sentinel ----
@@ -316,8 +486,9 @@ export async function runAssistantTurn(
if (stepNumber >= effectiveCap && effectiveCap < Infinity) {
const loaded = await loadContext(ctx.sql, sessionId, chatId);
if (loaded) {
const scSession = args.modelOverride ? { ...loaded.session, model: args.modelOverride } : loaded.session;
const capArgs: TurnArgs = { sessionId, chatId, assistantMessageId, toolsUsed, recentToolCalls, mistakeTracker, signal };
await runStepCapSummary(ctx, capArgs, loaded.session, loaded.project, loaded.history, agent, stepNumber, effectiveCap);
await runStepCapSummary(ctx, capArgs, scSession, loaded.project, loaded.history, agent, stepNumber, effectiveCap);
}
}
}
@@ -388,6 +559,31 @@ export async function runInference(
});
}
// v2.8-compare: run inference with a model override and compare group id.
// Used by the compare endpoint to run the same message through N models in
// parallel. Each call publishes frames scoped to its compare_group_id.
export async function runInferenceWithModel(
ctx: InferenceContext,
sessionId: string,
chatId: string,
assistantMessageId: string,
modelOverride: string,
compareGroupId: string,
signal?: AbortSignal,
): Promise<void> {
return runAssistantTurn(ctx, {
sessionId,
chatId,
assistantMessageId,
toolsUsed: 0,
recentToolCalls: [],
mistakeTracker: freshMistakeState(),
modelOverride,
compareGroupId,
signal,
});
}
// v1.8.2: cap-hit summary flow. Called instead of erroring when the loop
// hits its budget. Reuses the in-flight assistant message slot to stream a
// short wrap-up reply with the synthetic note prepended and tools disabled,

View File

@@ -19,6 +19,7 @@ import type {
UserStreamFrame,
} from '../../types/api.js';
import type { Broker } from '../broker.js';
import type { HookRunner } from '../hooks.js';
import type { MistakeState } from './mistake-tracker.js';
export interface StreamPhaseState {
@@ -45,10 +46,15 @@ export interface InferenceFrame {
| 'error'
| 'flow_run_started'
| 'flow_run_step_updated'
// tool trace frames
| 'tool_trace_start'
| 'tool_trace_finish'
// arena frames
| 'battle_started'
| 'contestant_updated'
| 'battle_updated';
| 'battle_updated'
// inter-agent message
| 'agent_message';
message_id?: string;
message_ids?: string[];
chat_id?: string;
@@ -77,8 +83,19 @@ export interface InferenceFrame {
started_at?: string | null;
finished_at?: string | null;
model?: string;
cache_tokens?: number | null;
reasoning_tokens?: number | null;
session_id?: string;
name?: string;
// tool trace frames
trace_id?: string;
tool_name?: string;
tool_input?: Record<string, unknown>;
tool_output?: string | null;
latency_ms?: number;
outcome?: string;
// agent snapshot restore
agent?: string | null;
// orchestrator frames ([D-6])
run_id?: string;
flow_name?: string;
@@ -88,6 +105,11 @@ export interface InferenceFrame {
status?: string;
run_status?: 'running' | 'completed' | 'failed' | 'cancelled';
report?: string;
// v2.8-compare: groups messages belonging to the same compare operation.
compare_group_id?: string;
// inter-agent message
sender_step_id?: string;
channel?: string;
// arena frames
battle_id?: string;
battle_type?: 'coding' | 'qa';
@@ -117,6 +139,9 @@ export interface InferenceContext {
// inference goes through `publish`); keeping a separate field avoids
// tempting other code paths into bypassing the session-id binding.
broker: Broker;
// vWhale: lifecycle hooks runner. Undefined when no hooks configured.
// Hook calls are best-effort — a failing hook never blocks inference.
hooks?: HookRunner;
}
export interface StreamResult {
@@ -128,6 +153,12 @@ export interface StreamResult {
// v1.13.1-C: reasoning text accumulated across reasoning-delta parts.
// Empty string when the model doesn't emit reasoning (most cases).
reasoning: string;
// vDeepSeek: optional cache-hit token count from DeepSeek's API.
// Only populated when using @ai-sdk/deepseek provider (not llama-swap).
cacheReadTokens?: number;
// vDeepSeek: optional reasoning token count from DeepSeek's API.
// Only populated when using @ai-sdk/deepseek provider (not llama-swap).
reasoningTokens?: number;
}
export interface TurnArgs {
@@ -153,5 +184,10 @@ export interface TurnArgs {
// Never persisted — mirrors how the cap-hit/doom-loop notes live only inside
// the summary call's messages array.
pendingRecoveryNote?: string;
// v2.8-compare: when set, overrides the session model for this single turn.
// Used by the compare endpoint to run the same message through N models.
modelOverride?: string;
// v2.8-compare: opaque group id that rides on every published frame.
compareGroupId?: string;
signal: AbortSignal | undefined;
}

View File

@@ -31,11 +31,14 @@ interface McpToolDef {
annotations?: McpToolAnnotations;
}
export type McpPermission = 'allow' | 'ask' | 'deny';
interface ServerState {
client: Client;
transport: StreamableHTTPClientTransport | StdioClientTransport;
tools: ToolDef<Record<string, unknown>>[];
type: 'streamableHttp' | 'stdio';
permission: McpPermission;
}
// ---- Module-level state ----
@@ -137,6 +140,27 @@ export async function callTool(
}
}
/** Return the permission level for a given MCP server. Defaults to 'allow' if unknown. */
export function getServerPermission(prefixedToolName: string): McpPermission {
const serverName = toolToServer.get(prefixedToolName);
if (!serverName) return 'allow';
const state = servers.get(serverName);
return state?.permission ?? 'allow';
}
/** Override the permission for a server. Used by the approval flow. */
export function setServerPermission(serverName: string, permission: McpPermission): void {
const state = servers.get(serverName);
if (state) {
state.permission = permission;
}
}
/** Get the server name from a prefixed tool name. Returns null if not an MCP tool. */
export function getServerName(prefixedToolName: string): string | null {
return toolToServer.get(prefixedToolName) ?? null;
}
/** Return all wrapped ToolDefs from all connected servers, flattened. */
export function getTools(): ToolDef<Record<string, unknown>>[] {
const all: ToolDef<Record<string, unknown>>[] = [];
@@ -214,7 +238,8 @@ async function connectServer(entry: McpServerEntry): Promise<void> {
toolToServer.set(wrapped.name, name);
}
servers.set(name, { client, transport, tools, type: config.type });
const permission = (config as { permission?: McpPermission }).permission ?? 'allow';
servers.set(name, { client, transport, tools, type: config.type, permission });
log!.info(
{ server: name, type: config.type, count: tools.length, names: tools.map((t) => t.name) },

View File

@@ -17,12 +17,15 @@ import type { FastifyBaseLogger } from 'fastify';
// ---- Zod schema ----
const McpPermissionSchema = z.enum(['allow', 'ask', 'deny']).default('allow');
const McpServerConfigSchema = z.discriminatedUnion('type', [
z.object({
type: z.literal('streamableHttp'),
url: z.string().url(),
headers: z.record(z.string()).optional(),
enabled: z.boolean().default(true),
permission: McpPermissionSchema,
}),
z.object({
type: z.literal('stdio'),
@@ -30,6 +33,7 @@ const McpServerConfigSchema = z.discriminatedUnion('type', [
args: z.array(z.string()).default([]),
env: z.record(z.string()).optional(),
enabled: z.boolean().default(true),
permission: McpPermissionSchema,
}),
]);

View File

@@ -7,10 +7,12 @@
export const MESSAGE_COLUMNS =
'id, session_id, chat_id, role, content, kind, tool_calls, tool_results, status, last_seq, ' +
'tokens_used, ctx_used, ctx_max, started_at, finished_at, created_at, metadata, ' +
'tokens_used, ctx_used, ctx_max, cache_tokens, reasoning_tokens, ' +
'started_at, finished_at, created_at, metadata, ' +
'summary, tail_start_id, compacted_at, model';
export const INFERENCE_MESSAGE_COLUMNS =
'id, session_id, chat_id, role, content, kind, tool_calls, tool_results, status, last_seq, ' +
'tokens_used, ctx_used, ctx_max, started_at, finished_at, created_at, metadata, ' +
'tokens_used, ctx_used, ctx_max, cache_tokens, reasoning_tokens, ' +
'started_at, finished_at, created_at, metadata, ' +
'reasoning_parts, model';

View File

@@ -37,7 +37,18 @@ export function configureModelContext(opts: { llamaSwapUrl: string }): void {
llamaSwapUrl = opts.llamaSwapUrl;
}
// vDeepSeek: DeepSeek models don't have a /upstream/<model>/props endpoint.
// Return a reasonable default context so compaction estimates work.
const DEEPSEEK_DEFAULT_N_CTX = 131_072;
const DEEPSEEK_MODEL_PREFIX = 'deepseek-';
export async function getModelContext(model: string): Promise<ModelContext | null> {
// vDeepSeek: DeepSeek models have no /upstream/<model>/props. Use a static
// default so compaction doesn't fall to the buffer-only path with tiny limits.
if (model.startsWith(DEEPSEEK_MODEL_PREFIX)) {
return { n_ctx: DEEPSEEK_DEFAULT_N_CTX };
}
// 1. Positive cache hit — no TTL check, model n_ctx is invariant.
const pos = positiveCache.get(model);
if (pos) return pos;

View File

@@ -0,0 +1,51 @@
import type { Sql } from '../db.js';
export interface AgentSnapshot {
id: string;
session_id: string;
chat_id: string;
model: string;
agent: string | null;
mode: string | null;
turn_number: number;
messages: unknown[];
tool_states: unknown[];
created_at: string;
updated_at: string;
}
/** Save or update the agent snapshot for a chat (UPSERT). */
export async function saveAgentSnapshot(sql: Sql, chatId: string, data: {
session_id: string;
model: string;
agent?: string | null;
mode?: string | null;
turn_number: number;
messages: unknown[];
tool_states?: unknown[];
}): Promise<void> {
await sql`
INSERT INTO agent_snapshots (session_id, chat_id, model, agent, mode, turn_number, messages, tool_states, updated_at)
VALUES (${data.session_id}, ${chatId}, ${data.model}, ${data.agent ?? null}, ${data.mode ?? null}, ${data.turn_number}, ${sql.json(data.messages as never)}, ${sql.json((data.tool_states ?? []) as never)}, clock_timestamp())
ON CONFLICT (chat_id)
DO UPDATE SET
model = EXCLUDED.model,
agent = EXCLUDED.agent,
mode = EXCLUDED.mode,
turn_number = EXCLUDED.turn_number,
messages = EXCLUDED.messages,
tool_states = EXCLUDED.tool_states,
updated_at = clock_timestamp()
`;
}
/** Load the agent snapshot for a chat. Returns null if no snapshot exists. */
export async function loadAgentSnapshot(sql: Sql, chatId: string): Promise<AgentSnapshot | null> {
const rows = await sql<AgentSnapshot[]>`SELECT * FROM agent_snapshots WHERE chat_id = ${chatId}`;
return rows[0] ?? null;
}
/** Delete the agent snapshot for a chat (call when session ends). */
export async function deleteAgentSnapshot(sql: Sql, chatId: string): Promise<void> {
await sql`DELETE FROM agent_snapshots WHERE chat_id = ${chatId}`;
}

View File

@@ -101,7 +101,7 @@ export interface PrefixFingerprint {
has_agent_system_prompt: boolean;
has_session_override: boolean;
has_project_override: boolean;
route: 'swap' | 'sidecar';
route: 'swap' | 'sidecar' | 'deepseek';
}
export interface PrefixDrift {
@@ -129,7 +129,7 @@ interface ObservedInputs {
has_agent_system_prompt: boolean;
has_session_override: boolean;
has_project_override: boolean;
route: 'swap' | 'sidecar';
route: 'swap' | 'sidecar' | 'deepseek';
}
interface ObserverEntry {

View File

@@ -0,0 +1,92 @@
import type { Sql } from '../db.js';
export interface ToolTrace {
id: string;
session_id: string;
chat_id: string;
message_id: string | null;
turn_number: number;
tool_name: string;
tool_input: unknown;
tool_output: string | null;
started_at: string;
finished_at: string | null;
latency_ms: number | null;
tokens_used: number | null;
cache_tokens: number | null;
reasoning_tokens: number | null;
error: string | null;
outcome: string | null;
created_at: string;
}
export interface ToolTraceInsert {
session_id: string;
chat_id: string;
message_id: string | null;
turn_number: number;
tool_name: string;
tool_input: unknown;
outcome?: string;
}
export interface ToolTraceUpdate {
finished_at?: string;
latency_ms?: number;
tool_output?: string;
tokens_used?: number;
cache_tokens?: number;
reasoning_tokens?: number;
error?: string;
outcome?: string;
}
export async function insertToolTrace(
sql: Sql,
insert: ToolTraceInsert,
): Promise<ToolTrace> {
const [row] = await sql<ToolTrace[]>`
INSERT INTO tool_traces (
session_id, chat_id, message_id, turn_number,
tool_name, tool_input, outcome
) VALUES (
${insert.session_id}, ${insert.chat_id}, ${insert.message_id},
${insert.turn_number}, ${insert.tool_name},
${sql.json(insert.tool_input as never)},
${insert.outcome ?? null}
)
RETURNING *
`;
if (!row) throw new Error('insertToolTrace returned no row');
return row;
}
export async function updateToolTrace(
sql: Sql,
id: string,
updates: ToolTraceUpdate,
): Promise<ToolTrace | null> {
const cols: string[] = [];
const vals: any[] = [];
if (updates.finished_at !== undefined) { cols.push('finished_at'); vals.push(updates.finished_at); }
if (updates.latency_ms !== undefined) { cols.push('latency_ms'); vals.push(updates.latency_ms); }
if (updates.tool_output !== undefined) { cols.push('tool_output'); vals.push(updates.tool_output); }
if (updates.tokens_used !== undefined) { cols.push('tokens_used'); vals.push(updates.tokens_used); }
if (updates.cache_tokens !== undefined) { cols.push('cache_tokens'); vals.push(updates.cache_tokens); }
if (updates.reasoning_tokens !== undefined) { cols.push('reasoning_tokens'); vals.push(updates.reasoning_tokens); }
if (updates.error !== undefined) { cols.push('error'); vals.push(updates.error); }
if (updates.outcome !== undefined) { cols.push('outcome'); vals.push(updates.outcome); }
if (cols.length === 0) {
const [row] = await sql<ToolTrace[]>`SELECT * FROM tool_traces WHERE id = ${id}`;
return row ?? null;
}
const setClause = cols.map((c, i) => `${c} = $${i + 1}`).join(', ');
const [row] = await sql.unsafe<ToolTrace[]>(
`UPDATE tool_traces SET ${setClause} WHERE id = $${cols.length + 1} RETURNING *`,
[...vals, id],
);
return row ?? null;
}

View File

@@ -0,0 +1,305 @@
// v2.x: Background subagent tools. Three tools that let the model spawn
// non-blocking subagent tasks, poll their status, and retrieve results.
//
// spawn_subagent — Create a background session+chat, dispatch inference,
// return immediately with a task_id.
// subagent_status — Poll the status of a previously spawned task.
// subagent_result — Retrieve the full output of a completed task.
//
// These tools reuse the existing sessions/chats/messages/tables and the
// inference pipeline — no new tables or services needed.
//
// Registered in tools.ts ALL_TOOLS. Lives in its own file so tests can
// import executors without dragging in the full tool registry.
//
// Follows the read_tab_by_number.ts pattern: a pure executor function plus
// a ToolDef wrapper. Type-only import from tools.ts to dodge runtime cycles.
import { z } from 'zod';
import type { Sql } from '../../db.js';
import type { ToolDef, ToolExecCtx } from '../tools.js';
import {
spawnBackgroundTask,
getBackgroundTaskStatus,
getBackgroundTaskResult,
} from '../background-task.js';
// ---------------------------------------------------------------------------
// spawn_subagent
// ---------------------------------------------------------------------------
export const SpawnSubagentInput = z.object({
input: z.string().min(1).describe('The task to execute in the background'),
model: z
.string()
.min(1)
.optional()
.describe('Model to use (defaults to session model)'),
agent: z
.string()
.min(1)
.optional()
.describe('Agent to use (defaults to boocode)'),
label: z
.string()
.max(100)
.optional()
.describe('Human-readable label for display'),
});
export type SpawnSubagentInputT = z.infer<typeof SpawnSubagentInput>;
export async function executeSpawnSubagent(
input: SpawnSubagentInputT,
sql: Sql,
sessionId: string,
): Promise<Record<string, unknown>> {
// Resolve project_id + model from the current session.
const sessRows = await sql<
{ project_id: string; model: string }[]
>`
SELECT project_id, model FROM sessions WHERE id = ${sessionId}
`;
if (sessRows.length === 0) {
return { error: 'current session not found' };
}
const projectId = sessRows[0]!.project_id;
const model = input.model ?? sessRows[0]!.model;
const task = await spawnBackgroundTask(
sql,
// We pass a minimal logger shim — the real logger is wired by the
// inference pipeline. This keeps the tool's execute signature clean.
{ info: () => {}, warn: () => {}, error: () => {} } as unknown as import('fastify').FastifyBaseLogger,
projectId,
input.input,
model,
input.agent,
input.label,
);
// Elapsed time since creation is negligible (task was just spawned).
return {
task_id: task.id,
status: task.status,
session_id: task.session_id,
chat_id: task.chat_id,
created_at: task.created_at,
};
}
export const spawnSubagent: ToolDef<SpawnSubagentInputT> = {
name: 'spawn_subagent',
description:
'Spawn a background subagent task. Creates a new session and chat, dispatches inference asynchronously, and returns immediately with a task_id. Use subagent_status to poll for completion and subagent_result to retrieve the full output. Non-blocking — the model continues while the subagent works in the background.',
inputSchema: SpawnSubagentInput,
jsonSchema: {
type: 'function',
function: {
name: 'spawn_subagent',
description:
'Spawn a background subagent task. Returns immediately with a task_id — poll with subagent_status.',
parameters: {
type: 'object',
properties: {
input: {
type: 'string',
description: 'The task to execute in the background',
},
model: {
type: 'string',
description: 'Model to use (defaults to session model)',
},
agent: {
type: 'string',
description: 'Agent to use (defaults to boocode)',
},
label: {
type: 'string',
maxLength: 100,
description: 'Human-readable label for display',
},
},
required: ['input'],
additionalProperties: false,
},
},
},
async execute(input, _projectRoot, _extraRoots, toolCtx?: ToolExecCtx) {
if (!toolCtx) {
return { error: 'spawn_subagent unavailable: no session context' };
}
try {
return await executeSpawnSubagent(input, toolCtx.sql, toolCtx.sessionId);
} catch (err) {
return {
error: `spawn_subagent failed: ${err instanceof Error ? err.message : String(err)}`,
};
}
},
};
// ---------------------------------------------------------------------------
// subagent_status
// ---------------------------------------------------------------------------
export const SubagentStatusInput = z.object({
task_id: z.string().uuid().describe('Task ID from spawn_subagent'),
});
export type SubagentStatusInputT = z.infer<typeof SubagentStatusInput>;
export async function executeSubagentStatus(
input: SubagentStatusInputT,
sql: Sql,
): Promise<Record<string, unknown>> {
const task = await getBackgroundTaskStatus(sql, input.task_id);
if (!task) {
return { error: 'task not found', task_id: input.task_id };
}
// Compute elapsed time from created_at (ISO string).
let elapsed_seconds: number | null = null;
try {
const created = new Date(task.created_at).getTime();
const finished = task.finished_at
? new Date(task.finished_at).getTime()
: Date.now();
elapsed_seconds = Math.round((finished - created) / 1000);
} catch {
elapsed_seconds = null;
}
return {
task_id: task.id,
status: task.status,
output_summary: task.output_summary,
finished_at: task.finished_at,
elapsed_seconds,
};
}
export const subagentStatus: ToolDef<SubagentStatusInputT> = {
name: 'subagent_status',
description:
'Poll the status of a background subagent task by task_id. Returns the current status (running/completed/failed/cancelled), an output summary if completed, and elapsed time. Useful after spawn_subagent to check if work is done.',
inputSchema: SubagentStatusInput,
jsonSchema: {
type: 'function',
function: {
name: 'subagent_status',
description:
'Poll the status of a background subagent task. Returns status, output summary, and elapsed time.',
parameters: {
type: 'object',
properties: {
task_id: {
type: 'string',
format: 'uuid',
description: 'Task ID from spawn_subagent',
},
},
required: ['task_id'],
additionalProperties: false,
},
},
},
async execute(input, _projectRoot, _extraRoots, toolCtx?: ToolExecCtx) {
if (!toolCtx) {
return { error: 'subagent_status unavailable: no session context' };
}
try {
return await executeSubagentStatus(input, toolCtx.sql);
} catch (err) {
return {
error: `subagent_status failed: ${err instanceof Error ? err.message : String(err)}`,
};
}
},
};
// ---------------------------------------------------------------------------
// subagent_result
// ---------------------------------------------------------------------------
export const SubagentResultInput = z.object({
task_id: z.string().uuid().describe('Task ID from spawn_subagent'),
});
export type SubagentResultInputT = z.infer<typeof SubagentResultInput>;
export async function executeSubagentResult(
input: SubagentResultInputT,
sql: Sql,
): Promise<Record<string, unknown>> {
const task = await getBackgroundTaskStatus(sql, input.task_id);
if (!task) {
return { error: 'task not found', task_id: input.task_id };
}
if (task.status !== 'completed') {
return {
task_id: task.id,
status: task.status,
error: `task is not yet completed (status: ${task.status})`,
};
}
if (!task.chat_id) {
return { error: 'task has no chat data', task_id: input.task_id };
}
const result = await getBackgroundTaskResult(sql, input.task_id, task.chat_id);
if (!result) {
return {
task_id: task.id,
status: task.status,
error: 'task completed but no output message found',
};
}
return {
task_id: task.id,
output: result.output,
token_usage: result.token_usage,
};
}
export const subagentResult: ToolDef<SubagentResultInputT> = {
name: 'subagent_result',
description:
'Retrieve the full output of a completed background subagent task by task_id. Returns the response text and token usage. The task must be in completed status — poll with subagent_status first.',
inputSchema: SubagentResultInput,
jsonSchema: {
type: 'function',
function: {
name: 'subagent_result',
description:
'Retrieve the full output of a completed background subagent task. Returns output text and token usage.',
parameters: {
type: 'object',
properties: {
task_id: {
type: 'string',
format: 'uuid',
description: 'Task ID from spawn_subagent',
},
},
required: ['task_id'],
additionalProperties: false,
},
},
},
async execute(input, _projectRoot, _extraRoots, toolCtx?: ToolExecCtx) {
if (!toolCtx) {
return { error: 'subagent_result unavailable: no session context' };
}
try {
return await executeSubagentResult(input, toolCtx.sql);
} catch (err) {
return {
error: `subagent_result failed: ${err instanceof Error ? err.message : String(err)}`,
};
}
},
};

View File

@@ -2,6 +2,12 @@ import { z } from 'zod';
import type { ToolDef } from '../types.js';
import { callCodecontext, type CodecontextResponse } from '../../codecontext_client.js';
// DEPRECATED (Phase 4, Domain 2, v2.8.14): This factory builds ToolDefs that
// route through the Go codecontext sidecar via callCodecontext(). Superseded
// by direct boocontext MCP tool wrappers. Keep functional for backward
// compatibility — old codecontext tools still use HTTP. New tools should use
// the boocontext MCP server instead of adding entries here.
//
// Shared factory for the 12 codecontext shim ToolDefs.
// Each shim provides name/schema/description/jsonParameters/mapArgs; the
// factory builds the ToolDef and returns both the ToolDef and the standalone

View File

@@ -0,0 +1,62 @@
import { z } from 'zod';
import type { ToolDef } from '../types.js';
import { callBoocontext } from '../../boocontext_client.js';
export const GetCodeHealthInput = z.object({
directory: z.string().optional().describe('Directory to analyze (defaults to project root)'),
file: z.string().optional().describe('Optional: specific file to analyze'),
});
export type GetCodeHealthInputT = z.infer<typeof GetCodeHealthInput>;
const DESCRIPTION =
'Code health analysis. Returns AF grades per file across 7 dimensions ' +
'(cohesion, coupling, complexity, documentation, duplication, unit size, test coverage). ' +
'Includes project health summary and refactoring candidates.';
/**
* Standalone execute function — calls the boocontext MCP server's
* boocontext_health tool and returns the raw report text.
*
* Structured for direct test access: accepts input + projectPath,
* no side effects beyond the MCP call.
*/
export async function executeGetCodeHealth(
input: GetCodeHealthInputT,
projectPath: string,
): Promise<string> {
const args: Record<string, unknown> = {};
if (input.directory) args['directory'] = input.directory;
if (input.file) args['file'] = input.file;
const resp = await callBoocontext({ toolName: 'boocontext_health', args });
return resp.result;
}
export const getCodeHealth: ToolDef<GetCodeHealthInputT> = {
name: 'get_code_health',
description: DESCRIPTION,
inputSchema: GetCodeHealthInput,
jsonSchema: {
type: 'function',
function: {
name: 'get_code_health',
description: DESCRIPTION,
parameters: {
type: 'object',
properties: {
directory: {
type: 'string',
description: 'Directory to analyze (defaults to project root)',
},
file: {
type: 'string',
description: 'Optional: specific file to analyze',
},
},
additionalProperties: false,
},
},
},
async execute(input, projectRoot) {
return executeGetCodeHealth(input, projectRoot);
},
};

View File

@@ -0,0 +1,228 @@
import { spawn } from 'node:child_process';
import { resolve } from 'node:path';
import { z } from 'zod';
import type { ToolDef } from '../types.js';
import type { CodecontextResponse } from '../../codecontext_client.js';
// ======================= MCP Client =======================
const BOOCONTEXT_PATH = resolve('/opt/forks/boocontext/dist/standalone.js');
const TOOL_CALL_TIMEOUT_MS = 60_000;
interface JsonRpcMessage {
jsonrpc: '2.0';
id?: number | string;
result?: {
content?: Array<{ type: string; text: string }>;
};
error?: { code?: number; message: string };
}
/**
* Single-shot MCP JSON-RPC client for boocontext.
* Spawns the process, sends initialize + tools/call over NDJSON, returns the
* text result from the content array. The boocontext MCP server auto-detects
* newline-delimited JSON transport when the first input lacks Content-Length
* headers, which is exactly what we send.
*/
async function callBoocontext(
toolName: string,
args: Record<string, unknown>,
): Promise<string> {
return new Promise<string>((resolvePromise, reject) => {
const child = spawn(process.execPath, [BOOCONTEXT_PATH], {
stdio: ['pipe', 'pipe', 'pipe'],
timeout: TOOL_CALL_TIMEOUT_MS,
});
let stdout = '';
let stderr = '';
let resolved = false;
function finalize(err?: Error, result?: string): void {
if (resolved) return;
resolved = true;
if (err) reject(err);
else resolvePromise(result!);
child.kill();
}
child.stdout!.on('data', (chunk: Buffer) => {
stdout += chunk.toString();
});
child.stderr!.on('data', (chunk: Buffer) => {
stderr += chunk.toString();
});
child.on('error', (err: Error) => {
finalize(new Error(`boocontext spawn error: ${err.message}`));
});
child.on('close', (code: number | null) => {
if (resolved) return;
// Parse newline-delimited JSON responses from stdout
const lines = stdout.split('\n').filter((l) => l.trim().length > 0);
let toolText: string | undefined;
let toolError: string | undefined;
for (const line of lines) {
try {
const msg = JSON.parse(line) as JsonRpcMessage;
if (msg.id === 2) {
if (msg.error) {
toolError = msg.error.message ?? 'boocontext tool call failed';
} else if (msg.result?.content?.[0]?.text !== undefined) {
toolText = msg.result.content[0].text;
}
}
} catch {
// skip malformed JSON lines
}
}
if (toolError) {
finalize(new Error(toolError));
} else if (toolText !== undefined) {
finalize(undefined, toolText);
} else {
const errSuffix =
stderr.length > 0 ? ` stderr: ${stderr.slice(0, 500)}` : '';
finalize(
new Error(`boocontext MCP call failed (exit ${code})${errSuffix}`),
);
}
});
// Step 1: initialize — establishes MCP protocol version + capabilities
child.stdin!.write(
JSON.stringify({
jsonrpc: '2.0',
id: 1,
method: 'initialize',
params: {
protocolVersion: '2024-11-05',
capabilities: {},
clientInfo: { name: 'boocode-server', version: '1.0.0' },
},
}) + '\n',
);
// Step 2: tools/call — invoke the named boocontext tool
child.stdin!.write(
JSON.stringify({
jsonrpc: '2.0',
id: 2,
method: 'tools/call',
params: { name: toolName, arguments: args },
}) + '\n',
);
child.stdin!.end();
// Safety timeout — prevent hung processes
setTimeout(() => {
finalize(
new Error(
`boocontext call timed out after ${TOOL_CALL_TIMEOUT_MS}ms`,
),
);
}, TOOL_CALL_TIMEOUT_MS);
});
}
// ======================= Tool Definition =======================
const TRUNCATION_LIMIT = 32_000;
export const GetCodeImpactInput = z.object({
symbol: z.string().min(1).describe('Symbol name for TSA trace_impact'),
file: z.string().optional().describe('File path for codesight blast_radius'),
directory: z
.string()
.optional()
.describe('Directory (defaults to project root)'),
depth: z
.number()
.int()
.min(1)
.max(5)
.optional()
.describe('Max blast-radius traversal depth (default 1)'),
});
export type GetCodeImpactInputT = z.infer<typeof GetCodeImpactInput>;
const DESCRIPTION =
'Impact analysis. Merges symbol-level call trace with file-level blast radius. ' +
'Use before making changes to understand change propagation. ' +
'Single call replaces separate get_symbol_info + get_blast_radius steps.';
/**
* Standalone execute function — calls the boocontext MCP `boocontext_impact`
* tool via a short-lived child process, then wraps the result in the standard
* CodecontextResponse shape with inline truncation at 32 KB.
*/
export async function executeGetCodeImpact(
input: GetCodeImpactInputT,
projectPath: string,
): Promise<CodecontextResponse> {
const args: Record<string, unknown> = {
symbol: input.symbol,
directory: input.directory ?? projectPath,
};
if (input.file) args['file'] = input.file;
const text = await callBoocontext('boocontext_impact', args);
// Inline truncation matching codecontext_client.ts patterns (32 KB ceiling).
if (text.length > TRUNCATION_LIMIT) {
const sliced = text.slice(0, TRUNCATION_LIMIT);
const omitted = text.length - TRUNCATION_LIMIT;
return {
result: `${sliced}\n\n[truncated, ${omitted} chars omitted; narrow with symbol or file parameters]`,
truncated: true,
};
}
return { result: text, truncated: false };
}
export const getCodeImpact: ToolDef<GetCodeImpactInputT> = {
name: 'get_code_impact',
description: DESCRIPTION,
inputSchema: GetCodeImpactInput,
jsonSchema: {
type: 'function',
function: {
name: 'get_code_impact',
description: DESCRIPTION,
parameters: {
type: 'object',
properties: {
symbol: {
type: 'string',
description: 'Symbol name for TSA trace_impact',
},
file: {
type: 'string',
description: 'File path for codesight blast_radius',
},
directory: {
type: 'string',
description: 'Directory (defaults to project root)',
},
depth: {
type: 'number',
description: 'Max blast-radius traversal depth (default 1)',
},
},
required: ['symbol'],
additionalProperties: false,
},
},
},
execute(input, projectRoot) {
return executeGetCodeImpact(input, projectRoot);
},
};

View File

@@ -0,0 +1,192 @@
import { spawn } from 'node:child_process';
import { z } from 'zod';
import type { ToolDef } from '../types.js';
export const GetCodeMapInput = z.object({
directory: z.string().optional().describe('Directory to scan (defaults to project root)'),
compress: z.boolean().optional().describe('Apply DCP compression if payload exceeds threshold (default: true)'),
});
export type GetCodeMapInputT = z.infer<typeof GetCodeMapInput>;
const DESCRIPTION =
'DCP-compressed codebase context map. Returns filenames, sizes, import relationships in a compressed format. ' +
'Use compress=false for full detail, compress=true (default) for token-efficient overview.';
const BOOCONTEXT_PATH = '/opt/forks/boocontext/dist/standalone.js';
const TOOL_TIMEOUT_MS = 30_000;
const MAX_RESULT_BYTES = 32_768;
export interface CodeMapResponse {
result: string;
truncated: boolean;
}
/**
* Calls the boocontext MCP server over stdio JSON-RPC to invoke
* the boocontext_map tool. Spawns the standalone binary, sends
* initialize + tools/call, collects NDJSON responses, and kills
* the child process.
*/
function callBoocontextMap(args: Record<string, unknown>): Promise<CodeMapResponse> {
return new Promise((resolve, reject) => {
const child = spawn('node', [BOOCONTEXT_PATH], {
stdio: ['pipe', 'pipe', 'pipe'],
});
let stdoutBuf = '';
const lines: string[] = [];
let timedOut = false;
let resolved = false;
const timer = setTimeout(() => {
timedOut = true;
child.kill('SIGKILL');
reject(new Error(`boocontext MCP call timed out after ${TOOL_TIMEOUT_MS}ms`));
}, TOOL_TIMEOUT_MS);
function tryParse(): void {
if (resolved || timedOut) return;
// Accumulate complete NDJSON lines
const parts = stdoutBuf.split('\n');
stdoutBuf = parts.pop()! ?? '';
for (const p of parts) {
const t = p.trim();
if (t) lines.push(t);
}
// Need at least 2 responses: initialize + tools/call
if (lines.length < 2) return;
resolved = true;
clearTimeout(timer);
child.kill();
try {
const callResponse = JSON.parse(lines[1]!);
if (callResponse.error) {
reject(new Error(`MCP error: ${callResponse.error.message}`));
return;
}
const content = callResponse.result?.content;
if (!content?.[0]?.text) {
reject(new Error('Unexpected MCP response shape — missing content[0].text'));
return;
}
// content[0].text is JSON-stringified VerdictEnvelope from boocontext
const envelope = JSON.parse(content[0].text as string);
const details = envelope.details;
let result: string;
if (details && typeof details === 'object' && 'data' in details) {
// DcpEnvelope shape: { compressed, originalLength, compressedLength, data }
if (details.compressed) {
// Return the full DcpEnvelope as JSON so the LLM can pass it
// transparently to a decompression step
result = JSON.stringify(details);
} else {
// Uncompressed — data is the raw output
result = details.data;
}
} else {
result = JSON.stringify(details ?? envelope);
}
const truncated = Buffer.byteLength(result, 'utf-8') > MAX_RESULT_BYTES;
if (truncated) {
result = result.substring(0, MAX_RESULT_BYTES);
}
resolve({ result, truncated });
} catch (e: any) {
reject(new Error(`Failed to parse boocontext response: ${e.message}`));
}
}
child.stdout!.on('data', (chunk: Buffer) => {
if (timedOut) return;
stdoutBuf += chunk.toString('utf-8');
tryParse();
});
child.stderr!.on('data', (_chunk: Buffer) => {
// Captured but not surfaced — logged only on parse failure
});
child.on('error', (err: Error) => {
clearTimeout(timer);
if (!resolved) {
resolved = true;
reject(new Error(`boocontext spawn failed: ${err.message}`));
}
});
child.on('close', () => {
clearTimeout(timer);
if (!resolved && !timedOut) {
tryParse();
if (!resolved) {
resolved = true;
reject(new Error('boocontext process closed without producing a valid response'));
}
}
});
// Step 1: initialize
child.stdin!.write(
JSON.stringify({ jsonrpc: '2.0', id: 1, method: 'initialize' }) + '\n',
);
// Step 2: tools/call for boocontext_map
child.stdin!.write(
JSON.stringify({
jsonrpc: '2.0',
id: 2,
method: 'tools/call',
params: { name: 'boocontext_map', arguments: args },
}) + '\n',
);
});
}
export const getCodeMap: ToolDef<GetCodeMapInputT> = {
name: 'get_code_map',
description: DESCRIPTION,
inputSchema: GetCodeMapInput,
jsonSchema: {
type: 'function',
function: {
name: 'get_code_map',
description: DESCRIPTION,
parameters: {
type: 'object',
properties: {
directory: { type: 'string', description: 'Directory to scan (defaults to project root)' },
compress: {
type: 'boolean',
description: 'Apply DCP compression if payload exceeds threshold (default: true)',
},
},
additionalProperties: false,
},
},
},
async execute(input, projectRoot): Promise<CodeMapResponse> {
return callBoocontextMap({
directory: input.directory ?? projectRoot,
compress: input.compress ?? true,
});
},
};
export async function executeGetCodeMap(
input: GetCodeMapInputT,
projectRoot: string,
): Promise<CodeMapResponse> {
return callBoocontextMap({
directory: input.directory ?? projectRoot,
compress: input.compress ?? true,
});
}

View File

@@ -3,6 +3,7 @@ import { makeCodecontextTool } from './factory.js';
export const GetCodebaseOverviewInput = z.object({
include_stats: z.boolean().optional(),
compress: z.boolean().optional().describe('Apply DCP compression for large projects (>50 files)'),
});
export type GetCodebaseOverviewInputT = z.infer<typeof GetCodebaseOverviewInput>;
@@ -24,10 +25,18 @@ const { toolDef: getCodebaseOverview, execute: executeGetCodebaseOverview } =
type: 'boolean',
description: 'Include file count, symbol count, language stats. Defaults to true.',
},
compress: {
type: 'boolean',
description: 'Apply DCP compression for large projects (>50 files)',
},
},
additionalProperties: false,
},
mapArgs: (input) => ({ include_stats: input.include_stats ?? true }),
mapArgs: (input) => {
const args: Record<string, unknown> = { include_stats: input.include_stats ?? true };
if (input.compress) args['compress'] = true;
return args;
},
});
export { getCodebaseOverview, executeGetCodebaseOverview };

View File

@@ -0,0 +1,262 @@
import { z } from 'zod';
import { spawn } from 'node:child_process';
import type { ToolDef } from '../types.js';
import type { CodecontextResponse } from '../../codecontext_client.js';
const BOOCONTEXT_PATH = '/opt/forks/boocontext/dist/standalone.js';
const TRUNCATION_LIMIT = 32_000;
export const GetTypeInfoInput = z.object({
file: z.string().min(1).describe('File path to resolve types in'),
symbol: z.string().optional().describe('Symbol name to resolve (supports regex)'),
directory: z.string().optional().describe('Project directory for type resolution context'),
});
export type GetTypeInfoInputT = z.infer<typeof GetTypeInfoInput>;
const DESCRIPTION =
'TypeScript type recovery. Returns type signatures, interface definitions, ' +
'generic constraints, and JSDoc for symbols in a file. Uses type-inject MCP server.';
// ---- JSON-RPC-over-stdio MCP caller for boocontext --------------------------
async function callBoocontext(
toolName: string,
args: Record<string, unknown>,
): Promise<CodecontextResponse> {
const child = spawn(process.execPath, [BOOCONTEXT_PATH], {
stdio: ['pipe', 'pipe', 'pipe'],
timeout: 60_000,
});
let stderrBuf = '';
child.stderr!.on('data', (chunk: Buffer) => {
stderrBuf += chunk.toString('utf-8');
});
let killed = false;
const killChild = () => {
if (killed) return;
killed = true;
child.kill();
};
try {
// Read one complete JSON-RPC response from stdout (handles both
// Content-Length framed and newline-delimited transport).
async function readResponse(timeoutMs = 30_000): Promise<unknown> {
return new Promise((resolve, reject) => {
const timer = setTimeout(() => {
cleanup();
reject(new Error('Timeout reading boocontext response'));
}, timeoutMs);
let buf = '';
const cleanup = () => {
clearTimeout(timer);
child.stdout!.removeListener('data', onData);
child.stdout!.removeListener('end', onEnd);
child.stdout!.removeListener('error', onError);
};
const onData = (chunk: Buffer) => {
buf += chunk.toString('utf-8');
const msg = tryExtractMessage(buf);
if (msg !== null) {
cleanup();
resolve(msg);
return;
}
if (buf.length > 1_024 * 1_024) {
cleanup();
reject(new Error('Boocontext response exceeded 1 MB'));
}
};
const onEnd = () => {
cleanup();
if (buf.trim()) {
try {
resolve(JSON.parse(buf.trim()));
} catch {
reject(new Error('Boocontext stream ended with incomplete data'));
}
} else {
reject(new Error('Boocontext stream ended unexpectedly'));
}
};
const onError = (err: Error) => {
cleanup();
reject(err);
};
child.stdout!.on('data', onData);
child.stdout!.on('end', onEnd);
child.stdout!.on('error', onError);
});
}
// Wait for the process to be fully spawned.
await new Promise<void>((resolve, reject) => {
child.on('error', reject);
child.on('spawn', () => resolve());
});
// Step 1 — MCP initialize
let reqId = 0;
reqId++;
child.stdin!.write(
JSON.stringify({ jsonrpc: '2.0', id: reqId, method: 'initialize' }) + '\n',
);
const initResp = await readResponse() as { error?: { message: string } };
if (initResp.error) {
throw new Error(`Boocontext init failed: ${initResp.error.message}`);
}
// Step 2 — tools/call
reqId++;
child.stdin!.write(
JSON.stringify({
jsonrpc: '2.0',
id: reqId,
method: 'tools/call',
params: { name: toolName, arguments: args },
}) + '\n',
);
const callResp = await readResponse() as {
error?: { message: string };
result?: { content?: Array<{ type: string; text: string }> };
};
if (callResp.error) {
throw new Error(`Boocontext tool call failed: ${callResp.error.message}`);
}
// Extract text from the MCP tool result shape:
// { content: [{ type: "text", text: "…" }] }
const content = callResp.result?.content;
let text: string;
if (Array.isArray(content) && content.length > 0 && content[0]!.type === 'text') {
text = content[0]!.text;
} else {
text = JSON.stringify(callResp.result);
}
// Inline truncation at 32 KB.
if (text.length > TRUNCATION_LIMIT) {
const omitted = text.length - TRUNCATION_LIMIT;
return {
result:
text.slice(0, TRUNCATION_LIMIT) +
`\n\n[truncated, ${omitted} chars omitted; narrow with file or symbol filter]`,
truncated: true,
};
}
return { result: text, truncated: false };
} finally {
killChild();
// Give the process a moment to release resources.
await new Promise<void>((resolve) => {
const timer = setTimeout(resolve, 2_000);
child.on('exit', () => {
clearTimeout(timer);
resolve();
});
});
}
}
/**
* Attempt to extract one complete JSON-RPC message from the head of a
* buffer. Handles both Content-Length framed and newline-delimited
* formats. Returns `null` when more data is needed.
*/
function tryExtractMessage(buf: string): unknown | null {
// --- Content-Length framed ---
const headerEnd = buf.indexOf('\r\n\r\n');
if (headerEnd !== -1) {
const header = buf.substring(0, headerEnd);
const lengthMatch = header.match(/Content-Length:\s*(\d+)/i);
if (lengthMatch) {
const contentLength = parseInt(lengthMatch[1]!, 10);
const bodyStart = headerEnd + 4;
if (buf.length >= bodyStart + contentLength) {
const jsonStr = buf.substring(bodyStart, bodyStart + contentLength);
return JSON.parse(jsonStr);
}
return null; // need more data
}
// Has \r\n\r\n but no Content-Length — junk segment; skip and retry.
return tryExtractMessage(buf.substring(headerEnd + 4));
}
// --- Newline-delimited ---
const nlIndex = buf.indexOf('\n');
if (nlIndex !== -1) {
const line = buf.substring(0, nlIndex).trim();
if (line && line.startsWith('{')) {
return JSON.parse(line);
}
// Non-JSON line (e.g. stderr echo), skip and continue.
return tryExtractMessage(buf.substring(nlIndex + 1));
}
return null; // need more data
}
// ---- ToolDef ----------------------------------------------------------------
export const getTypeInfo: ToolDef<GetTypeInfoInputT> = {
name: 'get_type_info',
description: DESCRIPTION,
inputSchema: GetTypeInfoInput,
jsonSchema: {
type: 'function',
function: {
name: 'get_type_info',
description: DESCRIPTION,
parameters: {
type: 'object',
properties: {
file: { type: 'string', description: 'File path to resolve types in' },
symbol: {
type: 'string',
description: 'Symbol name to resolve (supports regex)',
},
directory: {
type: 'string',
description: 'Project directory for type resolution context',
},
},
required: ['file'],
additionalProperties: false,
},
},
},
async execute(input): Promise<CodecontextResponse> {
const args: Record<string, unknown> = { file: input.file };
if (input.symbol) args['symbol'] = input.symbol;
return callBoocontext('boocontext_types', args);
},
};
/**
* Standalone execute function matching the `execute` shape returned by
* `makeCodecontextTool` — useful for direct callers and tests.
*
* Note: unlike the HTTP-backed codecontext tools this does NOT accept a
* `fetcher` override because it communicates over stdio rather than HTTP.
*/
export async function executeGetTypeInfo(
input: GetTypeInfoInputT,
_projectPath?: string,
): Promise<CodecontextResponse> {
const args: Record<string, unknown> = { file: input.file };
if (input.symbol) args['symbol'] = input.symbol;
return callBoocontext('boocontext_types', args);
}

View File

@@ -0,0 +1,61 @@
import { z } from 'zod';
import type { ToolDef } from '../types.js';
import { callBoocontext } from '../../boocontext_client.js';
export const GetWikiArticleInput = z.object({
article: z.string().min(1).describe('Article name (e.g. "auth", "database", "routes")'),
directory: z.string().optional().describe('Project directory'),
});
export type GetWikiArticleInputT = z.infer<typeof GetWikiArticleInput>;
const DESCRIPTION =
'Returns a persistent codebase wiki article by name (auth, database, routes, etc.). ' +
'Generated on first request and cached to disk. Avoids running expensive full-scan tools for targeted documentation.';
/**
* Standalone execute function — calls the boocontext MCP server's
* codesight_get_wiki_article tool and returns the article text.
*
* Structured for direct test access: accepts input + projectPath,
* no side effects beyond the MCP call.
*/
export async function executeGetWikiArticle(
input: GetWikiArticleInputT,
projectPath: string,
): Promise<string> {
const args: Record<string, unknown> = { article: input.article };
if (input.directory) args['directory'] = input.directory!;
const resp = await callBoocontext({ toolName: 'codesight_get_wiki_article', args });
return resp.result;
}
export const getWikiArticle: ToolDef<GetWikiArticleInputT> = {
name: 'get_wiki_article',
description: DESCRIPTION,
inputSchema: GetWikiArticleInput,
jsonSchema: {
type: 'function',
function: {
name: 'get_wiki_article',
description: DESCRIPTION,
parameters: {
type: 'object',
properties: {
article: {
type: 'string',
description: 'Article name (e.g. "auth", "database", "routes")',
},
directory: {
type: 'string',
description: 'Project directory',
},
},
required: ['article'],
additionalProperties: false,
},
},
},
async execute(input, projectRoot) {
return executeGetWikiArticle(input, projectRoot);
},
};

View File

@@ -13,3 +13,9 @@ export { getBlastRadius } from './get_blast_radius.js';
export { getHotFiles } from './get_hot_files.js';
export { getRoutes } from './get_routes.js';
export { getMiddleware } from './get_middleware.js';
// v2.8.14-domain2-phase1: boocontext-backed tools.
export { getCodeHealth } from './get_code_health.js';
export { getCodeImpact } from './get_code_impact.js';
export { getTypeInfo } from './get_type_info.js';
export { getCodeMap } from './get_code_map.js';
export { getWikiArticle } from './get_wiki_article.js';

View File

@@ -0,0 +1,132 @@
/**
* vWhale: run_command tool. Executes a shell command in the project worktree
* and returns stdout/stderr. Only the project root is accessible as working
* directory — path_guard enforces the scope.
*
* Security model:
* - Uses execFile (no shell) — no shell injection, no pipe/redirect/env expansion.
* - args passed as array, never a string.
* - 30s timeout default, configure per-call.
* - 32KB output cap with truncation (same pattern as web_fetch.ts).
* - Working directory restricted to project root via path_guard.
* - No background processes allowed (waits for completion).
*/
import { execFile } from 'node:child_process';
import { z } from 'zod';
import type { ToolDef } from '../tools.js';
const RunCommandInput = z.object({
command: z.string().min(1).max(256),
args: z.array(z.string()).default([]),
description: z.string().max(256).optional(),
timeout_ms: z.number().int().positive().max(120_000).optional(),
});
export type RunCommandInputT = z.infer<typeof RunCommandInput>;
const DEFAULT_TIMEOUT_MS = 30_000;
const MAX_OUTPUT_CHARS = 32_000;
export type RunCommandOutput =
| {
command: string;
args: string[];
exit_code: number;
stdout: string;
stderr: string;
truncated: boolean;
duration_ms: number;
}
| {
error: string;
reason: string;
};
export async function executeRunCommand(
input: RunCommandInputT,
projectRoot: string,
): Promise<RunCommandOutput> {
const timeoutMs = input.timeout_ms ?? DEFAULT_TIMEOUT_MS;
const startTime = Date.now();
return new Promise((resolve) => {
const child = execFile(
input.command,
input.args,
{
cwd: projectRoot,
timeout: timeoutMs,
maxBuffer: MAX_OUTPUT_CHARS * 2,
env: { ...process.env },
},
(err, stdout, stderr) => {
const durationMs = Date.now() - startTime;
// Truncate output if needed
const truncated = stdout.length + stderr.length > MAX_OUTPUT_CHARS;
const cappedStdout = truncated ? stdout.slice(0, MAX_OUTPUT_CHARS) : stdout;
const cappedStderr = truncated ? stderr.slice(0, Math.max(MAX_OUTPUT_CHARS - cappedStdout.length, 0)) : stderr;
const exitCode = err?.code === 'ENOENT' ? -1 : (err as Error & { code?: number })?.code ?? 0;
resolve({
command: input.command,
args: input.args,
exit_code: typeof exitCode === 'number' ? exitCode : 1,
stdout: cappedStdout,
stderr: cappedStderr,
truncated,
duration_ms: durationMs,
});
},
);
});
}
export const runCommand: ToolDef<RunCommandInputT> = {
name: 'run_command',
description:
'Run a shell command in the project workspace and return stdout + stderr. ' +
'The command runs in the project root directory. ' +
'Use for: building, testing, linting, git operations, running scripts. ' +
'Output is capped at 32KB. Timeout defaults to 30s (max 120s). ' +
'Security: args are passed as array (no shell injection). No background processes.',
inputSchema: RunCommandInput as unknown as z.ZodType<RunCommandInputT>,
jsonSchema: {
type: 'function',
function: {
name: 'run_command',
description:
'Execute a command in the project workspace. ' +
'Use for builds, tests, linting, git commands, and scripts. ' +
'The process runs with a 30s timeout and 32KB output cap.',
parameters: {
type: 'object',
properties: {
command: {
type: 'string',
description: 'Command to execute (e.g. pnpm, npm, npx, node, git, ls, cat).',
},
args: {
type: 'array',
items: { type: 'string' },
description: 'Arguments as array (e.g. ["run", "build"]). Never embedded in a shell string.',
},
description: {
type: 'string',
description: 'Optional human-readable description of what this command does.',
},
timeout_ms: {
type: 'integer',
description: 'Timeout in milliseconds. Default 30000, max 120000.',
},
},
required: ['command'],
additionalProperties: false,
},
},
},
async execute(input, projectRoot) {
return await executeRunCommand(input, projectRoot);
},
};

View File

@@ -0,0 +1,160 @@
import { z } from 'zod';
import { existsSync } from 'node:fs';
import { writeFile, unlink } from 'node:fs/promises';
import { join } from 'node:path';
import type { ToolDef } from '../tools/types.js';
import { ensureMemoryScaffold, getMemoryRoot } from '../memory/paths.js';
import { writeEntry, readTopicFiles } from '../memory/store.js';
const ManageMemoryInput = z.object({
topic: z.enum(['project', 'user', 'reference']).describe('Memory topic category'),
title: z.string().min(1).max(200).describe('Entry title (used as identifier for update/delete)'),
content: z.string().optional().describe('Memory content body (required for create/update)'),
tags: z.array(z.string()).optional().describe('Optional tags for search'),
action: z.enum(['create', 'update', 'delete']).describe('Action to perform'),
});
type InputT = z.infer<typeof ManageMemoryInput>;
function titleToFilename(title: string): string {
return (
title
.toLowerCase()
.replace(/[^a-z0-9]+/g, '-')
.replace(/(^-|-$)/g, '') + '.md'
);
}
/**
* Try to update the CoreTier SQLite database in addition to the file store.
* This is best-effort — CoreTier is optional (file store is primary).
*/
async function syncCoreTier(
_root: string,
_topic: string,
_title: string,
_content: string,
_tags: string[],
): Promise<void> {
// CoreTier SQLite backend is not available in this build — file store only.
}
export const manageMemoryTool: ToolDef<InputT> = {
name: 'manage_memory',
description:
'Create, update, or delete memory entries in .boocode/memory/ for cross-session recall. ' +
'Use to persist project conventions, user preferences, and architectural decisions. ' +
'Actions: create (write new entry), update (modify existing entry), delete (remove entry).',
inputSchema: ManageMemoryInput,
jsonSchema: {
type: 'function',
function: {
name: 'manage_memory',
description: 'Manage memory entries — create, update, or delete',
parameters: {
type: 'object',
properties: {
topic: {
type: 'string',
enum: ['project', 'user', 'reference'],
description: 'Memory topic category',
},
title: { type: 'string', description: 'Entry title (identifier for update/delete)' },
content: {
type: 'string',
description: 'Memory content body (required for create/update)',
},
tags: {
type: 'array',
items: { type: 'string' },
description: 'Optional tags for search',
},
action: {
type: 'string',
enum: ['create', 'update', 'delete'],
description: 'Action to perform',
},
},
required: ['topic', 'title', 'action'],
},
},
},
async execute(input: InputT, projectRoot: string): Promise<unknown> {
const root = getMemoryRoot(projectRoot);
await ensureMemoryScaffold(root);
const filename = titleToFilename(input.title);
if (input.action === 'create') {
if (!input.content) {
return { error: 'Content is required for create action.' };
}
await writeEntry(root, input.topic, input.title, input.content, input.tags ?? []);
await syncCoreTier(root, input.topic, input.title, input.content, input.tags ?? []);
return {
result: `Memory entry "${input.title}" created in .boocode/memory/${input.topic}/`,
};
}
if (input.action === 'update') {
if (!input.content) {
return { error: 'Content is required for update action.' };
}
// Resolve target file path — try computed filename first, then heading match
let targetPath = join(root, input.topic, filename);
if (!existsSync(targetPath)) {
const files = await readTopicFiles(root, input.topic);
const matched = [...files.keys()].find((name) => {
const content = files.get(name);
return content?.trimStart().startsWith(`## ${input.topic}: ${input.title}`);
});
if (matched) {
targetPath = join(root, input.topic, matched);
} else {
return {
error: `Memory entry "${input.title}" not found in .boocode/memory/${input.topic}/`,
};
}
}
const tagLine =
(input.tags ?? []).length > 0
? `> tags: ${(input.tags ?? []).join(', ')}\n\n`
: '\n';
const entry = `## ${input.topic}: ${input.title}\n${tagLine}${input.content}\n`;
await writeFile(targetPath, entry, 'utf8');
await syncCoreTier(root, input.topic, input.title, input.content, input.tags ?? []);
return {
result: `Memory entry "${input.title}" updated in .boocode/memory/${input.topic}/`,
};
}
if (input.action === 'delete') {
// Resolve target file path
let targetPath = join(root, input.topic, filename);
if (!existsSync(targetPath)) {
const files = await readTopicFiles(root, input.topic);
const matched = [...files.keys()].find((name) => {
const content = files.get(name);
return content?.trimStart().startsWith(`## ${input.topic}: ${input.title}`);
});
if (matched) {
targetPath = join(root, input.topic, matched);
} else {
return {
error: `Memory entry "${input.title}" not found in .boocode/memory/${input.topic}/`,
};
}
}
await unlink(targetPath);
return {
result: `Memory entry "${input.title}" deleted from .boocode/memory/${input.topic}/`,
};
}
return { error: `Unknown action: ${input.action}` };
},
};

View File

@@ -19,6 +19,11 @@ import {
getHotFiles,
getRoutes,
getMiddleware,
getCodeHealth,
getCodeImpact,
getTypeInfo,
getCodeMap,
getWikiArticle,
} from './codecontext/index.js';
// v1.13.17-cross-repo-reads: cross-repo read grant request tool. Paired
// with the pause-on-pending-grant branch in inference/tool-phase.ts and the
@@ -27,6 +32,21 @@ import { requestReadAccess } from '../request_read_access.js';
// v2.6.x: read-only tool that reads a tab's transcript by its session-scoped
// tab number. Needs DB/session context (ToolExecCtx 4th arg).
import { readTabByNumber } from '../read_tab_by_number.js';
// v2.x: memory management tools. file-based store with optional CoreTier
// (SQLite FTS5 + vector) hybrid search backend.
import { extractMemoryTool } from './extract_memory.js';
import { manageMemoryTool } from './manage_memory.js';
import { searchMemoryTool } from './search_memory.js';
// vWhale: command execution tool. Spawns processes in the project worktree
// with timeout and output cap. No shell — args are passed as array.
import { runCommand } from './execute-command.js';
// v2.x: background subagent tools. Non-blocking subagent execution with
// spawn/poll/collect lifecycle. Reuses existing sessions/chats/messages/tasks.
import {
spawnSubagent,
subagentStatus,
subagentResult,
} from './background-subagent-tools.js';
// v1.13.3: alpha-sorted by tool.name at module load. llama.cpp's prompt
// cache hits on byte-identical prefixes; the tool list lives near the top
@@ -75,6 +95,27 @@ export let ALL_TOOLS: ToolDef<unknown>[] = [
// v2.6.x: read a tab's transcript by its session-scoped tab number.
// Read-only; uses the ToolExecCtx 4th arg for DB/session access.
readTabByNumber as ToolDef<unknown>,
// v2.8.14-domain2-phase1: boocontext-backed tools. Backed by the boocontext
// MCP server. All read-only. Health, impact, types, map analysis.
getCodeHealth as ToolDef<unknown>,
getCodeImpact as ToolDef<unknown>,
getTypeInfo as ToolDef<unknown>,
getCodeMap as ToolDef<unknown>,
// v2.8.14-domain2-phase3: wiki mode + token-efficient scanning.
getWikiArticle as ToolDef<unknown>,
// v2.x: memory management tools. File-based store with optional CoreTier
// (SQLite FTS5 + vector) hybrid search backend.
extractMemoryTool as ToolDef<unknown>,
manageMemoryTool as ToolDef<unknown>,
searchMemoryTool as ToolDef<unknown>,
// vWhale: command execution. Spawns processes in the project worktree.
// Read-write; use with guard: restricted to project root via path_guard,
// no shell injection (execFile, not exec).
runCommand as ToolDef<unknown>,
// v2.x: background subagent tools. Non-blocking spawn/poll/collect lifecycle.
spawnSubagent as ToolDef<unknown>,
subagentStatus as ToolDef<unknown>,
subagentResult as ToolDef<unknown>,
].sort((a, b) => a.name.localeCompare(b.name));
export let TOOLS_BY_NAME: Record<string, ToolDef<unknown>> = Object.fromEntries(

View File

@@ -0,0 +1,376 @@
// v2.8.0: Workflow catalog — built-in workflow definitions that ship with
// BooCode. Each workflow is a metadata object with name, description, and a
// factory function that returns the workflow script source code.
//
// Built-in workflows are merged into the discovery list alongside file-based
// workflows from .boocode/workflows/. They take precedence over user-defined
// workflows with the same name.
import { createHash } from 'node:crypto';
// ---------------------------------------------------------------------------
// Types
// ---------------------------------------------------------------------------
/**
* A built-in workflow definition shipped with BooCode.
*/
export interface BuiltinWorkflow {
/** Unique workflow name (used to invoke via `WorkflowManager`). */
name: string;
/** Human-readable description of what this workflow does. */
description: string;
/** Optional ordered phases for UI progress display. */
phases?: Array<{ title: string; detail?: string }>;
/**
* Generate the workflow script source code for this workflow.
* The returned string must be valid JS that exports `meta` and a `default`
* async function matching the `WorkflowScript` shape.
*
* @param args - Optional arguments provided when the workflow is started.
*/
generateScript: (args?: Record<string, unknown>) => string;
}
// ---------------------------------------------------------------------------
// Script templates (shared helpers)
// ---------------------------------------------------------------------------
/**
* Stable JSON serialisation for generating deterministic cache keys from
* structured arguments. Keys are sorted so the same data always produces
* the same string regardless of property insertion order.
*/
function stableJson(value: unknown): string {
if (value === null) return 'null';
if (typeof value !== 'object') return JSON.stringify(value);
if (Array.isArray(value)) {
return `[${value.map(stableJson).join(',')}]`;
}
const keys = Object.keys(value as Record<string, unknown>).sort();
const pairs = keys.map((k) => `${JSON.stringify(k)}:${stableJson((value as Record<string, unknown>)[k])}`);
return `{${pairs.join(',')}}`;
}
/**
* Compute a deterministic SHA-256 fingerprint for a combined spec + args
* payload. Used by the resumability cache to detect unchanged agent tasks.
*
* Exported for testing.
*/
export function fingerprintAgentTask(
prompt: string,
spec: Record<string, unknown>,
args: string,
): string {
return createHash('sha256')
.update(stableJson({ prompt, spec, args }))
.digest('hex');
}
// ---------------------------------------------------------------------------
// Built-in workflow definitions
// ---------------------------------------------------------------------------
function generateDeepResearchScript(_args?: Record<string, unknown>): string {
return `
export const meta = {
name: 'deep-research',
description: 'Multi-phase deep research: scope, search, fetch, verify, synthesise.',
phases: [
{ title: 'Scope', detail: 'Define the research question and search criteria' },
{ title: 'Search', detail: 'Query web sources in parallel' },
{ title: 'Fetch', detail: 'Retrieve full content from top sources' },
{ title: 'Verify', detail: 'Cross-reference and validate findings' },
{ title: 'Synthesise', detail: 'Produce a final structured report' },
],
};
export default async function main(args) {
const query = args?.query ?? 'No query provided';
log('deep-research: starting with query: ' + query);
// Phase 1: Scope
phase('Scope');
const scope = await agent(
'Analyse this research query and produce a search plan with 3-5 key sub-questions: ' + query,
{ label: 'scope-analysis', phase: 'scope' },
);
log('Scope completed');
// Phase 2: Search
phase('Search');
const searchResults = await agent(
'Based on the scope, search for authoritative sources. Return a list of 3-5 URLs with brief annotations.',
{ label: 'web-search', phase: 'search' },
);
log('Search completed');
// Phase 3: Fetch
phase('Fetch');
const fetchedContent = await agent(
'Extract and summarise the key information from these sources: ' + JSON.stringify(searchResults),
{ label: 'content-fetch', phase: 'fetch' },
);
log('Fetch completed');
// Phase 4: Verify
phase('Verify');
const verified = await agent(
'Cross-reference the fetched information. Note any contradictions, gaps, or weak sources: ' + JSON.stringify(fetchedContent),
{ label: 'verification', phase: 'verify' },
);
log('Verify completed');
// Phase 5: Synthesise
phase('Synthesise');
const report = await agent(
'Synthesise the verified information into a structured report with findings, sources, and confidence levels: ' + JSON.stringify(verified),
{ label: 'synthesis', phase: 'synthesise' },
);
log('deep-research: completed');
return {
ok: true,
output: report,
phases: { scope, searchResults, fetchedContent, verified, report },
};
}
`.trim();
}
function generateReviewCodeScript(_args?: Record<string, unknown>): string {
return `
export const meta = {
name: 'review-code',
description: 'Multi-perspective code review: correctness, security, performance, then synthesise.',
phases: [
{ title: 'Correctness', detail: 'Check logic, edge cases, and correctness' },
{ title: 'Security', detail: 'Analyse for vulnerabilities and unsafe patterns' },
{ title: 'Performance', detail: 'Identify performance bottlenecks and optimisation opportunities' },
{ title: 'Synthesise', detail: 'Merge perspectives into a unified review report' },
],
};
export default async function main(args) {
const target = args?.target ?? args?.path ?? '';
log('review-code: starting review of: ' + (target || '(no target specified)'));
const context = await agent(
'Read the code at ' + (target || 'the provided context') + ' and produce a summary of its structure and purpose.',
{ label: 'read-context', phase: 'context' },
);
// Phase 1: Correctness
phase('Correctness');
const correctness = await agent(
'Review this code for correctness. Check logical errors, edge cases, type safety, and concurrency issues:\\n' + JSON.stringify(context),
{ label: 'correctness-review', phase: 'correctness' },
);
// Phase 2: Security
phase('Security');
const security = await agent(
'Review this code for security vulnerabilities. Check for injection, auth bypasses, unsafe deserialisation, secret exposure:\\n' + JSON.stringify(context),
{ label: 'security-review', phase: 'security' },
);
// Phase 3: Performance
phase('Performance');
const performance = await agent(
'Review this code for performance issues. Check algorithmic complexity, unnecessary allocations, I/O patterns, caching opportunities:\\n' + JSON.stringify(context),
{ label: 'performance-review', phase: 'performance' },
);
// Phase 4: Synthesise
phase('Synthesise');
const report = await agent(
'Merge these three review perspectives into one structured report with severity-ranked findings:\\n' +
'--- Correctness ---\\n' + JSON.stringify(correctness) + '\\n' +
'--- Security ---\\n' + JSON.stringify(security) + '\\n' +
'--- Performance ---\\n' + JSON.stringify(performance),
{ label: 'synthesis', phase: 'synthesise' },
);
log('review-code: completed');
return {
ok: true,
output: report,
reviews: { correctness, security, performance },
};
}
`.trim();
}
function generateFindIssuesScript(_args?: Record<string, unknown>): string {
return `
export const meta = {
name: 'find-issues',
description: 'Iterative issue discovery — keep surfacing issues until consecutive rounds find nothing new.',
phases: [
{ title: 'Analyse', detail: 'Analyse the codebase for issues' },
{ title: 'Check dry', detail: 'Verify no new issues remain' },
],
};
export default async function main(args) {
const target = args?.target ?? args?.path ?? '.';
const maxRounds = args?.maxRounds ?? 5;
log('find-issues: starting on ' + target + ' (max ' + maxRounds + ' rounds)');
const allIssues = [];
let dryRounds = 0;
let round = 0;
while (dryRounds < 2 && round < maxRounds) {
round++;
phase('Analyse');
const context = allIssues.length > 0
? 'Previously found issues (exclude these):\\n' + JSON.stringify(allIssues)
: 'No issues found yet.';
const newIssues = await agent(
'Analyse ' + target + ' for bugs, code smells, and anti-patterns.\\n' + context + '\\nReturn a JSON array of issues. If none found, return an empty array.',
{ label: 'round-' + round + '-analysis', phase: 'analyse' },
);
let parsed: unknown[] = [];
try {
if (typeof newIssues === 'string') {
parsed = JSON.parse(newIssues);
} else if (Array.isArray(newIssues)) {
parsed = newIssues;
}
} catch {
parsed = [];
}
if (parsed.length === 0) {
dryRounds++;
phase('Check dry');
log('Round ' + round + ': no new issues found (dry run ' + dryRounds + '/2)');
} else {
dryRounds = 0;
for (const issue of parsed) {
allIssues.push(issue);
}
log('Round ' + round + ': found ' + parsed.length + ' new issue(s)');
}
}
log('find-issues: completed after ' + round + ' rounds, ' + allIssues.length + ' total issues');
return {
ok: true,
output: allIssues,
totalRounds: round,
totalIssues: allIssues.length,
};
}
`.trim();
}
// ---------------------------------------------------------------------------
// Registry
// ---------------------------------------------------------------------------
/**
* All built-in workflow definitions shipped with BooCode.
*/
const BUILTIN_WORKFLOWS: BuiltinWorkflow[] = [
{
name: 'deep-research',
description:
'Performs multi-phase deep research: scope the question, search web sources in parallel, fetch full content, verify findings, and synthesise a structured report.',
phases: [
{ title: 'Scope', detail: 'Define the research question and search criteria' },
{ title: 'Search', detail: 'Query web sources in parallel' },
{ title: 'Fetch', detail: 'Retrieve full content from top sources' },
{ title: 'Verify', detail: 'Cross-reference and validate findings' },
{ title: 'Synthesise', detail: 'Produce a final structured report' },
],
generateScript: generateDeepResearchScript,
},
{
name: 'review-code',
description:
'Multi-perspective code review that analyses code for correctness, security vulnerabilities, and performance issues in parallel, then merges findings into a unified severity-ranked report.',
phases: [
{ title: 'Correctness', detail: 'Check logic, edge cases, and correctness' },
{ title: 'Security', detail: 'Analyse for vulnerabilities and unsafe patterns' },
{ title: 'Performance', detail: 'Identify performance bottlenecks' },
{ title: 'Synthesise', detail: 'Merge perspectives into a unified report' },
],
generateScript: generateReviewCodeScript,
},
{
name: 'find-issues',
description:
'Iterative issue discovery that runs analysis rounds until two consecutive passes find nothing new, ensuring comprehensive coverage without infinite loops.',
phases: [
{ title: 'Analyse', detail: 'Analyse the codebase for issues' },
{ title: 'Check dry', detail: 'Verify no new issues remain' },
],
generateScript: generateFindIssuesScript,
},
];
/**
* Read-only map of built-in workflows keyed by name.
*/
const BUILTIN_WORKFLOW_MAP = new Map<string, BuiltinWorkflow>(
BUILTIN_WORKFLOWS.map((w) => [w.name, w]),
);
/**
* Return all built-in workflow definitions.
*/
export function getBuiltinWorkflows(): BuiltinWorkflow[] {
return BUILTIN_WORKFLOWS;
}
/**
* Look up a built-in workflow by name.
*
* @param name - Workflow name (e.g. 'deep-research').
* @returns The built-in workflow, or undefined if not found.
*/
export function getBuiltinWorkflow(name: string): BuiltinWorkflow | undefined {
return BUILTIN_WORKFLOW_MAP.get(name);
}
/**
* Merge built-in workflow metadata into a list of file-discovered workflow
* entries. Built-in entries take precedence — if a user has a file-based
* workflow with the same name, the built-in version wins.
*
* @param fileWorkflows - Workflow metadata discovered from the filesystem.
* @returns Merged array with built-in workflows injected and duplicate names
* resolved (built-in wins).
*/
export function mergeBuiltinWorkflows(
fileWorkflows: Array<{ name: string; description: string; sourceFile?: string }>,
): Array<{ name: string; description: string; sourceFile?: string }> {
const seen = new Set<string>();
const result: Array<{ name: string; description: string; sourceFile?: string }> = [];
// Built-in workflows first (they take precedence)
for (const builtin of BUILTIN_WORKFLOWS) {
seen.add(builtin.name);
result.push({
name: builtin.name,
description: builtin.description,
// No sourceFile — built-in workflows are generated, not read from disk
});
}
// File-discovered workflows — skip any name already claimed by built-in
for (const fw of fileWorkflows) {
if (seen.has(fw.name)) continue;
seen.add(fw.name);
result.push(fw);
}
return result;
}

View File

@@ -0,0 +1,134 @@
// v2.8.0: Workflow file discovery — walks project-local and global workflow
// directories to find runnable scripts. Built-in workflows from the catalog
// are merged into the results (they take precedence over user-defined files).
// All functions exported for testing.
import { readdirSync, existsSync } from 'node:fs';
import { join, basename, extname } from 'node:path';
import { homedir } from 'node:os';
import { getBuiltinWorkflows, getBuiltinWorkflow } from './catalog.js';
/**
* Sentinel prefix used in `sourceFile` for built-in workflows from the
* catalog so callers (e.g. WorkflowManager) can detect and handle them
* by calling `generateScript()` instead of reading a file from disk.
*/
const BUILTIN_PREFIX = 'builtin:';
/**
* Metadata about a discovered workflow file (or built-in workflow).
*/
export interface WorkflowMeta {
/** Workflow name (file stem without .js extension). */
name: string;
/** Description loaded from the workflow module's `meta.description`.
* Empty string until loadWorkflowMeta() resolves it. */
description: string;
/** Absolute path to the .js file.
* For built-in workflows this is `'builtin:<name>'` — the caller
* should use `getBuiltinWorkflow(name)` and `generateScript()`
* instead of reading this path from disk. */
sourceFile: string;
}
/**
* Test whether a `WorkflowMeta.sourceFile` points to a built-in workflow
* (rather than a file on disk).
*
* @param meta - The workflow metadata to check.
*/
export function isBuiltinWorkflow(meta: WorkflowMeta): boolean {
return meta.sourceFile.startsWith(BUILTIN_PREFIX);
}
/**
* Find all workflow .js files in the standard search paths, merged with
* built-in workflows from the catalog.
*
* Priority order (first match wins for same-named workflows):
* 1. Built-in catalog (always takes precedence)
* 2. <projectRoot>/.boocode/workflows/ (project-local)
* 3. ~/.boocode/workflows/ (global, per-user)
*
* @param projectRoot - Absolute path to the current project root.
*/
export function discoverWorkflows(projectRoot: string): WorkflowMeta[] {
const seen = new Set<string>();
const results: WorkflowMeta[] = [];
// 1. Built-in workflows (highest priority)
for (const builtin of getBuiltinWorkflows()) {
seen.add(builtin.name);
results.push({
name: builtin.name,
description: builtin.description,
sourceFile: `${BUILTIN_PREFIX}${builtin.name}`,
});
}
// 2. Project-local + global file-based workflows
const dirs = [
join(projectRoot, '.boocode', 'workflows'),
join(homedir(), '.boocode', 'workflows'),
];
for (const dir of dirs) {
if (!existsSync(dir)) continue;
try {
const entries = readdirSync(dir);
for (const f of entries) {
if (!f.endsWith('.js')) continue;
const name = basename(f, '.js');
if (seen.has(name)) continue; // built-in shadows project-local,
// project-local shadows global
seen.add(name);
results.push({
name,
description: '',
sourceFile: join(dir, f),
});
}
} catch {
// Permission error on directory — skip silently
continue;
}
}
return results;
}
/**
* Find a single workflow by name across built-in catalog and search paths.
*
* Priority: built-in > project-local > global.
*
* @param name - Workflow name (without .js extension).
* @param projectRoot - Absolute path to the current project root.
*/
export function findWorkflow(
name: string,
projectRoot: string,
): WorkflowMeta | undefined {
// Check built-in catalog first
const builtin = getBuiltinWorkflow(name);
if (builtin) {
return {
name: builtin.name,
description: builtin.description,
sourceFile: `${BUILTIN_PREFIX}${builtin.name}`,
};
}
// Fall back to file-based discovery
return discoverWorkflows(projectRoot).find((w) => w.name === name);
}
/**
* Validate a candidate workflow file path.
* Checks that the file exists and has a .js extension.
*
* @param filePath - Absolute path to check.
*/
export function isValidWorkflowPath(filePath: string): boolean {
return extname(filePath) === '.js' && existsSync(filePath);
}

View File

@@ -0,0 +1,54 @@
// v2.8.0: Dynamic Workflow Engine — public surface.
//
// Re-exports all types and classes from the workflow sub-modules so consumers
// import from a single entry point:
//
// ```typescript
// import { WorkflowManager } from './services/workflow/index.js';
// ```
export { WorkflowManager } from './manager.js';
export type { WorkflowMetaInfo } from './manager.js';
export type { WorkflowEventHandler } from './manager.js';
export { discoverWorkflows, findWorkflow, isValidWorkflowPath, isBuiltinWorkflow } from './discovery.js';
export type { WorkflowMeta } from './discovery.js';
export {
loadWorkflowScript,
loadWorkflowScriptFromCode,
executeWorkflowScript,
executeWorkflowScriptFromCode,
buildSandbox,
transformEsmToCjs,
isEsmSyntax,
} from './sandbox.js';
export {
getBuiltinWorkflows,
getBuiltinWorkflow,
mergeBuiltinWorkflows,
fingerprintAgentTask,
} from './catalog.js';
export type { BuiltinWorkflow } from './catalog.js';
export {
cacheKey,
getCachedResult,
setCachedResult,
invalidateRun,
clearCache,
cacheSize,
} from './resumability.js';
export type { CachedResult } from './resumability.js';
export type {
WorkflowScript,
WorkflowScriptMeta,
WorkflowContext,
AgentTaskSpec,
AgentTaskResult,
WorkflowRun,
WorkflowRunStatus,
WorkflowEvent,
} from './types.js';

View File

@@ -0,0 +1,659 @@
// v2.8.0: WorkflowManager — ties discovery, sandbox, and inference dispatch
// together into a single orchestrator for multi-agent workflow scripts.
//
// Creates isolated sessions+chats for each agent() call within a workflow,
// dispatches inference via the existing pipeline, polls for completion, and
// returns structured results. All failures are returned as errors rather than
// thrown exceptions (catch-safe API).
import { randomUUID } from 'node:crypto';
import type { Sql } from '../../db.js';
import type { Config } from '../../config.js';
import type { FastifyBaseLogger } from 'fastify';
import type { Broker } from '../broker.js';
import type { UserStreamFrame } from '../../types/api.js';
import type {
WorkflowRun,
WorkflowRunStatus,
WorkflowContext,
WorkflowEvent,
AgentTaskSpec,
AgentTaskResult,
WorkflowScriptMeta,
} from './types.js';
import { discoverWorkflows, findWorkflow, isBuiltinWorkflow } from './discovery.js';
import { getBuiltinWorkflow } from './catalog.js';
import { cacheKey, getCachedResult, setCachedResult } from './resumability.js';
import {
executeWorkflowScript,
executeWorkflowScriptFromCode,
isEsmSyntax,
transformEsmToCjs,
} from './sandbox.js';
import { runInference } from '../inference/index.js';
import { readFileSync } from 'node:fs';
import vm from 'node:vm';
/**
* Maximum time to wait for a single agent task to complete (5 minutes).
* Beyond this, the task is treated as failed/timed out.
*/
const AGENT_TASK_TIMEOUT_MS = 300_000;
/**
* Polling interval when waiting for an agent task to finish.
*/
const POLL_INTERVAL_MS = 500;
/**
* Maximum time for the entire workflow run (30 minutes).
*/
const WORKFLOW_TIMEOUT_MS = 1_800_000;
/**
* Token budget tracker. Tracks total token spend across agent calls.
*/
class BudgetTracker {
total: number | null;
#spent = 0;
constructor(total: number | null) {
this.total = total;
}
spend(amount: number): void {
this.#spent += amount;
}
spent(): number {
return this.#spent;
}
remaining(): number {
if (this.total === null) return Infinity;
return Math.max(0, this.total - this.#spent);
}
}
/**
* Creates a no-op bounded publish function that avoids WS dependency
* for background workflow agent tasks. Messages are still persisted to DB.
*/
function noopPublish(): void {
/* intentional no-op */
}
function noopPublishUser(): void {
/* intentional no-op */
}
/**
* Callback type for workflow lifecycle events.
*/
export type WorkflowEventHandler = (event: WorkflowEvent) => void;
/**
* WorkflowManager — the orchestrator for sandboxed multi-agent workflows.
*/
export class WorkflowManager {
/** Active workflow runs by run ID. */
readonly #runs = new Map<string, WorkflowRunState>();
/** Registered event listeners. */
readonly #listeners = new Set<WorkflowEventHandler>();
constructor(
private sql: Sql,
private config: Config,
private log: FastifyBaseLogger,
private projectRoot: string,
private projectId: string,
private broker: Broker,
) {}
// ---- public API ----
/**
* Discover all available workflow scripts.
*/
listWorkflows(): WorkflowMetaInfo[] {
return discoverWorkflows(this.projectRoot).map((m) => ({
name: m.name,
sourceFile: m.sourceFile,
}));
}
/**
* Find a specific workflow by name.
*/
getWorkflow(name: string): WorkflowMetaInfo | undefined {
const found = findWorkflow(name, this.projectRoot);
if (!found) return undefined;
return { name: found.name, sourceFile: found.sourceFile };
}
/**
* Load the metadata (name, description, phases) from a workflow file
* without executing it.
*
* @param name - Workflow name.
* @returns The script's meta, or undefined if not found.
*/
async loadWorkflowMeta(name: string): Promise<WorkflowScriptMeta | undefined> {
const found = findWorkflow(name, this.projectRoot);
if (!found) return undefined;
// Built-in workflows: return meta directly from the catalog
if (isBuiltinWorkflow(found)) {
const builtin = getBuiltinWorkflow(name);
if (!builtin) return { name, description: '' };
return {
name: builtin.name,
description: builtin.description,
phases: builtin.phases,
};
}
try {
// Load meta by executing the script in a throwaway context
const context = this.#createMinimalContext('meta-loader');
const code = readFileSync(found.sourceFile, 'utf8');
const finalCode = isEsmSyntax(code) ? transformEsmToCjs(code) : code;
const sandboxData: Record<string, unknown> & {
module: { exports: Record<string, unknown> };
} = {
...context,
console: { log: () => {} },
module: { exports: {} },
exports: {},
};
vm.createContext(sandboxData as unknown as vm.Context);
new vm.Script(finalCode).runInContext(sandboxData as unknown as vm.Context, {
timeout: 10_000,
filename: found.sourceFile,
});
const meta = sandboxData.module.exports.meta as WorkflowScriptMeta | undefined;
return meta ?? { name, description: '' };
} catch {
return { name, description: '' };
}
}
/**
* Execute a workflow by name.
*
* @param name - The workflow name (without .js extension).
* @param args - Optional arguments to pass to the workflow function.
* @returns The run ID for tracking.
*/
async runWorkflow(
name: string,
args?: Record<string, unknown>,
): Promise<{ runId: string }> {
const found = findWorkflow(name, this.projectRoot);
if (!found) {
throw new Error(`Workflow not found: "${name}". ` +
`Check .boocode/workflows/ or ~/.boocode/workflows/ for a ${name}.js file.`);
}
const runId = randomUUID();
const startedAt = new Date().toISOString();
const state: WorkflowRunState = {
id: runId,
name,
status: 'running',
startedAt,
abortController: new AbortController(),
};
this.#runs.set(runId, state);
this.#emit({ type: 'run_started', runId, name });
// Run asynchronously — caller receives the runId immediately.
void this.#executeRun(state, found.sourceFile, args ?? {});
return { runId };
}
/**
* Get the current status of a workflow run.
*/
getRunStatus(runId: string): WorkflowRun | undefined {
const state = this.#runs.get(runId);
if (!state) return undefined;
return {
id: state.id,
name: state.name,
status: state.status,
started_at: state.startedAt,
finished_at: state.finishedAt,
error: state.error,
};
}
/**
* Cancel a running workflow. Best-effort — agent tasks in-flight will be
* aborted via AbortSignal.
*
* @param runId - The workflow run ID.
* @returns true if the workflow was found and cancelled.
*/
cancelRun(runId: string): boolean {
const state = this.#runs.get(runId);
if (!state || state.status !== 'running') return false;
state.status = 'cancelled';
state.finishedAt = new Date().toISOString();
state.abortController.abort();
this.#emit({ type: 'run_cancelled', runId, name: state.name });
return true;
}
/**
* Subscribe to workflow lifecycle events.
* Returns an unsubscribe function.
*/
onEvent(handler: WorkflowEventHandler): () => void {
this.#listeners.add(handler);
return () => {
this.#listeners.delete(handler);
};
}
// ---- internal execution ----
/**
* Execute the workflow script in the sandbox.
*/
async #executeRun(
state: WorkflowRunState,
sourceFile: string,
args: Record<string, unknown>,
): Promise<void> {
const BULTIN_MARKER = 'builtin:';
const budgetTracker = new BudgetTracker(null); // no fixed total yet
const runId = state.id;
try {
const context: WorkflowContext = {
agent: (prompt, opts) =>
this.#handleAgentCall(runId, prompt, opts ?? { prompt }, state.abortController.signal),
parallel: (thunks) =>
Promise.all(thunks.map((t) => t())),
pipeline: async (items, ...stages) => {
let result = [...items];
for (const stage of stages) {
result = await Promise.all(result.map(stage));
}
return result;
},
phase: (title) => {
this.#emit({ type: 'phase', runId, title });
},
log: (message) => {
this.#emit({ type: 'log', runId, message });
},
budget: {
total: budgetTracker.total,
spent: () => budgetTracker.spent(),
remaining: () => budgetTracker.remaining(),
},
args,
workflow: (nestedName, nestedArgs) =>
this.#handleNestedWorkflow(runId, nestedName, nestedArgs ?? {}, state.abortController.signal),
};
let result: unknown;
if (sourceFile.startsWith(BULTIN_MARKER)) {
// Built-in workflow: generate script from catalog and execute
const workflowName = sourceFile.slice(BULTIN_MARKER.length);
const builtin = getBuiltinWorkflow(workflowName);
if (!builtin) {
throw new Error(`Built-in workflow "${workflowName}" not found in catalog`);
}
const scriptCode = builtin.generateScript(args);
result = await executeWorkflowScriptFromCode(scriptCode, context, args, sourceFile);
} else {
result = await executeWorkflowScript(sourceFile, context, args);
}
// Only update to completed if we haven't been cancelled mid-flight.
if (state.status !== 'cancelled') {
state.status = 'completed';
state.finishedAt = new Date().toISOString();
}
// Store result
state.result = result;
this.#emit({ type: 'run_completed', runId, name: state.name });
} catch (err) {
if (state.status === 'cancelled') return; // already handled
const message = err instanceof Error ? err.message : String(err);
state.status = 'failed';
state.finishedAt = new Date().toISOString();
state.error = message;
this.#emit({ type: 'run_failed', runId, name: state.name, error: message });
}
}
/**
* Handle an `agent()` call from within a workflow.
* Creates a session + chat, dispatches inference, polls for completion.
*/
async #handleAgentCall(
runId: string,
prompt: string,
spec: AgentTaskSpec,
signal: AbortSignal,
): Promise<unknown> {
const label = spec.label ?? `agent-${prompt.slice(0, 40).replace(/\s+/g, '_')}`;
this.#emit({ type: 'agent_task_started', runId, label });
try {
const result = await this.executeAgentTask(prompt, spec, signal);
this.#emit({ type: 'agent_task_completed', runId, label });
return result;
} catch (err) {
this.#emit({ type: 'agent_task_completed', runId, label });
const message = err instanceof Error ? err.message : String(err);
return {
ok: false,
output: null,
error: message,
} satisfies AgentTaskResult;
}
}
/**
* Core agent task execution: create session/chat, dispatch inference, poll.
*
* Exported as a public method for testing.
*/
async executeAgentTask(
prompt: string,
spec: AgentTaskSpec,
signal?: AbortSignal,
): Promise<unknown> {
// ---- 0. Check resumability cache before creating a new task ----
const cacheKeyStr = cacheKey(spec, '');
const cached = getCachedResult(cacheKeyStr);
if (cached) {
return { ...cached, cached: true } satisfies AgentTaskResult;
}
const model = spec.model ?? null;
// ---- 1. Create a session for this agent task ----
const sessionName = `workflow-agent-${spec.label ?? 'task'}`;
const sessionResult = await this.sql.begin(async (tx) => {
const [session] = await tx<{ id: string }[]>`
INSERT INTO sessions (project_id, name, model)
VALUES (${this.projectId}, ${sessionName}, ${model ?? 'qwen3.6-35b-a3b-mxfp4'})
RETURNING id
`;
if (!session) throw new Error('Failed to create workflow agent session');
return session;
});
const sessionId = sessionResult.id;
// ---- 2. Create a chat in this session ----
const chatResult = await this.sql.begin(async (tx) => {
const [chat] = await tx<{ id: string }[]>`
INSERT INTO chats (session_id, name)
VALUES (${sessionId}, ${spec.label ?? null})
RETURNING id
`;
if (!chat) throw new Error('Failed to create workflow agent chat');
return chat;
});
const chatId = chatResult.id;
// ---- 3. Insert user message + streaming assistant message ----
const { userMessageId, assistantMessageId } = await this.sql.begin(async (tx) => {
const [userMsg] = await tx<{ id: string }[]>`
INSERT INTO messages (session_id, chat_id, role, content, status, created_at)
VALUES (${sessionId}, ${chatId}, 'user', ${prompt}, 'complete', clock_timestamp())
RETURNING id
`;
const [assistantMsg] = await tx<{ id: string }[]>`
INSERT INTO messages (session_id, chat_id, role, content, status, created_at)
VALUES (${sessionId}, ${chatId}, 'assistant', '', 'streaming', clock_timestamp())
RETURNING id
`;
return {
userMessageId: userMsg!.id,
assistantMessageId: assistantMsg!.id,
};
});
// ---- 4. Dispatch inference ----
// Create a bounded InferenceContext that won't crash on missing WS
const ctx: import('../inference/types.js').InferenceContext = {
sql: this.sql,
config: this.config,
log: this.log,
publish: noopPublish as unknown as import('../inference/types.js').FramePublisher,
publishUser: noopPublishUser as unknown as (frame: UserStreamFrame) => void,
broker: this.broker,
};
// Create a merged signal (workflow cancellation + optional caller signal)
const mergedController = new AbortController();
const onAbort = () => mergedController.abort();
signal?.addEventListener('abort', onAbort, { once: true });
const inferencePromise = runInference(
ctx,
sessionId,
chatId,
assistantMessageId,
mergedController.signal,
).finally(() => {
signal?.removeEventListener('abort', onAbort);
});
// ---- 5. Poll for completion ----
try {
const result = await this.#pollForCompletion(
chatId,
assistantMessageId,
inferencePromise,
mergedController.signal,
);
// Cache successful results for resumability
if (typeof result === 'object' && result !== null && (result as Record<string, unknown>).ok === true) {
setCachedResult(cacheKeyStr, {
ok: true,
output: (result as Record<string, unknown>).output,
token_usage: (result as Record<string, unknown>).token_usage as
| { prompt: number; completion: number }
| undefined,
});
}
return result;
} catch (err) {
if ((err as Error)?.message === 'cancelled') {
return { ok: false, output: null, error: 'Task was cancelled' } satisfies AgentTaskResult;
}
return {
ok: false,
output: null,
error: err instanceof Error ? err.message : String(err),
} satisfies AgentTaskResult;
}
}
/**
* Poll the messages table until the assistant message status changes
* from 'streaming' to 'complete' / 'failed' / 'cancelled'.
*/
async #pollForCompletion(
chatId: string,
assistantMessageId: string,
inferencePromise: Promise<void>,
signal: AbortSignal,
): Promise<unknown> {
// Wait for either inference to finish or timeout
const timeout = new Promise<never>((_, reject) => {
const timer = setTimeout(() => {
reject(new Error(`Agent task timed out after ${AGENT_TASK_TIMEOUT_MS}ms`));
}, AGENT_TASK_TIMEOUT_MS);
signal.addEventListener('abort', () => {
clearTimeout(timer);
reject(new Error('cancelled'));
}, { once: true });
});
// Poll loop — runs until inference completes, timeout, or cancellation
const pollLoop = (async () => {
// eslint-disable-next-line no-constant-condition
while (true) {
await new Promise((resolve) => setTimeout(resolve, POLL_INTERVAL_MS));
const rows = await this.sql<{
status: string;
content: string;
tool_calls: unknown;
tokens_used: number | null;
}[]>`
SELECT m.status, m.content, m.role,
(SELECT jsonb_agg(p.payload ORDER BY p.sequence)
FROM message_parts p
WHERE p.message_id = m.id AND p.kind = 'tool_call' AND p.hidden_at IS NULL) AS tool_calls,
m.tokens_used
FROM messages m
WHERE m.id = ${assistantMessageId}
`;
const msg = rows[0];
if (!msg) {
throw new Error(`Assistant message ${assistantMessageId} not found`);
}
if (msg.status === 'complete') {
return {
ok: true,
output: msg.content,
token_usage: msg.tokens_used ? { prompt: 0, completion: msg.tokens_used } : undefined,
};
}
if (msg.status === 'failed' || msg.status === 'cancelled') {
return {
ok: false,
output: msg.content || null,
error: `Assistant message ended with status: ${msg.status}`,
};
}
// Still streaming — continue polling
}
})();
// Race: polling vs timeout vs inference error vs cancellation
try {
return await Promise.race([pollLoop, timeout]);
} finally {
// Ensure inference is settled (but don't block on it)
inferencePromise.catch(() => {});
}
}
/**
* Handle a nested `workflow()` call from within a workflow.
* Runs the named workflow with the given args and returns its result.
*/
async #handleNestedWorkflow(
parentRunId: string,
name: string,
args: Record<string, unknown>,
signal: AbortSignal,
): Promise<unknown> {
const found = findWorkflow(name, this.projectRoot);
if (!found) {
return { ok: false, output: null, error: `Nested workflow not found: "${name}"` };
}
const nestedRunId = randomUUID();
const startedAt = new Date().toISOString();
const nestedState: WorkflowRunState = {
id: nestedRunId,
name,
status: 'running',
startedAt,
abortController: new AbortController(),
};
this.#runs.set(nestedRunId, nestedState);
this.#emit({ type: 'run_started', runId: nestedRunId, name });
// Link parent cancellation to nested
signal.addEventListener('abort', () => {
nestedState.abortController.abort();
}, { once: true });
await this.#executeRun(nestedState, found.sourceFile, args);
if (nestedState.status === 'cancelled') {
return { ok: false, output: null, error: 'Nested workflow cancelled' };
}
if (nestedState.status === 'failed') {
return { ok: false, output: null, error: nestedState.error };
}
return { ok: true, output: nestedState.result };
}
/**
* Create a minimal WorkflowContext for non-execution purposes
* (e.g. loading meta).
*/
#createMinimalContext(runId: string): Record<string, unknown> {
return {
agent: () => Promise.reject(new Error('Not available in this context')),
parallel: () => Promise.reject(new Error('Not available in this context')),
pipeline: () => Promise.reject(new Error('Not available in this context')),
phase: () => {},
log: () => {},
budget: { total: null, spent: () => 0, remaining: () => Infinity },
args: {},
workflow: () => Promise.reject(new Error('Not available in this context')),
};
}
/**
* Emit a workflow event to all registered listeners.
*/
#emit(event: WorkflowEvent): void {
for (const handler of this.#listeners) {
try {
handler(event);
} catch {
// Swallow listener errors — one bad listener shouldn't break others
}
}
}
}
// ---- internal types ----
/**
* Metadata returned from listWorkflows / getWorkflow.
*/
export interface WorkflowMetaInfo {
name: string;
sourceFile: string;
}
/**
* Internal mutable state for an active workflow run.
*/
interface WorkflowRunState {
id: string;
name: string;
status: WorkflowRunStatus;
startedAt: string;
finishedAt?: string;
error?: string;
result?: unknown;
abortController: AbortController;
}

Some files were not shown because too many files have changed in this diff Show More