v1.9.7: ask_user_input elicitation tool

2026-05-18 02:15:18 +00:00
parent adb5d7b3bb
commit d85b17081e
9 changed files with 710 additions and 4 deletions
--- a/apps/server/src/routes/messages.ts
+++ b/apps/server/src/routes/messages.ts
@@ -1,7 +1,7 @@
 import type { FastifyInstance } from 'fastify';
 import { z } from 'zod';
 import type { Sql } from '../db.js';
-import type { Chat, Message, Session } from '../types/api.js';
+import type { Chat, Message, Session, ToolCall } from '../types/api.js';

 const SendBody = z.object({
  content: z.string().min(1).max(64_000),
@@ -14,6 +14,39 @@ const ContinueBody = z.object({
  sentinel_message_id: z.string().uuid(),
 });

+// Batch 9.7: ask_user_input answer submission. Defensive shape — the question
+// content is echoed back for traceability but the server does NOT trust it
+// (the source of truth is the assistant message's tool_calls.args.questions).
+const AnswerUserInputBody = z.object({
+  tool_call_id: z.string().min(1),
+  answers: z
+    .array(
+      z.object({
+        question: z.string(),
+        selected_options: z.array(z.string()),
+        free_text: z.string().nullable(),
+      }),
+    )
+    .min(1)
+    .max(3),
+});
+
+// Same shape the model declared via the tool's zod input. Re-derived here so
+// the route can validate args without depending on services/tools.ts (which
+// would pull in fs/path_guard for nothing).
+const AskUserInputArgs = z.object({
+  questions: z
+    .array(
+      z.object({
+        question: z.string(),
+        type: z.enum(['single_select', 'multi_select']),
+        options: z.array(z.string()).min(1),
+      }),
+    )
+    .min(1)
+    .max(3),
+});
+
 interface MessageHandlers {
  enqueueInference: (sessionId: string, chatId: string, assistantMessageId: string, user: string) => void;
  enqueueCompact: (sessionId: string, chatId: string, compactMessageId: string, user: string) => void;
@@ -24,6 +57,13 @@ interface MessageHandlers {
    content: string
  ) => void;
  publishMessagesDeleted: (sessionId: string, chatId: string, messageIds: string[]) => void;
+  // Batch 9.7: lets the answer endpoint emit the tool_result frame that the
+  // pause path intentionally skipped. Matches SkillInvokeHandlers in
+  // routes/skills.ts so index.ts can pass the same broker.publish adapter.
+  publishSessionFrame: (
+    sessionId: string,
+    frame: Record<string, unknown> & { type: string }
+  ) => void;
  cancelInference: (sessionId: string, chatId: string) => Promise<boolean>;
  hasActiveInference: (chatId: string) => boolean;
 }
@@ -389,4 +429,169 @@ export function registerMessageRoutes(
      return result;
    }
  );
+
+  // Batch 9.7: resume an ask_user_input pause. Validates the body matches the
+  // question shape the model declared, UPDATEs the pending tool row's
+  // tool_results to the AnswerSet, publishes the deferred tool_result frame,
+  // and enqueues the next assistant turn. Error codes per spec:
+  //   400 invalid_body / mismatched_answer_shape
+  //   404 chat_not_found / unknown_tool_call_id
+  //   409 tool_call_already_answered
+  app.post<{ Params: { id: string } }>(
+    '/api/chats/:id/answer_user_input',
+    async (req, reply) => {
+      const parsed = AnswerUserInputBody.safeParse(req.body);
+      if (!parsed.success) {
+        reply.code(400);
+        return { error: 'invalid_body', details: parsed.error.flatten() };
+      }
+      const { tool_call_id, answers } = parsed.data;
+
+      const chatRows = await sql<Chat[]>`
+        SELECT id, session_id FROM chats WHERE id = ${req.params.id} AND status = 'open'
+      `;
+      if (chatRows.length === 0) {
+        reply.code(404);
+        return { error: 'chat_not_found' };
+      }
+      const chat = chatRows[0]!;
+      const sessionId = chat.session_id;
+
+      // Find the assistant message that emitted this tool_call. Scoped by
+      // chat_id + role to avoid cross-chat lookups; ordered by created_at DESC
+      // because the most recent issuance wins when an LLM reuses call IDs
+      // across turns (the older, already-answered one is a different row with
+      // populated tool_results downstream).
+      const callerRows = await sql<{ id: string; tool_calls: ToolCall[] | null }[]>`
+        SELECT id, tool_calls FROM messages
+        WHERE chat_id = ${chat.id}
+          AND role = 'assistant'
+          AND tool_calls IS NOT NULL
+        ORDER BY created_at DESC
+      `;
+      let foundCall: ToolCall | null = null;
+      for (const row of callerRows) {
+        const match = row.tool_calls?.find((tc) => tc.id === tool_call_id);
+        if (match) {
+          foundCall = match;
+          break;
+        }
+      }
+      if (!foundCall) {
+        reply.code(404);
+        return { error: 'unknown_tool_call_id' };
+      }
+      if (foundCall.name !== 'ask_user_input') {
+        reply.code(400);
+        return { error: 'tool_call_not_ask_user_input' };
+      }
+
+      // Validate the args themselves — the LLM could have emitted bad JSON.
+      const argsParsed = AskUserInputArgs.safeParse(foundCall.args);
+      if (!argsParsed.success) {
+        reply.code(400);
+        return { error: 'mismatched_answer_shape', detail: 'tool_call args invalid' };
+      }
+      const questions = argsParsed.data.questions;
+      if (answers.length !== questions.length) {
+        reply.code(400);
+        return {
+          error: 'mismatched_answer_shape',
+          detail: `expected ${questions.length} answer(s), got ${answers.length}`,
+        };
+      }
+      for (let i = 0; i < questions.length; i++) {
+        const q = questions[i]!;
+        const a = answers[i]!;
+        for (const sel of a.selected_options) {
+          if (!q.options.includes(sel)) {
+            reply.code(400);
+            return {
+              error: 'mismatched_answer_shape',
+              detail: `answer ${i + 1} contains option not in question: ${sel}`,
+            };
+          }
+        }
+        if (q.type === 'single_select' && a.selected_options.length > 1) {
+          reply.code(400);
+          return {
+            error: 'mismatched_answer_shape',
+            detail: `answer ${i + 1} has multiple selections on single_select`,
+          };
+        }
+        const hasOpt = a.selected_options.length > 0;
+        const hasText = a.free_text !== null && a.free_text.trim().length > 0;
+        if (!hasOpt && !hasText) {
+          reply.code(400);
+          return { error: 'mismatched_answer_shape', detail: `answer ${i + 1} is empty` };
+        }
+      }
+
+      // Find the pending tool row. ORDER BY created_at DESC + LIMIT 1 picks
+      // the most recent row with this tool_call_id; the already-answered
+      // check below guards against UPDATE-ing a stale answer.
+      const toolRows = await sql<{
+        id: string;
+        tool_results: { tool_call_id: string; output: unknown } | null;
+      }[]>`
+        SELECT id, tool_results FROM messages
+        WHERE chat_id = ${chat.id}
+          AND role = 'tool'
+          AND tool_results->>'tool_call_id' = ${tool_call_id}
+        ORDER BY created_at DESC
+        LIMIT 1
+      `;
+      const toolRow = toolRows[0];
+      if (!toolRow) {
+        reply.code(404);
+        return { error: 'unknown_tool_call_id', detail: 'tool message not found' };
+      }
+      if (toolRow.tool_results && toolRow.tool_results.output !== null) {
+        reply.code(409);
+        return { error: 'tool_call_already_answered' };
+      }
+
+      const answerSet = { answers };
+      const newToolResults = {
+        tool_call_id,
+        output: answerSet,
+        truncated: false,
+      };
+
+      const result = await sql.begin(async (tx) => {
+        await tx`
+          UPDATE messages
+          SET tool_results = ${tx.json(newToolResults as never)}
+          WHERE id = ${toolRow.id}
+        `;
+        const [assistantMsg] = await tx<{ id: string }[]>`
+          INSERT INTO messages (session_id, chat_id, role, content, status, created_at)
+          VALUES (${sessionId}, ${chat.id}, 'assistant', '', 'streaming', clock_timestamp())
+          RETURNING id
+        `;
+        await tx`UPDATE sessions SET updated_at = clock_timestamp() WHERE id = ${sessionId}`;
+        await tx`UPDATE chats SET updated_at = clock_timestamp() WHERE id = ${chat.id}`;
+        return {
+          tool_message_id: toolRow.id,
+          assistant_message_id: assistantMsg!.id,
+        };
+      });
+
+      // Publish the deferred tool_result frame. useSessionStream's reducer
+      // updates the matching tool_run.result so AskUserInputCard flips into
+      // its read-only "answered" mode without a refetch.
+      handlers.publishSessionFrame(sessionId, {
+        type: 'tool_result',
+        tool_message_id: result.tool_message_id,
+        tool_call_id,
+        chat_id: chat.id,
+        output: answerSet,
+        truncated: false,
+      });
+      handlers.enqueueInference(sessionId, chat.id, result.assistant_message_id, 'default');
+
+      reply.code(202);
+      return result;
+    },
+  );
 }