openclaw
diff --git a/‎extensions/qa-lab/src/providers/aimock/server.ts‎
Lines changed: 17 additions & 0 deletions b/‎extensions/qa-lab/src/providers/aimock/server.ts‎
Lines changed: 17 additions & 0 deletions
diff --git a/‎extensions/qa-lab/src/providers/mock-openai/server.test.ts‎
Lines changed: 53 additions & 0 deletions b/‎extensions/qa-lab/src/providers/mock-openai/server.test.ts‎
Lines changed: 53 additions & 0 deletions
diff --git a/‎extensions/qa-lab/src/providers/mock-openai/server.ts‎
Lines changed: 41 additions & 0 deletions b/‎extensions/qa-lab/src/providers/mock-openai/server.ts‎
Lines changed: 41 additions & 0 deletions
@@ -19,6 +19,7 @@ type AimockRequestSnapshot = {
   plannedToolCallId?: string;
   plannedToolName?: string;
   toolOutputCallId?: string;
+  toolOutputStructuredError?: true;
 };
 
 function writeJson(res: ServerResponse, status: number, body: unknown) {
@@ -100,6 +101,21 @@ function extractToolOutputCallId(body: ChatCompletionRequest | null | undefined)
   return "";
 }
 
+function extractToolOutputStructuredError(body: ChatCompletionRequest | null | undefined) {
+  const messages = requestMessages(body);
+  for (let index = messages.length - 1; index >= 0; index -= 1) {
+    const message = messages[index] as {
+      role?: unknown;
+      isError?: unknown;
+      is_error?: unknown;
+    };
+    if (message?.role === "tool") {
+      return message.isError === true || message.is_error === true;
+    }
+  }
+  return false;
+}
+
 function countImageInputs(value: unknown): number {
   if (Array.isArray(value)) {
     return value.reduce((sum, entry) => sum + countImageInputs(entry), 0);
@@ -170,6 +186,7 @@ function toRequestSnapshot(entry: JournalEntry): AimockRequestSnapshot {
     plannedToolCallId: extractPlannedToolCallId(entry),
     plannedToolName: extractPlannedToolName(entry),
     toolOutputCallId: extractToolOutputCallId(body) || undefined,
+    ...(extractToolOutputStructuredError(body) ? { toolOutputStructuredError: true } : {}),
   };
 }
 
 
@@ -3752,6 +3752,59 @@ describe("qa mock openai server", () => {
     expect(debug.allInputText).toContain("Delegate one bounded QA task");
   });
 
+  it("exposes structured Anthropic tool_result errors in debug snapshots", async () => {
+    const server = await startQaMockOpenAiServer({
+      host: "127.0.0.1",
+      port: 0,
+    });
+    cleanups.push(async () => {
+      await server.stop();
+    });
+
+    const response = await fetch(`${server.baseUrl}/v1/messages`, {
+      method: "POST",
+      headers: { "content-type": "application/json" },
+      body: JSON.stringify({
+        model: "claude-opus-4-8",
+        max_tokens: 256,
+        messages: [
+          {
+            role: "assistant",
+            content: [
+              {
+                type: "tool_use",
+                id: "toolu_mock_read_error",
+                name: "read",
+                input: { path: "/missing" },
+              },
+            ],
+          },
+          {
+            role: "user",
+            content: [
+              {
+                type: "tool_result",
+                tool_use_id: "toolu_mock_read_error",
+                is_error: true,
+                content: "ENOENT: no such file or directory",
+              },
+            ],
+          },
+        ],
+      }),
+    });
+    expect(response.status).toBe(200);
+
+    const debugResponse = await fetch(`${server.baseUrl}/debug/last-request`);
+    expect(debugResponse.status).toBe(200);
+    const debug = (await debugResponse.json()) as {
+      toolOutputCallId: string;
+      toolOutputStructuredError?: boolean;
+    };
+    expect(debug.toolOutputCallId).toBe("toolu_mock_read_error");
+    expect(debug.toolOutputStructuredError).toBe(true);
+  });
+
   it("streams Anthropic /v1/messages tool_use responses as SSE", async () => {
     const server = await startQaMockOpenAiServer({
       host: "127.0.0.1",
 
@@ -106,6 +106,7 @@ type MockOpenAiRequestSnapshot = {
   plannedToolName?: string;
   plannedToolArgs?: Record<string, unknown>;
   toolOutputCallId?: string;
+  toolOutputStructuredError?: true;
 };
 
 // Anthropic /v1/messages request/response shapes the mock actually needs.
@@ -125,6 +126,7 @@ type AnthropicMessageContentBlock =
   | {
       type: "tool_result";
       tool_use_id: string;
+      is_error?: boolean;
       content: string | Array<{ type: "text"; text: string }>;
     }
   | { type: "image"; source: Record<string, unknown> };
@@ -395,6 +397,13 @@ function extractFunctionCallOutputCallId(item: ResponsesInputItem) {
   );
 }
 
+function functionCallOutputIsStructuredError(item: ResponsesInputItem) {
+  if (item.type !== "function_call_output") {
+    return false;
+  }
+  return item.is_error === true || item.isError === true;
+}
+
 function extractToolOutput(input: ResponsesInputItem[]) {
   const lastUserIndex = findLastUserIndex(input);
   for (let index = input.length - 1; index > lastUserIndex; index -= 1) {
@@ -425,6 +434,35 @@ function extractToolOutput(input: ResponsesInputItem[]) {
   return "";
 }
 
+function extractToolOutputStructuredError(input: ResponsesInputItem[]) {
+  const lastUserIndex = findLastUserIndex(input);
+  for (let index = input.length - 1; index > lastUserIndex; index -= 1) {
+    const item = input[index];
+    const output = extractFunctionCallOutputText(item);
+    if (output) {
+      return functionCallOutputIsStructuredError(item);
+    }
+  }
+  for (let index = input.length - 1; index >= 0; index -= 1) {
+    const item = input[index];
+    const output = extractFunctionCallOutputText(item);
+    if (output) {
+      const laterUserTexts = input
+        .slice(index + 1)
+        .filter((laterItem) => laterItem.role === "user" && Array.isArray(laterItem.content))
+        .map((laterItem) => extractInputText(laterItem.content as unknown[]))
+        .filter(Boolean);
+      if (
+        laterUserTexts.length > 0 &&
+        laterUserTexts.every((text) => isToolOutputContinuationText(text))
+      ) {
+        return functionCallOutputIsStructuredError(item);
+      }
+    }
+  }
+  return false;
+}
+
 function extractToolOutputCallId(input: ResponsesInputItem[]) {
   const lastUserIndex = findLastUserIndex(input);
   for (let index = input.length - 1; index > lastUserIndex; index -= 1) {
@@ -2867,6 +2905,7 @@ function convertAnthropicMessagesToResponsesInput(params: {
             type: "function_call_output",
             call_id: block.tool_use_id,
             output,
+            ...(block.is_error === true ? { is_error: true } : {}),
           });
         }
         continue;
@@ -3235,6 +3274,7 @@ export async function startQaMockOpenAiServer(params?: { host?: string; port?: n
           plannedToolName: extractPlannedToolName(events),
           plannedToolArgs: extractPlannedToolArgs(events),
           toolOutputCallId: extractToolOutputCallId(input) || undefined,
+          ...(extractToolOutputStructuredError(input) ? { toolOutputStructuredError: true } : {}),
         };
         requests.push(lastRequest);
         if (requests.length > MOCK_OPENAI_DEBUG_REQUEST_LIMIT) {
@@ -3293,6 +3333,7 @@ export async function startQaMockOpenAiServer(params?: { host?: string; port?: n
           plannedToolName: extractPlannedToolName(events),
           plannedToolArgs: extractPlannedToolArgs(events),
           toolOutputCallId: extractToolOutputCallId(input) || undefined,
+          ...(extractToolOutputStructuredError(input) ? { toolOutputStructuredError: true } : {}),
         };
         requests.push(lastRequest);
         if (requests.length > MOCK_OPENAI_DEBUG_REQUEST_LIMIT) {