Merge 28bf07d613 into bc432d8435

2026-01-30 18:26:11 +08:00 · 2026-01-30 18:26:11 +08:00 · 1b9da76f17
commit 1b9da76f17
parent bc432d8435 28bf07d613
2 changed files with 232 additions and 2 deletions
--- a/src/agents/session-transcript-repair.test.ts
+++ b/src/agents/session-transcript-repair.test.ts
@ -1,6 +1,6 @@
 import type { AgentMessage } from "@mariozechner/pi-agent-core";
 import { describe, expect, it } from "vitest";
-import { sanitizeToolUseResultPairing } from "./session-transcript-repair.js";
+import { isIncompleteToolCall, sanitizeToolUseResultPairing } from "./session-transcript-repair.js";

 describe("sanitizeToolUseResultPairing", () => {
  it("moves tool results directly after tool calls and inserts missing results", () => {
@ -109,4 +109,201 @@ describe("sanitizeToolUseResultPairing", () => {
    expect(out.some((m) => m.role === "toolResult")).toBe(false);
    expect(out.map((m) => m.role)).toEqual(["user", "assistant"]);
  });
+
+  it("skips incomplete tool calls (partialJson, no arguments) and drops their synthetic results", () => {
+    // Simulates a terminated streaming response: the assistant message has a
+    // tool call with partialJson but no arguments, followed by a synthetic
+    // error toolResult inserted by session persistence.  The repair must skip
+    // the incomplete tool call entirely so no synthetic result is emitted, and
+    // the orphaned synthetic result is dropped.
+    const input = [
+      {
+        role: "assistant",
+        content: [
+          { type: "text", text: "Let me write that file:" },
+          {
+            type: "toolCall",
+            id: "toolu_terminated",
+            name: "write",
+            partialJson: '{"path": "/tmp/test.md", "content": "# Hello',
+          },
+        ],
+      },
+      {
+        role: "toolResult",
+        toolCallId: "toolu_terminated",
+        toolName: "write",
+        content: [
+          {
+            type: "text",
+            text: "[moltbot] missing tool result in session history; inserted synthetic error result for transcript repair.",
+          },
+        ],
+        isError: true,
+      },
+      { role: "user", content: "what happened?" },
+    ] satisfies AgentMessage[];
+
+    const out = sanitizeToolUseResultPairing(input);
+    // The incomplete tool call should be treated as having zero tool calls,
+    // so no toolResult should appear in the output.
+    expect(out.some((m) => m.role === "toolResult")).toBe(false);
+    expect(out.map((m) => m.role)).toEqual(["assistant", "user"]);
+  });
+
+  it("keeps complete tool calls even when partialJson is present", () => {
+    // A tool call that completed successfully may still carry partialJson
+    // from the streaming buffer.  It must be treated normally.
+    const input = [
+      {
+        role: "assistant",
+        content: [
+          {
+            type: "toolCall",
+            id: "call_ok",
+            name: "read",
+            arguments: { path: "/tmp/test.md" },
+            partialJson: '{"path": "/tmp/test.md"}',
+          },
+        ],
+      },
+      {
+        role: "toolResult",
+        toolCallId: "call_ok",
+        toolName: "read",
+        content: [{ type: "text", text: "file contents" }],
+        isError: false,
+      },
+    ] satisfies AgentMessage[];
+
+    const out = sanitizeToolUseResultPairing(input);
+    expect(out).toHaveLength(2);
+    expect(out[0]?.role).toBe("assistant");
+    expect(out[1]?.role).toBe("toolResult");
+  });
+
+  it("handles mixed complete and incomplete tool calls in one assistant message", () => {
+    // The assistant issued two parallel tool calls but was terminated during
+    // the second.  The first call completed and has a real result; the second
+    // is incomplete.  Only the first should be paired.
+    const input = [
+      {
+        role: "assistant",
+        content: [
+          { type: "toolCall", id: "call_done", name: "read", arguments: { path: "/a" } },
+          {
+            type: "toolCall",
+            id: "call_partial",
+            name: "write",
+            partialJson: '{"path": "/b", "content": "half...',
+          },
+        ],
+      },
+      {
+        role: "toolResult",
+        toolCallId: "call_done",
+        toolName: "read",
+        content: [{ type: "text", text: "ok" }],
+        isError: false,
+      },
+      {
+        role: "toolResult",
+        toolCallId: "call_partial",
+        toolName: "write",
+        content: [{ type: "text", text: "[moltbot] synthetic" }],
+        isError: true,
+      },
+      { role: "user", content: "continue" },
+    ] satisfies AgentMessage[];
+
+    const out = sanitizeToolUseResultPairing(input);
+    const results = out.filter((m) => m.role === "toolResult");
+    // Only the completed tool call should have a result
+    expect(results).toHaveLength(1);
+    expect((results[0] as { toolCallId?: string }).toolCallId).toBe("call_done");
+    expect(out.map((m) => m.role)).toEqual(["assistant", "toolResult", "user"]);
+  });
+
+  it("handles incomplete tool call with empty arguments object", () => {
+    // Some providers set arguments to {} when the stream was interrupted
+    // before any argument parsing completed.
+    const input = [
+      {
+        role: "assistant",
+        content: [
+          {
+            type: "toolCall",
+            id: "call_empty_args",
+            name: "exec",
+            arguments: {},
+            partialJson: '{"command": "ls',
+          },
+        ],
+      },
+      { role: "user", content: "?" },
+    ] satisfies AgentMessage[];
+
+    const out = sanitizeToolUseResultPairing(input);
+    expect(out.some((m) => m.role === "toolResult")).toBe(false);
+    expect(out.map((m) => m.role)).toEqual(["assistant", "user"]);
+  });
+});
+
+describe("isIncompleteToolCall", () => {
+  it("returns true for partialJson with no arguments", () => {
+    expect(
+      isIncompleteToolCall({
+        type: "toolCall",
+        id: "x",
+        name: "write",
+        partialJson: '{"path": "/tmp',
+      }),
+    ).toBe(true);
+  });
+
+  it("returns true for partialJson with empty arguments", () => {
+    expect(
+      isIncompleteToolCall({
+        type: "toolCall",
+        id: "x",
+        name: "exec",
+        arguments: {},
+        partialJson: '{"command": "ls',
+      }),
+    ).toBe(true);
+  });
+
+  it("returns false for complete tool call with partialJson", () => {
+    expect(
+      isIncompleteToolCall({
+        type: "toolCall",
+        id: "x",
+        name: "read",
+        arguments: { path: "/tmp/test" },
+        partialJson: '{"path": "/tmp/test"}',
+      }),
+    ).toBe(false);
+  });
+
+  it("returns false for tool call without partialJson", () => {
+    expect(
+      isIncompleteToolCall({
+        type: "toolCall",
+        id: "x",
+        name: "read",
+        arguments: { path: "/tmp/test" },
+      }),
+    ).toBe(false);
+  });
+
+  it("returns false when partialJson is empty string", () => {
+    expect(
+      isIncompleteToolCall({
+        type: "toolCall",
+        id: "x",
+        name: "read",
+        partialJson: "",
+      }),
+    ).toBe(false);
+  });
 });
--- a/src/agents/session-transcript-repair.ts
+++ b/src/agents/session-transcript-repair.ts
@ -5,6 +5,35 @@ type ToolCallLike = {
  name?: string;
 };

+/**
+ * Check whether a tool call block is incomplete (terminated mid-stream).
+ *
+ * When a streaming response is interrupted (`stopReason: "error"`,
+ * `errorMessage: "terminated"`), the assistant message may contain tool call
+ * blocks with only `partialJson` and no valid `arguments`.  These were never
+ * executed, so inserting a synthetic `toolResult` for them causes Anthropic's
+ * API to reject the request with "unexpected tool_use_id".
+ *
+ * We detect incompleteness by checking:
+ *   1. `partialJson` is present (streaming was in progress), AND
+ *   2. `arguments` is missing, empty, or not a non-empty object.
+ *
+ * If `arguments` is fully populated the call completed successfully and should
+ * be treated normally, even if `partialJson` happens to be set.
+ */
+function isIncompleteToolCall(block: Record<string, unknown>): boolean {
+  if (typeof block.partialJson !== "string" || !block.partialJson) return false;
+
+  const args = block.arguments;
+  // No arguments at all → incomplete
+  if (args === undefined || args === null) return true;
+  // Empty object {} → incomplete (arguments were not parsed)
+  if (typeof args === "object" && !Array.isArray(args) && Object.keys(args as object).length === 0)
+    return true;
+
+  return false;
+}
+
 function extractToolCallsFromAssistant(
  msg: Extract<AgentMessage, { role: "assistant" }>,
 ): ToolCallLike[] {
@ -18,6 +47,10 @@ function extractToolCallsFromAssistant(
    if (typeof rec.id !== "string" || !rec.id) continue;

    if (rec.type === "toolCall" || rec.type === "toolUse" || rec.type === "functionCall") {
+      // Skip incomplete tool calls from terminated/errored streaming responses.
+      // These were never executed, so they must not receive a synthetic toolResult.
+      if (isIncompleteToolCall(rec as Record<string, unknown>)) continue;
+
      toolCalls.push({
        id: rec.id,
        name: typeof rec.name === "string" ? rec.name : undefined,
@ -54,7 +87,7 @@ function makeMissingToolResult(params: {
  } as Extract<AgentMessage, { role: "toolResult" }>;
 }

-export { makeMissingToolResult };
+export { isIncompleteToolCall, makeMissingToolResult };

 export function sanitizeToolUseResultPairing(messages: AgentMessage[]): AgentMessage[] {
  return repairToolUseResultPairing(messages).messages;