fix: repair tool_use/tool_result pairing for Claude on any provider

When using Claude models via non-Anthropic providers (github-copilot, openrouter, amazon-bedrock, etc), the repairToolUseResultPairing sanitizer was not running, causing 400 errors when sessions had orphaned tool_use blocks without matching tool_result. Added isClaudeModel() helper that detects Claude by modelId, and wired it into: - repairToolUseResultPairing (fixes the 400 error) - validateAnthropicTurns (Claude needs Anthropic-style turn validation) - allowSyntheticToolResults (allows inserting synthetic results for missing) Added comprehensive test suite covering: - Direct Anthropic provider - Claude via github-copilot, openrouter, opencode, amazon-bedrock - Non-Claude models (GPT, Llama, Gemini) - Edge cases (null/empty modelId) - Case-insensitive detection Fixes: '400 messages.220: tool_use ids were found without tool_result blocks'
2026-01-27 11:54:54 -03:00 · 2026-01-27 11:54:54 -03:00 · 3f6fcabd9d
commit 3f6fcabd9d
parent 3f83afe4a6
2 changed files with 253 additions and 3 deletions
--- a/src/agents/transcript-policy.test.ts
+++ b/src/agents/transcript-policy.test.ts
@ -0,0 +1,238 @@
 import { describe, expect, it } from "vitest";
 import { resolveTranscriptPolicy } from "./transcript-policy.js";
 describe("resolveTranscriptPolicy", () => {
  describe("Anthropic provider (direct)", () => {
    it("enables Claude-specific sanitizers for anthropic provider", () => {
      const policy = resolveTranscriptPolicy({
        provider: "anthropic",
        modelId: "claude-sonnet-4-20250514",
      });
      expect(policy.repairToolUseResultPairing).toBe(true);
      expect(policy.validateAnthropicTurns).toBe(true);
      expect(policy.allowSyntheticToolResults).toBe(true);
    });
    it("enables Claude-specific sanitizers for anthropic-messages API", () => {
      const policy = resolveTranscriptPolicy({
        modelApi: "anthropic-messages",
        modelId: "claude-3-opus-20240229",
      });
      expect(policy.repairToolUseResultPairing).toBe(true);
      expect(policy.validateAnthropicTurns).toBe(true);
      expect(policy.allowSyntheticToolResults).toBe(true);
    });
  });
  describe("Claude models via non-Anthropic providers", () => {
    it("enables Claude-specific sanitizers for github-copilot with Claude model", () => {
      const policy = resolveTranscriptPolicy({
        provider: "github-copilot",
        modelId: "claude-sonnet-4",
      });
      expect(policy.repairToolUseResultPairing).toBe(true);
      expect(policy.validateAnthropicTurns).toBe(true);
      expect(policy.allowSyntheticToolResults).toBe(true);
    });
    it("enables Claude-specific sanitizers for openrouter with Claude model", () => {
      const policy = resolveTranscriptPolicy({
        provider: "openrouter",
        modelId: "anthropic/claude-3.5-sonnet",
      });
      expect(policy.repairToolUseResultPairing).toBe(true);
      expect(policy.validateAnthropicTurns).toBe(true);
      expect(policy.allowSyntheticToolResults).toBe(true);
    });
    it("enables Claude-specific sanitizers for opencode with Claude model", () => {
      const policy = resolveTranscriptPolicy({
        provider: "opencode",
        modelId: "claude-3-haiku-20240307",
      });
      expect(policy.repairToolUseResultPairing).toBe(true);
      expect(policy.validateAnthropicTurns).toBe(true);
      expect(policy.allowSyntheticToolResults).toBe(true);
    });
    it("enables Claude-specific sanitizers for amazon-bedrock with Claude model", () => {
      const policy = resolveTranscriptPolicy({
        provider: "amazon-bedrock",
        modelId: "anthropic.claude-3-sonnet-20240229-v1:0",
      });
      expect(policy.repairToolUseResultPairing).toBe(true);
      expect(policy.validateAnthropicTurns).toBe(true);
      expect(policy.allowSyntheticToolResults).toBe(true);
    });
    it("handles case-insensitive Claude model detection", () => {
      const policy = resolveTranscriptPolicy({
        provider: "openrouter",
        modelId: "CLAUDE-3-OPUS",
      });
      expect(policy.repairToolUseResultPairing).toBe(true);
      expect(policy.validateAnthropicTurns).toBe(true);
      expect(policy.allowSyntheticToolResults).toBe(true);
    });
  });
  describe("OpenAI short-circuit", () => {
    it("disables Claude-specific sanitizers for OpenAI provider even with Claude in modelId", () => {
      // Edge case: OpenAI provider should short-circuit regardless of modelId
      const policy = resolveTranscriptPolicy({
        provider: "openai",
        modelId: "gpt-4-claude-variant", // hypothetical edge case
      });
      expect(policy.repairToolUseResultPairing).toBe(false);
      expect(policy.validateAnthropicTurns).toBe(false);
      expect(policy.allowSyntheticToolResults).toBe(false);
    });
    it("disables Claude-specific sanitizers for openai-codex provider", () => {
      const policy = resolveTranscriptPolicy({
        provider: "openai-codex",
        modelId: "codex-davinci",
      });
      expect(policy.repairToolUseResultPairing).toBe(false);
      expect(policy.validateAnthropicTurns).toBe(false);
      expect(policy.allowSyntheticToolResults).toBe(false);
    });
  });
  describe("Google models", () => {
    it("enables repairToolUseResultPairing and allowSyntheticToolResults for Google", () => {
      const policy = resolveTranscriptPolicy({
        modelApi: "google-gemini-cli",
        modelId: "gemini-2.0-flash",
      });
      expect(policy.repairToolUseResultPairing).toBe(true);
      expect(policy.validateAnthropicTurns).toBe(false);
      expect(policy.allowSyntheticToolResults).toBe(true);
      expect(policy.validateGeminiTurns).toBe(true);
      expect(policy.applyGoogleTurnOrdering).toBe(true);
    });
  });
  describe("non-Claude models via third-party providers", () => {
    it("does not enable Claude-specific sanitizers for GPT models on openrouter", () => {
      const policy = resolveTranscriptPolicy({
        provider: "openrouter",
        modelId: "openai/gpt-4-turbo",
      });
      expect(policy.repairToolUseResultPairing).toBe(false);
      expect(policy.validateAnthropicTurns).toBe(false);
      expect(policy.allowSyntheticToolResults).toBe(false);
    });
    it("does not enable Claude-specific sanitizers for Llama models on github-copilot", () => {
      const policy = resolveTranscriptPolicy({
        provider: "github-copilot",
        modelId: "llama-3.1-70b",
      });
      expect(policy.repairToolUseResultPairing).toBe(false);
      expect(policy.validateAnthropicTurns).toBe(false);
      expect(policy.allowSyntheticToolResults).toBe(false);
    });
    it("does not enable Claude sanitizers for Gemini models on openrouter (but enables Gemini-specific)", () => {
      const policy = resolveTranscriptPolicy({
        provider: "openrouter",
        modelId: "google/gemini-pro",
      });
      // Gemini on openrouter gets special thought signature handling but not Claude sanitizers
      expect(policy.repairToolUseResultPairing).toBe(false);
      expect(policy.validateAnthropicTurns).toBe(false);
      expect(policy.allowSyntheticToolResults).toBe(false);
      expect(policy.sanitizeThoughtSignatures).toEqual({
        allowBase64Only: true,
        includeCamelCase: true,
      });
    });
  });
  describe("Mistral models", () => {
    it("enables Mistral-specific sanitizers", () => {
      const policy = resolveTranscriptPolicy({
        provider: "mistral",
        modelId: "mistral-large",
      });
      expect(policy.sanitizeToolCallIds).toBe(true);
      expect(policy.toolCallIdMode).toBe("strict9");
      expect(policy.sanitizeMode).toBe("full");
    });
    it("detects Mistral models by modelId hint", () => {
      const policy = resolveTranscriptPolicy({
        provider: "openrouter",
        modelId: "mistralai/mixtral-8x7b",
      });
      expect(policy.sanitizeToolCallIds).toBe(true);
      expect(policy.toolCallIdMode).toBe("strict9");
    });
  });
  describe("edge cases", () => {
    it("handles null/undefined modelId gracefully", () => {
      const policy = resolveTranscriptPolicy({
        provider: "github-copilot",
        modelId: null,
      });
      expect(policy.repairToolUseResultPairing).toBe(false);
      expect(policy.validateAnthropicTurns).toBe(false);
      expect(policy.allowSyntheticToolResults).toBe(false);
    });
    it("handles empty string modelId gracefully", () => {
      const policy = resolveTranscriptPolicy({
        provider: "openrouter",
        modelId: "",
      });
      expect(policy.repairToolUseResultPairing).toBe(false);
      expect(policy.validateAnthropicTurns).toBe(false);
      expect(policy.allowSyntheticToolResults).toBe(false);
    });
    it("handles undefined params gracefully", () => {
      const policy = resolveTranscriptPolicy({});
      expect(policy.repairToolUseResultPairing).toBe(false);
      expect(policy.validateAnthropicTurns).toBe(false);
      expect(policy.allowSyntheticToolResults).toBe(false);
    });
  });
  describe("google-antigravity Claude models", () => {
    it("enables antigravity-specific settings for Claude via google-antigravity", () => {
      const policy = resolveTranscriptPolicy({
        modelApi: "google-antigravity",
        provider: "google-antigravity",
        modelId: "claude-3-5-sonnet",
      });
      expect(policy.preserveSignatures).toBe(true);
      expect(policy.normalizeAntigravityThinkingBlocks).toBe(true);
      // Also enables Claude-specific sanitizers
      expect(policy.repairToolUseResultPairing).toBe(true);
      expect(policy.validateAnthropicTurns).toBe(true);
      expect(policy.allowSyntheticToolResults).toBe(true);
    });
  });
 });
--- a/src/agents/transcript-policy.ts
+++ b/src/agents/transcript-policy.ts
@ -62,6 +62,16 @@ function isMistralModel(params: { provider?: string | null; modelId?: string | n
  return MISTRAL_MODEL_HINTS.some((hint) => modelId.includes(hint));
 }
 /**
 * Detects Claude models by checking if the modelId contains 'claude'.
 * This catches Claude models accessed via non-Anthropic providers like
 * github-copilot, openrouter, etc.
 */
 function isClaudeModel(modelId?: string | null): boolean {
  if (!modelId) return false;
  return modelId.toLowerCase().includes("claude");
 }
 export function resolveTranscriptPolicy(params: {
  modelApi?: string | null;
  provider?: string | null;
@ -81,6 +91,8 @@ export function resolveTranscriptPolicy(params: {
    provider,
    modelId,
  });
  // Detect Claude models by modelId (catches github-copilot, openrouter, etc.)
  const isClaude = isClaudeModel(modelId);
  const needsNonImageSanitize = isGoogle || isAnthropic || isMistral || isOpenRouterGemini;
@ -90,7 +102,7 @@ export function resolveTranscriptPolicy(params: {
    : sanitizeToolCallIds
      ? "strict"
      : undefined;
-  const repairToolUseResultPairing = isGoogle || isAnthropic;
+  const repairToolUseResultPairing = isGoogle || isAnthropic || isClaude;
  const sanitizeThoughtSignatures = isOpenRouterGemini
    ? { allowBase64Only: true, includeCamelCase: true }
    : undefined;
@ -106,7 +118,7 @@ export function resolveTranscriptPolicy(params: {
    normalizeAntigravityThinkingBlocks,
    applyGoogleTurnOrdering: !isOpenAi && isGoogle,
    validateGeminiTurns: !isOpenAi && isGoogle,
-    validateAnthropicTurns: !isOpenAi && isAnthropic,
+    validateAnthropicTurns: !isOpenAi && (isAnthropic || isClaude),
-    allowSyntheticToolResults: !isOpenAi && (isGoogle || isAnthropic),
+    allowSyntheticToolResults: !isOpenAi && (isGoogle || isAnthropic || isClaude),
  };
 }