fix(agent): strip thinking tags from text content

2026-01-14 14:55:48 +01:00
parent 8146c43aa3
commit 3b7d103758
2 changed files with 121 additions and 1 deletions
--- a/src/agents/pi-embedded-utils.test.ts
+++ b/src/agents/pi-embedded-utils.test.ts
@@ -358,4 +358,84 @@ File contents here`,
    const result = extractAssistantText(msg);
    expect(result).toBe("Here's what I found:\nDone checking.");
  });
  it("strips thinking tags from text content", () => {
    const msg: AssistantMessage = {
      role: "assistant",
      content: [
        {
          type: "text",
          text: "<think>El usuario quiere retomar una tarea...</think>Aquí está tu respuesta.",
        },
      ],
      timestamp: Date.now(),
    };
    const result = extractAssistantText(msg);
    expect(result).toBe("Aquí está tu respuesta.");
  });
  it("strips thinking tags without closing tag", () => {
    const msg: AssistantMessage = {
      role: "assistant",
      content: [
        {
          type: "text",
          text: "<think>Pensando sobre el problema...",
        },
      ],
      timestamp: Date.now(),
    };
    const result = extractAssistantText(msg);
    expect(result).toBe("");
  });
  it("strips thinking tags with various formats", () => {
    const msg: AssistantMessage = {
      role: "assistant",
      content: [
        {
          type: "text",
          text: "Before<thinking>internal reasoning</thinking>After",
        },
      ],
      timestamp: Date.now(),
    };
    const result = extractAssistantText(msg);
    expect(result).toBe("BeforeAfter");
  });
  it("strips antthinking tags", () => {
    const msg: AssistantMessage = {
      role: "assistant",
      content: [
        {
          type: "text",
          text: "<antthinking>Some reasoning</antthinking>The actual answer.",
        },
      ],
      timestamp: Date.now(),
    };
    const result = extractAssistantText(msg);
    expect(result).toBe("The actual answer.");
  });
  it("handles nested or multiple thinking blocks", () => {
    const msg: AssistantMessage = {
      role: "assistant",
      content: [
        {
          type: "text",
          text: "Start<think>first thought</think>Middle<think>second thought</think>End",
        },
      ],
      timestamp: Date.now(),
    };
    const result = extractAssistantText(msg);
    expect(result).toBe("StartMiddleEnd");
  });
 });
--- a/src/agents/pi-embedded-utils.ts
+++ b/src/agents/pi-embedded-utils.ts
@@ -47,6 +47,44 @@ function stripDowngradedToolCallText(text: string): string {
  return cleaned.trim();
 }
 /**
 * Strip thinking tags and their content from text.
 * This is a safety net for cases where the model outputs <think> tags
 * that slip through other filtering mechanisms.
 */
 function stripThinkingTagsFromText(text: string): string {
  if (!text) return text;
  // Quick check to avoid regex overhead when no tags present.
  if (!/(?:think(?:ing)?|thought|antthinking)/i.test(text)) return text;
  const tagRe = /<\s*(\/?)\s*(?:think(?:ing)?|thought|antthinking)\s*>/gi;
  let result = "";
  let lastIndex = 0;
  let inThinking = false;
  for (const match of text.matchAll(tagRe)) {
    const idx = match.index ?? 0;
    const isClose = match[1] === "/";
    if (!inThinking && !isClose) {
      // Opening tag - save text before it.
      result += text.slice(lastIndex, idx);
      inThinking = true;
    } else if (inThinking && isClose) {
      // Closing tag - skip content inside.
      inThinking = false;
    }
    lastIndex = idx + match[0].length;
  }
  // Append remaining text if we're not inside thinking.
  if (!inThinking) {
    result += text.slice(lastIndex);
  }
  return result.trim();
 }
 export function extractAssistantText(msg: AssistantMessage): string {
  const isTextBlock = (block: unknown): block is { type: "text"; text: string } => {
    if (!block || typeof block !== "object") return false;
@@ -58,7 +96,9 @@ export function extractAssistantText(msg: AssistantMessage): string {
    ? msg.content
        .filter(isTextBlock)
        .map((c) =>
-          stripDowngradedToolCallText(stripMinimaxToolCallXml(c.text)).trim(),
+          stripThinkingTagsFromText(
            stripDowngradedToolCallText(stripMinimaxToolCallXml(c.text)),
          ).trim(),
        )
        .filter(Boolean)
    : [];