agentscope-ai · lailoo · Feb 28, 2026 · Mar 2, 2026 · Mar 3, 2026 · ekzhu
diff --git a/src/copaw/agents/model_factory.py b/src/copaw/agents/model_factory.py
@@ -73,14 +73,43 @@ class FileBlockSupportFormatter(base_formatter_class):
         """Formatter with file block support for tool results."""
 
         async def _format(self, msgs):
-            """Override to sanitize tool messages before formatting.
+            """Override to sanitize tool messages and preserve thinking blocks.
 
-            This prevents OpenAI API errors from improperly paired
-            tool messages.
+            - Sanitizes improperly paired tool messages.
+            - After base formatting, injects ``reasoning_content`` from
+              thinking blocks into assistant messages so that APIs like
+              Kimi K2.5 (which require it) don't reject the request.
             """
             msgs = _sanitize_tool_messages(msgs)
-            messages = await super()._format(msgs)
-            return _strip_top_level_message_name(messages)
+
+            # Collect thinking content per assistant msg (in order).
+            assistant_thinking: list[str] = []
+            for msg in msgs:
+                if msg.role == "assistant":
+                    parts = [
+                        b.get("thinking", "")
+                        for b in msg.get_content_blocks()
+                        if b.get("type") == "thinking"
+                    ]
+                    assistant_thinking.append(
+                        "\n".join(p for p in parts if p),
+                    )
+
+            formatted = await super()._format(msgs)
+
+            # Inject reasoning_content into formatted assistant messages.
+            if assistant_thinking:
-            if assistant_thinking:
+            if any(assistant_thinking):
-            if assistant_thinking:
+            if any(assistant_thinking):
+                asst_idx = 0
+                for fmt_msg in formatted:
+                    if fmt_msg.get("role") == "assistant":
+                        if (
+                            asst_idx < len(assistant_thinking)
+                            and assistant_thinking[asst_idx]
+                        ):
+                            fmt_msg["reasoning_content"] = assistant_thinking[asst_idx]
+                        asst_idx += 1
-            # Inject reasoning_content into formatted assistant messages.
-            if assistant_thinking:
-                asst_idx = 0
-                for fmt_msg in formatted:
-                    if fmt_msg.get("role") == "assistant":
-                        if (
-                            asst_idx < len(assistant_thinking)
-                            and assistant_thinking[asst_idx]
-                        ):
-                            fmt_msg["reasoning_content"] = assistant_thinking[asst_idx]
-                        asst_idx += 1
+            # Inject reasoning_content into formatted assistant messages.
+            if assistant_thinking:
+                asst_idx = 0
+                for fmt_msg in formatted:
+                    if fmt_msg.get("role") == "assistant":
+                        if (
+                            fmt_msg.get("tool_calls")
+                            and
+                            asst_idx < len(assistant_thinking)
+                            and assistant_thinking[asst_idx]
+                        ):
+                            fmt_msg["reasoning_content"] = assistant_thinking[asst_idx]
+                        asst_idx += 1
-            # Inject reasoning_content into formatted assistant messages.
-            if assistant_thinking:
-                asst_idx = 0
-                for fmt_msg in formatted:
-                    if fmt_msg.get("role") == "assistant":
-                        if (
-                            asst_idx < len(assistant_thinking)
-                            and assistant_thinking[asst_idx]
-                        ):
-                            fmt_msg["reasoning_content"] = assistant_thinking[asst_idx]
-                        asst_idx += 1
+            # Inject reasoning_content into formatted assistant messages.
+            if assistant_thinking:
+                asst_idx = 0
+                for fmt_msg in formatted:
+                    if fmt_msg.get("role") == "assistant":
+                        if (
+                            fmt_msg.get("tool_calls")
+                            and
+                            asst_idx < len(assistant_thinking)
+                            and assistant_thinking[asst_idx]
+                        ):
+                            fmt_msg["reasoning_content"] = assistant_thinking[asst_idx]
+                        asst_idx += 1
+
+            return _strip_top_level_message_name(formatted)
 
         @staticmethod
         def convert_tool_result_to_string(
@@ -282,8 +311,7 @@ def _create_remote_model_instance(
         base_url = llm_cfg.base_url
     else:
         logger.warning(
-            "No active LLM configured — "
-            "falling back to DASHSCOPE_API_KEY env var",
+            "No active LLM configured — " "falling back to DASHSCOPE_API_KEY env var",
         )
         model_name = "qwen3-max"
         api_key = os.getenv("DASHSCOPE_API_KEY", "")

diff --git a/tests/test_thinking_block_fix.py b/tests/test_thinking_block_fix.py
@@ -0,0 +1,204 @@
+# -*- coding: utf-8 -*-
+"""Verify fix for #155: thinking blocks preserved as reasoning_content."""
+import asyncio
+import json
+
+from agentscope.message import (
+    Msg,
+    ThinkingBlock,
+    TextBlock,
+    ToolUseBlock,
+    ToolResultBlock,
+)
+from agentscope.model import OpenAIChatModel
+
+from copaw.agents.model_factory import _create_formatter_instance
+
+
+def test_reasoning_content_preserved():
+    """Thinking blocks must appear as reasoning_content in formatted output."""
+    formatter = _create_formatter_instance(OpenAIChatModel)
+
+    msgs = [
+        Msg(
+            name="system",
+            role="system",
+            content="You are a helpful assistant.",
+        ),
+        Msg(name="user", role="user", content="What time is it now?"),
+        Msg(
+            name="assistant",
+            role="assistant",
+            content=[
+                ThinkingBlock(
+                    type="thinking",
+                    thinking="I should call get_current_time to answer this.",
+                ),
+                TextBlock(type="text", text="Let me check."),
+                ToolUseBlock(
+                    type="tool_use",
+                    id="call_001",
+                    name="get_current_time",
+                    input={},
+                ),
+            ],
+        ),
+        Msg(
+            name="system",
+            role="system",
+            content=[
+                ToolResultBlock(
+                    type="tool_result",
+                    id="call_001",
+                    name="get_current_time",
+                    output="2026-03-01 14:30:00 CST",
+                ),
+            ],
+        ),
+    ]
+
+    formatted = asyncio.run(formatter.format(msgs))
+
+    assistant_msgs = [
+        m
+        for m in formatted
+        if m.get("role") == "assistant" and m.get("tool_calls")
+    ]
+    assert len(assistant_msgs) == 1, (
+        f"Expected 1 assistant msg with tool_calls, "
+        f"got {len(assistant_msgs)}. "
+        f"All formatted: {json.dumps(formatted, ensure_ascii=False)}"
+    )
+
+    msg = assistant_msgs[0]
+    reasoning = msg.get("reasoning_content")
+    assert reasoning, (
+        f"reasoning_content missing! "
+        f"Formatted msg: {json.dumps(msg, ensure_ascii=False, indent=2)}"
+    )
+    assert "get_current_time" in reasoning
+    print(f"✅ PASS — reasoning_content preserved: {reasoning}")
+
+
+def test_no_reasoning_when_no_thinking():
+    """Messages without thinking blocks should not get reasoning_content."""
+    formatter = _create_formatter_instance(OpenAIChatModel)
+
+    msgs = [
+        Msg(name="system", role="system", content="Hi"),
+        Msg(name="user", role="user", content="Hello"),
+        Msg(
+            name="assistant",
+            role="assistant",
+            content=[TextBlock(type="text", text="Hi there!")],
+        ),
+    ]
+
+    formatted = asyncio.run(formatter.format(msgs))
+    assistant_msgs = [m for m in formatted if m.get("role") == "assistant"]
+    assert len(assistant_msgs) == 1
+
+    msg = assistant_msgs[0]
+    assert (
+        "reasoning_content" not in msg
+    ), (
+        "reasoning_content should not be present "
+        "when there are no thinking blocks"
+    )
+    print("✅ PASS — no reasoning_content when no thinking blocks")
+
+
+def test_multiple_assistant_messages():
+    """Each assistant message gets its own reasoning_content."""
+    formatter = _create_formatter_instance(OpenAIChatModel)
+
+    msgs = [
+        Msg(name="system", role="system", content="Hi"),
+        Msg(name="user", role="user", content="Do two things"),
+        Msg(
+            name="assistant",
+            role="assistant",
+            content=[
+                ThinkingBlock(
+                    type="thinking",
+                    thinking="First task thinking",
+                ),
+                TextBlock(type="text", text="Doing first thing."),
+                ToolUseBlock(
+                    type="tool_use",
+                    id="c1",
+                    name="tool_a",
+                    input={},
+                ),
+            ],
+        ),
+        Msg(
+            name="system",
+            role="system",
+            content=[
+                ToolResultBlock(
+                    type="tool_result",
+                    id="c1",
+                    name="tool_a",
+                    output="done",
+                ),
+            ],
+        ),
+        Msg(
+            name="assistant",
+            role="assistant",
+            content=[
+                ThinkingBlock(
+                    type="thinking",
+                    thinking="Second task thinking",
+                ),
+                TextBlock(type="text", text="Doing second thing."),
+                ToolUseBlock(
+                    type="tool_use",
+                    id="c2",
+                    name="tool_b",
+                    input={},
+                ),
+            ],
+        ),
+        Msg(
+            name="system",
+            role="system",
+            content=[
+                ToolResultBlock(
+                    type="tool_result",
+                    id="c2",
+                    name="tool_b",
+                    output="done",
+                ),
+            ],
+        ),
+    ]
+
+    formatted = asyncio.run(formatter.format(msgs))
+    assistant_msgs = [
+        m
+        for m in formatted
+        if m.get("role") == "assistant" and m.get("tool_calls")
+    ]
+    assert (
+        len(assistant_msgs) == 2
+    ), f"Expected 2 assistant msgs, got {len(assistant_msgs)}"
+
+    assert (
+        assistant_msgs[0].get("reasoning_content") == "First task thinking"
+    )
+    assert (
+        assistant_msgs[1].get("reasoning_content") == "Second task thinking"
+    )
+    print(
+        "✅ PASS — multiple assistant messages "
+        "each get correct reasoning_content"
+    )
+
+
+if __name__ == "__main__":
+    test_reasoning_content_preserved()
+    test_no_reasoning_when_no_thinking()
+    test_multiple_assistant_messages()
+    print("\nAll tests passed!")