Merge branch 'main' into fix/951-react-agent-tool-execution-error-handling

chensk0601 · web-flow · commit 2d7ad5f3a5ef · 2026-03-27T13:27:12.000+08:00
diff --git a/agentscope-extensions/agentscope-extensions-autocontext-memory/src/main/java/io/agentscope/core/memory/autocontext/AutoContextMemory.java b/agentscope-extensions/agentscope-extensions-autocontext-memory/src/main/java/io/agentscope/core/memory/autocontext/AutoContextMemory.java
@@ -1228,6 +1228,99 @@ private boolean offloadingLargePayload(List<Msg> rawMessages, boolean lastKeep)
             Msg msg = rawMessages.get(i);
             String textContent = msg.getTextContent();
 
+            // ASSISTANT messages with ToolUseBlock (tool_calls) must NOT be offloaded as a plain
+            // text stub. Doing so strips the ToolUseBlock, leaving the subsequent TOOL result
+            // messages without a preceding tool_calls assistant message, which violates the API
+            // constraint: "messages with role 'tool' must be a response to a preceding message
+            // with 'tool_calls'". These pairs are handled exclusively by Strategy 1.
+            if (MsgUtils.isToolUseMessage(msg)) {
+                continue;
+            }
+
+            // TOOL result messages can have their output content offloaded, but the
+            // ToolResultBlock structure (id, name) MUST be preserved so that the API formatter
+            // can still emit the correct tool_call_id / name fields. We handle them separately.
+            if (MsgUtils.isToolResultMessage(msg)) {
+                ToolResultBlock originalResult = msg.getFirstContentBlock(ToolResultBlock.class);
+                if (originalResult != null) {
+                    // Use the ToolResultBlock output text for size checking, because
+                    // Msg.getTextContent() only extracts top-level TextBlocks and returns
+                    // empty string for TOOL messages whose content is a ToolResultBlock.
+                    String outputText =
+                            originalResult.getOutput().stream()
+                                    .filter(TextBlock.class::isInstance)
+                                    .map(TextBlock.class::cast)
+                                    .map(TextBlock::getText)
+                                    .collect(Collectors.joining("\n"));
+                    if (outputText.length() > threshold) {
+                        String toolResultUuid = UUID.randomUUID().toString();
+                        List<Msg> offloadMsg = new ArrayList<>();
+                        offloadMsg.add(msg);
+                        offload(toolResultUuid, offloadMsg);
+                        log.info(
+                                "Offloaded large tool result message: index={}, size={} chars,"
+                                        + " uuid={}",
+                                i,
+                                outputText.length(),
+                                toolResultUuid);
+
+                        String preview =
+                                outputText.length() > autoContextConfig.offloadSinglePreview
+                                        ? outputText.substring(
+                                                        0, autoContextConfig.offloadSinglePreview)
+                                                + "..."
+                                        : outputText;
+                        String offloadHint =
+                                preview
+                                        + "\n"
+                                        + String.format(
+                                                Prompts.CONTEXT_OFFLOAD_TAG_FORMAT, toolResultUuid);
+
+                        // Preserve ToolResultBlock structure (id, name, metadata) so the API
+                        // formatter can emit the correct tool_call_id / name, and downstream
+                        // consumers retain semantic flags (e.g. agentscope_suspended) after
+                        // offloading.  Only the output text is replaced with the offload hint.
+                        ToolResultBlock compressedResult =
+                                ToolResultBlock.of(
+                                        originalResult.getId(),
+                                        originalResult.getName(),
+                                        TextBlock.builder().text(offloadHint).build(),
+                                        originalResult.getMetadata());
+
+                        Map<String, Object> trCompressMeta = new HashMap<>();
+                        trCompressMeta.put("offloaduuid", toolResultUuid);
+                        Map<String, Object> trMetadata = new HashMap<>();
+                        trMetadata.put("_compress_meta", trCompressMeta);
+
+                        Msg replacementToolMsg =
+                                Msg.builder()
+                                        .role(msg.getRole())
+                                        .name(msg.getName())
+                                        .content(compressedResult)
+                                        .metadata(trMetadata)
+                                        .build();
+
+                        int tokenBefore = TokenCounterUtil.calculateToken(List.of(msg));
+                        int tokenAfter =
+                                TokenCounterUtil.calculateToken(List.of(replacementToolMsg));
+                        Map<String, Object> trEventMetadata = new HashMap<>();
+                        trEventMetadata.put("inputToken", tokenBefore);
+                        trEventMetadata.put("outputToken", tokenAfter);
+                        trEventMetadata.put("time", 0.0);
+
+                        String eventType =
+                                lastKeep
+                                        ? CompressionEvent.LARGE_MESSAGE_OFFLOAD_WITH_PROTECTION
+                                        : CompressionEvent.LARGE_MESSAGE_OFFLOAD;
+                        recordCompressionEvent(eventType, i, i, rawMessages, null, trEventMetadata);
+
+                        rawMessages.set(i, replacementToolMsg);
+                        hasOffloaded = true;
+                    }
+                }
+                continue;
+            }
+
             String uuid = null;
             // Check if message content exceeds threshold
             if (textContent != null && textContent.length() > threshold) {
diff --git a/agentscope-extensions/agentscope-extensions-autocontext-memory/src/test/java/io/agentscope/core/memory/autocontext/AutoContextMemoryTest.java b/agentscope-extensions/agentscope-extensions-autocontext-memory/src/test/java/io/agentscope/core/memory/autocontext/AutoContextMemoryTest.java
@@ -1631,6 +1631,271 @@ void testGetPlanStateContextWithDoneSubtaskWithoutOutcome() throws Exception {
                 "Should contain expected outcome");
     }
 
+    // ==================== Tool Call Pairing Safety Tests ====================
+
+    @Test
+    @DisplayName(
+            "Should NOT offload ASSISTANT tool-call message as plain TextBlock stub during large"
+                    + " payload offloading (Strategy 2/3)")
+    void testLargePayloadOffloadingSkipsAssistantToolUseMessage() {
+        // Regression test for: DashScope 400 "messages with role 'tool' must be a response to a
+        // preceding message with 'tool_calls'".
+        // When an ASSISTANT message carrying ToolUseBlock is large and gets offloaded as a plain
+        // TextBlock stub, the downstream TOOL result messages become orphaned.
+        TestModel model = new TestModel("Summary");
+        AutoContextConfig cfg =
+                AutoContextConfig.builder()
+                        .msgThreshold(5)
+                        .largePayloadThreshold(50) // low threshold so the large message triggers
+                        .lastKeep(2)
+                        .minConsecutiveToolMessages(100) // disable Strategy 1
+                        .minCompressionTokenThreshold(Integer.MAX_VALUE) // disable LLM compression
+                        .build();
+        AutoContextMemory mem = new AutoContextMemory(cfg, model);
+
+        // Round 0: user → large ASSISTANT tool-call → TOOL result → ASSISTANT final
+        mem.addMessage(createTextMessage("User query", MsgRole.USER));
+
+        // Build a large ASSISTANT tool-use message (> largePayloadThreshold)
+        String largeInput = "x".repeat(200);
+        Msg largeToolUseMsg =
+                Msg.builder()
+                        .role(MsgRole.ASSISTANT)
+                        .name("assistant")
+                        .content(
+                                ToolUseBlock.builder()
+                                        .id("call_large")
+                                        .name("search")
+                                        .input(Map.of("query", largeInput))
+                                        .build())
+                        .build();
+        mem.addMessage(largeToolUseMsg);
+        mem.addMessage(createToolResultMessage("search", "call_large", "tool output"));
+        mem.addMessage(createTextMessage("Assistant final response", MsgRole.ASSISTANT));
+
+        // Extra messages to push over msgThreshold
+        mem.addMessage(createTextMessage("Follow-up user question", MsgRole.USER));
+        mem.addMessage(createTextMessage("Follow-up assistant answer", MsgRole.ASSISTANT));
+
+        boolean compressed = mem.compressIfNeeded();
+        List<Msg> messages = mem.getMessages();
+
+        // Key assertion: the ASSISTANT message that had ToolUseBlock must still carry
+        // a ToolUseBlock (not be degraded to a plain TextBlock stub).
+        // If it were stripped, the subsequent TOOL message would be orphaned.
+        boolean hasOrphanedToolMsg = false;
+        for (int i = 0; i < messages.size(); i++) {
+            Msg msg = messages.get(i);
+            if (MsgUtils.isToolResultMessage(msg)) {
+                // The message immediately before a TOOL result must be ASSISTANT with tool_calls
+                // OR another TOOL result (parallel calls). It must NOT be a non-tool-call msg.
+                boolean precededByToolCall = false;
+                for (int j = i - 1; j >= 0; j--) {
+                    Msg prev = messages.get(j);
+                    if (MsgUtils.isToolUseMessage(prev)) {
+                        precededByToolCall = true;
+                        break;
+                    }
+                    if (MsgUtils.isToolResultMessage(prev)) {
+                        // Consecutive TOOL results from the same assistant tool-call message
+                        continue;
+                    }
+                    // Hit a non-tool message before finding a tool-call → orphaned
+                    break;
+                }
+                if (!precededByToolCall) {
+                    hasOrphanedToolMsg = true;
+                }
+            }
+        }
+        assertFalse(
+                hasOrphanedToolMsg,
+                "TOOL result messages must always be preceded by an ASSISTANT tool-call message."
+                        + " Offloading the ASSISTANT tool-call as a plain stub orphans them.");
+    }
+
+    @Test
+    @DisplayName(
+            "Should offload large TOOL result output while preserving ToolResultBlock id and name")
+    void testLargeToolResultOffloadPreservesIdAndName() {
+        // When a TOOL result message is large, Strategy 2/3 should compress its output text
+        // but MUST preserve the ToolResultBlock structure (id, name) so the API formatter
+        // can still emit the correct tool_call_id / name fields.
+        TestModel model = new TestModel("Summary");
+        AutoContextConfig cfg =
+                AutoContextConfig.builder()
+                        .msgThreshold(5)
+                        .largePayloadThreshold(50) // low threshold
+                        .lastKeep(2)
+                        .minConsecutiveToolMessages(100) // disable Strategy 1
+                        .minCompressionTokenThreshold(Integer.MAX_VALUE) // disable LLM compression
+                        .build();
+        AutoContextMemory mem = new AutoContextMemory(cfg, model);
+
+        // Round 0: user → ASSISTANT tool-call → large TOOL result → ASSISTANT final
+        mem.addMessage(createTextMessage("User query", MsgRole.USER));
+        mem.addMessage(createToolUseMessage("search", "call_tool_id_001"));
+
+        // Build a large TOOL result message (> largePayloadThreshold)
+        String largeOutput = "y".repeat(200);
+        Msg largeToolResultMsg =
+                Msg.builder()
+                        .role(MsgRole.TOOL)
+                        .name("search")
+                        .content(
+                                ToolResultBlock.builder()
+                                        .id("call_tool_id_001")
+                                        .name("search")
+                                        .output(
+                                                List.of(
+                                                        TextBlock.builder()
+                                                                .text(largeOutput)
+                                                                .build()))
+                                        .build())
+                        .build();
+        mem.addMessage(largeToolResultMsg);
+        mem.addMessage(createTextMessage("Assistant final response", MsgRole.ASSISTANT));
+
+        // Extra messages to push over msgThreshold
+        mem.addMessage(createTextMessage("Follow-up user question", MsgRole.USER));
+        mem.addMessage(createTextMessage("Follow-up assistant answer", MsgRole.ASSISTANT));
+
+        mem.compressIfNeeded();
+        List<Msg> messages = mem.getMessages();
+
+        // Find the (possibly compressed) TOOL result message
+        Msg toolResultMsg =
+                messages.stream().filter(MsgUtils::isToolResultMessage).findFirst().orElse(null);
+
+        // If the TOOL message was offloaded (compressed), it must still carry ToolResultBlock
+        // with the original id and name intact.
+        if (toolResultMsg != null) {
+            ToolResultBlock block = toolResultMsg.getFirstContentBlock(ToolResultBlock.class);
+            assertNotNull(
+                    block,
+                    "Compressed TOOL result message must still contain a ToolResultBlock"
+                            + " (not be degraded to plain TextBlock)");
+            assertEquals(
+                    "call_tool_id_001",
+                    block.getId(),
+                    "ToolResultBlock id must be preserved after offloading");
+            assertEquals(
+                    "search",
+                    block.getName(),
+                    "ToolResultBlock name must be preserved after offloading");
+            // The output should now contain the offload hint
+            String outputText =
+                    block.getOutput().stream()
+                            .filter(b -> b instanceof TextBlock)
+                            .map(b -> ((TextBlock) b).getText())
+                            .findFirst()
+                            .orElse("");
+            assertTrue(
+                    outputText.contains("CONTEXT_OFFLOAD"),
+                    "Compressed tool result output should contain offload hint. Got: "
+                            + outputText);
+        }
+
+        // Also verify no orphaned TOOL messages exist
+        for (int i = 0; i < messages.size(); i++) {
+            Msg msg = messages.get(i);
+            if (MsgUtils.isToolResultMessage(msg)) {
+                boolean precededByToolCall = false;
+                for (int j = i - 1; j >= 0; j--) {
+                    Msg prev = messages.get(j);
+                    if (MsgUtils.isToolUseMessage(prev)) {
+                        precededByToolCall = true;
+                        break;
+                    }
+                    if (MsgUtils.isToolResultMessage(prev)) {
+                        continue;
+                    }
+                    break;
+                }
+                assertTrue(
+                        precededByToolCall,
+                        "Every TOOL result must be preceded by an ASSISTANT tool-call message");
+            }
+        }
+    }
+
+    @Test
+    @DisplayName(
+            "Should maintain valid tool_calls/tool_result pairing after offloading large plain"
+                    + " messages in a mixed conversation")
+    void testToolCallPairingIntegrityAfterMixedOffloading() {
+        // Simulates the production scenario from the bug report:
+        // A long conversation with multiple tool-call rounds plus large plain messages.
+        // After Strategy 2/3 runs, every TOOL result must still follow an ASSISTANT tool-call.
+        TestModel model = new TestModel("Summary");
+        AutoContextConfig cfg =
+                AutoContextConfig.builder()
+                        .msgThreshold(8)
+                        .largePayloadThreshold(50)
+                        .lastKeep(3)
+                        .minConsecutiveToolMessages(100) // disable Strategy 1
+                        .minCompressionTokenThreshold(Integer.MAX_VALUE) // disable LLM compression
+                        .build();
+        AutoContextMemory mem = new AutoContextMemory(cfg, model);
+
+        // Round 0: normal tool call round (small output)
+        mem.addMessage(createTextMessage("User asks tool", MsgRole.USER));
+        mem.addMessage(createToolUseMessage("tool_a", "id_a1"));
+        mem.addMessage(createToolResultMessage("tool_a", "id_a1", "small result"));
+        mem.addMessage(createTextMessage("Assistant reply 0", MsgRole.ASSISTANT));
+
+        // Round 1: large USER message + tool call round
+        String largeUserText = "L".repeat(200);
+        mem.addMessage(
+                createTextMessage(largeUserText, MsgRole.USER)); // large – candidate for offload
+        mem.addMessage(createToolUseMessage("tool_b", "id_b1"));
+        mem.addMessage(createToolResultMessage("tool_b", "id_b1", "result b"));
+        mem.addMessage(createTextMessage("Assistant reply 1", MsgRole.ASSISTANT));
+
+        // Round 2: current (protected by lastKeep)
+        mem.addMessage(createTextMessage("Current user question", MsgRole.USER));
+        mem.addMessage(createTextMessage("Current assistant answer", MsgRole.ASSISTANT));
+
+        mem.compressIfNeeded();
+        List<Msg> messages = mem.getMessages();
+
+        // Invariant: for every TOOL result, scan backwards and find an ASSISTANT tool-call
+        // before hitting any non-tool message.
+        for (int i = 0; i < messages.size(); i++) {
+            if (!MsgUtils.isToolResultMessage(messages.get(i))) {
+                continue;
+            }
+            boolean found = false;
+            for (int j = i - 1; j >= 0; j--) {
+                Msg prev = messages.get(j);
+                if (MsgUtils.isToolUseMessage(prev)) {
+                    found = true;
+                    break;
+                }
+                if (MsgUtils.isToolResultMessage(prev)) {
+                    continue; // parallel tool results
+                }
+                break;
+            }
+            assertTrue(
+                    found,
+                    "TOOL result at index "
+                            + i
+                            + " is orphaned – no preceding ASSISTANT tool-call found."
+                            + " Full message sequence: "
+                            + messages.stream()
+                                    .map(
+                                            m ->
+                                                    m.getRole()
+                                                            + "(toolUse="
+                                                            + MsgUtils.isToolUseMessage(m)
+                                                            + ",toolResult="
+                                                            + MsgUtils.isToolResultMessage(m)
+                                                            + ")")
+                                    .toList());
+        }
+    }
+
     @Test
     @DisplayName("Should return plan context with different plan states")
     void testGetPlanStateContextWithDifferentPlanStates() throws Exception {