fix: handle tool execution timeout/error causing IllegalStateException (#951)

chensk0601 · chensk0601 · commit 86c49aa967b0 · 2026-03-14T15:00:11.000+08:00
ReActAgent throws IllegalStateException when tool calls timeout or fail, because no tool result is written to memory, leaving orphaned pending tool call states that crash the agent on subsequent requests. Root cause: - Tool execution timeout/error propagates without writing results to memory - Pending tool call state remains, blocking subsequent doCall() invocations - validateAndAddToolResults() throws when user message has no tool results Changes: - doCall(): detect pending tool calls without user-provided results and auto-generate error results to clear the pending state - executeToolCalls(): add onErrorResume to catch tool execution failures and generate error tool results instead of propagating exceptions - Add generateAndAddErrorToolResults() helper to create error results for orphaned pending tool calls This ensures the agent recovers gracefully from tool failures instead of crashing, and the model receives proper error feedback to continue processing. Closes #951
diff --git a/agentscope-core/src/main/java/io/agentscope/core/ReActAgent.java b/agentscope-core/src/main/java/io/agentscope/core/ReActAgent.java
@@ -252,9 +252,72 @@ protected Mono<Msg> doCall(List<Msg> msgs) {
             return executeIteration(0);
         }
 
-        // Has pending tools -> validate and add tool results
-        validateAndAddToolResults(msgs, pendingIds);
-        return hasPendingToolUse() ? acting(0) : executeIteration(0);
+        // Has pending tools but no input -> resume (execute pending tools directly)
+        if (msgs == null || msgs.isEmpty()) {
+            return hasPendingToolUse() ? acting(0) : executeIteration(0);
+        }
+
+        // Has pending tools + input -> check if user provided tool results
+        List<ToolResultBlock> providedResults =
+                msgs.stream()
+                        .flatMap(m -> m.getContentBlocks(ToolResultBlock.class).stream())
+                        .toList();
+
+        if (!providedResults.isEmpty()) {
+            // User provided tool results -> validate and add
+            validateAndAddToolResults(msgs, pendingIds);
+            return hasPendingToolUse() ? acting(0) : executeIteration(0);
+        }
+
+        // User sent a new message without tool results -> auto-recover from orphaned pending state
+        log.warn(
+                "Pending tool calls detected without results, auto-generating error results."
+                        + " Pending IDs: {}",
+                pendingIds);
+        generateAndAddErrorToolResults(pendingIds);
+        addToMemory(msgs);
+        return executeIteration(0);
+    }
+
+    /**
+     * Generate error tool results for pending tool calls and add them to memory.
+     * This is used to recover from situations where tool execution failed without
+     * properly writing results to memory.
+     *
+     * @param pendingIds The set of pending tool use IDs
+     */
+    private void generateAndAddErrorToolResults(Set<String> pendingIds) {
+        Msg lastAssistant = findLastAssistantMsg();
+        if (lastAssistant == null) {
+            return;
+        }
+
+        List<ToolUseBlock> pendingToolCalls =
+                lastAssistant.getContentBlocks(ToolUseBlock.class).stream()
+                        .filter(toolUse -> pendingIds.contains(toolUse.getId()))
+                        .toList();
+
+        for (ToolUseBlock toolCall : pendingToolCalls) {
+            ToolResultBlock errorResult =
+                    ToolResultBlock.builder()
+                            .id(toolCall.getId())
+                            .output(
+                                    List.of(
+                                            TextBlock.builder()
+                                                    .text(
+                                                            "[ERROR] Previous tool execution failed"
+                                                                    + " or was interrupted. Tool: "
+                                                                    + toolCall.getName())
+                                                    .build()))
+                            .build();
+            Msg toolResultMsg =
+                    ToolResultMessageBuilder.buildToolResultMsg(errorResult, toolCall, getName());
+            memory.addMessage(toolResultMsg);
+            log.info(
+                    "Auto-generated error result for pending tool call: {} ({})",
+                    toolCall.getName(),
+                    toolCall.getId());
+        }
     }
 
     /**
@@ -592,6 +655,10 @@ private Msg buildSuspendedMsg(List<Map.Entry<ToolUseBlock, ToolResultBlock>> pen
     /**
      * Execute tool calls and return paired results.
      *
+     * <p>If tool execution fails (timeout, error, etc.), this method generates error tool results
+     * for all pending tool calls instead of propagating the error. This ensures the agent can
+     * continue processing and the model receives proper error feedback.
+     *
      * @param toolCalls The list of tool calls (potentially modified by PreActingEvent hooks)
      * @return Mono containing list of (ToolUseBlock, ToolResultBlock) pairs
      */
@@ -602,7 +669,41 @@ private Mono<List<Map.Entry<ToolUseBlock, ToolResultBlock>>> executeToolCalls(
                         results ->
                                 IntStream.range(0, toolCalls.size())
                                         .mapToObj(i -> Map.entry(toolCalls.get(i), results.get(i)))
-                                        .toList());
+                                        .toList())
+                .onErrorResume(
+                        error -> {
+                            // Generate error tool results for all pending tool calls
+                            log.error(
+                                    "Tool execution failed, generating error results for {} tool"
+                                            + " calls: {}",
+                                    toolCalls.size(),
+                                    error.getMessage());
+                            List<Map.Entry<ToolUseBlock, ToolResultBlock>> errorResults =
+                                    toolCalls.stream()
+                                            .map(
+                                                    toolCall -> {
+                                                        ToolResultBlock errorResult =
+                                                                ToolResultBlock.builder()
+                                                                        .id(toolCall.getId())
+                                                                        .output(
+                                                                                List.of(
+                                                                                        TextBlock
+                                                                                                .builder()
+                                                                                                .text(
+                                                                                                        "[ERROR]"
+                                                                                                            + " Tool"
+                                                                                                            + " execution"
+                                                                                                            + " failed:"
+                                                                                                            + " "
+                                                                                                                + error
+                                                                                                                        .getMessage())
+                                                                                                .build()))
+                                                                        .build();
+                                                        return Map.entry(toolCall, errorResult);
+                                                    })
+                                            .toList();
+                            return Mono.just(errorResults);
+                        });
     }
 
     /**
diff --git a/agentscope-core/src/test/java/io/agentscope/core/hook/HookStopAgentTest.java b/agentscope-core/src/test/java/io/agentscope/core/hook/HookStopAgentTest.java
@@ -52,7 +52,6 @@
 import org.junit.jupiter.api.Test;
 import reactor.core.publisher.Flux;
 import reactor.core.publisher.Mono;
-import reactor.test.StepVerifier;
 
 /**
  * Comprehensive tests for the Hook Stop Agent feature.
@@ -345,10 +344,15 @@ void testResumeWithToolResultMsg() {
         }
 
         @Test
-        @DisplayName("New message with pending tool calls throws error")
+        @DisplayName("New message with pending tool calls auto-recovers")
         void testNewMsgWithPendingToolUseContinuesActing() {
             Msg toolUseMsg = createToolUseMsg("tool1", "test_tool", Map.of());
-            setupModelToReturnToolUse(toolUseMsg);
+            Msg textResponse =
+                    createAssistantTextMsg("Recovered after auto-generated error results");
+
+            when(mockModel.stream(anyList(), anyList(), any()))
+                    .thenReturn(createFluxFromMsg(toolUseMsg))
+                    .thenReturn(createFluxFromMsg(textResponse));
 
             Hook stopHook = createPostReasoningStopHook();
 
@@ -368,15 +372,11 @@ void testNewMsgWithPendingToolUseContinuesActing() {
                     result1.hasContentBlocks(ToolUseBlock.class),
                     "First call should return ToolUse message");
 
-            // Send a new regular message - should throw error due to pending tool calls
+            // Send a new regular message - should auto-recover by generating error results
             Msg newMsg = createUserMsg("new message");
+            Msg result2 = agent.call(newMsg).block(TEST_TIMEOUT);
 
-            StepVerifier.create(agent.call(newMsg))
-                    .expectErrorMatches(
-                            e ->
-                                    e instanceof IllegalStateException
-                                            && e.getMessage().contains("pending tool calls"))
-                    .verify();
+            assertNotNull(result2, "Agent should auto-recover and return a result");
         }
     }
 
@@ -642,10 +642,14 @@ void testNormalCallAfterCompletion() {
         }
 
         @Test
-        @DisplayName("Agent throws error when adding regular message with pending tool calls")
+        @DisplayName("Agent auto-recovers when adding regular message with pending tool calls")
         void testAgentHandlesPendingToolCallsGracefully() {
             Msg toolUseMsg = createToolUseMsg("tool1", "test_tool", Map.of());
-            setupModelToReturnToolUse(toolUseMsg);
+            Msg textResponse = createAssistantTextMsg("Recovered");
+
+            when(mockModel.stream(anyList(), anyList(), any()))
+                    .thenReturn(createFluxFromMsg(toolUseMsg))
+                    .thenReturn(createFluxFromMsg(textResponse));
 
             Hook stopHook = createPostReasoningStopHook();
 
@@ -661,14 +665,10 @@ void testAgentHandlesPendingToolCallsGracefully() {
 
             agent.call(createUserMsg("test")).block(TEST_TIMEOUT);
 
-            // With new design, agent will throw error when adding regular message
-            // with pending tool calls
-            StepVerifier.create(agent.call(createUserMsg("new")))
-                    .expectErrorMatches(
-                            e ->
-                                    e instanceof IllegalStateException
-                                            && e.getMessage().contains("pending tool calls"))
-                    .verify();
+            // With new design, agent will auto-recover by generating error results
+            // for pending tool calls and continue processing
+            Msg result = agent.call(createUserMsg("new")).block(TEST_TIMEOUT);
+            assertNotNull(result, "Agent should auto-recover and return a result");
         }
     }