From 777f3f02968de7ca6b1273059de5be3e8e9c039a Mon Sep 17 00:00:00 2001
From: Tao Chen <taochen@microsoft.com>
Date: Wed, 8 Oct 2025 11:59:13 -0700
Subject: [PATCH] Invoke the model one more time after auto invoke has
 exhausted

---
 .../connectors/ai/chat_completion_client_base.py  | 15 +++++++++------
 1 file changed, 9 insertions(+), 6 deletions(-)

diff --git a/python/semantic_kernel/connectors/ai/chat_completion_client_base.py b/python/semantic_kernel/connectors/ai/chat_completion_client_base.py
index 974d59af92be..d26abeca9c7d 100644
--- a/python/semantic_kernel/connectors/ai/chat_completion_client_base.py
+++ b/python/semantic_kernel/connectors/ai/chat_completion_client_base.py
@@ -99,9 +99,7 @@ async def get_chat_message_contents(
         Returns:
             A list of chat message contents representing the response(s) from the LLM.
         """
-        from semantic_kernel.connectors.ai.function_calling_utils import (
-            merge_function_results,
-        )
+        from semantic_kernel.connectors.ai.function_calling_utils import merge_function_results
 
         # Create a copy of the settings to avoid modifying the original settings
         settings = copy.deepcopy(settings)
@@ -210,9 +208,7 @@ async def get_streaming_chat_message_contents(
         Yields:
             A stream representing the response(s) from the LLM.
         """
-        from semantic_kernel.connectors.ai.function_calling_utils import (
-            merge_streaming_function_results,
-        )
+        from semantic_kernel.connectors.ai.function_calling_utils import merge_streaming_function_results
 
         # Create a copy of the settings to avoid modifying the original settings
         settings = copy.deepcopy(settings)
@@ -316,6 +312,13 @@ async def get_streaming_chat_message_contents(
 
                 if any(result.terminate for result in results if result is not None):
                     break
+            else:
+                # Do a final call, without function calling when the max has been reached.
+                self._reset_function_choice_settings(settings)
+                async for streaming_chat_message_contents in self._inner_get_streaming_chat_message_contents(
+                    chat_history, settings
+                ):
+                    yield streaming_chat_message_contents
 
     async def get_streaming_chat_message_content(
         self,