fix: duplicate reasoning_content fields in chat completions response (#2493)

think-in-universe · serrrfirat · claude · web-flow · commit be0b33b2a373 · 2026-04-15T13:38:49.000+03:00
* fix: duplicate reasoning_content fields in chat completions response

* fix: resolve comments

* style: fix rustfmt and ignore RUSTSEC-2026-{0098,0099} in cargo-deny

Co-Authored-By: Claude Opus 4.6 (1M context) &lt;noreply@anthropic.com&gt;

* fix: resolve comments

---------

Co-authored-by: serrrfirat &lt;f@nuff.tech&gt;
Co-authored-by: Claude Opus 4.6 (1M context) &lt;noreply@anthropic.com&gt;
diff --git a/deny.toml b/deny.toml
@@ -17,6 +17,9 @@ ignore = [
     # rand unsoundness with custom logger calling rand::rng() during reseed — we don't use this pattern;
     # revisit/remove by 2026-06-30, or when transitive deps (tower, nanoid, phf_generator) release rand ≥0.9.3 compat
     "RUSTSEC-2026-0097",
+    # rustls-webpki URI/wildcard name constraint bypass — 0.102.x/0.103.x pinned by libsql transitive dep
+    "RUSTSEC-2026-0098",
+    "RUSTSEC-2026-0099",
 ]
 
 [licenses]
diff --git a/src/llm/nearai_chat.rs b/src/llm/nearai_chat.rs
@@ -523,10 +523,14 @@ impl LlmProvider for NearAiChatProvider {
 
         // Fall back to reasoning_content when content is null (same as
         // complete_with_tools — reasoning models may put the answer there).
-        let content = choice
-            .message
-            .content
-            .or(choice.message.reasoning_content)
+        let ChatCompletionResponseMessage {
+            content,
+            reasoning_content,
+            reasoning,
+            ..
+        } = choice.message;
+        let content = content
+            .or(reasoning_content.or(reasoning))
             .unwrap_or_default();
         let finish_reason = match choice.finish_reason.as_deref() {
             Some("stop") => FinishReason::Stop,
@@ -602,9 +606,16 @@ impl LlmProvider for NearAiChatProvider {
                     provider: "nearai_chat".to_string(),
                 })?;
 
-        let tool_calls: Vec<ToolCall> = choice
-            .message
-            .tool_calls
+        let ChatCompletionResponseMessage {
+            content: message_content,
+            reasoning_content,
+            reasoning,
+            tool_calls: message_tool_calls,
+            ..
+        } = choice.message;
+        let reasoning_fallback = reasoning_content.or(reasoning);
+
+        let tool_calls: Vec<ToolCall> = message_tool_calls
             .unwrap_or_default()
             .into_iter()
             .map(|tc| {
@@ -626,9 +637,9 @@ impl LlmProvider for NearAiChatProvider {
         // leaking that into conversation history inflates context and
         // confuses the model.
         let content = if tool_calls.is_empty() {
-            choice.message.content.or(choice.message.reasoning_content)
+            message_content.or(reasoning_fallback)
         } else {
-            choice.message.content
+            message_content
         };
 
         let finish_reason = match choice.finish_reason.as_deref() {
@@ -1072,8 +1083,10 @@ struct ChatCompletionResponseMessage {
     /// Some models return chain-of-thought reasoning here instead of in
     /// `content`. vLLM/SGLang backends (used by NEAR AI) return the field
     /// as `reasoning`; other APIs (GLM-5, DeepSeek) use `reasoning_content`.
-    #[serde(default, alias = "reasoning")]
+    #[serde(default)]
     reasoning_content: Option<String>,
+    #[serde(default)]
+    reasoning: Option<String>,
     tool_calls: Option<Vec<ChatCompletionToolCall>>,
 }
 
@@ -1454,7 +1467,7 @@ mod tests {
         assert_eq!(output, default_out);
     }
 
-    /// Regression: reasoning_content must NOT leak into tool-call responses.
+    /// Regression: reasoning fallbacks must NOT leak into tool-call responses.
     #[test]
     fn test_reasoning_content_not_leaked_into_tool_call_response() {
         let response: ChatCompletionResponse = serde_json::from_value(serde_json::json!({
@@ -1464,6 +1477,7 @@ mod tests {
                     "role": "assistant",
                     "content": null,
                     "reasoning_content": "Let me think about which tool to call...",
+                    "reasoning": "Secondary reasoning fallback text",
                     "tool_calls": [{
                         "id": "call_abc123",
                         "type": "function",
@@ -1480,9 +1494,15 @@ mod tests {
         .unwrap();
 
         let choice = response.choices.into_iter().next().unwrap();
-        let tool_calls: Vec<ToolCall> = choice
-            .message
-            .tool_calls
+        let ChatCompletionResponseMessage {
+            content: message_content,
+            reasoning_content,
+            reasoning,
+            tool_calls: message_tool_calls,
+            ..
+        } = choice.message;
+        let reasoning_fallback = reasoning_content.or(reasoning);
+        let tool_calls: Vec<ToolCall> = message_tool_calls
             .unwrap_or_default()
             .into_iter()
             .map(|tc| {
@@ -1498,14 +1518,14 @@ mod tests {
             .collect();
 
         let content = if tool_calls.is_empty() {
-            choice.message.content.or(choice.message.reasoning_content)
+            message_content.or(reasoning_fallback)
         } else {
-            choice.message.content
+            message_content
         };
 
         assert!(
             content.is_none(),
-            "reasoning_content should NOT leak into tool-call responses, got: {:?}",
+            "reasoning fallbacks should NOT leak into tool-call responses, got: {:?}",
             content
         );
         assert_eq!(tool_calls.len(), 1);
@@ -1521,7 +1541,8 @@ mod tests {
                 "message": {
                     "role": "assistant",
                     "content": null,
-                    "reasoning_content": "The answer is 42."
+                    "reasoning_content": "The answer is 42.",
+                    "reasoning": "Backup reasoning text"
                 },
                 "finish_reason": "stop"
             }],
@@ -1530,9 +1551,15 @@ mod tests {
         .unwrap();
 
         let choice = response.choices.into_iter().next().unwrap();
-        let tool_calls: Vec<ToolCall> = choice
-            .message
-            .tool_calls
+        let ChatCompletionResponseMessage {
+            content: message_content,
+            reasoning_content,
+            reasoning,
+            tool_calls: message_tool_calls,
+            ..
+        } = choice.message;
+        let reasoning_fallback = reasoning_content.or(reasoning);
+        let tool_calls: Vec<ToolCall> = message_tool_calls
             .unwrap_or_default()
             .into_iter()
             .map(|tc| {
@@ -1548,9 +1575,9 @@ mod tests {
             .collect();
 
         let content = if tool_calls.is_empty() {
-            choice.message.content.or(choice.message.reasoning_content)
+            message_content.or(reasoning_fallback)
         } else {
-            choice.message.content
+            message_content
         };
 
         assert_eq!(
@@ -1562,7 +1589,7 @@ mod tests {
     }
 
     /// The vLLM/SGLang API returns `reasoning` (not `reasoning_content`).
-    /// Verify that the serde alias deserializes it correctly.
+    /// Verify that this dedicated field is consumed as fallback content.
     #[test]
     fn test_reasoning_field_alias_accepted() {
         let response: ChatCompletionResponse = serde_json::from_value(serde_json::json!({
@@ -1581,12 +1608,18 @@ mod tests {
         .unwrap();
 
         let choice = response.choices.into_iter().next().unwrap();
-        let content = choice.message.content.or(choice.message.reasoning_content);
+        let ChatCompletionResponseMessage {
+            content,
+            reasoning_content,
+            reasoning,
+            ..
+        } = choice.message;
+        let content = content.or(reasoning_content.or(reasoning));
 
         assert_eq!(
             content,
             Some("The answer is 42.".to_string()),
-            "reasoning field (vLLM alias) should deserialize into reasoning_content"
+            "reasoning should be used as fallback content"
         );
     }
 
@@ -1618,9 +1651,15 @@ mod tests {
         .unwrap();
 
         let choice = response.choices.into_iter().next().unwrap();
-        let tool_calls: Vec<ToolCall> = choice
-            .message
-            .tool_calls
+        let ChatCompletionResponseMessage {
+            content: message_content,
+            reasoning_content,
+            reasoning,
+            tool_calls: message_tool_calls,
+            ..
+        } = choice.message;
+        let reasoning_fallback = reasoning_content.or(reasoning);
+        let tool_calls: Vec<ToolCall> = message_tool_calls
             .unwrap_or_default()
             .into_iter()
             .map(|tc| {
@@ -1636,9 +1675,9 @@ mod tests {
             .collect();
 
         let content = if tool_calls.is_empty() {
-            choice.message.content.or(choice.message.reasoning_content)
+            message_content.or(reasoning_fallback)
         } else {
-            choice.message.content
+            message_content
         };
 
         assert!(
@@ -1648,6 +1687,66 @@ mod tests {
         assert_eq!(tool_calls.len(), 1);
     }
 
+    /// Regression: payloads that include BOTH reasoning fields must parse
+    /// successfully and honor fallback precedence:
+    /// content -> reasoning_content -> reasoning.
+    #[test]
+    fn test_both_reasoning_fields_parse_with_defined_precedence() {
+        // Case 1: content is present, so it wins over both reasoning fields.
+        let response_with_content: ChatCompletionResponse =
+            serde_json::from_value(serde_json::json!({
+                "id": "chatcmpl-test-content",
+                "choices": [{
+                    "message": {
+                        "role": "assistant",
+                        "content": "Final answer in content.",
+                        "reasoning_content": "Reasoning content fallback",
+                        "reasoning": "Reasoning alias fallback"
+                    },
+                    "finish_reason": "stop"
+                }]
+            }))
+            .expect("payload with both reasoning fields should deserialize");
+        let choice = response_with_content.choices.into_iter().next().unwrap();
+        let ChatCompletionResponseMessage {
+            content,
+            reasoning_content,
+            reasoning,
+            ..
+        } = choice.message;
+        let selected = content
+            .or(reasoning_content.or(reasoning))
+            .expect("content should be selected");
+        assert_eq!(selected, "Final answer in content.");
+
+        // Case 2: content is null; reasoning_content should win over reasoning.
+        let response_without_content: ChatCompletionResponse =
+            serde_json::from_value(serde_json::json!({
+                "id": "chatcmpl-test-reasoning",
+                "choices": [{
+                    "message": {
+                        "role": "assistant",
+                        "content": null,
+                        "reasoning_content": "Preferred reasoning_content",
+                        "reasoning": "Secondary reasoning"
+                    },
+                    "finish_reason": "stop"
+                }]
+            }))
+            .expect("payload with both reasoning fields should deserialize");
+        let choice = response_without_content.choices.into_iter().next().unwrap();
+        let ChatCompletionResponseMessage {
+            content,
+            reasoning_content,
+            reasoning,
+            ..
+        } = choice.message;
+        let selected = content
+            .or(reasoning_content.or(reasoning))
+            .expect("reasoning fallback should be selected");
+        assert_eq!(selected, "Preferred reasoning_content");
+    }
+
     #[tokio::test]
     async fn test_resolve_bearer_token_config_api_key() {
         // When config.api_key is set, it takes top priority.

Original file line number	Diff line number	Diff line change
`@@ -17,6 +17,9 @@ ignore = [`
`17`	`17`	`# rand unsoundness with custom logger calling rand::rng() during reseed — we don't use this pattern;`
`18`	`18`	`# revisit/remove by 2026-06-30, or when transitive deps (tower, nanoid, phf_generator) release rand ≥0.9.3 compat`
`19`	`19`	`"RUSTSEC-2026-0097",`
	`20`	`+ # rustls-webpki URI/wildcard name constraint bypass — 0.102.x/0.103.x pinned by libsql transitive dep`
	`21`	`+ "RUSTSEC-2026-0098",`
	`22`	`+ "RUSTSEC-2026-0099",`
`20`	`23`	`]`
`21`	`24`
`22`	`25`	`[licenses]`