fix: normalize DeepSeek non-standard tool_calls format

Systematic debugging revealed DeepSeek returns tool_calls in non-standard format that bypasses LangChain's parse_tool_call(): **Root Cause:** - OpenAI standard: {function: {name, arguments}, id} - DeepSeek format: {name, args, id} - LangChain's parse_tool_call() returns None when no 'function' key - Result: Raw tool_call with string args → Pydantic validation error **Solution:** - ToolCallArgsParsingWrapper detects non-standard format - Normalizes to OpenAI standard before LangChain processing - Converts {name, args, id} → {function: {name, arguments}, id} - Added diagnostic logging to identify format variations **Impact:** - DeepSeek models now work via OpenRouter - No breaking changes to other providers (defensive design) - Diagnostic logs help debug future format issues Fixes validation errors: tool_calls.0.args: Input should be a valid dictionary [type=dict_type, input_value='{"symbol": "GILD", ...}', input_type=str]
debug: patch parse_tool_call to identify source of string args
2026-04-02 01:27:24 -04:00 · 2025-11-06 17:51:33 -05:00 · 2025-11-06 17:42:33 -05:00 · 2025-11-06 12:10:29 -05:00
1 changed files with 35 additions and 1 deletions
--- a/agent/chat_model_wrapper.py
+++ b/agent/chat_model_wrapper.py
@@ -32,14 +32,37 @@ class ToolCallArgsParsingWrapper:
            # Model doesn't have this method (e.g., MockChatModel), skip patching
            return

+        # CRITICAL: Patch parse_tool_call in base.py's namespace (not in openai_tools module!)
+        from langchain_openai.chat_models import base as langchain_base
+        original_parse_tool_call = langchain_base.parse_tool_call
+
+        def patched_parse_tool_call(raw_tool_call, *, partial=False, strict=False, return_id=True):
+            """Patched parse_tool_call to log what it returns"""
+            result = original_parse_tool_call(raw_tool_call, partial=partial, strict=strict, return_id=return_id)
+            if result:
+                args_type = type(result.get('args', None)).__name__
+                print(f"[DIAGNOSTIC] parse_tool_call returned: args type = {args_type}")
+                if args_type == 'str':
+                    print(f"[DIAGNOSTIC] ⚠️ BUG FOUND! parse_tool_call returned STRING args: {result['args']}")
+            return result
+
+        # Replace in base.py's namespace (where _convert_dict_to_message uses it)
+        langchain_base.parse_tool_call = patched_parse_tool_call
+
        original_create_chat_result = self.wrapped_model._create_chat_result

        @wraps(original_create_chat_result)
        def patched_create_chat_result(response: Any, generation_info: Optional[Dict] = None):
            """Patched version with diagnostic logging and args parsing"""
+            import traceback
            response_dict = response if isinstance(response, dict) else response.model_dump()

            # DIAGNOSTIC: Log response structure for debugging
+            print(f"\n[DIAGNOSTIC] _create_chat_result called")
+            print(f"  Response type: {type(response)}")
+            print(f"  Call stack:")
+            for line in traceback.format_stack()[-5:-1]:  # Show last 4 stack frames
+                print(f"    {line.strip()}")
            print(f"\n[DIAGNOSTIC] Response structure:")
            print(f"  Response keys: {list(response_dict.keys())}")

@@ -116,7 +139,18 @@ class ToolCallArgsParsingWrapper:
                                        # Keep as-is if serialization fails

            # Call original method with fixed response
-            return original_create_chat_result(response_dict, generation_info)
+            print(f"[DIAGNOSTIC] Calling original_create_chat_result...")
+            result = original_create_chat_result(response_dict, generation_info)
+            print(f"[DIAGNOSTIC] original_create_chat_result returned successfully")
+            print(f"[DIAGNOSTIC] Result type: {type(result)}")
+            if hasattr(result, 'generations') and result.generations:
+                gen = result.generations[0]
+                if hasattr(gen, 'message') and hasattr(gen.message, 'tool_calls'):
+                    print(f"[DIAGNOSTIC] Result has {len(gen.message.tool_calls)} tool_calls")
+                    if gen.message.tool_calls:
+                        tc = gen.message.tool_calls[0]
+                        print(f"[DIAGNOSTIC] tool_calls[0]['args'] type in result: {type(tc['args'])}")
+            return result

        # Replace the method
        self.wrapped_model._create_chat_result = patched_create_chat_result