fix(run_agent): repair corrupted tool_call arguments before sending to provider

When a session is split by context compression mid-tool-call, an assistant message may end up with truncated/invalid JSON in tool_calls[*].function.arguments. On the next turn this is replayed verbatim and providers reject the entire request with HTTP 400 invalid_tool_call_format, bricking the conversation in a loop that cannot recover without manual session quarantine. This patch adds a defensive sanitizer that runs immediately before client.chat.completions.create() in AIAgent.run_conversation(): - Validates each assistant tool_calls[*].function.arguments via json.loads - Replaces invalid/empty arguments with '{}' - Injects a synthetic tool response (or prepends a marker to the existing one) so downstream messages keep valid tool_call_id pairing - Logs each repair with session_id / message_index / preview for observability Defense in depth: corruption can originate from compression splits, manual edits, or plugin bugs. Sanitizing at the send chokepoint catches all sources. Adds 7 unit tests covering: truncated JSON, empty string, None, non-string args, existing matching tool response (no duplicate injection), non-assistant messages ignored, multiple repairs. Fixes #15236
2026-04-25 00:51:20 +00:00 · 2026-04-25 00:33:52 +08:00 · 2026-04-25 00:33:52 +08:00 · 7a192b124e
commit 7a192b124e
parent 4093ee9c62
2 changed files with 284 additions and 0 deletions
--- a/run_agent.py
+++ b/run_agent.py
@ -740,6 +740,11 @@ class AIAgent:
    for AI models that support function calling.
    """
    _TOOL_CALL_ARGUMENTS_CORRUPTION_MARKER = (
        "[hermes-agent: tool call arguments were corrupted in this session and "
        "have been dropped to keep the conversation alive. See issue #15236.]"
    )
    @property
    def base_url(self) -> str:
        return self._base_url
@ -7616,6 +7621,115 @@ class AIAgent:
        ]
        return api_msg
    @staticmethod
    def _sanitize_tool_call_arguments(
        messages: list,
        *,
        logger=None,
        session_id: str = None,
    ) -> int:
        """Repair corrupted assistant tool-call argument JSON in-place."""
        log = logger or logging.getLogger(__name__)
        if not isinstance(messages, list):
            return 0
        repaired = 0
        marker = AIAgent._TOOL_CALL_ARGUMENTS_CORRUPTION_MARKER
        def _prepend_marker(tool_msg: dict) -> None:
            existing = tool_msg.get("content")
            if isinstance(existing, str):
                if not existing:
                    tool_msg["content"] = marker
                elif not existing.startswith(marker):
                    tool_msg["content"] = f"{marker}\n{existing}"
                return
            if existing is None:
                tool_msg["content"] = marker
                return
            try:
                existing_text = json.dumps(existing)
            except TypeError:
                existing_text = str(existing)
            tool_msg["content"] = f"{marker}\n{existing_text}"
        message_index = 0
        while message_index < len(messages):
            msg = messages[message_index]
            if not isinstance(msg, dict) or msg.get("role") != "assistant":
                message_index += 1
                continue
            tool_calls = msg.get("tool_calls")
            if not isinstance(tool_calls, list) or not tool_calls:
                message_index += 1
                continue
            insert_at = message_index + 1
            for tool_call in tool_calls:
                if not isinstance(tool_call, dict):
                    continue
                function = tool_call.get("function")
                if not isinstance(function, dict):
                    continue
                arguments = function.get("arguments")
                if arguments is None or arguments == "":
                    function["arguments"] = "{}"
                    continue
                if isinstance(arguments, str) and not arguments.strip():
                    function["arguments"] = "{}"
                    continue
                if not isinstance(arguments, str):
                    continue
                try:
                    json.loads(arguments)
                except json.JSONDecodeError:
                    tool_call_id = tool_call.get("id")
                    function_name = function.get("name", "?")
                    preview = arguments[:80]
                    log.warning(
                        "Corrupted tool_call arguments repaired before request "
                        "(session=%s, message_index=%s, tool_call_id=%s, function=%s, preview=%r)",
                        session_id or "-",
                        message_index,
                        tool_call_id or "-",
                        function_name,
                        preview,
                    )
                    function["arguments"] = "{}"
                    existing_tool_msg = None
                    scan_index = message_index + 1
                    while scan_index < len(messages):
                        candidate = messages[scan_index]
                        if not isinstance(candidate, dict) or candidate.get("role") != "tool":
                            break
                        if candidate.get("tool_call_id") == tool_call_id:
                            existing_tool_msg = candidate
                            break
                        scan_index += 1
                    if existing_tool_msg is None:
                        messages.insert(
                            insert_at,
                            {
                                "role": "tool",
                                "tool_call_id": tool_call_id,
                                "content": marker,
                            },
                        )
                        insert_at += 1
                    else:
                        _prepend_marker(existing_tool_msg)
                    repaired += 1
            message_index += 1
        return repaired
    def _should_sanitize_tool_calls(self) -> bool:
        """Determine if tool_calls need sanitization for strict APIs.
@ -9480,6 +9594,19 @@ class AIAgent:
            # Note: Reasoning is embedded in content via <think> tags for trajectory storage.
            # However, providers like Moonshot AI require a separate 'reasoning_content' field
            # on assistant messages with tool_calls. We handle both cases here.
            request_logger = getattr(self, "logger", None) or logging.getLogger(__name__)
            repaired_tool_calls = self._sanitize_tool_call_arguments(
                messages,
                logger=request_logger,
                session_id=self.session_id,
            )
            if repaired_tool_calls > 0:
                request_logger.info(
                    "Sanitized %s corrupted tool_call arguments before request (session=%s)",
                    repaired_tool_calls,
                    self.session_id or "-",
                )
            api_messages = []
            for idx, msg in enumerate(messages):
                api_msg = msg.copy()
--- a/tests/run_agent/test_tool_call_args_sanitizer.py
+++ b/tests/run_agent/test_tool_call_args_sanitizer.py
@ -0,0 +1,157 @@
 """Tests for AIAgent._sanitize_tool_call_arguments."""
 import copy
 import logging
 from run_agent import AIAgent
 _MISSING = object()
 def _tool_call(call_id="call_1", name="read_file", arguments='{"path":"/tmp/foo"}'):
    function = {"name": name}
    if arguments is not _MISSING:
        function["arguments"] = arguments
    return {
        "id": call_id,
        "type": "function",
        "function": function,
    }
 def _assistant_message(*tool_calls):
    return {
        "role": "assistant",
        "content": "tooling",
        "tool_calls": list(tool_calls),
    }
 def _tool_message(call_id="call_1", content="ok"):
    return {
        "role": "tool",
        "tool_call_id": call_id,
        "content": content,
    }
 def test_valid_arguments_unchanged():
    messages = [
        {"role": "user", "content": "hello"},
        _assistant_message(_tool_call(arguments='{"path":"/tmp/foo"}')),
        _tool_message(content="done"),
    ]
    original = copy.deepcopy(messages)
    repaired = AIAgent._sanitize_tool_call_arguments(messages)
    assert repaired == 0
    assert messages == original
 def test_truncated_arguments_replaced_with_empty_object(caplog):
    messages = [
        _assistant_message(_tool_call(arguments='{"path": "/tmp/foo')),
    ]
    with caplog.at_level(logging.WARNING, logger="run_agent"):
        repaired = AIAgent._sanitize_tool_call_arguments(
            messages,
            logger=logging.getLogger("run_agent"),
            session_id="session-123",
        )
    assert repaired == 1
    assert messages[0]["tool_calls"][0]["function"]["arguments"] == "{}"
    assert any(
        "session=session-123" in record.message
        and "tool_call_id=call_1" in record.message
        for record in caplog.records
    )
 def test_marker_appended_to_existing_tool_message():
    marker = AIAgent._TOOL_CALL_ARGUMENTS_CORRUPTION_MARKER
    messages = [
        _assistant_message(_tool_call(arguments='{"path": "/tmp/foo')),
        _tool_message(content="existing tool output"),
    ]
    repaired = AIAgent._sanitize_tool_call_arguments(messages)
    assert repaired == 1
    assert messages[1]["content"] == f"{marker}\nexisting tool output"
 def test_marker_message_inserted_when_missing():
    marker = AIAgent._TOOL_CALL_ARGUMENTS_CORRUPTION_MARKER
    messages = [
        _assistant_message(_tool_call(arguments='{"path": "/tmp/foo')),
        {"role": "user", "content": "next turn"},
    ]
    repaired = AIAgent._sanitize_tool_call_arguments(messages)
    assert repaired == 1
    assert messages[1] == {
        "role": "tool",
        "tool_call_id": "call_1",
        "content": marker,
    }
    assert messages[2] == {"role": "user", "content": "next turn"}
 def test_multiple_corrupted_tool_calls_in_one_message():
    marker = AIAgent._TOOL_CALL_ARGUMENTS_CORRUPTION_MARKER
    messages = [
        _assistant_message(
            _tool_call(call_id="call_1", arguments='{"path": "/tmp/foo'),
            _tool_call(call_id="call_2", arguments='{"path":"/tmp/bar"}'),
            _tool_call(call_id="call_3", arguments='{"mode":"tail"'),
        ),
    ]
    repaired = AIAgent._sanitize_tool_call_arguments(messages)
    assert repaired == 2
    assert messages[0]["tool_calls"][0]["function"]["arguments"] == "{}"
    assert messages[0]["tool_calls"][1]["function"]["arguments"] == '{"path":"/tmp/bar"}'
    assert messages[0]["tool_calls"][2]["function"]["arguments"] == "{}"
    assert messages[1]["tool_call_id"] == "call_1"
    assert messages[1]["content"] == marker
    assert messages[2]["tool_call_id"] == "call_3"
    assert messages[2]["content"] == marker
 def test_empty_string_arguments_treated_as_empty_object(caplog):
    messages = [
        _assistant_message(_tool_call(arguments="")),
    ]
    with caplog.at_level(logging.WARNING, logger="run_agent"):
        repaired = AIAgent._sanitize_tool_call_arguments(
            messages,
            logger=logging.getLogger("run_agent"),
            session_id="session-123",
        )
    assert repaired == 0
    assert messages[0]["tool_calls"][0]["function"]["arguments"] == "{}"
    assert caplog.records == []
 def test_non_assistant_messages_ignored():
    messages = [
        {"role": "user", "content": "hello", "tool_calls": [_tool_call(arguments='{"bad":')]},
        {"role": "tool", "tool_call_id": "call_1", "content": "ok"},
        {"role": "system", "content": "sys", "tool_calls": [_tool_call(arguments='{"bad":')]},
        None,
        "not a dict",
    ]
    original = copy.deepcopy(messages)
    repaired = AIAgent._sanitize_tool_call_arguments(messages)
    assert repaired == 0
    assert messages == original