diff --git a/tests/agent/test_auxiliary_client.py b/tests/agent/test_auxiliary_client.py index 47e0a3d4f90..8d82bdeb573 100644 --- a/tests/agent/test_auxiliary_client.py +++ b/tests/agent/test_auxiliary_client.py @@ -163,6 +163,18 @@ class TestBuildCallKwargsMaxTokens: assert kwargs["max_tokens"] == 1234 assert "max_completion_tokens" not in kwargs + def test_keeps_max_tokens_for_nvidia_nim(self): + from agent.auxiliary_client import _build_call_kwargs + + kwargs = _build_call_kwargs( + provider="nvidia", + model="minimaxai/minimax-m3", + messages=[{"role": "user", "content": "hi"}], + max_tokens=4096, + base_url="https://integrate.api.nvidia.com/v1", + ) + assert kwargs["max_tokens"] == 4096 + class TestNousTagsScoping: def test_tags_injected_when_provider_is_nous(self, monkeypatch):