mirror of
https://github.com/NousResearch/hermes-agent.git
synced 2026-04-25 00:51:20 +00:00
Follow up salvaged PR #12668 by threading base_url through the remaining direct-call sites so kimi-k2.5 uses temperature=1.0 on api.moonshot.ai and keeps 0.6 on api.kimi.com/coding. Add focused regression tests for run_agent, trajectory_compressor, and mini_swe_runner.
55 lines
1.8 KiB
Python
55 lines
1.8 KiB
Python
from types import SimpleNamespace
|
|
from unittest.mock import MagicMock, patch
|
|
|
|
|
|
def test_run_task_forces_kimi_fixed_temperature():
|
|
with patch("openai.OpenAI") as mock_openai:
|
|
client = MagicMock()
|
|
client.chat.completions.create.return_value = SimpleNamespace(
|
|
choices=[SimpleNamespace(message=SimpleNamespace(content="done", tool_calls=[]))]
|
|
)
|
|
mock_openai.return_value = client
|
|
|
|
from mini_swe_runner import MiniSWERunner
|
|
|
|
runner = MiniSWERunner(
|
|
model="kimi-for-coding",
|
|
base_url="https://api.kimi.com/coding/v1",
|
|
api_key="test-key",
|
|
env_type="local",
|
|
max_iterations=1,
|
|
)
|
|
runner._create_env = MagicMock()
|
|
runner._cleanup_env = MagicMock()
|
|
|
|
result = runner.run_task("2+2")
|
|
|
|
assert result["completed"] is True
|
|
assert client.chat.completions.create.call_args.kwargs["temperature"] == 0.6
|
|
|
|
|
|
def test_run_task_public_moonshot_kimi_k2_5_forces_temperature_1():
|
|
with patch("openai.OpenAI") as mock_openai:
|
|
client = MagicMock()
|
|
client.base_url = "https://api.moonshot.ai/v1"
|
|
client.chat.completions.create.return_value = SimpleNamespace(
|
|
choices=[SimpleNamespace(message=SimpleNamespace(content="done", tool_calls=[]))]
|
|
)
|
|
mock_openai.return_value = client
|
|
|
|
from mini_swe_runner import MiniSWERunner
|
|
|
|
runner = MiniSWERunner(
|
|
model="kimi-k2.5",
|
|
base_url="https://api.moonshot.ai/v1",
|
|
api_key="test-key",
|
|
env_type="local",
|
|
max_iterations=1,
|
|
)
|
|
runner._create_env = MagicMock()
|
|
runner._cleanup_env = MagicMock()
|
|
|
|
result = runner.run_task("2+2")
|
|
|
|
assert result["completed"] is True
|
|
assert client.chat.completions.create.call_args.kwargs["temperature"] == 1.0
|