hermes-agent/tests/agent/test_gemini_fast_fallback.py
2026-05-05 10:14:48 -07:00

62 lines
1.9 KiB
Python

"""Regression tests for #13636 — CloudCode / Gemini CLI rate-limit fallback.
_pool_may_recover_from_rate_limit() is the hinge between credential-pool
rotation and fallback-provider activation. For CloudCode (Gemini CLI /
Gemini OAuth) the 429 is an account-wide throttle, so waiting for pool
rotation is pointless — prefer fallback immediately.
"""
from unittest.mock import MagicMock
from run_agent import _pool_may_recover_from_rate_limit
def _pool(entries: int = 2):
p = MagicMock()
p.has_available.return_value = True
p.entries.return_value = list(range(entries))
return p
def test_cloudcode_provider_skips_pool_rotation():
assert _pool_may_recover_from_rate_limit(
_pool(entries=3),
provider="google-gemini-cli",
base_url="cloudcode-pa://google",
) is False
def test_cloudcode_base_url_skips_pool_rotation_even_on_alias_provider():
# Even if the provider label is something else, a cloudcode-pa:// URL
# signals the account-wide quota regime.
assert _pool_may_recover_from_rate_limit(
_pool(entries=3),
provider="custom-provider",
base_url="cloudcode-pa://google",
) is False
def test_non_cloudcode_multi_entry_pool_still_recovers():
assert _pool_may_recover_from_rate_limit(
_pool(entries=3),
provider="openrouter",
base_url="https://openrouter.ai/api/v1",
) is True
def test_single_entry_pool_skips_rotation_regardless_of_provider():
# Pre-existing single-entry-pool exception (#11314) still holds.
assert _pool_may_recover_from_rate_limit(
_pool(entries=1),
provider="openrouter",
base_url="https://openrouter.ai/api/v1",
) is False
def test_exhausted_pool_skips_rotation():
p = MagicMock()
p.has_available.return_value = False
assert _pool_may_recover_from_rate_limit(p) is False
def test_no_pool_skips_rotation():
assert _pool_may_recover_from_rate_limit(None) is False