"""Regression tests for #35314 — empty model on the post-interrupt recovery turn. After a ``stream_interrupt_abort`` during an active gateway session, the recovery turn was sometimes built with ``model=""`` (a transient config-cache miss returned an empty ``user_config``). Every API call then failed HTTP 400 "No models provided", "trying fallback..." was logged but never executed (the user had no fallback configured), and the session went silent until the user re-sent. These tests pin two fixes: 1. ``_resolve_session_agent_runtime`` caches the last successfully-resolved model per session and recovers it when a fresh resolution comes back empty. 2. ``_has_pending_fallback`` gates the "trying fallback..." status so it is only announced when a fallback chain actually exists. """ import threading import gateway.run as gateway_run def _make_runner(): runner = object.__new__(gateway_run.GatewayRunner) runner._session_model_overrides = {} runner._last_resolved_model = {} runner._service_tier = None runner._agent_cache = {} runner._agent_cache_lock = threading.Lock() return runner def _patch_resolution(monkeypatch, *, model_from_config: str, provider: str = "openrouter"): """Stub gateway model + runtime resolution to a known state.""" monkeypatch.setattr(gateway_run, "_resolve_gateway_model", lambda cfg=None: model_from_config) monkeypatch.setattr( gateway_run, "_resolve_runtime_agent_kwargs", lambda: { "provider": provider, "api_key": "x", "base_url": "https://openrouter.ai/api/v1", "api_mode": "chat_completions", }, ) def test_normal_turn_caches_last_resolved_model(monkeypatch): _patch_resolution(monkeypatch, model_from_config="deepseek/deepseek-v4-flash") runner = _make_runner() sk = "agent:main:discord:dm:123" model, _ = runner._resolve_session_agent_runtime(session_key=sk, user_config={"model": {"default": "x"}}) assert model == "deepseek/deepseek-v4-flash" # Cached per-session AND process-wide for first-seen-session recovery. assert runner._last_resolved_model[sk] == "deepseek/deepseek-v4-flash" assert runner._last_resolved_model["*"] == "deepseek/deepseek-v4-flash" def test_empty_model_recovers_session_last_good(monkeypatch): runner = _make_runner() sk = "agent:main:discord:dm:123" # Turn 1: config has the model — cache it. _patch_resolution(monkeypatch, model_from_config="deepseek/deepseek-v4-flash") runner._resolve_session_agent_runtime(session_key=sk, user_config={"model": {"default": "x"}}) # Turn 2: simulate the transient empty config read (the #35314 race). _patch_resolution(monkeypatch, model_from_config="", provider="") model, _ = runner._resolve_session_agent_runtime(session_key=sk, user_config={}) assert model == "deepseek/deepseek-v4-flash", "recovery turn must reuse last-known-good, not build model=''" def test_empty_model_new_session_recovers_global_last_good(monkeypatch): runner = _make_runner() # Prime a different session so the process-wide "*" slot is populated. _patch_resolution(monkeypatch, model_from_config="deepseek/deepseek-v4-flash") runner._resolve_session_agent_runtime(session_key="agent:main:discord:dm:111", user_config={"model": {}}) # A brand-new session that hits an empty config read still recovers via "*". _patch_resolution(monkeypatch, model_from_config="", provider="") model, _ = runner._resolve_session_agent_runtime(session_key="agent:main:discord:dm:999", user_config={}) assert model == "deepseek/deepseek-v4-flash" def test_cold_start_empty_model_does_not_crash(monkeypatch): """No last-good anywhere + empty config → returns '' gracefully (no exception).""" _patch_resolution(monkeypatch, model_from_config="", provider="") runner = _make_runner() model, _ = runner._resolve_session_agent_runtime(session_key="agent:main:discord:dm:1", user_config={}) assert model == "" def test_bare_runner_without_cache_attr_does_not_crash(monkeypatch): """object.__new__ runners (test helpers / pitfall #17) lack _last_resolved_model. The getattr guard must tolerate the missing attribute. """ _patch_resolution(monkeypatch, model_from_config="deepseek/deepseek-v4-flash") runner = object.__new__(gateway_run.GatewayRunner) runner._session_model_overrides = {} runner._service_tier = None # Deliberately omit _last_resolved_model. model, _ = runner._resolve_session_agent_runtime(session_key="x", user_config={"model": {}}) assert model == "deepseek/deepseek-v4-flash" # ── _has_pending_fallback gate ────────────────────────────────────────────── def _bare_agent(): import run_agent return object.__new__(run_agent.AIAgent) def test_has_pending_fallback_empty_chain(): agent = _bare_agent() agent._fallback_chain = [] agent._fallback_index = 0 assert agent._has_pending_fallback() is False def test_has_pending_fallback_with_chain(): agent = _bare_agent() agent._fallback_chain = [{"provider": "openai", "model": "gpt-5"}] agent._fallback_index = 0 assert agent._has_pending_fallback() is True def test_has_pending_fallback_exhausted_chain(): agent = _bare_agent() agent._fallback_chain = [{"provider": "openai", "model": "gpt-5"}] agent._fallback_index = 1 assert agent._has_pending_fallback() is False def test_has_pending_fallback_missing_attrs(): """Bare agent with no fallback attributes set must default to False, not crash.""" agent = _bare_agent() assert agent._has_pending_fallback() is False