test(e2e): add authorization, session lifecycle, and resilience tests

New test classes: - TestSessionLifecycle: /new then /status sequence, idempotent resets - TestAuthorization: unauthorized users get pairing code, not commands - TestSendFailureResilience: pipeline survives send() failures Additional command coverage: /provider, /verbose, /personality, /yolo. Note: /provider test is xfail - found a real bug where model_cfg is referenced unbound when config.yaml is absent (run.py:3247).
2026-06-14 09:11:54 +00:00 · 2026-04-01 17:47:34 -03:00 · 2026-04-01 17:47:34 -03:00 · 04e60cfacd
commit 04e60cfacd
parent ecd9bf2ca0
2 changed files with 170 additions and 0 deletions
--- a/tests/e2e/conftest.py
+++ b/tests/e2e/conftest.py
@ -105,6 +105,11 @@ def make_runner(session_entry: SessionEntry) -> "GatewayRunner":
    runner._capture_gateway_honcho_if_configured = lambda *a, **kw: None
    runner._emit_gateway_run_progress = AsyncMock()

+    # Pairing store (used by authorization rejection path)
+    runner.pairing_store = MagicMock()
+    runner.pairing_store._is_rate_limited = MagicMock(return_value=False)
+    runner.pairing_store.generate_code = MagicMock(return_value="ABC123")
+
    return runner


--- a/tests/e2e/test_telegram_commands.py
+++ b/tests/e2e/test_telegram_commands.py
@ -9,10 +9,15 @@ Each test drives a message through the full async pipeline:
 No LLM involved — only gateway-level commands are tested.
 """

+import asyncio
+from unittest.mock import AsyncMock
+
 import pytest

+from gateway.platforms.base import SendResult
 from tests.e2e.conftest import (
    make_adapter,
+    make_event,
    make_runner,
    make_session_entry,
    make_source,
@ -102,3 +107,163 @@ class TestTelegramSlashCommands:

        send_status = await send_and_capture(adapter, "/status")
        send_status.assert_called_once()
+
+    @pytest.mark.asyncio
+    @pytest.mark.xfail(
+        reason="Bug: _handle_provider_command references unbound model_cfg when config.yaml is absent",
+        strict=False,
+    )
+    async def test_provider_shows_current_provider(self, adapter):
+        send = await send_and_capture(adapter, "/provider")
+
+        send.assert_called_once()
+        response_text = send.call_args[1].get("content") or send.call_args[0][1]
+        assert "provider" in response_text.lower()
+
+    @pytest.mark.asyncio
+    async def test_verbose_responds(self, adapter):
+        send = await send_and_capture(adapter, "/verbose")
+
+        send.assert_called_once()
+        response_text = send.call_args[1].get("content") or send.call_args[0][1]
+        # Either shows the mode cycle or tells user to enable it in config
+        assert "verbose" in response_text.lower() or "tool_progress" in response_text
+
+    @pytest.mark.asyncio
+    async def test_personality_lists_options(self, adapter):
+        send = await send_and_capture(adapter, "/personality")
+
+        send.assert_called_once()
+        response_text = send.call_args[1].get("content") or send.call_args[0][1]
+        assert "personalit" in response_text.lower()  # matches "personality" or "personalities"
+
+    @pytest.mark.asyncio
+    async def test_yolo_toggles_mode(self, adapter):
+        send = await send_and_capture(adapter, "/yolo")
+
+        send.assert_called_once()
+        response_text = send.call_args[1].get("content") or send.call_args[0][1]
+        assert "yolo" in response_text.lower()
+
+
+class TestSessionLifecycle:
+    """Verify session state changes across command sequences."""
+
+    @pytest.fixture()
+    def source(self):
+        return make_source()
+
+    @pytest.fixture()
+    def session_entry(self, source):
+        return make_session_entry(source)
+
+    @pytest.fixture()
+    def runner(self, session_entry):
+        return make_runner(session_entry)
+
+    @pytest.fixture()
+    def adapter(self, runner):
+        return make_adapter(runner)
+
+    @pytest.mark.asyncio
+    async def test_new_then_status_reflects_reset(self, adapter, runner, session_entry):
+        """After /new, /status should report the fresh session."""
+        await send_and_capture(adapter, "/new")
+        runner.session_store.reset_session.assert_called_once()
+
+        send = await send_and_capture(adapter, "/status")
+        send.assert_called_once()
+        response_text = send.call_args[1].get("content") or send.call_args[0][1]
+        # Session ID from the entry should appear in the status output
+        assert session_entry.session_id[:8] in response_text
+
+    @pytest.mark.asyncio
+    async def test_new_is_idempotent(self, adapter, runner):
+        """/new called twice should not crash."""
+        await send_and_capture(adapter, "/new")
+        await send_and_capture(adapter, "/new")
+        assert runner.session_store.reset_session.call_count == 2
+
+
+class TestAuthorization:
+    """Verify the pipeline handles unauthorized users."""
+
+    @pytest.fixture()
+    def source(self):
+        return make_source()
+
+    @pytest.fixture()
+    def session_entry(self, source):
+        return make_session_entry(source)
+
+    @pytest.fixture()
+    def runner(self, session_entry):
+        return make_runner(session_entry)
+
+    @pytest.fixture()
+    def adapter(self, runner):
+        return make_adapter(runner)
+
+    @pytest.mark.asyncio
+    async def test_unauthorized_user_gets_pairing_response(self, adapter, runner):
+        """Unauthorized DM should trigger pairing code, not a command response."""
+        runner._is_user_authorized = lambda _source: False
+
+        event = make_event("/help")
+        adapter.send.reset_mock()
+        await adapter.handle_message(event)
+        await asyncio.sleep(0.3)
+
+        # The adapter.send is called directly by the authorization path
+        # (not via _send_with_retry), so check it was called with a pairing message
+        adapter.send.assert_called()
+        response_text = adapter.send.call_args[0][1] if len(adapter.send.call_args[0]) > 1 else ""
+        assert "recognize" in response_text.lower() or "pair" in response_text.lower() or "ABC123" in response_text
+
+    @pytest.mark.asyncio
+    async def test_unauthorized_user_does_not_get_help(self, adapter, runner):
+        """Unauthorized user should NOT see the help command output."""
+        runner._is_user_authorized = lambda _source: False
+
+        event = make_event("/help")
+        adapter.send.reset_mock()
+        await adapter.handle_message(event)
+        await asyncio.sleep(0.3)
+
+        # If send was called, it should NOT contain the help text
+        if adapter.send.called:
+            response_text = adapter.send.call_args[0][1] if len(adapter.send.call_args[0]) > 1 else ""
+            assert "/new" not in response_text
+
+
+class TestSendFailureResilience:
+    """Verify the pipeline handles send failures gracefully."""
+
+    @pytest.fixture()
+    def source(self):
+        return make_source()
+
+    @pytest.fixture()
+    def session_entry(self, source):
+        return make_session_entry(source)
+
+    @pytest.fixture()
+    def runner(self, session_entry):
+        return make_runner(session_entry)
+
+    @pytest.fixture()
+    def adapter(self, runner):
+        return make_adapter(runner)
+
+    @pytest.mark.asyncio
+    async def test_send_failure_does_not_crash_pipeline(self, adapter):
+        """If send() returns failure, the pipeline should not raise."""
+        adapter.send = AsyncMock(return_value=SendResult(success=False, error="network timeout"))
+        adapter.set_message_handler(adapter._message_handler)  # re-wire with same handler
+
+        event = make_event("/help")
+        # Should not raise — pipeline handles send failures internally
+        await adapter.handle_message(event)
+        await asyncio.sleep(0.3)
+
+        adapter.send.assert_called()