mirror of
https://github.com/NousResearch/hermes-agent.git
synced 2026-06-17 09:41:58 +00:00
* fix(s6): prevent profile create from auto-starting gateway service When hermes profile create runs inside an s6 container, _maybe_register_gateway_service() calls register_profile_gateway() which creates the service directory and triggers s6-svscanctl -a. Previously the service always started immediately, causing profiles that share the main gateway's bot token (e.g. Kanban worker profiles) to fail with a token-lock conflict and persist gateway_state: running — becoming zombies that resurrect on every container restart. Wire the existing start_now parameter through the S6 implementation: when start_now=False, write a marker file (same pattern as container_boot.py _register_gateway_slot) so s6-supervise leaves the service stopped until the user explicitly runs hermes -p <profile> gateway start. 4 files, +61/-6, 4 new tests (all passing). * test(docker): wait for gateway running state before restart --------- Co-authored-by: liuhao1024 <sunsky.lau@gmail.com>
227 lines
8.1 KiB
Python
227 lines
8.1 KiB
Python
"""Tests for the Phase 4 s6 hooks in hermes_cli.profiles.
|
|
|
|
Specifically: _maybe_register_gateway_service,
|
|
_maybe_unregister_gateway_service. The integration with
|
|
create_profile and delete_profile is covered indirectly by the
|
|
existing TestCreateProfile and TestDeleteProfile classes in
|
|
tests/hermes_cli/test_profiles.py; here we only exercise the new
|
|
helper surface that doesn't touch the filesystem.
|
|
"""
|
|
from __future__ import annotations
|
|
|
|
from typing import Any
|
|
|
|
import pytest
|
|
|
|
from hermes_cli.profiles import (
|
|
_maybe_register_gateway_service,
|
|
_maybe_unregister_gateway_service,
|
|
)
|
|
|
|
|
|
# ---------------------------------------------------------------------------
|
|
# _maybe_register_gateway_service / _maybe_unregister_gateway_service
|
|
# ---------------------------------------------------------------------------
|
|
|
|
|
|
class _HostManager:
|
|
"""Mimics a host backend that doesn't support runtime registration."""
|
|
kind = "systemd"
|
|
|
|
def supports_runtime_registration(self) -> bool:
|
|
return False
|
|
|
|
def register_profile_gateway(self, *args: Any, **kwargs: Any) -> None:
|
|
raise AssertionError("host backend register_profile_gateway should not be called")
|
|
|
|
def unregister_profile_gateway(self, *args: Any, **kwargs: Any) -> None:
|
|
raise AssertionError("host backend unregister_profile_gateway should not be called")
|
|
|
|
|
|
class _S6Manager:
|
|
"""Mimics S6ServiceManager just enough for the hooks."""
|
|
kind = "s6"
|
|
|
|
def __init__(self) -> None:
|
|
self.registered: list[str] = []
|
|
self.unregistered: list[str] = []
|
|
self.raise_on_register: Exception | None = None
|
|
self.raise_on_unregister: Exception | None = None
|
|
|
|
def supports_runtime_registration(self) -> bool:
|
|
return True
|
|
|
|
def register_profile_gateway(
|
|
self, profile: str, *,
|
|
extra_env: dict[str, str] | None = None,
|
|
start_now: bool = True,
|
|
) -> None:
|
|
if self.raise_on_register is not None:
|
|
raise self.raise_on_register
|
|
self.registered.append(profile)
|
|
self.last_start_now = start_now
|
|
|
|
def unregister_profile_gateway(self, profile: str) -> None:
|
|
if self.raise_on_unregister is not None:
|
|
raise self.raise_on_unregister
|
|
self.unregistered.append(profile)
|
|
|
|
|
|
def _patch_detect_s6(monkeypatch: pytest.MonkeyPatch) -> None:
|
|
"""Pretend we're inside an s6 container so the host short-circuit
|
|
in :func:`_maybe_register_gateway_service` /
|
|
:func:`_maybe_unregister_gateway_service` doesn't fire.
|
|
|
|
Without this, ``detect_service_manager()`` runs its real
|
|
implementation (host Linux/macOS in CI), returns ``"systemd"`` or
|
|
``"launchd"``, and the hooks return early before reaching the
|
|
patched ``get_service_manager``. Each s6-call-through test
|
|
explicitly opts into this so the host-no-op tests can still
|
|
exercise the early-return path.
|
|
"""
|
|
monkeypatch.setattr(
|
|
"hermes_cli.service_manager.detect_service_manager",
|
|
lambda: "s6",
|
|
)
|
|
|
|
|
|
def test_register_noop_on_host(monkeypatch: pytest.MonkeyPatch) -> None:
|
|
# NOTE: deliberately DO NOT patch detect_service_manager — we want
|
|
# the real host detection to kick in and short-circuit before
|
|
# get_service_manager is ever called. The lambda below is a
|
|
# defense-in-depth assertion that get_service_manager is never
|
|
# reached on host.
|
|
monkeypatch.setattr(
|
|
"hermes_cli.service_manager.get_service_manager",
|
|
lambda: _HostManager(),
|
|
)
|
|
# Should NOT raise the AssertionError from _HostManager.register
|
|
_maybe_register_gateway_service("hostprof")
|
|
|
|
|
|
def test_register_calls_through_on_s6(monkeypatch: pytest.MonkeyPatch) -> None:
|
|
_patch_detect_s6(monkeypatch)
|
|
mgr = _S6Manager()
|
|
monkeypatch.setattr(
|
|
"hermes_cli.service_manager.get_service_manager", lambda: mgr,
|
|
)
|
|
_maybe_register_gateway_service("coder")
|
|
assert mgr.registered == ["coder"]
|
|
|
|
|
|
def test_register_passes_start_now_false(monkeypatch: pytest.MonkeyPatch) -> None:
|
|
"""_maybe_register_gateway_service must register with start_now=False
|
|
so that profile creation does not auto-start a gateway that may
|
|
conflict with the main gateway's bot-token lock."""
|
|
_patch_detect_s6(monkeypatch)
|
|
mgr = _S6Manager()
|
|
monkeypatch.setattr(
|
|
"hermes_cli.service_manager.get_service_manager", lambda: mgr,
|
|
)
|
|
_maybe_register_gateway_service("coder")
|
|
assert mgr.last_start_now is False, (
|
|
"profile creation must not auto-start the gateway service"
|
|
)
|
|
|
|
|
|
def test_register_swallows_duplicate_value_error(
|
|
monkeypatch: pytest.MonkeyPatch,
|
|
) -> None:
|
|
"""A pre-existing s6 registration (from container-boot reconcile)
|
|
is a benign condition — register must not propagate ValueError."""
|
|
_patch_detect_s6(monkeypatch)
|
|
mgr = _S6Manager()
|
|
mgr.raise_on_register = ValueError("already registered")
|
|
monkeypatch.setattr(
|
|
"hermes_cli.service_manager.get_service_manager", lambda: mgr,
|
|
)
|
|
# Should NOT raise
|
|
_maybe_register_gateway_service("coder")
|
|
|
|
|
|
def test_register_swallows_arbitrary_error(
|
|
monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str],
|
|
) -> None:
|
|
"""Even an unexpected exception from the manager must not bring
|
|
down `hermes profile create` — print and continue."""
|
|
_patch_detect_s6(monkeypatch)
|
|
mgr = _S6Manager()
|
|
mgr.raise_on_register = RuntimeError("svscanctl exploded")
|
|
monkeypatch.setattr(
|
|
"hermes_cli.service_manager.get_service_manager", lambda: mgr,
|
|
)
|
|
_maybe_register_gateway_service("coder")
|
|
captured = capsys.readouterr()
|
|
assert "Could not register" in captured.out
|
|
|
|
|
|
def test_register_swallows_no_backend_runtime_error(
|
|
monkeypatch: pytest.MonkeyPatch,
|
|
) -> None:
|
|
"""When `get_service_manager()` raises RuntimeError (no backend
|
|
detected), the hook must silently no-op."""
|
|
_patch_detect_s6(monkeypatch)
|
|
def _no_backend() -> None:
|
|
raise RuntimeError("no supported service manager detected")
|
|
monkeypatch.setattr(
|
|
"hermes_cli.service_manager.get_service_manager", _no_backend,
|
|
)
|
|
# Should NOT raise
|
|
_maybe_register_gateway_service("anywhere")
|
|
|
|
|
|
def test_register_silent_when_detect_throws(
|
|
monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str],
|
|
) -> None:
|
|
"""If detect_service_manager itself raises (e.g. a partial s6
|
|
install on a host machine), the hook must stay silent — no
|
|
confusing s6 warning printed to a user who has never touched a
|
|
container."""
|
|
def _broken_detect() -> str:
|
|
raise RuntimeError("detection blew up")
|
|
monkeypatch.setattr(
|
|
"hermes_cli.service_manager.detect_service_manager", _broken_detect,
|
|
)
|
|
# If get_service_manager is reached, the test will assert via
|
|
# _HostManager.register. It must NOT be reached.
|
|
monkeypatch.setattr(
|
|
"hermes_cli.service_manager.get_service_manager",
|
|
lambda: _HostManager(),
|
|
)
|
|
_maybe_register_gateway_service("anywhere")
|
|
captured = capsys.readouterr()
|
|
assert "Could not register" not in captured.out
|
|
assert captured.out == ""
|
|
|
|
|
|
def test_unregister_noop_on_host(monkeypatch: pytest.MonkeyPatch) -> None:
|
|
# Same as test_register_noop_on_host: rely on real host detection.
|
|
monkeypatch.setattr(
|
|
"hermes_cli.service_manager.get_service_manager",
|
|
lambda: _HostManager(),
|
|
)
|
|
_maybe_unregister_gateway_service("hostprof")
|
|
|
|
|
|
def test_unregister_calls_through_on_s6(monkeypatch: pytest.MonkeyPatch) -> None:
|
|
_patch_detect_s6(monkeypatch)
|
|
mgr = _S6Manager()
|
|
monkeypatch.setattr(
|
|
"hermes_cli.service_manager.get_service_manager", lambda: mgr,
|
|
)
|
|
_maybe_unregister_gateway_service("coder")
|
|
assert mgr.unregistered == ["coder"]
|
|
|
|
|
|
def test_unregister_swallows_errors(
|
|
monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str],
|
|
) -> None:
|
|
_patch_detect_s6(monkeypatch)
|
|
mgr = _S6Manager()
|
|
mgr.raise_on_unregister = RuntimeError("svc gone weird")
|
|
monkeypatch.setattr(
|
|
"hermes_cli.service_manager.get_service_manager", lambda: mgr,
|
|
)
|
|
_maybe_unregister_gateway_service("coder")
|
|
captured = capsys.readouterr()
|
|
assert "Could not unregister" in captured.out
|