mirror of
https://github.com/NousResearch/hermes-agent.git
synced 2026-05-29 06:31:32 +00:00
Tasks 0.2-0.6 of the s6-overlay supervision plan. Locks the user-visible behavior we must preserve through the Phase 2 init- system swap: - test_main_invocation.py (Task 0.2): docker run <image> with no args, chat subcommand passthrough, bare executable passthrough, bash pattern, exit-code propagation - test_tui_passthrough.py (Task 0.3): TTY allocation via docker -t using the host's script(1) for a PTY - test_dashboard.py (Task 0.4): HERMES_DASHBOARD=1 opt-in, HERMES_DASHBOARD_PORT override - test_profile_gateway.py (Task 0.5): per-profile gateway start/stop and profile-delete-stops-gateway. Both marked xfail(strict=True) because the current tini image refuses gateway lifecycle commands inside the container; Phase 4 Task 4.3 flips them to passing. - test_zombie_reaping.py (Task 0.6): PID 1 reaps orphaned zombies. tini does this today; s6-overlay's /init must continue to. Refs: docs/plans/2026-05-07-s6-overlay-dynamic-subagent-gateways.md
79 lines
2.8 KiB
Python
79 lines
2.8 KiB
Python
"""Harness: docker run <image> [cmd...] invocation patterns.
|
|
|
|
These tests MUST pass on the current tini-based image AND continue to
|
|
pass after the Phase 2 s6 migration. Any behavior drift is a regression.
|
|
|
|
The harness expects ``built_image`` and ``container_name`` fixtures from
|
|
``tests/docker/conftest.py``. When Docker isn't available every test
|
|
here is skipped at collection time.
|
|
"""
|
|
from __future__ import annotations
|
|
|
|
import subprocess
|
|
|
|
|
|
def test_no_args_starts_hermes(built_image: str) -> None:
|
|
"""``docker run <image>`` should start hermes cleanly.
|
|
|
|
We invoke ``--version`` so the call exits without needing a configured
|
|
model. Exit code may be 0 (printed version) or 1 (config bootstrapping
|
|
failure on a fresh volume), but never a stack trace.
|
|
"""
|
|
r = subprocess.run(
|
|
["docker", "run", "--rm", built_image, "--version"],
|
|
capture_output=True, text=True, timeout=60,
|
|
)
|
|
assert r.returncode in (0, 1), (
|
|
f"Unexpected exit {r.returncode}: stderr={r.stderr!r}"
|
|
)
|
|
assert "Traceback" not in r.stderr
|
|
|
|
|
|
def test_chat_subcommand_passthrough(built_image: str) -> None:
|
|
"""``docker run <image> chat --help`` should exec ``hermes chat --help``.
|
|
|
|
Uses ``--help`` so the call doesn't need an upstream model configured.
|
|
"""
|
|
r = subprocess.run(
|
|
["docker", "run", "--rm", built_image, "chat", "--help"],
|
|
capture_output=True, text=True, timeout=60,
|
|
)
|
|
assert r.returncode == 0
|
|
combined = (r.stdout + r.stderr).lower()
|
|
assert "chat" in combined or "usage" in combined
|
|
|
|
|
|
def test_bare_executable_passthrough(built_image: str) -> None:
|
|
"""``docker run <image> sleep 1`` should exec ``sleep`` directly.
|
|
|
|
The entrypoint detects that ``sleep`` is on PATH and routes around the
|
|
hermes wrapper. Useful for long-lived sandbox mode and for testing.
|
|
"""
|
|
r = subprocess.run(
|
|
["docker", "run", "--rm", built_image, "sleep", "1"],
|
|
capture_output=True, text=True, timeout=30,
|
|
)
|
|
assert r.returncode == 0
|
|
|
|
|
|
def test_bash_pattern(built_image: str) -> None:
|
|
"""``docker run <image> bash -c 'echo ok'`` should exec bash directly."""
|
|
r = subprocess.run(
|
|
["docker", "run", "--rm", built_image, "bash", "-c", "echo ok"],
|
|
capture_output=True, text=True, timeout=30,
|
|
)
|
|
assert r.returncode == 0
|
|
assert "ok" in r.stdout
|
|
|
|
|
|
def test_container_exit_code_matches_inner_exit(built_image: str) -> None:
|
|
"""The container exit code must match the inner process's exit code.
|
|
|
|
Critical for CI: ``docker run <image> hermes batch ...`` returns a
|
|
non-zero status when batch fails. Phase 2 (s6) must preserve this.
|
|
"""
|
|
r = subprocess.run(
|
|
["docker", "run", "--rm", built_image, "sh", "-c", "exit 42"],
|
|
capture_output=True, text=True, timeout=30,
|
|
)
|
|
assert r.returncode == 42
|