mirror of
https://github.com/NousResearch/hermes-agent.git
synced 2026-06-09 08:21:50 +00:00
Daemon thread polls _is_orphaned (original ppid check + psutil create_time PID-reuse guard, no PR_SET_PDEATHSIG). On orphan, drains an in-flight command up to a grace window then os._exit(0). Started before the HermesCLI build to cover the spawn window. Task: swl-qrf.8
123 lines
3.9 KiB
Python
123 lines
3.9 KiB
Python
"""Persistent slash-command worker — one HermesCLI per TUI session.
|
|
|
|
Protocol: reads JSON lines from stdin {id, command}, writes {id, ok, output|error} to stdout.
|
|
"""
|
|
|
|
import argparse
|
|
import contextlib
|
|
import io
|
|
import json
|
|
import os
|
|
import sys
|
|
import threading
|
|
import time
|
|
|
|
import psutil
|
|
|
|
import cli as cli_mod
|
|
from cli import HermesCLI
|
|
from rich.console import Console
|
|
|
|
# Env-overridable so the integration test can drive sub-second timing.
|
|
_WATCHDOG_POLL_S = float(os.environ.get("HERMES_SLASH_WATCHDOG_POLL_S", 2.0))
|
|
_ORPHAN_GRACE_S = float(os.environ.get("HERMES_SLASH_WATCHDOG_GRACE_S", 5.0))
|
|
_in_flight = threading.Event() # set while a command is executing
|
|
|
|
|
|
def _is_orphaned(original_ppid, parent_create_time, getppid=os.getppid) -> bool:
|
|
"""True once our spawning gateway is gone. Compare to the ORIGINAL ppid
|
|
(never ==1: Linux reparents to a subreaper) and guard PID reuse via
|
|
create_time."""
|
|
if getppid() != original_ppid:
|
|
return True
|
|
try:
|
|
if not psutil.pid_exists(original_ppid):
|
|
return True
|
|
return psutil.Process(original_ppid).create_time() != parent_create_time
|
|
except psutil.Error:
|
|
return True
|
|
|
|
|
|
def _start_parent_death_watchdog(original_ppid, parent_create_time) -> None:
|
|
def _loop():
|
|
while not _is_orphaned(original_ppid, parent_create_time):
|
|
time.sleep(_WATCHDOG_POLL_S)
|
|
deadline = time.monotonic() + _ORPHAN_GRACE_S
|
|
while _in_flight.is_set() and time.monotonic() < deadline:
|
|
time.sleep(0.05) # let an in-flight command finish/flush
|
|
os._exit(0)
|
|
|
|
threading.Thread(target=_loop, daemon=True).start()
|
|
|
|
|
|
def _run(cli: HermesCLI, command: str) -> str:
|
|
cmd = (command or "").strip()
|
|
if not cmd:
|
|
return ""
|
|
if not cmd.startswith("/"):
|
|
cmd = f"/{cmd}"
|
|
|
|
buf = io.StringIO()
|
|
|
|
# Rich Console captures its file handle at construction time, so
|
|
# contextlib.redirect_stdout won't affect it. Swap the console's
|
|
# underlying file to our buffer so self.console.print() is captured.
|
|
cli.console = Console(file=buf, force_terminal=True, width=120)
|
|
|
|
old = getattr(cli_mod, "_cprint", None)
|
|
if old is not None:
|
|
cli_mod._cprint = lambda text: print(text)
|
|
|
|
try:
|
|
with contextlib.redirect_stdout(buf), contextlib.redirect_stderr(buf):
|
|
cli.process_command(cmd)
|
|
finally:
|
|
if old is not None:
|
|
cli_mod._cprint = old
|
|
|
|
return buf.getvalue().rstrip()
|
|
|
|
|
|
def main():
|
|
p = argparse.ArgumentParser(add_help=False)
|
|
p.add_argument("--session-key", required=True)
|
|
p.add_argument("--model", default="")
|
|
args = p.parse_args()
|
|
|
|
os.environ["HERMES_SESSION_KEY"] = args.session_key
|
|
os.environ["HERMES_INTERACTIVE"] = "1"
|
|
|
|
# Start before the (hundreds-of-ms) HermesCLI build — that window is itself
|
|
# an orphan risk if the gateway dies mid-spawn.
|
|
orig_ppid = os.getppid()
|
|
try:
|
|
parent_create_time = psutil.Process(orig_ppid).create_time()
|
|
except psutil.Error:
|
|
parent_create_time = 0.0
|
|
_start_parent_death_watchdog(orig_ppid, parent_create_time)
|
|
|
|
with contextlib.redirect_stdout(io.StringIO()), contextlib.redirect_stderr(io.StringIO()):
|
|
cli = HermesCLI(model=args.model or None, compact=True, resume=args.session_key, verbose=False)
|
|
|
|
for raw in sys.stdin:
|
|
line = raw.strip()
|
|
if not line:
|
|
continue
|
|
|
|
_in_flight.set()
|
|
rid = None
|
|
try:
|
|
req = json.loads(line)
|
|
rid = req.get("id")
|
|
out = _run(cli, req.get("command", ""))
|
|
sys.stdout.write(json.dumps({"id": rid, "ok": True, "output": out}) + "\n")
|
|
sys.stdout.flush()
|
|
except Exception as e:
|
|
sys.stdout.write(json.dumps({"id": rid, "ok": False, "error": str(e)}) + "\n")
|
|
sys.stdout.flush()
|
|
finally:
|
|
_in_flight.clear()
|
|
|
|
|
|
if __name__ == "__main__":
|
|
main()
|