mirror of
https://github.com/NousResearch/hermes-agent.git
synced 2026-06-24 10:52:21 +00:00
The subprocess-stdin guard (TUI gateway fd-inheritance protection) flagged the `permissions grant` call. None of the cua-driver probes/grant read stdin, so DEVNULL is correct; apply it to the shared `_run` helper and the grant call.
189 lines
6.7 KiB
Python
189 lines
6.7 KiB
Python
"""
|
|
Cross-platform Computer Use readiness + macOS permission helpers.
|
|
|
|
cua-driver runs on macOS, Windows, and Linux, but "ready to drive" means
|
|
something different on each:
|
|
|
|
* macOS — explicit TCC grants (Accessibility + Screen Recording). cua-driver
|
|
reports/requests them via ``permissions status`` / ``permissions grant``.
|
|
The grants attach to cua-driver's OWN identity (``com.trycua.driver`` /
|
|
the installed ``CuaDriver.app``), NOT Hermes — so no Hermes entitlement is
|
|
involved, and ``grant`` launches CuaDriver via LaunchServices so the macOS
|
|
dialog is attributed correctly.
|
|
* Windows — no TCC toggles; the UIAccess worker (``cua-driver-uia.exe``) may
|
|
trip a SmartScreen prompt on first run. Readiness == driver health.
|
|
* Linux — assistive control via the X11/XWayland stack. Readiness == driver
|
|
health.
|
|
|
|
The universal signal on every platform is ``cua-driver doctor --json`` (binary
|
|
integrity + platform support). ``computer_use_status`` folds that together with
|
|
the macOS permission detail into one payload for the desktop card, the
|
|
``hermes computer-use permissions`` CLI, and ``/api/tools/computer-use/status``.
|
|
"""
|
|
|
|
from __future__ import annotations
|
|
|
|
import json
|
|
import os
|
|
import shutil
|
|
import subprocess
|
|
import sys
|
|
from typing import Any, Dict, List, Optional
|
|
|
|
# Platforms with a cua-driver runtime backend (mirrors the toolset platform_gate).
|
|
_RUNTIME_PLATFORMS = frozenset({"darwin", "win32", "linux"})
|
|
_BOOLS = ("accessibility", "screen_recording", "screen_recording_capturable")
|
|
|
|
|
|
def _driver_cmd(override: Optional[str]) -> str:
|
|
if override:
|
|
return override
|
|
try:
|
|
from hermes_cli.tools_config import _cua_driver_cmd
|
|
|
|
return _cua_driver_cmd()
|
|
except Exception:
|
|
return os.environ.get("HERMES_CUA_DRIVER_CMD", "").strip() or "cua-driver"
|
|
|
|
|
|
def _child_env() -> Dict[str, str]:
|
|
"""cua-driver child env honoring the Hermes telemetry opt-in policy."""
|
|
try:
|
|
from tools.computer_use.cua_backend import cua_driver_child_env
|
|
|
|
return cua_driver_child_env()
|
|
except Exception:
|
|
return dict(os.environ)
|
|
|
|
|
|
def _run(binary: str, *args: str, timeout: float) -> subprocess.CompletedProcess:
|
|
return subprocess.run(
|
|
[binary, *args],
|
|
capture_output=True,
|
|
text=True,
|
|
timeout=timeout,
|
|
env=_child_env(),
|
|
stdin=subprocess.DEVNULL,
|
|
)
|
|
|
|
|
|
def _json_out(binary: str, *args: str, timeout: float) -> Any:
|
|
"""Run ``binary args`` and parse stdout as JSON, or ``None`` on any failure."""
|
|
raw = (_run(binary, *args, timeout=timeout).stdout or "").strip()
|
|
return json.loads(raw) if raw else None
|
|
|
|
|
|
def _doctor(binary: str) -> Optional[Dict[str, Any]]:
|
|
"""``cua-driver doctor --json`` → ``{ok, checks:[{label,status,message}]}``."""
|
|
try:
|
|
data = _json_out(binary, "doctor", "--json", timeout=12)
|
|
except Exception:
|
|
return None
|
|
if not isinstance(data, dict):
|
|
return None
|
|
checks: List[Dict[str, str]] = [
|
|
{
|
|
"label": str(p.get("label", "")),
|
|
"status": str(p.get("status", "")),
|
|
"message": str(p.get("message", "")),
|
|
}
|
|
for p in data.get("probes", [])
|
|
if isinstance(p, dict)
|
|
]
|
|
return {"ok": bool(data.get("ok")), "checks": checks}
|
|
|
|
|
|
def _mac_permissions(binary: str, out: Dict[str, Any]) -> None:
|
|
"""Fold ``cua-driver permissions status --json`` booleans into ``out``."""
|
|
try:
|
|
data = _json_out(binary, "permissions", "status", "--json", timeout=10)
|
|
except subprocess.TimeoutExpired:
|
|
out["error"] = "cua-driver permissions status timed out"
|
|
return
|
|
except Exception as exc: # spawn failure or malformed JSON
|
|
out["error"] = f"cua-driver permissions status failed: {exc}"
|
|
return
|
|
if isinstance(data, dict):
|
|
out.update({k: data[k] for k in _BOOLS if isinstance(data.get(k), bool)})
|
|
if isinstance(data.get("source"), dict):
|
|
out["source"] = data["source"]
|
|
|
|
|
|
def computer_use_status(driver_cmd: Optional[str] = None) -> Dict[str, Any]:
|
|
"""Unified, OS-aware Computer Use readiness for the desktop card.
|
|
|
|
``ready`` is the single signal the UI keys off: on macOS it's both TCC
|
|
grants; elsewhere it's driver health (no TCC model). ``None`` means
|
|
unknown (binary missing / probe failed). ``can_grant`` is macOS-only.
|
|
"""
|
|
plat = sys.platform
|
|
binary = shutil.which(_driver_cmd(driver_cmd))
|
|
out: Dict[str, Any] = {
|
|
"platform": plat,
|
|
"platform_supported": plat in _RUNTIME_PLATFORMS,
|
|
"installed": bool(binary),
|
|
"version": None,
|
|
"ready": None,
|
|
"can_grant": plat == "darwin",
|
|
"checks": [],
|
|
"source": None,
|
|
"error": None,
|
|
**{k: None for k in _BOOLS},
|
|
}
|
|
if not binary:
|
|
return out
|
|
|
|
try:
|
|
out["version"] = (_run(binary, "--version", timeout=5).stdout or "").strip() or None
|
|
except Exception:
|
|
pass
|
|
|
|
doctor = _doctor(binary)
|
|
if doctor is not None:
|
|
out["checks"] = doctor["checks"]
|
|
|
|
if plat == "darwin":
|
|
_mac_permissions(binary, out)
|
|
if out["error"] is None:
|
|
out["ready"] = out["accessibility"] is True and out["screen_recording"] is True
|
|
elif doctor is not None:
|
|
# No TCC model off macOS — readiness is driver health.
|
|
out["ready"] = doctor["ok"]
|
|
return out
|
|
|
|
|
|
def request_permissions_grant(driver_cmd: Optional[str] = None) -> int:
|
|
"""Run ``cua-driver permissions grant`` (macOS); stream its output.
|
|
|
|
Launches CuaDriver via LaunchServices so the TCC dialog is attributed to
|
|
``com.trycua.driver``, then waits for the grant. Returns the driver's exit
|
|
code (0 ok), 2 if the binary is missing, 64 on a non-macOS platform (which
|
|
has no TCC permission model to grant).
|
|
"""
|
|
if sys.platform != "darwin":
|
|
print("Computer Use permissions are a macOS concept; nothing to grant here.")
|
|
return 64
|
|
|
|
binary = shutil.which(_driver_cmd(driver_cmd))
|
|
if not binary:
|
|
print("cua-driver: not installed. Run: hermes computer-use install")
|
|
return 2
|
|
|
|
print(
|
|
"Requesting Accessibility + Screen Recording for CuaDriver.\n"
|
|
"macOS will show a dialog attributed to CuaDriver (com.trycua.driver) — "
|
|
"approve it, then return here."
|
|
)
|
|
try:
|
|
return int(
|
|
subprocess.run(
|
|
[binary, "permissions", "grant"],
|
|
env=_child_env(),
|
|
stdin=subprocess.DEVNULL,
|
|
).returncode
|
|
)
|
|
except KeyboardInterrupt: # pragma: no cover - interactive
|
|
return 130
|
|
except Exception as exc: # pragma: no cover - defensive
|
|
print(f"cua-driver permissions grant failed: {exc}", file=sys.stderr)
|
|
return 2
|