mirror of
https://github.com/NousResearch/hermes-agent.git
synced 2026-06-29 11:42:04 +00:00
* feat(kanban): typed block reasons + unblock-loop breaker Stops the kanban blocked-task loop: a worker blocks a task, a cron unblocks it, the worker re-blocks for the same reason, repeat forever. block_task now takes a typed kind and a persistent block_recurrences counter on the tasks table: - kind=dependency routes to todo (parent-gated, auto-resumed), never the human 'blocked' bucket a cron would keep unblocking. - needs_input/capability/transient/untyped land in blocked; each same-cause re-block after an unblock increments block_recurrences, and at BLOCK_RECURRENCE_LIMIT (default 2) the task routes to triage for a human instead of blocked. - unblock_task no longer resets block_recurrences (the amnesia that let the loop run unbounded); complete_task clears it on success. Wired through the worker kanban_block tool (new kind arg) and the hermes kanban block --kind CLI flag, both reporting where the task actually landed. Docs + 11 new tests; 536 existing kanban tests green. * test(kanban): make second-block notify test use a distinct block cause test_notifier_second_blocked_delivers blocked the same task twice with the same (untyped) reason, which now trips the new unblock-loop breaker and routes the second block to triage instead of blocked — so only one 'blocked' notification fired. The test's actual intent is that TWO distinct block cycles each notify; give the two cycles different kinds (needs_input then capability) so they're genuinely separate blocks. The same-cause loop→triage path is covered by test_kanban_block_kinds.py.
202 lines
8 KiB
Python
202 lines
8 KiB
Python
"""Tests for typed block reasons + the unblock-loop breaker.
|
|
|
|
Covers the built-in fix for the kanban "blocked loop" — a worker blocks a
|
|
task, a cron unblocks it, the worker re-blocks for the same reason, repeat
|
|
forever. The fix gives ``block_task`` a typed ``kind`` and a persistent
|
|
``block_recurrences`` counter:
|
|
|
|
* ``dependency`` blocks route to ``todo`` (parent-gated, auto-resumed) and
|
|
never enter the human ``blocked`` bucket a cron would keep unblocking.
|
|
* ``needs_input`` / ``capability`` / un-typed blocks land in ``blocked``;
|
|
each same-cause re-block after an unblock increments ``block_recurrences``,
|
|
and at ``BLOCK_RECURRENCE_LIMIT`` the task routes to ``triage`` for a human.
|
|
* ``unblock_task`` deliberately does NOT reset ``block_recurrences`` (the
|
|
amnesia that let the loop run unbounded).
|
|
* A successful ``complete_task`` resets the loop memory.
|
|
"""
|
|
|
|
from __future__ import annotations
|
|
|
|
from pathlib import Path
|
|
|
|
import pytest
|
|
|
|
from hermes_cli import kanban_db as kb
|
|
|
|
|
|
@pytest.fixture
|
|
def kanban_home(tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> Path:
|
|
home = tmp_path / ".hermes"
|
|
home.mkdir()
|
|
monkeypatch.setenv("HERMES_HOME", str(home))
|
|
monkeypatch.setattr(Path, "home", lambda: tmp_path)
|
|
kb.init_db()
|
|
return home
|
|
|
|
|
|
def _running_task(conn, title="t"):
|
|
"""Create a task and drive it to ``running`` so block_task can act."""
|
|
tid = kb.create_task(conn, title=title, assignee="worker")
|
|
with kb.write_txn(conn):
|
|
conn.execute("UPDATE tasks SET status='ready' WHERE id=?", (tid,))
|
|
claimed = kb.claim_task(conn, tid, claimer="worker")
|
|
assert claimed is not None
|
|
return tid
|
|
|
|
|
|
def _make_running_again(conn, tid):
|
|
with kb.write_txn(conn):
|
|
conn.execute("UPDATE tasks SET status='ready' WHERE id=?", (tid,))
|
|
assert kb.claim_task(conn, tid, claimer="worker") is not None
|
|
|
|
|
|
# ---------------------------------------------------------------------------
|
|
# Loop breaker
|
|
# ---------------------------------------------------------------------------
|
|
|
|
|
|
def test_first_typed_block_lands_in_blocked(kanban_home: Path) -> None:
|
|
with kb.connect_closing() as conn:
|
|
tid = _running_task(conn)
|
|
assert kb.block_task(conn, tid, reason="which key?", kind="needs_input")
|
|
t = kb.get_task(conn, tid)
|
|
assert t.status == "blocked"
|
|
assert t.block_kind == "needs_input"
|
|
assert t.block_recurrences == 1
|
|
|
|
|
|
def test_unblock_does_not_reset_recurrence_counter(kanban_home: Path) -> None:
|
|
"""The crux of the fix: unblock must preserve the loop counter."""
|
|
with kb.connect_closing() as conn:
|
|
tid = _running_task(conn)
|
|
kb.block_task(conn, tid, reason="x", kind="needs_input")
|
|
assert kb.get_task(conn, tid).block_recurrences == 1
|
|
assert kb.unblock_task(conn, tid)
|
|
t = kb.get_task(conn, tid)
|
|
assert t.status == "ready"
|
|
assert t.block_recurrences == 1 # NOT reset to 0
|
|
assert t.block_kind == "needs_input" # kind preserved for comparison
|
|
|
|
|
|
def test_same_cause_reblock_routes_to_triage(kanban_home: Path) -> None:
|
|
"""Dale's loop: block → unblock → re-block same kind → triage."""
|
|
with kb.connect_closing() as conn:
|
|
tid = _running_task(conn)
|
|
kb.block_task(conn, tid, reason="need creds", kind="needs_input")
|
|
kb.unblock_task(conn, tid)
|
|
_make_running_again(conn, tid)
|
|
kb.block_task(conn, tid, reason="still need creds", kind="needs_input")
|
|
t = kb.get_task(conn, tid)
|
|
assert t.status == "triage"
|
|
assert t.block_recurrences == 2
|
|
|
|
|
|
def test_untyped_block_loop_also_protected(kanban_home: Path) -> None:
|
|
"""Legacy un-typed blocks (kind=None) still trip the breaker."""
|
|
with kb.connect_closing() as conn:
|
|
tid = _running_task(conn)
|
|
kb.block_task(conn, tid, reason="a")
|
|
kb.unblock_task(conn, tid)
|
|
_make_running_again(conn, tid)
|
|
kb.block_task(conn, tid, reason="a again")
|
|
assert kb.get_task(conn, tid).status == "triage"
|
|
|
|
|
|
def test_different_kinds_do_not_compound(kanban_home: Path) -> None:
|
|
"""A re-block for a DIFFERENT reason resets the counter to 1."""
|
|
with kb.connect_closing() as conn:
|
|
tid = _running_task(conn)
|
|
kb.block_task(conn, tid, reason="a", kind="needs_input")
|
|
kb.unblock_task(conn, tid)
|
|
_make_running_again(conn, tid)
|
|
kb.block_task(conn, tid, reason="b", kind="capability")
|
|
t = kb.get_task(conn, tid)
|
|
assert t.status == "blocked"
|
|
assert t.block_recurrences == 1
|
|
|
|
|
|
def test_block_loop_detected_event_emitted(kanban_home: Path) -> None:
|
|
with kb.connect_closing() as conn:
|
|
tid = _running_task(conn)
|
|
kb.block_task(conn, tid, reason="x", kind="capability")
|
|
kb.unblock_task(conn, tid)
|
|
_make_running_again(conn, tid)
|
|
kb.block_task(conn, tid, reason="x", kind="capability")
|
|
events = [e for e in kb.list_events(conn, tid)
|
|
if e.kind == "block_loop_detected"]
|
|
assert events, "expected a block_loop_detected event"
|
|
payload = events[-1].payload or {}
|
|
assert payload.get("recurrences") == 2
|
|
assert payload.get("kind") == "capability"
|
|
|
|
|
|
# ---------------------------------------------------------------------------
|
|
# Dependency routing
|
|
# ---------------------------------------------------------------------------
|
|
|
|
|
|
def test_dependency_block_routes_to_todo(kanban_home: Path) -> None:
|
|
"""Dependency waits never enter the human 'blocked' bucket."""
|
|
with kb.connect_closing() as conn:
|
|
tid = _running_task(conn)
|
|
assert kb.block_task(conn, tid, reason="need X first", kind="dependency")
|
|
t = kb.get_task(conn, tid)
|
|
assert t.status == "todo"
|
|
assert t.block_kind == "dependency"
|
|
|
|
|
|
def test_dependency_then_parent_done_promotes(kanban_home: Path) -> None:
|
|
"""A dependency-parked child becomes ready once its parent completes."""
|
|
with kb.connect_closing() as conn:
|
|
parent = kb.create_task(conn, title="parent", assignee="worker")
|
|
child = _running_task(conn, title="child")
|
|
kb.link_tasks(conn, parent_id=parent, child_id=child)
|
|
kb.block_task(conn, child, reason="wait", kind="dependency")
|
|
assert kb.get_task(conn, child).status == "todo"
|
|
# Finish the parent, then let recompute_ready run.
|
|
with kb.write_txn(conn):
|
|
conn.execute("UPDATE tasks SET status='ready' WHERE id=?", (parent,))
|
|
kb.claim_task(conn, parent, claimer="worker")
|
|
kb.complete_task(conn, parent, result="done")
|
|
kb.recompute_ready(conn)
|
|
assert kb.get_task(conn, child).status == "ready"
|
|
|
|
|
|
# ---------------------------------------------------------------------------
|
|
# Completion resets loop memory
|
|
# ---------------------------------------------------------------------------
|
|
|
|
|
|
def test_completion_clears_block_memory(kanban_home: Path) -> None:
|
|
with kb.connect_closing() as conn:
|
|
tid = _running_task(conn)
|
|
kb.block_task(conn, tid, reason="x", kind="capability")
|
|
kb.unblock_task(conn, tid)
|
|
assert kb.get_task(conn, tid).block_recurrences == 1
|
|
kb.complete_task(conn, tid, result="done")
|
|
t = kb.get_task(conn, tid)
|
|
assert t.status == "done"
|
|
assert t.block_recurrences == 0
|
|
assert t.block_kind is None
|
|
|
|
|
|
# ---------------------------------------------------------------------------
|
|
# Validation + back-compat
|
|
# ---------------------------------------------------------------------------
|
|
|
|
|
|
def test_invalid_kind_rejected(kanban_home: Path) -> None:
|
|
with kb.connect_closing() as conn:
|
|
tid = _running_task(conn)
|
|
with pytest.raises(ValueError):
|
|
kb.block_task(conn, tid, reason="x", kind="bogus")
|
|
|
|
|
|
def test_block_without_kind_is_backward_compatible(kanban_home: Path) -> None:
|
|
"""Existing callers that pass no kind keep the old single-block behaviour."""
|
|
with kb.connect_closing() as conn:
|
|
tid = _running_task(conn)
|
|
assert kb.block_task(conn, tid, reason="legacy")
|
|
t = kb.get_task(conn, tid)
|
|
assert t.status == "blocked"
|
|
assert t.block_kind is None
|