mirror of
https://github.com/NousResearch/hermes-agent.git
synced 2026-06-28 11:32:22 +00:00
The /learn authoring prompt taught a subset of the HARDLINE skill rules, and stated the <=60-char description rule without making the model enforce it — so generated descriptions overshot (up to 202 chars), which the 60-char system-prompt skill index then silently truncates. - description: add the index-truncation rationale, a count-and-trim self-check, and a good/bad length example so the model actually hits <=60. - add platforms-gating rule (OS-bound primitives -> declare platforms:). - add author-credits-human-first rule. - round out the Hermes-tool framing with the full wrapped-tool mapping and references/templates layout. Closes #52367.
90 lines
3.8 KiB
Python
90 lines
3.8 KiB
Python
"""Tests for /learn — open-ended skill distillation.
|
|
|
|
Covers the shared prompt builder (agent.learn_prompt.build_learn_prompt) and
|
|
the slash-command registry wiring. /learn has no engine and no model tool: it
|
|
builds a standards-guided prompt that the live agent runs as a normal turn, so
|
|
these are the load-bearing behavior contracts.
|
|
"""
|
|
|
|
from agent.learn_prompt import build_learn_prompt, _AUTHORING_STANDARDS
|
|
|
|
|
|
class TestBuildLearnPrompt:
|
|
def test_embeds_the_user_request_verbatim(self):
|
|
req = "the REST client in ~/projects/acme-sdk, focus on auth"
|
|
prompt = build_learn_prompt(req)
|
|
assert req in prompt
|
|
|
|
def test_always_includes_the_authoring_standards(self):
|
|
# The standards are what make distilled skills match house style;
|
|
# they must travel with every prompt regardless of input.
|
|
for req in ["", "a url https://x/y", "what we just did"]:
|
|
assert _AUTHORING_STANDARDS in build_learn_prompt(req)
|
|
|
|
def test_instructs_saving_via_skill_manage_not_a_raw_file(self):
|
|
prompt = build_learn_prompt("learn the thing")
|
|
assert "skill_manage" in prompt
|
|
|
|
def test_references_gather_tools_for_open_ended_sourcing(self):
|
|
# Open-ended sourcing relies on the agent's own tools, named so it
|
|
# knows dirs/URLs/conversation/paste all route through existing tools.
|
|
prompt = build_learn_prompt("learn from somewhere")
|
|
for tool in ("read_file", "search_files", "web_extract"):
|
|
assert tool in prompt
|
|
|
|
def test_empty_request_falls_back_to_the_conversation(self):
|
|
# Bare /learn should distill "what we just did", not error.
|
|
prompt = build_learn_prompt("")
|
|
assert "conversation" in prompt.lower()
|
|
# And still carries the standards + save instruction.
|
|
assert "skill_manage" in prompt
|
|
|
|
def test_whitespace_only_request_is_treated_as_empty(self):
|
|
assert build_learn_prompt(" \n ") == build_learn_prompt("")
|
|
|
|
def test_description_length_rule_is_in_the_standards(self):
|
|
# The single most-violated rule must be explicit in the prompt.
|
|
assert "60" in _AUTHORING_STANDARDS
|
|
|
|
def test_teaches_the_full_hardline_standards(self):
|
|
# /learn must teach ALL the CONTRIBUTING.md skill rules, not just the
|
|
# description length — otherwise distilled skills miss platform gating,
|
|
# author credit, and the tool-framing table. Lock the coverage in.
|
|
std = _AUTHORING_STANDARDS.lower()
|
|
# #1 description: the count-and-trim self-check (the reported bug).
|
|
assert "count" in std and "60" in std
|
|
# #3 platforms gating against OS-bound primitives.
|
|
assert "platforms" in std
|
|
# #4 author credits the human first.
|
|
assert "author" in std
|
|
# #2 Hermes-tool framing names the wrapped tools, not shell utilities.
|
|
for tool in ("read_file", "search_files", "patch", "write_file"):
|
|
assert tool in std
|
|
# #6 scripts/references/templates layout.
|
|
assert "scripts/" in _AUTHORING_STANDARDS
|
|
|
|
|
|
class TestLearnRegistryWiring:
|
|
def test_learn_is_registered_and_resolves(self):
|
|
from hermes_cli.commands import resolve_command
|
|
|
|
cmd = resolve_command("learn")
|
|
assert cmd is not None
|
|
assert cmd.name == "learn"
|
|
|
|
def test_learn_is_in_tools_and_skills_category(self):
|
|
from hermes_cli.commands import resolve_command
|
|
|
|
assert resolve_command("learn").category == "Tools & Skills"
|
|
|
|
def test_learn_works_on_the_gateway(self):
|
|
# /learn must reach the gateway runner (it's a both-surfaces command),
|
|
# not be CLI-only.
|
|
from hermes_cli.commands import GATEWAY_KNOWN_COMMANDS
|
|
|
|
assert "learn" in GATEWAY_KNOWN_COMMANDS
|
|
|
|
def test_learn_is_not_cli_only(self):
|
|
from hermes_cli.commands import resolve_command
|
|
|
|
assert not resolve_command("learn").cli_only
|