diff --git a/gateway/run.py b/gateway/run.py index abdb3324c..b75b0e1f0 100644 --- a/gateway/run.py +++ b/gateway/run.py @@ -925,8 +925,8 @@ class GatewayRunner: def _load_reasoning_config() -> dict | None: """Load reasoning effort from config.yaml. - Reads agent.reasoning_effort from config.yaml. Valid: "xhigh", - "high", "medium", "low", "minimal", "none". Returns None to use + Reads agent.reasoning_effort from config.yaml. Valid: "none", + "minimal", "low", "medium", "high", "xhigh". Returns None to use default (medium). """ from hermes_constants import parse_reasoning_effort @@ -4903,7 +4903,7 @@ class GatewayRunner: effort = args.strip() if effort == "none": parsed = {"enabled": False} - elif effort in ("xhigh", "high", "medium", "low", "minimal"): + elif effort in ("minimal", "low", "medium", "high", "xhigh"): parsed = {"enabled": True, "effort": effort} else: return ( diff --git a/hermes_constants.py b/hermes_constants.py index eded659ec..638d36a33 100644 --- a/hermes_constants.py +++ b/hermes_constants.py @@ -72,7 +72,7 @@ def display_hermes_home() -> str: return str(home) -VALID_REASONING_EFFORTS = ("xhigh", "high", "medium", "low", "minimal") +VALID_REASONING_EFFORTS = ("minimal", "low", "medium", "high", "xhigh") def parse_reasoning_effort(effort: str) -> dict | None: diff --git a/skills/autonomous-ai-agents/hermes-agent/SKILL.md b/skills/autonomous-ai-agents/hermes-agent/SKILL.md index 74445c267..6d8cd1c61 100644 --- a/skills/autonomous-ai-agents/hermes-agent/SKILL.md +++ b/skills/autonomous-ai-agents/hermes-agent/SKILL.md @@ -250,7 +250,7 @@ Type these during an interactive chat session. /model [name] Show or change model /provider Show provider info /personality [name] Set personality -/reasoning [level] Set reasoning (none|low|medium|high|xhigh|show|hide) +/reasoning [level] Set reasoning (none|minimal|low|medium|high|xhigh|show|hide) /verbose Cycle: off → new → all → verbose /voice [on|off|tts] Voice mode /yolo Toggle approval bypass diff --git a/website/docs/user-guide/configuration.md b/website/docs/user-guide/configuration.md index 0ac24db18..819a379eb 100644 --- a/website/docs/user-guide/configuration.md +++ b/website/docs/user-guide/configuration.md @@ -747,7 +747,7 @@ Control how much "thinking" the model does before responding: ```yaml agent: - reasoning_effort: "" # empty = medium (default). Options: xhigh (max), high, medium, low, minimal, none + reasoning_effort: "" # empty = medium (default). Options: none, minimal, low, medium, high, xhigh (max) ``` When unset (default), reasoning effort defaults to "medium" — a balanced level that works well for most tasks. Setting a value overrides it — higher reasoning effort gives better results on complex tasks at the cost of more tokens and latency. diff --git a/website/docs/user-guide/features/batch-processing.md b/website/docs/user-guide/features/batch-processing.md index 3cab1eba2..59554e34d 100644 --- a/website/docs/user-guide/features/batch-processing.md +++ b/website/docs/user-guide/features/batch-processing.md @@ -79,7 +79,7 @@ Entries can optionally include: | Parameter | Description | |-----------|-------------| -| `--reasoning_effort` | Effort level: `xhigh`, `high`, `medium`, `low`, `minimal`, `none` | +| `--reasoning_effort` | Effort level: `none`, `minimal`, `low`, `medium`, `high`, `xhigh` | | `--reasoning_disabled` | Completely disable reasoning/thinking tokens | ### Advanced Options