diff --git a/AGENTS.md b/AGENTS.md
index 0c8550d459d..d8ba934c521 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -540,10 +540,14 @@ Full authoring guide: `website/docs/developer-guide/model-provider-plugin.md`.
 
 ### Dashboard / context-engine / image-gen plugin directories
 
-`plugins/context_engine/`, `plugins/image_gen/`, `plugins/example-dashboard/`,
-etc. follow the same pattern (ABC + orchestrator + per-plugin directory).
-Context engines plug into `agent/context_engine.py`; image-gen providers
-into `agent/image_gen_provider.py`.
+`plugins/context_engine/`, `plugins/image_gen/`, etc. follow the same
+pattern (ABC + orchestrator + per-plugin directory). Context engines
+plug into `agent/context_engine.py`; image-gen providers into
+`agent/image_gen_provider.py`. Reference / docs-companion plugins
+(`example-dashboard`, `strike-freedom-cockpit`, `plugin-llm-example`,
+`plugin-llm-async-example`) live in the
+[`hermes-example-plugins`](https://github.com/NousResearch/hermes-example-plugins)
+companion repo, not in this tree.
 
 ---
 
diff --git a/agent/plugin_llm.py b/agent/plugin_llm.py
new file mode 100644
index 00000000000..e9c2a869dd7
--- /dev/null
+++ b/agent/plugin_llm.py
@@ -0,0 +1,1046 @@
+"""
+Plugin LLM facade — host-owned LLM access for trusted plugins.
+==============================================================
+
+Plugins built on Hermes Agent often need to make their own LLM calls
+out-of-band — a hook that rewrites a tool error before the user sees
+it, a gateway adapter that translates inbound text, a slash command
+that summarises a paste, a scheduled job that scores yesterday's
+activity into a single line on a status board.
+
+Today the only stable plugin surfaces extend an existing Hermes
+subsystem: ``register_tool``, ``register_platform``,
+``register_memory_provider``, etc. None of those help when the
+plugin's job is to make its own model call. This module is the
+supported lane for that case.
+
+The plugin gets ``ctx.llm`` exposed on its
+:class:`~hermes_cli.plugins.PluginContext`:
+
+* ``complete(messages, ...)`` — chat completion against the user's
+  active model + auth.
+* ``complete_structured(instructions=..., input=[...], json_schema=...)``
+  — bounded structured inference with optional image inputs, JSON
+  schema validation, and parsed JSON output.
+* async siblings ``acomplete()`` / ``acomplete_structured()`` for
+  plugins running on asyncio loops (gateway adapters, hooks).
+
+Provider/model/agent_id/profile are explicit keyword arguments — no
+embedded slugs, no shorthands. This mirrors Hermes' main config
+shape (``model.provider`` + ``model.model``) so plugin authors who
+already understand the host config don't have to learn anything new.
+
+The host owns provider routing, auth resolution, timeouts, and
+fallback. The plugin never sees raw OAuth tokens or API keys. All
+override knobs (``provider=``, ``model=``, ``agent_id=``,
+``profile=``) are gated behind explicit per-plugin trust flags in
+``config.yaml``::
+
+    plugins:
+      entries:
+        my-plugin:
+          llm:
+            allow_provider_override: true
+            allow_model_override: true
+            allowed_providers: [openrouter, anthropic]   # optional
+            allowed_models:    [openai/gpt-4o-mini]       # optional
+            allow_agent_id_override: false
+            allow_profile_override: false
+
+Untrusted plugins still get the default surface — they just can't
+steer provider, model, agent, or auth-profile selection. The trust
+gate is fail-closed: a missing config block means "no overrides,"
+not "anything goes."
+
+Backed by :func:`agent.auxiliary_client.call_llm`, which already
+handles every provider, fallback chain, and per-task override Hermes
+supports.
+"""
+
+from __future__ import annotations
+
+import base64
+import json
+import logging
+import re
+from dataclasses import dataclass, field
+from typing import Any, Awaitable, Callable, Dict, List, Optional, Sequence, Union
+
+logger = logging.getLogger(__name__)
+
+
+# ---------------------------------------------------------------------------
+# Public dataclasses
+# ---------------------------------------------------------------------------
+
+
+@dataclass
+class PluginLlmTextInput:
+    """Text block in a structured input list."""
+
+    text: str
+    type: str = "text"
+
+
+@dataclass
+class PluginLlmImageInput:
+    """Image block in a structured input list.
+
+    Either ``data`` (raw bytes) or ``url`` (http(s) or data: URL) must be
+    provided. ``mime_type`` defaults to ``image/png`` when ``data`` is
+    used and is required for non-PNG bytes to render correctly across
+    providers.
+    """
+
+    data: Optional[bytes] = None
+    url: Optional[str] = None
+    mime_type: str = "image/png"
+    file_name: str = ""
+    type: str = "image"
+
+
+PluginLlmInput = Union[PluginLlmTextInput, PluginLlmImageInput, Dict[str, Any]]
+"""A single structured input block.
+
+Plugins may pass either the dataclasses above or plain dicts with the
+same shape — dicts are normalized internally. Dict shape::
+
+    {"type": "text", "text": "..."}
+    {"type": "image", "data": <bytes>, "mime_type": "image/png", "file_name": "receipt.png"}
+    {"type": "image", "url": "https://..."}
+"""
+
+
+@dataclass
+class PluginLlmUsage:
+    """Token + cost usage for a completion. All fields optional — providers
+    differ on what they return. ``cost_usd`` is the host's best estimate."""
+
+    input_tokens: int = 0
+    output_tokens: int = 0
+    total_tokens: int = 0
+    cache_read_tokens: int = 0
+    cache_write_tokens: int = 0
+    cost_usd: Optional[float] = None
+
+
+@dataclass
+class PluginLlmCompleteResult:
+    """Result of :meth:`PluginLlm.complete`."""
+
+    text: str
+    provider: str
+    model: str
+    agent_id: str
+    usage: PluginLlmUsage = field(default_factory=PluginLlmUsage)
+    audit: Dict[str, Any] = field(default_factory=dict)
+
+
+@dataclass
+class PluginLlmStructuredResult:
+    """Result of :meth:`PluginLlm.complete_structured`.
+
+    ``parsed`` is set only when ``json_mode=True`` or ``json_schema`` is
+    provided AND the response was valid JSON. ``content_type`` is
+    ``"json"`` in that case, ``"text"`` otherwise (e.g. the model
+    refused or the response wasn't requested as JSON)."""
+
+    text: str
+    provider: str
+    model: str
+    agent_id: str
+    usage: PluginLlmUsage = field(default_factory=PluginLlmUsage)
+    parsed: Optional[Any] = None
+    content_type: str = "text"
+    audit: Dict[str, Any] = field(default_factory=dict)
+
+
+# ---------------------------------------------------------------------------
+# Trust gate
+# ---------------------------------------------------------------------------
+
+
+@dataclass(frozen=True)
+class _TrustPolicy:
+    """Resolved trust gate for one plugin's LLM access."""
+
+    plugin_id: str
+    allow_provider_override: bool = False
+    allowed_providers: Optional[frozenset] = None  # None = no allowlist
+    allow_any_provider: bool = False  # True when allowed_providers == ["*"]
+    allow_model_override: bool = False
+    allowed_models: Optional[frozenset] = None  # None = no allowlist
+    allow_any_model: bool = False  # True when allowed_models == ["*"]
+    allow_agent_id_override: bool = False
+    allow_profile_override: bool = False
+
+
+def _normalize_ref(raw: str) -> str:
+    """Lower-case + strip whitespace. Used for allowlist matching."""
+    return (raw or "").strip().lower()
+
+
+def _coerce_allowlist(raw: Any) -> tuple[Optional[frozenset], bool]:
+    """Coerce a YAML list into ``(frozenset_or_None, allow_any)``.
+
+    ``["*"]`` (or any list containing ``"*"``) → ``(frozenset(), True)``.
+    Any other list → ``(frozenset({...}), False)``.
+    Missing / non-list → ``(None, False)`` meaning "no allowlist."
+    """
+    if not isinstance(raw, list):
+        return None, False
+    normalized = [_normalize_ref(item) for item in raw if isinstance(item, str)]
+    allow_any = "*" in normalized
+    cleaned = {item for item in normalized if item and item != "*"}
+    if allow_any and not cleaned:
+        return frozenset(), True
+    if cleaned:
+        return frozenset(cleaned), allow_any
+    return frozenset(), allow_any
+
+
+def _resolve_trust_policy(plugin_id: str) -> _TrustPolicy:
+    """Read ``plugins.entries.<plugin_id>.llm`` from config.yaml.
+
+    Missing config → fully restrictive policy (default deny on every
+    override). The policy is resolved per-call rather than cached so
+    config edits take effect without restarting the agent.
+    """
+    if not plugin_id:
+        return _TrustPolicy(plugin_id="")
+
+    try:
+        from hermes_cli.config import load_config
+        config = load_config() or {}
+    except Exception:  # pragma: no cover — config IO failure
+        return _TrustPolicy(plugin_id=plugin_id)
+
+    plugins_cfg = config.get("plugins")
+    if not isinstance(plugins_cfg, dict):
+        return _TrustPolicy(plugin_id=plugin_id)
+    entries = plugins_cfg.get("entries")
+    if not isinstance(entries, dict):
+        return _TrustPolicy(plugin_id=plugin_id)
+    entry = entries.get(plugin_id)
+    if not isinstance(entry, dict):
+        return _TrustPolicy(plugin_id=plugin_id)
+    llm_cfg = entry.get("llm")
+    if not isinstance(llm_cfg, dict):
+        return _TrustPolicy(plugin_id=plugin_id)
+
+    allowed_models, allow_any_model = _coerce_allowlist(llm_cfg.get("allowed_models"))
+    allowed_providers, allow_any_provider = _coerce_allowlist(
+        llm_cfg.get("allowed_providers")
+    )
+
+    return _TrustPolicy(
+        plugin_id=plugin_id,
+        allow_provider_override=bool(llm_cfg.get("allow_provider_override", False)),
+        allowed_providers=allowed_providers,
+        allow_any_provider=allow_any_provider,
+        allow_model_override=bool(llm_cfg.get("allow_model_override", False)),
+        allowed_models=allowed_models,
+        allow_any_model=allow_any_model,
+        allow_agent_id_override=bool(llm_cfg.get("allow_agent_id_override", False)),
+        allow_profile_override=bool(llm_cfg.get("allow_profile_override", False)),
+    )
+
+
+class PluginLlmTrustError(PermissionError):
+    """Raised when a plugin attempts an LLM override without trust."""
+
+
+def _check_overrides(
+    policy: _TrustPolicy,
+    *,
+    requested_provider: Optional[str],
+    requested_model: Optional[str],
+    requested_agent_id: Optional[str],
+    requested_profile: Optional[str],
+) -> tuple[Optional[str], Optional[str], Optional[str], Optional[str]]:
+    """Apply the trust gate. Returns the validated overrides as
+    ``(provider, model, agent_id, profile)`` or raises
+    :class:`PluginLlmTrustError`.
+
+    Each override (``provider``, ``model``, ``agent_id``, ``profile``)
+    is independently gated. ``provider`` and ``model`` each have an
+    optional allowlist via ``allowed_providers`` / ``allowed_models``.
+    """
+    final_provider: Optional[str] = None
+    final_model: Optional[str] = None
+    final_profile: Optional[str] = None
+
+    if requested_provider:
+        if not policy.allow_provider_override:
+            raise PluginLlmTrustError(
+                f"Plugin {policy.plugin_id!r} cannot override the provider "
+                f"(set plugins.entries.{policy.plugin_id}.llm.allow_provider_override "
+                f"to true to allow)."
+            )
+        normalized = _normalize_ref(requested_provider)
+        if (
+            not policy.allow_any_provider
+            and policy.allowed_providers is not None
+            and normalized not in policy.allowed_providers
+        ):
+            raise PluginLlmTrustError(
+                f"Plugin {policy.plugin_id!r} provider override "
+                f"{requested_provider!r} is not in plugins.entries."
+                f"{policy.plugin_id}.llm.allowed_providers."
+            )
+        final_provider = requested_provider.strip()
+
+    if requested_model:
+        if not policy.allow_model_override:
+            raise PluginLlmTrustError(
+                f"Plugin {policy.plugin_id!r} cannot override the model "
+                f"(set plugins.entries.{policy.plugin_id}.llm.allow_model_override "
+                f"to true to allow)."
+            )
+        normalized = _normalize_ref(requested_model)
+        if (
+            not policy.allow_any_model
+            and policy.allowed_models is not None
+            and normalized not in policy.allowed_models
+        ):
+            raise PluginLlmTrustError(
+                f"Plugin {policy.plugin_id!r} model override "
+                f"{requested_model!r} is not in plugins.entries."
+                f"{policy.plugin_id}.llm.allowed_models."
+            )
+        final_model = requested_model.strip()
+
+    if requested_agent_id and not policy.allow_agent_id_override:
+        raise PluginLlmTrustError(
+            f"Plugin {policy.plugin_id!r} cannot run completions against a "
+            f"non-default agent id (set plugins.entries.{policy.plugin_id}."
+            f"llm.allow_agent_id_override to true to allow)."
+        )
+
+    if requested_profile:
+        if not policy.allow_profile_override:
+            raise PluginLlmTrustError(
+                f"Plugin {policy.plugin_id!r} cannot override the auth profile "
+                f"(set plugins.entries.{policy.plugin_id}.llm.allow_profile_override "
+                f"to true to allow)."
+            )
+        final_profile = requested_profile.strip()
+
+    return final_provider, final_model, requested_agent_id, final_profile
+
+
+# ---------------------------------------------------------------------------
+# Input normalization
+# ---------------------------------------------------------------------------
+
+
+def _normalize_input_block(block: PluginLlmInput) -> Dict[str, Any]:
+    """Coerce a structured input block to a plain dict the message
+    builder understands. Unknown shapes raise ``ValueError``."""
+    if isinstance(block, PluginLlmTextInput):
+        return {"type": "text", "text": block.text}
+    if isinstance(block, PluginLlmImageInput):
+        d: Dict[str, Any] = {
+            "type": "image",
+            "mime_type": block.mime_type,
+            "file_name": block.file_name,
+        }
+        if block.data is not None:
+            d["data"] = block.data
+        if block.url:
+            d["url"] = block.url
+        return d
+    if isinstance(block, dict):
+        kind = block.get("type")
+        if kind == "text":
+            text = block.get("text")
+            if not isinstance(text, str):
+                raise ValueError("text input block requires 'text' string")
+            return {"type": "text", "text": text}
+        if kind == "image":
+            if "data" not in block and not block.get("url"):
+                raise ValueError("image input block requires 'data' bytes or 'url'")
+            return {
+                "type": "image",
+                "data": block.get("data"),
+                "url": block.get("url"),
+                "mime_type": block.get("mime_type") or "image/png",
+                "file_name": block.get("file_name") or "",
+            }
+        raise ValueError(f"Unknown input block type: {kind!r}")
+    raise ValueError(f"Unsupported input block: {type(block).__name__}")
+
+
+def _build_structured_messages(
+    *,
+    instructions: str,
+    inputs: Sequence[PluginLlmInput],
+    json_mode: bool,
+    json_schema: Optional[Any],
+    schema_name: Optional[str],
+    system_prompt: Optional[str],
+) -> List[Dict[str, Any]]:
+    """Build the OpenAI-style messages list for a structured call.
+
+    The instructions become the first text part of the user message,
+    followed by an optional ``Schema name: <name>`` hint and an optional
+    JSON-only directive when JSON output is requested. Image inputs are
+    encoded as ``image_url`` parts.
+    """
+    messages: List[Dict[str, Any]] = []
+    sys_parts: List[str] = []
+    if system_prompt:
+        sys_parts.append(system_prompt.strip())
+    if json_mode or json_schema is not None:
+        sys_parts.append(
+            "Respond with a single JSON object that matches the requested shape. "
+            "Do not include prose or markdown fences."
+        )
+    if sys_parts:
+        messages.append({"role": "system", "content": "\n\n".join(sys_parts)})
+
+    user_parts: List[Dict[str, Any]] = []
+    header = instructions.strip()
+    if schema_name:
+        header = f"{header}\n\nSchema name: {schema_name}"
+    if json_schema is not None:
+        try:
+            schema_text = json.dumps(json_schema, ensure_ascii=False, sort_keys=True)
+        except (TypeError, ValueError):
+            schema_text = str(json_schema)
+        header = f"{header}\n\nJSON schema:\n{schema_text}"
+    user_parts.append({"type": "text", "text": header})
+
+    for block in inputs:
+        norm = _normalize_input_block(block)
+        if norm["type"] == "text":
+            user_parts.append({"type": "text", "text": norm["text"]})
+        elif norm["type"] == "image":
+            if norm.get("url"):
+                user_parts.append({
+                    "type": "image_url",
+                    "image_url": {"url": norm["url"]},
+                })
+            else:
+                data = norm.get("data") or b""
+                if not isinstance(data, (bytes, bytearray)):
+                    raise ValueError("image input 'data' must be bytes")
+                b64 = base64.b64encode(data).decode("ascii")
+                mime = norm.get("mime_type") or "image/png"
+                user_parts.append({
+                    "type": "image_url",
+                    "image_url": {"url": f"data:{mime};base64,{b64}"},
+                })
+
+    messages.append({"role": "user", "content": user_parts})
+    return messages
+
+
+# ---------------------------------------------------------------------------
+# JSON parsing
+# ---------------------------------------------------------------------------
+
+
+_FENCE_RE = re.compile(r"```(?:json)?\s*(.+?)```", re.DOTALL | re.IGNORECASE)
+
+
+def _strip_code_fences(text: str) -> str:
+    """Pull the first fenced code block out of ``text`` if any. Returns
+    ``text`` unchanged when no fence is present."""
+    match = _FENCE_RE.search(text)
+    if match:
+        return match.group(1).strip()
+    return text.strip()
+
+
+def _parse_structured_text(
+    *, text: str, json_mode: bool, json_schema: Optional[Any]
+) -> tuple[Optional[Any], str]:
+    """Return ``(parsed, content_type)``. ``content_type`` is ``"json"``
+    when parsing succeeded and (when a schema was given) validation
+    passed; ``"text"`` otherwise."""
+    if not (json_mode or json_schema is not None):
+        return None, "text"
+    if not text:
+        return None, "text"
+
+    try:
+        parsed = json.loads(_strip_code_fences(text))
+    except (json.JSONDecodeError, ValueError):
+        return None, "text"
+
+    if json_schema is not None:
+        try:
+            import jsonschema  # type: ignore[import-untyped]
+            jsonschema.validate(parsed, json_schema)
+        except ImportError:
+            # jsonschema is optional; skip strict validation when absent.
+            logger.debug("jsonschema unavailable; skipping schema validation")
+        except jsonschema.ValidationError as exc:  # type: ignore[attr-defined]
+            raise ValueError(
+                f"Plugin LLM structured output did not match schema: {exc.message}"
+            ) from exc
+
+    return parsed, "json"
+
+
+# ---------------------------------------------------------------------------
+# Usage extraction
+# ---------------------------------------------------------------------------
+
+
+def _extract_usage(response: Any) -> PluginLlmUsage:
+    """Pull token usage out of an OpenAI-shaped response object.
+
+    Tolerant of provider differences — Anthropic via the auxiliary
+    adapter exposes ``usage.prompt_tokens`` / ``usage.completion_tokens``;
+    direct OpenAI also exposes ``cache_read_input_tokens``."""
+    usage = PluginLlmUsage()
+    raw = getattr(response, "usage", None)
+    if raw is None:
+        return usage
+
+    def _g(name: str) -> int:
+        v = getattr(raw, name, None)
+        if v is None and isinstance(raw, dict):
+            v = raw.get(name)
+        try:
+            return int(v) if v is not None else 0
+        except (TypeError, ValueError):
+            return 0
+
+    usage.input_tokens = _g("prompt_tokens") or _g("input_tokens")
+    usage.output_tokens = _g("completion_tokens") or _g("output_tokens")
+    usage.total_tokens = _g("total_tokens") or (usage.input_tokens + usage.output_tokens)
+    usage.cache_read_tokens = _g("cache_read_input_tokens") or _g("cache_read_tokens")
+    usage.cache_write_tokens = _g("cache_creation_input_tokens") or _g("cache_write_tokens")
+    return usage
+
+
+def _extract_text(response: Any) -> str:
+    """Pull the assistant text out of an OpenAI-shaped response object."""
+    try:
+        msg = response.choices[0].message
+        content = getattr(msg, "content", None)
+        if isinstance(content, str):
+            return content
+        if isinstance(content, list):
+            parts: List[str] = []
+            for part in content:
+                if isinstance(part, dict):
+                    if part.get("type") == "text" and isinstance(part.get("text"), str):
+                        parts.append(part["text"])
+                else:
+                    txt = getattr(part, "text", None)
+                    if isinstance(txt, str):
+                        parts.append(txt)
+            return "".join(parts)
+    except (AttributeError, IndexError, TypeError):
+        pass
+    return ""
+
+
+def _resolve_attribution(
+    *,
+    provider_override: Optional[str],
+    model_override: Optional[str],
+    response: Any,
+) -> tuple[str, str]:
+    """Decide what to record as ``result.provider`` / ``result.model``.
+
+    Precedence:
+
+    1. Explicit overrides win — if the plugin asked for ``provider="x"``
+       or ``model="y"``, that's what we record (it's what the call
+       actually targeted).
+    2. Otherwise we ask the host for the current main provider/model
+       via :func:`_read_main_provider` / :func:`_read_main_model`, since
+       those are what ``call_llm`` resolves to when ``provider=None``
+       and ``model=None`` are passed through. They reflect runtime
+       overrides set by ``set_runtime_main()``.
+    3. ``response.model`` (if present) overrides the recorded model
+       string. Providers post-resolution often return a slightly
+       different model id than the request (e.g. ``gpt-4o`` →
+       ``gpt-4o-2024-08-06``); the plugin's audit log should reflect
+       what actually ran.
+    4. If everything above is empty, fall back to ``"auto"`` /
+       ``"default"`` so the result object has non-empty strings.
+    """
+    if provider_override:
+        provider = provider_override
+    else:
+        try:
+            from agent.auxiliary_client import _read_main_provider
+            provider = (_read_main_provider() or "").strip() or "auto"
+        except Exception:  # pragma: no cover — defensive
+            provider = "auto"
+
+    response_model = getattr(response, "model", None)
+    if isinstance(response_model, str) and response_model.strip():
+        model = response_model.strip()
+    elif model_override:
+        model = model_override
+    else:
+        try:
+            from agent.auxiliary_client import _read_main_model
+            model = (_read_main_model() or "").strip() or "default"
+        except Exception:  # pragma: no cover — defensive
+            model = "default"
+
+    return provider, model
+
+
+# ---------------------------------------------------------------------------
+# PluginLlm facade
+# ---------------------------------------------------------------------------
+
+
+class PluginLlm:
+    """Host-owned LLM access for one trusted plugin.
+
+    Instances are constructed by :class:`hermes_cli.plugins.PluginContext`
+    and exposed as ``ctx.llm``. Plugins should not instantiate this
+    directly — the constructor binds plugin identity for trust-gate
+    enforcement.
+    """
+
+    def __init__(
+        self,
+        *,
+        plugin_id: str,
+        policy_loader: Optional[Callable[[str], _TrustPolicy]] = None,
+        sync_caller: Optional[Callable[..., Any]] = None,
+        async_caller: Optional[Callable[..., Awaitable[Any]]] = None,
+    ) -> None:
+        self._plugin_id = plugin_id
+        self._policy_loader = policy_loader or _resolve_trust_policy
+        self._sync_caller = sync_caller
+        self._async_caller = async_caller
+
+    # -- public sync API ----------------------------------------------------
+
+    def complete(
+        self,
+        messages: List[Dict[str, Any]],
+        *,
+        provider: Optional[str] = None,
+        model: Optional[str] = None,
+        temperature: Optional[float] = None,
+        max_tokens: Optional[int] = None,
+        timeout: Optional[float] = None,
+        agent_id: Optional[str] = None,
+        profile: Optional[str] = None,
+        purpose: Optional[str] = None,
+    ) -> PluginLlmCompleteResult:
+        """Run a host-owned chat completion against the user's active model.
+
+        ``messages`` is the standard OpenAI shape. ``provider``,
+        ``model``, ``agent_id``, and ``profile`` follow the same
+        explicit shape as the host's main config (``model.provider``
+        + ``model.model``). Each is independently gated by
+        ``plugins.entries.<id>.llm.allow_*_override`` (see module
+        docstring).
+        """
+        policy = self._policy_loader(self._plugin_id)
+        eff_provider, eff_model, eff_agent, eff_profile = _check_overrides(
+            policy,
+            requested_provider=provider,
+            requested_model=model,
+            requested_agent_id=agent_id,
+            requested_profile=profile,
+        )
+        real_provider, real_model, response = self._invoke_sync(
+            messages=messages,
+            provider_override=eff_provider,
+            model_override=eff_model,
+            profile_override=eff_profile,
+            temperature=temperature,
+            max_tokens=max_tokens,
+            timeout=timeout,
+        )
+        text = _extract_text(response)
+        usage = _extract_usage(response)
+        result = PluginLlmCompleteResult(
+            text=text,
+            provider=real_provider,
+            model=real_model,
+            agent_id=eff_agent or "default",
+            usage=usage,
+            audit={
+                "plugin_id": self._plugin_id,
+                "purpose": purpose or "",
+                "profile": eff_profile or "",
+            },
+        )
+        logger.info(
+            "plugin_llm.complete plugin=%s provider=%s model=%s purpose=%s "
+            "tokens=%d",
+            self._plugin_id, real_provider, real_model, purpose or "",
+            usage.total_tokens,
+        )
+        return result
+
+    def complete_structured(
+        self,
+        *,
+        instructions: str,
+        input: Sequence[PluginLlmInput],
+        json_schema: Optional[Any] = None,
+        json_mode: bool = False,
+        schema_name: Optional[str] = None,
+        system_prompt: Optional[str] = None,
+        provider: Optional[str] = None,
+        model: Optional[str] = None,
+        temperature: Optional[float] = None,
+        max_tokens: Optional[int] = None,
+        timeout: Optional[float] = None,
+        agent_id: Optional[str] = None,
+        profile: Optional[str] = None,
+        purpose: Optional[str] = None,
+    ) -> PluginLlmStructuredResult:
+        """Run a bounded host-owned structured completion.
+
+        ``input`` accepts text and image blocks (see
+        :class:`PluginLlmTextInput` / :class:`PluginLlmImageInput`). When
+        ``json_mode=True`` or ``json_schema`` is provided, the response
+        is parsed and (if a schema is given) validated; the parsed value
+        is returned in :attr:`PluginLlmStructuredResult.parsed`.
+
+        Validation requires the optional ``jsonschema`` package. When it
+        isn't installed, JSON mode still works but schema enforcement is
+        skipped with a debug log.
+        """
+        if not instructions or not instructions.strip():
+            raise ValueError("complete_structured requires non-empty instructions")
+        if not input:
+            raise ValueError("complete_structured requires at least one input block")
+
+        policy = self._policy_loader(self._plugin_id)
+        eff_provider, eff_model, eff_agent, eff_profile = _check_overrides(
+            policy,
+            requested_provider=provider,
+            requested_model=model,
+            requested_agent_id=agent_id,
+            requested_profile=profile,
+        )
+
+        messages = _build_structured_messages(
+            instructions=instructions,
+            inputs=list(input),
+            json_mode=json_mode,
+            json_schema=json_schema,
+            schema_name=schema_name,
+            system_prompt=system_prompt,
+        )
+        extra_body = self._json_response_format(json_mode=json_mode, json_schema=json_schema)
+
+        real_provider, real_model, response = self._invoke_sync(
+            messages=messages,
+            provider_override=eff_provider,
+            model_override=eff_model,
+            profile_override=eff_profile,
+            temperature=temperature,
+            max_tokens=max_tokens,
+            timeout=timeout,
+            extra_body=extra_body,
+        )
+        text = _extract_text(response)
+        usage = _extract_usage(response)
+        parsed, content_type = _parse_structured_text(
+            text=text, json_mode=json_mode, json_schema=json_schema
+        )
+        result = PluginLlmStructuredResult(
+            text=text,
+            provider=real_provider,
+            model=real_model,
+            agent_id=eff_agent or "default",
+            usage=usage,
+            parsed=parsed,
+            content_type=content_type,
+            audit={
+                "plugin_id": self._plugin_id,
+                "purpose": purpose or "",
+                "profile": eff_profile or "",
+                "schema_name": schema_name or "",
+            },
+        )
+        logger.info(
+            "plugin_llm.complete_structured plugin=%s provider=%s model=%s "
+            "purpose=%s content_type=%s tokens=%d",
+            self._plugin_id, real_provider, real_model, purpose or "",
+            content_type, usage.total_tokens,
+        )
+        return result
+
+    # -- public async API ---------------------------------------------------
+
+    async def acomplete(
+        self,
+        messages: List[Dict[str, Any]],
+        *,
+        provider: Optional[str] = None,
+        model: Optional[str] = None,
+        temperature: Optional[float] = None,
+        max_tokens: Optional[int] = None,
+        timeout: Optional[float] = None,
+        agent_id: Optional[str] = None,
+        profile: Optional[str] = None,
+        purpose: Optional[str] = None,
+    ) -> PluginLlmCompleteResult:
+        """Async sibling of :meth:`complete`."""
+        policy = self._policy_loader(self._plugin_id)
+        eff_provider, eff_model, eff_agent, eff_profile = _check_overrides(
+            policy,
+            requested_provider=provider,
+            requested_model=model,
+            requested_agent_id=agent_id,
+            requested_profile=profile,
+        )
+        real_provider, real_model, response = await self._invoke_async(
+            messages=messages,
+            provider_override=eff_provider,
+            model_override=eff_model,
+            profile_override=eff_profile,
+            temperature=temperature,
+            max_tokens=max_tokens,
+            timeout=timeout,
+        )
+        text = _extract_text(response)
+        usage = _extract_usage(response)
+        return PluginLlmCompleteResult(
+            text=text,
+            provider=real_provider,
+            model=real_model,
+            agent_id=eff_agent or "default",
+            usage=usage,
+            audit={
+                "plugin_id": self._plugin_id,
+                "purpose": purpose or "",
+                "profile": eff_profile or "",
+            },
+        )
+
+    async def acomplete_structured(
+        self,
+        *,
+        instructions: str,
+        input: Sequence[PluginLlmInput],
+        json_schema: Optional[Any] = None,
+        json_mode: bool = False,
+        schema_name: Optional[str] = None,
+        system_prompt: Optional[str] = None,
+        provider: Optional[str] = None,
+        model: Optional[str] = None,
+        temperature: Optional[float] = None,
+        max_tokens: Optional[int] = None,
+        timeout: Optional[float] = None,
+        agent_id: Optional[str] = None,
+        profile: Optional[str] = None,
+        purpose: Optional[str] = None,
+    ) -> PluginLlmStructuredResult:
+        """Async sibling of :meth:`complete_structured`."""
+        if not instructions or not instructions.strip():
+            raise ValueError("acomplete_structured requires non-empty instructions")
+        if not input:
+            raise ValueError("acomplete_structured requires at least one input block")
+
+        policy = self._policy_loader(self._plugin_id)
+        eff_provider, eff_model, eff_agent, eff_profile = _check_overrides(
+            policy,
+            requested_provider=provider,
+            requested_model=model,
+            requested_agent_id=agent_id,
+            requested_profile=profile,
+        )
+        messages = _build_structured_messages(
+            instructions=instructions,
+            inputs=list(input),
+            json_mode=json_mode,
+            json_schema=json_schema,
+            schema_name=schema_name,
+            system_prompt=system_prompt,
+        )
+        extra_body = self._json_response_format(json_mode=json_mode, json_schema=json_schema)
+        real_provider, real_model, response = await self._invoke_async(
+            messages=messages,
+            provider_override=eff_provider,
+            model_override=eff_model,
+            profile_override=eff_profile,
+            temperature=temperature,
+            max_tokens=max_tokens,
+            timeout=timeout,
+            extra_body=extra_body,
+        )
+        text = _extract_text(response)
+        usage = _extract_usage(response)
+        parsed, content_type = _parse_structured_text(
+            text=text, json_mode=json_mode, json_schema=json_schema
+        )
+        return PluginLlmStructuredResult(
+            text=text,
+            provider=real_provider,
+            model=real_model,
+            agent_id=eff_agent or "default",
+            usage=usage,
+            parsed=parsed,
+            content_type=content_type,
+            audit={
+                "plugin_id": self._plugin_id,
+                "purpose": purpose or "",
+                "profile": eff_profile or "",
+                "schema_name": schema_name or "",
+            },
+        )
+
+    # -- internals ---------------------------------------------------------
+
+    @staticmethod
+    def _json_response_format(
+        *, json_mode: bool, json_schema: Optional[Any]
+    ) -> Optional[Dict[str, Any]]:
+        """Build the ``extra_body.response_format`` payload for the
+        provider request. Falls back to ``json_object`` when no schema
+        is given so providers that ignore json_schema still get a hint."""
+        if json_schema is not None:
+            return {
+                "response_format": {
+                    "type": "json_schema",
+                    "json_schema": {
+                        "name": "plugin_structured_output",
+                        "schema": json_schema,
+                        "strict": False,
+                    },
+                }
+            }
+        if json_mode:
+            return {"response_format": {"type": "json_object"}}
+        return None
+
+    def _invoke_sync(
+        self,
+        *,
+        messages: List[Dict[str, Any]],
+        provider_override: Optional[str],
+        model_override: Optional[str],
+        profile_override: Optional[str],
+        temperature: Optional[float],
+        max_tokens: Optional[int],
+        timeout: Optional[float],
+        extra_body: Optional[Dict[str, Any]] = None,
+    ) -> tuple[str, str, Any]:
+        """Invoke the host's ``call_llm``. Lazy-imports
+        ``agent.auxiliary_client`` to avoid circular deps at plugin
+        discovery time."""
+        if self._sync_caller is not None:
+            return self._sync_caller(
+                messages=messages,
+                provider_override=provider_override,
+                model_override=model_override,
+                profile_override=profile_override,
+                temperature=temperature,
+                max_tokens=max_tokens,
+                timeout=timeout,
+                extra_body=extra_body,
+            )
+        from agent.auxiliary_client import call_llm
+        merged_extra = dict(extra_body or {})
+        if profile_override:
+            merged_extra.setdefault("metadata", {})["auth_profile"] = profile_override
+        response = call_llm(
+            task=None,
+            provider=provider_override,
+            model=model_override,
+            messages=messages,
+            temperature=temperature,
+            max_tokens=max_tokens,
+            timeout=timeout,
+            extra_body=merged_extra or None,
+        )
+        provider, model = _resolve_attribution(
+            provider_override=provider_override,
+            model_override=model_override,
+            response=response,
+        )
+        return provider, model, response
+
+    async def _invoke_async(
+        self,
+        *,
+        messages: List[Dict[str, Any]],
+        provider_override: Optional[str],
+        model_override: Optional[str],
+        profile_override: Optional[str],
+        temperature: Optional[float],
+        max_tokens: Optional[int],
+        timeout: Optional[float],
+        extra_body: Optional[Dict[str, Any]] = None,
+    ) -> tuple[str, str, Any]:
+        if self._async_caller is not None:
+            return await self._async_caller(
+                messages=messages,
+                provider_override=provider_override,
+                model_override=model_override,
+                profile_override=profile_override,
+                temperature=temperature,
+                max_tokens=max_tokens,
+                timeout=timeout,
+                extra_body=extra_body,
+            )
+        from agent.auxiliary_client import async_call_llm
+        merged_extra = dict(extra_body or {})
+        if profile_override:
+            merged_extra.setdefault("metadata", {})["auth_profile"] = profile_override
+        response = await async_call_llm(
+            task=None,
+            provider=provider_override,
+            model=model_override,
+            messages=messages,
+            temperature=temperature,
+            max_tokens=max_tokens,
+            timeout=timeout,
+            extra_body=merged_extra or None,
+        )
+        provider, model = _resolve_attribution(
+            provider_override=provider_override,
+            model_override=model_override,
+            response=response,
+        )
+        return provider, model, response
+
+
+# ---------------------------------------------------------------------------
+# Test helpers
+# ---------------------------------------------------------------------------
+
+
+def make_plugin_llm_for_test(
+    *,
+    plugin_id: str,
+    policy: _TrustPolicy,
+    sync_caller: Optional[Callable[..., Any]] = None,
+    async_caller: Optional[Callable[..., Awaitable[Any]]] = None,
+) -> PluginLlm:
+    """Construct a :class:`PluginLlm` with an injected policy and caller.
+
+    Used by unit tests that don't want to round-trip through config.yaml
+    or hit a real provider. Not part of the public plugin API.
+    """
+    return PluginLlm(
+        plugin_id=plugin_id,
+        policy_loader=lambda _pid: policy,
+        sync_caller=sync_caller,
+        async_caller=async_caller,
+    )
+
+
+__all__ = [
+    "PluginLlm",
+    "PluginLlmTextInput",
+    "PluginLlmImageInput",
+    "PluginLlmInput",
+    "PluginLlmUsage",
+    "PluginLlmCompleteResult",
+    "PluginLlmStructuredResult",
+    "PluginLlmTrustError",
+    "make_plugin_llm_for_test",
+]
diff --git a/hermes_cli/plugins.py b/hermes_cli/plugins.py
index 15ef7920a15..3a58baa0695 100644
--- a/hermes_cli/plugins.py
+++ b/hermes_cli/plugins.py
@@ -290,6 +290,27 @@ class PluginContext:
     def __init__(self, manifest: PluginManifest, manager: "PluginManager"):
         self.manifest = manifest
         self._manager = manager
+        # Lazy-built host-owned LLM facade — see ctx.llm property below.
+        self._llm: Any = None
+
+    # -- host-owned LLM access ----------------------------------------------
+
+    @property
+    def llm(self) -> Any:
+        """Return the plugin's :class:`agent.plugin_llm.PluginLlm` facade.
+
+        Lets trusted plugins run host-owned chat or structured completions
+        against the user's active model and auth without bringing their
+        own provider keys. Override capability (model, agent id, auth
+        profile) is fail-closed by default and gated through
+        ``plugins.entries.<plugin_id>.llm.*`` config keys.
+
+        See :mod:`agent.plugin_llm` for the full surface."""
+        if self._llm is None:
+            from agent.plugin_llm import PluginLlm
+            plugin_id = self.manifest.key or self.manifest.name
+            self._llm = PluginLlm(plugin_id=plugin_id)
+        return self._llm
 
     # -- tool registration --------------------------------------------------
 
diff --git a/plugins/example-dashboard/dashboard/dist/index.js b/plugins/example-dashboard/dashboard/dist/index.js
deleted file mode 100644
index 04092348ffb..00000000000
--- a/plugins/example-dashboard/dashboard/dist/index.js
+++ /dev/null
@@ -1,119 +0,0 @@
-/**
- * Example Dashboard Plugin
- *
- * Demonstrates how to build a dashboard plugin using the Hermes Plugin SDK.
- * No build step needed — this is a plain IIFE that uses globals from the SDK.
- */
-(function () {
-  "use strict";
-
-  const SDK = window.__HERMES_PLUGIN_SDK__;
-  const { React } = SDK;
-  const { Card, CardHeader, CardTitle, CardContent, Badge, Button } = SDK.components;
-  const { useState, useEffect } = SDK.hooks;
-  const { cn } = SDK.utils;
-
-  function ExamplePage() {
-    const [greeting, setGreeting] = useState(null);
-    const [loading, setLoading] = useState(false);
-
-    function fetchGreeting() {
-      setLoading(true);
-      SDK.fetchJSON("/api/plugins/example/hello")
-        .then(function (data) { setGreeting(data.message); })
-        .catch(function () { setGreeting("(backend not available)"); })
-        .finally(function () { setLoading(false); });
-    }
-
-    return React.createElement("div", { className: "flex flex-col gap-6" },
-      // Header card
-      React.createElement(Card, null,
-        React.createElement(CardHeader, null,
-          React.createElement("div", { className: "flex items-center gap-3" },
-            React.createElement(CardTitle, { className: "text-lg" }, "Example Plugin"),
-            React.createElement(Badge, { variant: "outline" }, "v1.0.0"),
-          ),
-        ),
-        React.createElement(CardContent, { className: "flex flex-col gap-4" },
-          React.createElement("p", { className: "text-sm text-muted-foreground" },
-            "This is an example dashboard plugin. It demonstrates using the Plugin SDK to build ",
-            "custom tabs with React components, connect to backend API routes, and integrate with ",
-            "the existing Hermes UI system.",
-          ),
-          React.createElement("div", { className: "flex items-center gap-3" },
-            React.createElement(Button, {
-              onClick: fetchGreeting,
-              disabled: loading,
-              className: cn(
-                "inline-flex items-center gap-2 border border-border bg-background/40 px-4 py-2",
-                "text-sm font-courier transition-colors hover:bg-foreground/10 cursor-pointer",
-              ),
-            }, loading ? "Loading..." : "Call Backend API"),
-            greeting && React.createElement("span", {
-              className: "text-sm font-courier text-muted-foreground",
-            }, greeting),
-          ),
-        ),
-      ),
-
-      // Info card about the SDK
-      React.createElement(Card, null,
-        React.createElement(CardHeader, null,
-          React.createElement(CardTitle, { className: "text-base" }, "Plugin SDK Reference"),
-        ),
-        React.createElement(CardContent, null,
-          React.createElement("div", { className: "grid gap-3 text-sm" },
-            React.createElement("div", { className: "flex flex-col gap-1 border border-border p-3" },
-              React.createElement("span", { className: "font-medium" }, "window.__HERMES_PLUGIN_SDK__.React"),
-              React.createElement("span", { className: "text-muted-foreground text-xs" }, "React instance — use instead of importing react"),
-            ),
-            React.createElement("div", { className: "flex flex-col gap-1 border border-border p-3" },
-              React.createElement("span", { className: "font-medium" }, "window.__HERMES_PLUGIN_SDK__.hooks"),
-              React.createElement("span", { className: "text-muted-foreground text-xs" }, "useState, useEffect, useCallback, useMemo, useRef, useContext, createContext"),
-            ),
-            React.createElement("div", { className: "flex flex-col gap-1 border border-border p-3" },
-              React.createElement("span", { className: "font-medium" }, "window.__HERMES_PLUGIN_SDK__.components"),
-              React.createElement("span", { className: "text-muted-foreground text-xs" }, "Card, Badge, Button, Input, Label, Select, Separator, Tabs, etc."),
-            ),
-            React.createElement("div", { className: "flex flex-col gap-1 border border-border p-3" },
-              React.createElement("span", { className: "font-medium" }, "window.__HERMES_PLUGIN_SDK__.api"),
-              React.createElement("span", { className: "text-muted-foreground text-xs" }, "Hermes API client — getStatus(), getSessions(), etc."),
-            ),
-            React.createElement("div", { className: "flex flex-col gap-1 border border-border p-3" },
-              React.createElement("span", { className: "font-medium" }, "window.__HERMES_PLUGIN_SDK__.utils"),
-              React.createElement("span", { className: "text-muted-foreground text-xs" }, "cn(), timeAgo(), isoTimeAgo()"),
-            ),
-          ),
-        ),
-      ),
-    );
-  }
-
-  // Register this plugin — the dashboard picks it up automatically.
-  window.__HERMES_PLUGINS__.register("example", ExamplePage);
-
-  // ─────────────────────────────────────────────────────────────────────
-  // Page-scoped slot demo: inject a small banner at the top of /sessions.
-  //
-  // Built-in pages expose named slots (<page>:top, <page>:bottom) that
-  // plugins can populate without overriding the whole route. The
-  // manifest lists the slots we use in its `slots` array so the shell
-  // knows to render <PluginSlot name="sessions:top" /> there.
-  // ─────────────────────────────────────────────────────────────────────
-  function SessionsTopBanner() {
-    return React.createElement(Card, {
-      className: "border-dashed",
-    },
-      React.createElement(CardContent, { className: "flex items-center gap-3 py-2" },
-        React.createElement(Badge, { variant: "outline" }, "Example"),
-        React.createElement("span", {
-          className: "text-xs text-muted-foreground",
-        }, "This banner was injected into the Sessions page by the example plugin via the ",
-          React.createElement("code", { className: "font-courier" }, "sessions:top"),
-          " slot."),
-      ),
-    );
-  }
-
-  window.__HERMES_PLUGINS__.registerSlot("example", "sessions:top", SessionsTopBanner);
-})();
diff --git a/plugins/example-dashboard/dashboard/manifest.json b/plugins/example-dashboard/dashboard/manifest.json
deleted file mode 100644
index 95fce2f100f..00000000000
--- a/plugins/example-dashboard/dashboard/manifest.json
+++ /dev/null
@@ -1,14 +0,0 @@
-{
-  "name": "example",
-  "label": "Example",
-  "description": "Example dashboard plugin — demonstrates the plugin SDK",
-  "icon": "Sparkles",
-  "version": "1.0.0",
-  "tab": {
-    "path": "/example",
-    "position": "after:skills"
-  },
-  "slots": ["sessions:top"],
-  "entry": "dist/index.js",
-  "api": "plugin_api.py"
-}
diff --git a/plugins/example-dashboard/dashboard/plugin_api.py b/plugins/example-dashboard/dashboard/plugin_api.py
deleted file mode 100644
index 20aed76e26f..00000000000
--- a/plugins/example-dashboard/dashboard/plugin_api.py
+++ /dev/null
@@ -1,14 +0,0 @@
-"""Example dashboard plugin — backend API routes.
-
-Mounted at /api/plugins/example/ by the dashboard plugin system.
-"""
-
-from fastapi import APIRouter
-
-router = APIRouter()
-
-
-@router.get("/hello")
-async def hello():
-    """Simple greeting endpoint to demonstrate plugin API routes."""
-    return {"message": "Hello from the example plugin!", "plugin": "example", "version": "1.0.0"}
diff --git a/plugins/strike-freedom-cockpit/README.md b/plugins/strike-freedom-cockpit/README.md
deleted file mode 100644
index c24c5e3882b..00000000000
--- a/plugins/strike-freedom-cockpit/README.md
+++ /dev/null
@@ -1,70 +0,0 @@
-# Strike Freedom Cockpit — dashboard skin demo
-
-Demonstrates how the dashboard skin+plugin system can be used to build a
-fully custom cockpit-style reskin without touching the core dashboard.
-
-Two pieces:
-
-- `theme/strike-freedom.yaml` — a dashboard theme YAML that paints the
-  palette, typography, layout variant (`cockpit`), component chrome
-  (notched card corners, scanlines, accent colors), and declares asset
-  slots (`hero`, `crest`, `bg`).
-- `dashboard/` — a plugin that populates the `sidebar`, `header-left`,
-  and `footer-right` slots reserved by the cockpit layout. The sidebar
-  renders an MS-STATUS panel with segmented telemetry bars driven by
-  real agent status; the header-left injects a COMPASS crest; the
-  footer-right replaces the default org tagline.
-
-## Install
-
-1. **Theme** — copy the theme YAML into your Hermes home:
-
-   ```
-   cp theme/strike-freedom.yaml ~/.hermes/dashboard-themes/
-   ```
-
-2. **Plugin** — the `dashboard/` directory gets auto-discovered because
-   it lives under `plugins/` in the repo. On a user install, copy the
-   whole plugin directory into `~/.hermes/plugins/`:
-
-   ```
-   cp -r . ~/.hermes/plugins/strike-freedom-cockpit
-   ```
-
-3. Restart the web UI (or `GET /api/dashboard/plugins/rescan`), open it,
-   pick **Strike Freedom** from the theme switcher.
-
-## Customising the artwork
-
-The sidebar plugin reads `--theme-asset-hero` and `--theme-asset-crest`
-from the active theme. Drop your own URLs into the theme YAML:
-
-```yaml
-assets:
-  hero: "/my-images/strike-freedom.png"
-  crest: "/my-images/compass-crest.svg"
-  bg: "/my-images/cosmic-era-bg.jpg"
-```
-
-The plugin reads those at render time — no plugin code changes needed
-to swap artwork across themes.
-
-## What this demo proves
-
-The dashboard skin+plugin system supports (ref: `web/src/themes/types.ts`,
-`web/src/plugins/slots.ts`):
-
-- Palette, typography, font URLs, density, radius — already present
-- **Asset URLs exposed as CSS vars** (bg / hero / crest / logo /
-  sidebar / header + arbitrary `custom.*`)
-- **Raw `customCSS` blocks** injected as scoped `<style>` tags
-- **Per-component style overrides** (card / header / sidebar / backdrop /
-  tab / progress / footer / badge / page) via CSS vars
-- **`layoutVariant`** — `standard`, `cockpit`, or `tiled`
-- **Plugin slots** — 10 named shell slots plugins can inject into
-  (`backdrop`, `header-left/right/banner`, `sidebar`, `pre-main`,
-  `post-main`, `footer-left/right`, `overlay`)
-- **Route overrides** — plugins can replace a built-in page entirely
-  (`tab.override: "/"`) instead of just adding a tab
-- **Hidden plugins** — slot-only plugins that never show in the nav
-  (`tab.hidden: true`) — as used here
diff --git a/plugins/strike-freedom-cockpit/dashboard/dist/index.js b/plugins/strike-freedom-cockpit/dashboard/dist/index.js
deleted file mode 100644
index 7506c80997e..00000000000
--- a/plugins/strike-freedom-cockpit/dashboard/dist/index.js
+++ /dev/null
@@ -1,309 +0,0 @@
-/**
- * Strike Freedom Cockpit — dashboard plugin demo.
- *
- * A slot-only plugin (manifest sets tab.hidden: true) that populates
- * three shell slots when the user has the ``strike-freedom`` theme
- * selected (or any theme that picks layoutVariant: cockpit):
- *
- *   - sidebar       → MS-STATUS panel: ENERGY / SHIELD / POWER bars,
- *                     ZGMF-X20A identity line, pilot block, hero
- *                     render (from --theme-asset-hero when the theme
- *                     provides one).
- *   - header-left   → COMPASS faction crest (uses --theme-asset-crest
- *                     if provided, falls back to a geometric SVG).
- *   - footer-right  → COSMIC ERA tagline that replaces the default
- *                     footer org line.
- *
- * The plugin demonstrates every extension point added alongside the
- * slot system: registerSlot, tab.hidden, reading theme asset CSS vars
- * from plugin code, and rendering above the built-in route content.
- */
-(function () {
-  "use strict";
-
-  const SDK = window.__HERMES_PLUGIN_SDK__;
-  const PLUGINS = window.__HERMES_PLUGINS__;
-  if (!SDK || !PLUGINS || !PLUGINS.registerSlot) {
-    // Old dashboard bundle without slot support — bail silently rather
-    // than breaking the page.
-    return;
-  }
-
-  const { React } = SDK;
-  const { useState, useEffect } = SDK.hooks;
-  const { api } = SDK;
-
-  // ---------------------------------------------------------------------
-  // Helpers
-  // ---------------------------------------------------------------------
-
-  /** Read a CSS custom property from :root. Empty string when unset. */
-  function cssVar(name) {
-    if (typeof document === "undefined") return "";
-    return getComputedStyle(document.documentElement).getPropertyValue(name).trim();
-  }
-
-  /** Segmented chip progress bar — 10 cells filled proportionally to value. */
-  function TelemetryBar(props) {
-    const { label, value, color } = props;
-    const cells = [];
-    for (let i = 0; i < 10; i++) {
-      const filled = Math.round(value / 10) > i;
-      cells.push(
-        React.createElement("span", {
-          key: i,
-          style: {
-            flex: 1,
-            height: 8,
-            background: filled ? color : "rgba(255,255,255,0.06)",
-            transition: "background 200ms",
-            clipPath: "polygon(2px 0, 100% 0, calc(100% - 2px) 100%, 0 100%)",
-          },
-        }),
-      );
-    }
-    return React.createElement(
-      "div",
-      { style: { display: "flex", flexDirection: "column", gap: 4 } },
-      React.createElement(
-        "div",
-        {
-          style: {
-            display: "flex",
-            justifyContent: "space-between",
-            fontSize: "0.65rem",
-            letterSpacing: "0.12em",
-            opacity: 0.75,
-          },
-        },
-        React.createElement("span", null, label),
-        React.createElement("span", { style: { color, fontWeight: 700 } }, value + "%"),
-      ),
-      React.createElement(
-        "div",
-        { style: { display: "flex", gap: 2 } },
-        cells,
-      ),
-    );
-  }
-
-  // ---------------------------------------------------------------------
-  // Sidebar: MS-STATUS panel
-  // ---------------------------------------------------------------------
-
-  function SidebarSlot() {
-    // Pull live-ish numbers from the status API so the plugin isn't just
-    // a static decoration. Fall back to full bars if the API is slow /
-    // unavailable.
-    const [status, setStatus] = useState(null);
-    useEffect(function () {
-      let cancel = false;
-      api.getStatus()
-        .then(function (s) { if (!cancel) setStatus(s); })
-        .catch(function () {});
-      return function () { cancel = true; };
-    }, []);
-
-    // Map real status signals to HUD telemetry. Energy/shield/power
-    // aren't literal concepts on a software agent, so we read them from
-    // adjacent signals: active sessions, gateway connected-platforms,
-    // and agent-online health.
-    const energy = status && status.gateway_online ? 92 : 18;
-    const shield = status && status.connected_platforms
-      ? Math.min(100, 40 + (status.connected_platforms.length * 15))
-      : 70;
-    const power = status && status.active_sessions
-      ? Math.min(100, 55 + (status.active_sessions.length * 10))
-      : 87;
-
-    const hero = cssVar("--theme-asset-hero");
-
-    return React.createElement(
-      "div",
-      {
-        style: {
-          padding: "1rem 0.75rem",
-          display: "flex",
-          flexDirection: "column",
-          gap: "1rem",
-          fontFamily: "var(--theme-font-display, sans-serif)",
-          letterSpacing: "0.08em",
-          textTransform: "uppercase",
-          fontSize: "0.65rem",
-        },
-      },
-      // Header line
-      React.createElement(
-        "div",
-        {
-          style: {
-            borderBottom: "1px solid rgba(64,200,255,0.3)",
-            paddingBottom: 8,
-            display: "flex",
-            flexDirection: "column",
-            gap: 2,
-          },
-        },
-        React.createElement("span", { style: { opacity: 0.6 } }, "ms status"),
-        React.createElement("span", { style: { fontWeight: 700, fontSize: "0.85rem" } }, "zgmf-x20a"),
-        React.createElement("span", { style: { opacity: 0.6, fontSize: "0.6rem" } }, "strike freedom"),
-      ),
-      // Hero slot — only renders when the theme provides one.
-      hero
-        ? React.createElement("div", {
-            style: {
-              width: "100%",
-              aspectRatio: "3 / 4",
-              backgroundImage: hero,
-              backgroundSize: "contain",
-              backgroundPosition: "center",
-              backgroundRepeat: "no-repeat",
-              opacity: 0.85,
-            },
-            "aria-hidden": true,
-          })
-        : React.createElement("div", {
-            style: {
-              width: "100%",
-              aspectRatio: "3 / 4",
-              border: "1px dashed rgba(64,200,255,0.25)",
-              display: "flex",
-              alignItems: "center",
-              justifyContent: "center",
-              fontSize: "0.55rem",
-              opacity: 0.4,
-            },
-          }, "hero slot — set assets.hero in theme"),
-      // Pilot block
-      React.createElement(
-        "div",
-        {
-          style: {
-            borderTop: "1px solid rgba(64,200,255,0.18)",
-            borderBottom: "1px solid rgba(64,200,255,0.18)",
-            padding: "8px 0",
-            display: "flex",
-            flexDirection: "column",
-            gap: 2,
-          },
-        },
-        React.createElement("span", { style: { opacity: 0.5, fontSize: "0.55rem" } }, "pilot"),
-        React.createElement("span", { style: { fontWeight: 700 } }, "hermes agent"),
-        React.createElement("span", { style: { opacity: 0.5, fontSize: "0.55rem" } }, "compass"),
-      ),
-      // Telemetry bars
-      React.createElement(TelemetryBar, { label: "energy",  value: energy, color: "#ffce3a" }),
-      React.createElement(TelemetryBar, { label: "shield",  value: shield, color: "#3fd3ff" }),
-      React.createElement(TelemetryBar, { label: "power",   value: power,  color: "#ff3a5e" }),
-      // System online
-      React.createElement(
-        "div",
-        {
-          style: {
-            marginTop: 4,
-            padding: "6px 8px",
-            border: "1px solid rgba(74,222,128,0.4)",
-            color: "#4ade80",
-            textAlign: "center",
-            fontWeight: 700,
-            fontSize: "0.6rem",
-          },
-        },
-        status && status.gateway_online ? "system online" : "system offline",
-      ),
-    );
-  }
-
-  // ---------------------------------------------------------------------
-  // Header-left: COMPASS crest
-  // ---------------------------------------------------------------------
-
-  function HeaderCrestSlot() {
-    const crest = cssVar("--theme-asset-crest");
-    const inner = crest
-      ? React.createElement("div", {
-          style: {
-            width: 28,
-            height: 28,
-            backgroundImage: crest,
-            backgroundSize: "contain",
-            backgroundPosition: "center",
-            backgroundRepeat: "no-repeat",
-          },
-          "aria-hidden": true,
-        })
-      : React.createElement(
-          "svg",
-          {
-            width: 28,
-            height: 28,
-            viewBox: "0 0 28 28",
-            fill: "none",
-            stroke: "currentColor",
-            strokeWidth: 1.5,
-            "aria-hidden": true,
-          },
-          React.createElement("path", { d: "M14 2 L26 14 L14 26 L2 14 Z" }),
-          React.createElement("path", { d: "M14 8 L20 14 L14 20 L8 14 Z" }),
-          React.createElement("circle", { cx: 14, cy: 14, r: 2, fill: "currentColor" }),
-        );
-    return React.createElement(
-      "div",
-      {
-        style: {
-          display: "flex",
-          alignItems: "center",
-          paddingLeft: 12,
-          paddingRight: 8,
-          color: "var(--color-accent, #3fd3ff)",
-        },
-      },
-      inner,
-    );
-  }
-
-  // ---------------------------------------------------------------------
-  // Footer-right: COSMIC ERA tagline
-  // ---------------------------------------------------------------------
-
-  function FooterTaglineSlot() {
-    return React.createElement(
-      "span",
-      {
-        style: {
-          fontFamily: "var(--theme-font-display, sans-serif)",
-          fontSize: "0.6rem",
-          letterSpacing: "0.18em",
-          textTransform: "uppercase",
-          opacity: 0.75,
-          mixBlendMode: "plus-lighter",
-        },
-      },
-      "compass hermes systems / cosmic era 71",
-    );
-  }
-
-  // ---------------------------------------------------------------------
-  // Hidden tab placeholder — tab.hidden=true means this never renders in
-  // the nav, but we still register something sensible in case someone
-  // manually navigates to /strike-freedom-cockpit (e.g. via a bookmark).
-  // ---------------------------------------------------------------------
-
-  function HiddenPage() {
-    return React.createElement(
-      "div",
-      { style: { padding: "2rem", opacity: 0.6, fontSize: "0.8rem" } },
-      "Strike Freedom cockpit is a slot-only plugin — it populates the sidebar, header, and footer instead of showing a tab page.",
-    );
-  }
-
-  // ---------------------------------------------------------------------
-  // Registration
-  // ---------------------------------------------------------------------
-
-  const NAME = "strike-freedom-cockpit";
-  PLUGINS.register(NAME, HiddenPage);
-  PLUGINS.registerSlot(NAME, "sidebar", SidebarSlot);
-  PLUGINS.registerSlot(NAME, "header-left", HeaderCrestSlot);
-  PLUGINS.registerSlot(NAME, "footer-right", FooterTaglineSlot);
-})();
diff --git a/plugins/strike-freedom-cockpit/dashboard/manifest.json b/plugins/strike-freedom-cockpit/dashboard/manifest.json
deleted file mode 100644
index fec3c79eff9..00000000000
--- a/plugins/strike-freedom-cockpit/dashboard/manifest.json
+++ /dev/null
@@ -1,14 +0,0 @@
-{
-  "name": "strike-freedom-cockpit",
-  "label": "Strike Freedom Cockpit",
-  "description": "MS-STATUS sidebar + header crest for the Strike Freedom theme",
-  "icon": "Shield",
-  "version": "1.0.0",
-  "tab": {
-    "path": "/strike-freedom-cockpit",
-    "position": "end",
-    "hidden": true
-  },
-  "slots": ["sidebar", "header-left", "footer-right"],
-  "entry": "dist/index.js"
-}
diff --git a/plugins/strike-freedom-cockpit/theme/strike-freedom.yaml b/plugins/strike-freedom-cockpit/theme/strike-freedom.yaml
deleted file mode 100644
index ebbcf11841b..00000000000
--- a/plugins/strike-freedom-cockpit/theme/strike-freedom.yaml
+++ /dev/null
@@ -1,126 +0,0 @@
-# Strike Freedom — Hermes dashboard theme demo
-#
-# Copy this file to ~/.hermes/dashboard-themes/strike-freedom.yaml and
-# restart the web UI (or hit `/api/dashboard/plugins/rescan`). Pair with
-# the `strike-freedom-cockpit` plugin (plugins/strike-freedom-cockpit/)
-# for the full cockpit experience — this theme paints the palette,
-# chrome, and layout; the plugin supplies the MS-STATUS sidebar + header
-# crest that the cockpit layout variant reserves space for.
-#
-# Demonstrates every theme extension point added alongside the plugin
-# slot system: palette, typography, layoutVariant, assets, customCSS,
-# componentStyles, colorOverrides.
-name: strike-freedom
-label: "Strike Freedom"
-description: "Cockpit HUD — deep navy + cyan + gold accents"
-
-# ------- palette (3-layer) -------
-palette:
-  background: "#05091a"
-  midground: "#d8f0ff"
-  foreground:
-    hex: "#ffffff"
-    alpha: 0
-  warmGlow: "rgba(255, 199, 55, 0.24)"
-  noiseOpacity: 0.7
-
-# ------- typography -------
-typography:
-  fontSans: '"Orbitron", "Eurostile", "Bank Gothic", "Impact", sans-serif'
-  fontMono: '"Share Tech Mono", "JetBrains Mono", ui-monospace, monospace'
-  fontDisplay: '"Orbitron", "Eurostile", "Impact", sans-serif'
-  fontUrl: "https://fonts.googleapis.com/css2?family=Orbitron:wght@400;500;600;700;800&family=Share+Tech+Mono&display=swap"
-  baseSize: "14px"
-  lineHeight: "1.5"
-  letterSpacing: "0.04em"
-
-# ------- layout -------
-layout:
-  radius: "0"
-  density: "compact"
-
-# ``cockpit`` reserves a 260px left rail that the shell renders when the
-# user is on this theme. A paired plugin populates the rail via the
-# ``sidebar`` slot; with no plugin the rail shows a placeholder.
-layoutVariant: cockpit
-
-# ------- assets -------
-# Use any URL (https, data:, /dashboard-plugins/...) or a pre-wrapped
-# ``url(...)``/``linear-gradient(...)`` expression. The shell exposes
-# each as a CSS var so plugins can read the same imagery.
-assets:
-  bg: "linear-gradient(140deg, #05091a 0%, #0a1530 55%, #102048 100%)"
-  # Plugin reads --theme-asset-hero / --theme-asset-crest to populate
-  # its sidebar hero render + header crest. Replace these URLs with your
-  # own artwork (copy files into ~/.hermes/dashboard-themes/assets/ and
-  # reference them as /dashboard-themes-assets/strike-freedom/hero.png
-  # once that static route is wired up — for now use inline data URLs or
-  # remote URLs).
-  hero: ""
-  crest: ""
-
-# ------- component chrome -------
-# Each bucket's props become CSS vars (--component-<bucket>-<kebab>) that
-# built-in shell components (Card, header, sidebar, backdrop) consume.
-componentStyles:
-  card:
-    # Notched corners on the top-left + bottom-right — classic mecha UI.
-    clipPath: "polygon(12px 0, 100% 0, 100% calc(100% - 12px), calc(100% - 12px) 100%, 0 100%, 0 12px)"
-    background: "linear-gradient(180deg, rgba(10, 22, 52, 0.85) 0%, rgba(5, 9, 26, 0.92) 100%)"
-    boxShadow: "inset 0 0 0 1px rgba(64, 200, 255, 0.28), 0 0 18px -6px rgba(64, 200, 255, 0.4)"
-  header:
-    background: "linear-gradient(180deg, rgba(16, 32, 72, 0.95) 0%, rgba(5, 9, 26, 0.9) 100%)"
-  sidebar:
-    background: "linear-gradient(180deg, rgba(8, 18, 42, 0.88) 0%, rgba(5, 9, 26, 0.85) 100%)"
-  tab:
-    clipPath: "polygon(6px 0, 100% 0, calc(100% - 6px) 100%, 0 100%)"
-  backdrop:
-    backgroundSize: "cover"
-    backgroundPosition: "center"
-    fillerOpacity: "1"
-    fillerBlendMode: "normal"
-
-# ------- color overrides -------
-colorOverrides:
-  primary: "#ffce3a"
-  primaryForeground: "#05091a"
-  accent: "#3fd3ff"
-  accentForeground: "#05091a"
-  ring: "#3fd3ff"
-  success: "#4ade80"
-  warning: "#ffce3a"
-  destructive: "#ff3a5e"
-  border: "rgba(64, 200, 255, 0.28)"
-
-# ------- customCSS -------
-# Raw CSS injected as a scoped <style> tag on theme apply. Use this for
-# selector-level tweaks componentStyles can't express (pseudo-elements,
-# animations, media queries). Bounded to 32 KiB per theme.
-customCSS: |
-  /* Scanline overlay — subtle, only when theme is active. */
-  :root[data-layout-variant="cockpit"] body::before {
-    content: "";
-    position: fixed;
-    inset: 0;
-    pointer-events: none;
-    z-index: 100;
-    background: repeating-linear-gradient(
-      to bottom,
-      transparent 0px,
-      transparent 2px,
-      rgba(64, 200, 255, 0.035) 3px,
-      rgba(64, 200, 255, 0.035) 4px
-    );
-    mix-blend-mode: screen;
-  }
-
-  /* Chevron pips on card corners. */
-  [data-layout-variant="cockpit"] .border-border::before,
-  [data-layout-variant="cockpit"] .border-border::after {
-    content: "";
-    position: absolute;
-    width: 8px;
-    height: 8px;
-    border: 1px solid rgba(64, 200, 255, 0.55);
-    pointer-events: none;
-  }
diff --git a/tests/agent/test_plugin_llm.py b/tests/agent/test_plugin_llm.py
new file mode 100644
index 00000000000..b31f8097a7e
--- /dev/null
+++ b/tests/agent/test_plugin_llm.py
@@ -0,0 +1,991 @@
+"""Unit tests for the plugin LLM facade (``agent.plugin_llm``).
+
+These tests exercise the trust gate, JSON parsing, schema validation,
+image input encoding, and the auxiliary-client invocation contract.
+The auxiliary client itself is stubbed via ``make_plugin_llm_for_test``
+so we don't hit real providers.
+"""
+
+from __future__ import annotations
+
+import asyncio
+import base64
+import json
+from types import SimpleNamespace
+from typing import Any
+from unittest.mock import MagicMock
+
+import pytest
+
+from agent.plugin_llm import (
+    PluginLlm,
+    PluginLlmCompleteResult,
+    PluginLlmImageInput,
+    PluginLlmStructuredResult,
+    PluginLlmTextInput,
+    PluginLlmTrustError,
+    _build_structured_messages,
+    _check_overrides,
+    _coerce_allowlist,
+    _parse_structured_text,
+    _strip_code_fences,
+    _TrustPolicy,
+    make_plugin_llm_for_test,
+)
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+
+def _fake_response(text: str, *, prompt: int = 4, completion: int = 6) -> SimpleNamespace:
+    """Build an OpenAI-shaped response with the given text + token usage."""
+    return SimpleNamespace(
+        choices=[
+            SimpleNamespace(
+                message=SimpleNamespace(content=text, role="assistant"),
+                finish_reason="stop",
+            )
+        ],
+        usage=SimpleNamespace(
+            prompt_tokens=prompt,
+            completion_tokens=completion,
+            total_tokens=prompt + completion,
+        ),
+    )
+
+
+def _trusted_policy(plugin_id: str = "trusted-plugin", **overrides: Any) -> _TrustPolicy:
+    defaults = dict(
+        allow_provider_override=True,
+        allowed_providers=None,
+        allow_any_provider=True,
+        allow_model_override=True,
+        allowed_models=None,
+        allow_any_model=True,
+        allow_agent_id_override=True,
+        allow_profile_override=True,
+    )
+    defaults.update(overrides)
+    return _TrustPolicy(plugin_id=plugin_id, **defaults)
+
+
+# ---------------------------------------------------------------------------
+# Trust gate
+# ---------------------------------------------------------------------------
+
+
+class TestTrustGate:
+    def test_default_policy_blocks_provider_override(self):
+        policy = _TrustPolicy(plugin_id="locked")
+        with pytest.raises(PluginLlmTrustError, match="cannot override the provider"):
+            _check_overrides(
+                policy,
+                requested_provider="anthropic",
+                requested_model=None,
+                requested_agent_id=None,
+                requested_profile=None,
+            )
+
+    def test_default_policy_blocks_model_override(self):
+        policy = _TrustPolicy(plugin_id="locked")
+        with pytest.raises(PluginLlmTrustError, match="cannot override the model"):
+            _check_overrides(
+                policy,
+                requested_provider=None,
+                requested_model="claude-3-5-sonnet",
+                requested_agent_id=None,
+                requested_profile=None,
+            )
+
+    def test_default_policy_blocks_agent_override(self):
+        policy = _TrustPolicy(plugin_id="locked")
+        with pytest.raises(PluginLlmTrustError, match="non-default agent id"):
+            _check_overrides(
+                policy,
+                requested_provider=None,
+                requested_model=None,
+                requested_agent_id="ada",
+                requested_profile=None,
+            )
+
+    def test_default_policy_blocks_profile_override(self):
+        policy = _TrustPolicy(plugin_id="locked")
+        with pytest.raises(PluginLlmTrustError, match="cannot override the auth profile"):
+            _check_overrides(
+                policy,
+                requested_provider=None,
+                requested_model=None,
+                requested_agent_id=None,
+                requested_profile="work",
+            )
+
+    def test_overrides_independent(self):
+        """Each override is gated independently — turning on
+        ``allow_model_override`` does NOT also grant provider override."""
+        policy = _TrustPolicy(
+            plugin_id="model-only",
+            allow_model_override=True,
+            allow_any_model=True,
+        )
+        # model alone passes
+        _, m, _, _ = _check_overrides(
+            policy,
+            requested_provider=None,
+            requested_model="gpt-4o",
+            requested_agent_id=None,
+            requested_profile=None,
+        )
+        assert m == "gpt-4o"
+        # provider alone is still denied
+        with pytest.raises(PluginLlmTrustError, match="cannot override the provider"):
+            _check_overrides(
+                policy,
+                requested_provider="anthropic",
+                requested_model=None,
+                requested_agent_id=None,
+                requested_profile=None,
+            )
+
+    def test_provider_allowlist_rejects_non_listed(self):
+        policy = _TrustPolicy(
+            plugin_id="restricted",
+            allow_provider_override=True,
+            allowed_providers=frozenset({"openrouter", "anthropic"}),
+            allow_any_provider=False,
+        )
+        with pytest.raises(PluginLlmTrustError, match="not in plugins.entries"):
+            _check_overrides(
+                policy,
+                requested_provider="openai",
+                requested_model=None,
+                requested_agent_id=None,
+                requested_profile=None,
+            )
+
+    def test_provider_allowlist_accepts_listed_case_insensitively(self):
+        policy = _TrustPolicy(
+            plugin_id="restricted",
+            allow_provider_override=True,
+            allowed_providers=frozenset({"openrouter"}),
+            allow_any_provider=False,
+        )
+        p, _, _, _ = _check_overrides(
+            policy,
+            requested_provider="OpenRouter",
+            requested_model=None,
+            requested_agent_id=None,
+            requested_profile=None,
+        )
+        assert p == "OpenRouter"
+
+    def test_model_allowlist_rejects_non_listed(self):
+        policy = _TrustPolicy(
+            plugin_id="restricted",
+            allow_model_override=True,
+            allowed_models=frozenset({"openai/gpt-4o-mini"}),
+            allow_any_model=False,
+        )
+        with pytest.raises(PluginLlmTrustError, match="not in plugins.entries"):
+            _check_overrides(
+                policy,
+                requested_provider=None,
+                requested_model="anthropic/claude-3-opus",
+                requested_agent_id=None,
+                requested_profile=None,
+            )
+
+    def test_model_allowlist_accepts_listed_case_insensitively(self):
+        policy = _TrustPolicy(
+            plugin_id="restricted",
+            allow_model_override=True,
+            allowed_models=frozenset({"openai/gpt-4o-mini"}),
+            allow_any_model=False,
+        )
+        _, m, _, _ = _check_overrides(
+            policy,
+            requested_provider=None,
+            requested_model="OpenAI/GPT-4o-mini",
+            requested_agent_id=None,
+            requested_profile=None,
+        )
+        assert m == "OpenAI/GPT-4o-mini"
+
+    def test_no_overrides_passes_through(self):
+        policy = _TrustPolicy(plugin_id="locked")
+        result = _check_overrides(
+            policy,
+            requested_provider=None,
+            requested_model=None,
+            requested_agent_id=None,
+            requested_profile=None,
+        )
+        assert result == (None, None, None, None)
+
+    def test_all_overrides_when_fully_trusted(self):
+        policy = _trusted_policy()
+        result = _check_overrides(
+            policy,
+            requested_provider="openrouter",
+            requested_model="anthropic/claude-3-5-sonnet",
+            requested_agent_id="ada",
+            requested_profile="work",
+        )
+        assert result == ("openrouter", "anthropic/claude-3-5-sonnet", "ada", "work")
+
+
+class TestAllowlistCoercion:
+    def test_missing_yields_none(self):
+        ranges, allow_any = _coerce_allowlist(None)
+        assert ranges is None
+        assert allow_any is False
+
+    def test_list_of_strings(self):
+        ranges, allow_any = _coerce_allowlist(["A", "B"])
+        assert ranges == frozenset({"a", "b"})
+        assert allow_any is False
+
+    def test_star_alone_means_any(self):
+        ranges, allow_any = _coerce_allowlist(["*"])
+        assert ranges == frozenset()
+        assert allow_any is True
+
+    def test_star_plus_specific_keeps_specifics(self):
+        ranges, allow_any = _coerce_allowlist(["*", "openrouter"])
+        assert ranges == frozenset({"openrouter"})
+        assert allow_any is True
+
+    def test_non_list_yields_none(self):
+        ranges, allow_any = _coerce_allowlist("openrouter")
+        assert ranges is None
+        assert allow_any is False
+
+
+# ---------------------------------------------------------------------------
+# Structured message building
+# ---------------------------------------------------------------------------
+
+
+class TestStructuredMessageBuilding:
+    def test_text_only_input(self):
+        messages = _build_structured_messages(
+            instructions="Extract the action items",
+            inputs=[PluginLlmTextInput(text="meeting notes go here")],
+            json_mode=False,
+            json_schema=None,
+            schema_name=None,
+            system_prompt=None,
+        )
+        assert len(messages) == 1
+        assert messages[0]["role"] == "user"
+        parts = messages[0]["content"]
+        assert parts[0]["type"] == "text"
+        assert "Extract the action items" in parts[0]["text"]
+        assert parts[1] == {"type": "text", "text": "meeting notes go here"}
+
+    def test_json_mode_adds_system_directive(self):
+        messages = _build_structured_messages(
+            instructions="Summarise",
+            inputs=[PluginLlmTextInput(text="content")],
+            json_mode=True,
+            json_schema=None,
+            schema_name=None,
+            system_prompt=None,
+        )
+        assert messages[0]["role"] == "system"
+        assert "JSON object" in messages[0]["content"]
+
+    def test_schema_name_appended_to_header(self):
+        messages = _build_structured_messages(
+            instructions="Extract fields",
+            inputs=[PluginLlmTextInput(text="data")],
+            json_mode=False,
+            json_schema=None,
+            schema_name="action.items",
+            system_prompt=None,
+        )
+        header = messages[0]["content"][0]["text"]
+        assert "Schema name: action.items" in header
+
+    def test_image_bytes_encoded_as_data_url(self):
+        png_bytes = b"\x89PNG\r\n\x1a\nfake"
+        messages = _build_structured_messages(
+            instructions="Read the image",
+            inputs=[
+                PluginLlmImageInput(data=png_bytes, mime_type="image/png"),
+                PluginLlmTextInput(text="prefer printed text"),
+            ],
+            json_mode=False,
+            json_schema=None,
+            schema_name=None,
+            system_prompt=None,
+        )
+        parts = messages[0]["content"]
+        assert parts[1]["type"] == "image_url"
+        url = parts[1]["image_url"]["url"]
+        assert url.startswith("data:image/png;base64,")
+        decoded = base64.b64decode(url.split(",", 1)[1])
+        assert decoded == png_bytes
+        assert parts[2] == {"type": "text", "text": "prefer printed text"}
+
+    def test_image_url_passed_through(self):
+        messages = _build_structured_messages(
+            instructions="Caption this",
+            inputs=[PluginLlmImageInput(url="https://example.com/cat.jpg")],
+            json_mode=False,
+            json_schema=None,
+            schema_name=None,
+            system_prompt=None,
+        )
+        img_part = messages[0]["content"][1]
+        assert img_part["type"] == "image_url"
+        assert img_part["image_url"]["url"] == "https://example.com/cat.jpg"
+
+    def test_dict_inputs_normalized(self):
+        messages = _build_structured_messages(
+            instructions="Test",
+            inputs=[
+                {"type": "text", "text": "hello"},
+                {"type": "image", "url": "https://x.example/y.png"},
+            ],
+            json_mode=False,
+            json_schema=None,
+            schema_name=None,
+            system_prompt=None,
+        )
+        parts = messages[0]["content"]
+        assert parts[1]["text"] == "hello"
+        assert parts[2]["image_url"]["url"] == "https://x.example/y.png"
+
+    def test_invalid_input_block_rejected(self):
+        with pytest.raises(ValueError, match="Unknown input block"):
+            _build_structured_messages(
+                instructions="Test",
+                inputs=[{"type": "audio", "data": b""}],
+                json_mode=False,
+                json_schema=None,
+                schema_name=None,
+                system_prompt=None,
+            )
+
+
+# ---------------------------------------------------------------------------
+# JSON parsing
+# ---------------------------------------------------------------------------
+
+
+class TestJsonParsing:
+    def test_strip_code_fences_with_json_label(self):
+        assert _strip_code_fences('```json\n{"a":1}\n```') == '{"a":1}'
+
+    def test_strip_code_fences_without_label(self):
+        assert _strip_code_fences("```\nfoo\n```") == "foo"
+
+    def test_strip_code_fences_no_fence(self):
+        assert _strip_code_fences('{"a":1}') == '{"a":1}'
+
+    def test_parse_returns_text_when_not_json_mode(self):
+        parsed, ct = _parse_structured_text(
+            text='{"a": 1}', json_mode=False, json_schema=None
+        )
+        assert parsed is None
+        assert ct == "text"
+
+    def test_parse_valid_json_with_json_mode(self):
+        parsed, ct = _parse_structured_text(
+            text='{"language": "French", "is_question": true}',
+            json_mode=True,
+            json_schema=None,
+        )
+        assert parsed == {"language": "French", "is_question": True}
+        assert ct == "json"
+
+    def test_parse_strips_code_fences_before_loading(self):
+        parsed, ct = _parse_structured_text(
+            text='Here you go:\n```json\n{"ok": true}\n```',
+            json_mode=True,
+            json_schema=None,
+        )
+        assert parsed == {"ok": True}
+        assert ct == "json"
+
+    def test_parse_returns_text_on_invalid_json(self):
+        parsed, ct = _parse_structured_text(
+            text="not even close to json",
+            json_mode=True,
+            json_schema=None,
+        )
+        assert parsed is None
+        assert ct == "text"
+
+    def test_schema_validation_rejects_mismatch(self):
+        pytest.importorskip("jsonschema")
+        schema = {
+            "type": "object",
+            "properties": {"language": {"type": "string"}},
+            "required": ["language"],
+        }
+        with pytest.raises(ValueError, match="did not match schema"):
+            _parse_structured_text(
+                text='{"is_question": true}',
+                json_mode=False,
+                json_schema=schema,
+            )
+
+    def test_schema_validation_accepts_match(self):
+        pytest.importorskip("jsonschema")
+        schema = {
+            "type": "object",
+            "properties": {"language": {"type": "string"}},
+            "required": ["language"],
+        }
+        parsed, ct = _parse_structured_text(
+            text='{"language": "French"}',
+            json_mode=False,
+            json_schema=schema,
+        )
+        assert parsed == {"language": "French"}
+        assert ct == "json"
+
+
+# ---------------------------------------------------------------------------
+# End-to-end facade
+# ---------------------------------------------------------------------------
+
+
+class TestPluginLlmFacade:
+    def test_complete_uses_active_model_by_default(self):
+        captured: dict = {}
+
+        def fake_caller(**kwargs):
+            captured.update(kwargs)
+            return "auto", "default", _fake_response("Hello world.")
+
+        llm = make_plugin_llm_for_test(
+            plugin_id="my-plugin",
+            policy=_TrustPolicy(plugin_id="my-plugin"),
+            sync_caller=fake_caller,
+        )
+        result = llm.complete([{"role": "user", "content": "hi"}])
+        assert isinstance(result, PluginLlmCompleteResult)
+        assert result.text == "Hello world."
+        assert captured["provider_override"] is None
+        assert captured["model_override"] is None
+        assert captured["profile_override"] is None
+        assert result.usage.input_tokens == 4
+        assert result.usage.total_tokens == 10
+
+    def test_complete_rejects_provider_override_without_trust(self):
+        llm = make_plugin_llm_for_test(
+            plugin_id="my-plugin",
+            policy=_TrustPolicy(plugin_id="my-plugin"),
+            sync_caller=lambda **_: ("x", "y", _fake_response("")),
+        )
+        with pytest.raises(PluginLlmTrustError, match="cannot override the provider"):
+            llm.complete(
+                [{"role": "user", "content": "hi"}],
+                provider="openrouter",
+            )
+
+    def test_complete_rejects_model_override_without_trust(self):
+        llm = make_plugin_llm_for_test(
+            plugin_id="my-plugin",
+            policy=_TrustPolicy(plugin_id="my-plugin"),
+            sync_caller=lambda **_: ("x", "y", _fake_response("")),
+        )
+        with pytest.raises(PluginLlmTrustError, match="cannot override the model"):
+            llm.complete(
+                [{"role": "user", "content": "hi"}],
+                model="anthropic/claude-3-opus",
+            )
+
+    def test_complete_passes_through_trusted_overrides(self):
+        captured: dict = {}
+
+        def fake_caller(**kwargs):
+            captured.update(kwargs)
+            return "anthropic", "claude-3-opus", _fake_response("ok")
+
+        llm = make_plugin_llm_for_test(
+            plugin_id="my-plugin",
+            policy=_trusted_policy("my-plugin"),
+            sync_caller=fake_caller,
+        )
+        result = llm.complete(
+            [{"role": "user", "content": "hi"}],
+            provider="anthropic",
+            model="claude-3-opus",
+            profile="work",
+            agent_id="ada",
+            temperature=0.0,
+            max_tokens=128,
+            timeout=10.0,
+            purpose="extract",
+        )
+        # The recorded provider/model in the result come from the override,
+        # since the stub caller echoed those values.
+        assert result.provider == "anthropic"
+        assert result.model == "claude-3-opus"
+        assert captured["provider_override"] == "anthropic"
+        assert captured["model_override"] == "claude-3-opus"
+        assert captured["profile_override"] == "work"
+        assert captured["temperature"] == 0.0
+        assert captured["max_tokens"] == 128
+        assert captured["timeout"] == 10.0
+
+    def test_complete_structured_returns_parsed_json(self):
+        def fake_caller(**_kwargs):
+            return "openai", "gpt-4o", _fake_response(
+                '{"language": "French", "is_question": true, "confidence": 0.99}'
+            )
+
+        llm = make_plugin_llm_for_test(
+            plugin_id="my-plugin",
+            policy=_TrustPolicy(plugin_id="my-plugin"),
+            sync_caller=fake_caller,
+        )
+        result = llm.complete_structured(
+            instructions="Detect language",
+            input=[PluginLlmTextInput(text="Comment ça va?")],
+            json_mode=True,
+        )
+        assert isinstance(result, PluginLlmStructuredResult)
+        assert result.parsed == {
+            "language": "French",
+            "is_question": True,
+            "confidence": 0.99,
+        }
+        assert result.content_type == "json"
+
+    def test_complete_structured_returns_text_on_unparseable_response(self):
+        def fake_caller(**_kwargs):
+            return "openai", "gpt-4o", _fake_response("Sorry, I can't help with that.")
+
+        llm = make_plugin_llm_for_test(
+            plugin_id="my-plugin",
+            policy=_TrustPolicy(plugin_id="my-plugin"),
+            sync_caller=fake_caller,
+        )
+        result = llm.complete_structured(
+            instructions="Detect language",
+            input=[PluginLlmTextInput(text="x")],
+            json_mode=True,
+        )
+        assert result.parsed is None
+        assert result.content_type == "text"
+        assert result.text.startswith("Sorry")
+
+    def test_complete_structured_validates_against_schema(self):
+        pytest.importorskip("jsonschema")
+
+        def fake_caller(**_kwargs):
+            return "openai", "gpt-4o", _fake_response('{"unrelated": "field"}')
+
+        llm = make_plugin_llm_for_test(
+            plugin_id="my-plugin",
+            policy=_TrustPolicy(plugin_id="my-plugin"),
+            sync_caller=fake_caller,
+        )
+        schema = {
+            "type": "object",
+            "properties": {"language": {"type": "string"}},
+            "required": ["language"],
+        }
+        with pytest.raises(ValueError, match="did not match schema"):
+            llm.complete_structured(
+                instructions="Detect language",
+                input=[PluginLlmTextInput(text="x")],
+                json_schema=schema,
+            )
+
+    def test_complete_structured_requires_instructions(self):
+        llm = make_plugin_llm_for_test(
+            plugin_id="my-plugin",
+            policy=_TrustPolicy(plugin_id="my-plugin"),
+            sync_caller=MagicMock(),
+        )
+        with pytest.raises(ValueError, match="non-empty instructions"):
+            llm.complete_structured(
+                instructions="   ",
+                input=[PluginLlmTextInput(text="x")],
+            )
+
+    def test_complete_structured_requires_at_least_one_input(self):
+        llm = make_plugin_llm_for_test(
+            plugin_id="my-plugin",
+            policy=_TrustPolicy(plugin_id="my-plugin"),
+            sync_caller=MagicMock(),
+        )
+        with pytest.raises(ValueError, match="at least one input"):
+            llm.complete_structured(
+                instructions="Extract",
+                input=[],
+            )
+
+    def test_complete_structured_emits_response_format_extra_body(self):
+        captured: dict = {}
+
+        def fake_caller(**kwargs):
+            captured.update(kwargs)
+            return "openai", "gpt-4o", _fake_response('{"a": 1}')
+
+        llm = make_plugin_llm_for_test(
+            plugin_id="my-plugin",
+            policy=_TrustPolicy(plugin_id="my-plugin"),
+            sync_caller=fake_caller,
+        )
+        schema = {"type": "object"}
+        llm.complete_structured(
+            instructions="Test",
+            input=[PluginLlmTextInput(text="x")],
+            json_schema=schema,
+        )
+        rf = captured["extra_body"]["response_format"]
+        assert rf["type"] == "json_schema"
+        assert rf["json_schema"]["schema"] == schema
+
+    def test_complete_structured_with_image_passes_image_url_part(self):
+        captured: dict = {}
+
+        def fake_caller(**kwargs):
+            captured.update(kwargs)
+            return "openai", "gpt-4o", _fake_response('{"caption": "ok"}')
+
+        llm = make_plugin_llm_for_test(
+            plugin_id="my-plugin",
+            policy=_TrustPolicy(plugin_id="my-plugin"),
+            sync_caller=fake_caller,
+        )
+        png = b"fake-bytes"
+        llm.complete_structured(
+            instructions="Caption this",
+            input=[PluginLlmImageInput(data=png, mime_type="image/png")],
+            json_mode=True,
+        )
+        msgs = captured["messages"]
+        user_msg = next(m for m in msgs if m["role"] == "user")
+        image_parts = [p for p in user_msg["content"] if p.get("type") == "image_url"]
+        assert len(image_parts) == 1
+        assert image_parts[0]["image_url"]["url"].startswith("data:image/png;base64,")
+
+
+# ---------------------------------------------------------------------------
+# Async surface
+# ---------------------------------------------------------------------------
+
+
+class TestAsyncSurface:
+    def test_acomplete_uses_async_caller(self):
+        async def fake_async(**_kwargs):
+            return "openai", "gpt-4o", _fake_response("async hello")
+
+        llm = make_plugin_llm_for_test(
+            plugin_id="my-plugin",
+            policy=_TrustPolicy(plugin_id="my-plugin"),
+            async_caller=fake_async,
+        )
+
+        async def _run() -> PluginLlmCompleteResult:
+            return await llm.acomplete([{"role": "user", "content": "hi"}])
+
+        result = asyncio.run(_run())
+        assert result.text == "async hello"
+        assert result.provider == "openai"
+
+    def test_acomplete_structured_parses_json(self):
+        async def fake_async(**_kwargs):
+            return "openai", "gpt-4o", _fake_response('{"x": 42}')
+
+        llm = make_plugin_llm_for_test(
+            plugin_id="my-plugin",
+            policy=_TrustPolicy(plugin_id="my-plugin"),
+            async_caller=fake_async,
+        )
+
+        async def _run() -> PluginLlmStructuredResult:
+            return await llm.acomplete_structured(
+                instructions="Extract x",
+                input=[PluginLlmTextInput(text="data")],
+                json_mode=True,
+            )
+
+        result = asyncio.run(_run())
+        assert result.parsed == {"x": 42}
+        assert result.content_type == "json"
+
+
+# ---------------------------------------------------------------------------
+# Config-driven trust gate (round-trip via plugins.entries.<id>.llm)
+# ---------------------------------------------------------------------------
+
+
+class TestConfigDrivenPolicy:
+    def test_policy_loaded_from_yaml(self, tmp_path, monkeypatch):
+        from agent.plugin_llm import _resolve_trust_policy
+
+        hermes_home = tmp_path / ".hermes"
+        hermes_home.mkdir()
+        (hermes_home / "config.yaml").write_text(
+            """
+plugins:
+  entries:
+    my-plugin:
+      llm:
+        allow_provider_override: true
+        allowed_providers: [openrouter, anthropic]
+        allow_model_override: true
+        allowed_models:
+          - openai/gpt-4o-mini
+          - anthropic/claude-3-5-haiku
+        allow_profile_override: false
+""",
+            encoding="utf-8",
+        )
+        monkeypatch.setenv("HERMES_HOME", str(hermes_home))
+        from hermes_cli import config as _config_mod
+        _config_mod._config_cache = None  # type: ignore[attr-defined]
+
+        policy = _resolve_trust_policy("my-plugin")
+        assert policy.allow_provider_override is True
+        assert policy.allow_model_override is True
+        assert policy.allow_profile_override is False
+        assert policy.allowed_providers == frozenset({"openrouter", "anthropic"})
+        assert policy.allowed_models == frozenset({
+            "openai/gpt-4o-mini", "anthropic/claude-3-5-haiku",
+        })
+
+    def test_missing_plugin_entry_yields_default_deny(self, tmp_path, monkeypatch):
+        from agent.plugin_llm import _resolve_trust_policy
+
+        hermes_home = tmp_path / ".hermes"
+        hermes_home.mkdir()
+        (hermes_home / "config.yaml").write_text("plugins: {}\n", encoding="utf-8")
+        monkeypatch.setenv("HERMES_HOME", str(hermes_home))
+        from hermes_cli import config as _config_mod
+        _config_mod._config_cache = None  # type: ignore[attr-defined]
+
+        policy = _resolve_trust_policy("never-configured")
+        assert policy.allow_provider_override is False
+        assert policy.allow_model_override is False
+        assert policy.allow_profile_override is False
+        assert policy.allow_agent_id_override is False
+
+
+# ---------------------------------------------------------------------------
+# Plugin context wiring
+# ---------------------------------------------------------------------------
+
+
+class TestPluginContextIntegration:
+    def test_ctx_llm_is_lazy_singleton(self):
+        from hermes_cli.plugins import PluginContext, PluginManifest, PluginManager
+
+        manifest = PluginManifest(name="test-plugin", source="test", key="test-plugin")
+        manager = PluginManager()
+        ctx = PluginContext(manifest, manager)
+        first = ctx.llm
+        second = ctx.llm
+        assert first is second
+        assert isinstance(first, PluginLlm)
+        assert first._plugin_id == "test-plugin"  # type: ignore[attr-defined]
+
+    def test_ctx_llm_uses_manifest_key_for_policy(self):
+        from hermes_cli.plugins import PluginContext, PluginManifest, PluginManager
+
+        manifest = PluginManifest(
+            name="bare-name", source="test", key="image_gen/openai"
+        )
+        manager = PluginManager()
+        ctx = PluginContext(manifest, manager)
+        assert ctx.llm._plugin_id == "image_gen/openai"  # type: ignore[attr-defined]
+
+
+# ---------------------------------------------------------------------------
+# Attribution (result.provider / result.model / audit log)
+# ---------------------------------------------------------------------------
+
+
+class TestAttribution:
+    """Verifies that the result object and the audit log carry the real
+    provider/model that ``call_llm`` ended up using, NOT the placeholder
+    fallbacks ('auto', 'default') from earlier drafts."""
+
+    def test_explicit_overrides_recorded_when_no_response_model(self):
+        from agent.plugin_llm import _resolve_attribution
+
+        # Response with no .model attribute — overrides win.
+        response = SimpleNamespace(choices=[], usage=None)
+        provider, model = _resolve_attribution(
+            provider_override="openrouter",
+            model_override="anthropic/claude-3-5-sonnet",
+            response=response,
+        )
+        assert provider == "openrouter"
+        assert model == "anthropic/claude-3-5-sonnet"
+
+    def test_response_model_wins_over_model_override(self):
+        """Providers often canonicalise the model name (e.g. ``gpt-4o``
+        → ``gpt-4o-2024-08-06``). Whatever they actually returned wins
+        for the recorded model so the audit log reflects reality."""
+        from agent.plugin_llm import _resolve_attribution
+
+        response = SimpleNamespace(model="gpt-4o-2024-08-06", choices=[])
+        provider, model = _resolve_attribution(
+            provider_override="openrouter",
+            model_override="openai/gpt-4o",
+            response=response,
+        )
+        assert model == "gpt-4o-2024-08-06"
+        # Provider override is unaffected by response.model.
+        assert provider == "openrouter"
+
+    def test_falls_back_to_main_provider_and_model_when_no_overrides(self, monkeypatch):
+        """When the plugin doesn't override anything, attribution
+        reflects the user's active main provider/model rather than
+        misleading placeholders."""
+        from agent import plugin_llm
+        import agent.auxiliary_client as ac
+
+        monkeypatch.setattr(ac, "_read_main_provider", lambda: "openrouter")
+        monkeypatch.setattr(ac, "_read_main_model", lambda: "anthropic/claude-3-5-sonnet")
+
+        response = SimpleNamespace(choices=[])  # no .model attribute
+        provider, model = plugin_llm._resolve_attribution(
+            provider_override=None,
+            model_override=None,
+            response=response,
+        )
+        assert provider == "openrouter"
+        assert model == "anthropic/claude-3-5-sonnet"
+
+    def test_response_model_used_even_when_no_overrides(self, monkeypatch):
+        """The provider's canonical model name should still flow through
+        when no overrides are set."""
+        from agent import plugin_llm
+        import agent.auxiliary_client as ac
+
+        monkeypatch.setattr(ac, "_read_main_provider", lambda: "openrouter")
+        monkeypatch.setattr(ac, "_read_main_model", lambda: "openai/gpt-4o")
+
+        response = SimpleNamespace(model="openai/gpt-4o-2024-08-06", choices=[])
+        provider, model = plugin_llm._resolve_attribution(
+            provider_override=None,
+            model_override=None,
+            response=response,
+        )
+        assert provider == "openrouter"
+        assert model == "openai/gpt-4o-2024-08-06"
+
+    def test_placeholder_fallback_only_when_everything_is_empty(self, monkeypatch):
+        """If main_provider/main_model are unset AND there's no override
+        AND the response has no .model, fall through to the safety
+        placeholders so the result object never has empty strings."""
+        from agent import plugin_llm
+        import agent.auxiliary_client as ac
+
+        monkeypatch.setattr(ac, "_read_main_provider", lambda: "")
+        monkeypatch.setattr(ac, "_read_main_model", lambda: "")
+
+        response = SimpleNamespace(choices=[])
+        provider, model = plugin_llm._resolve_attribution(
+            provider_override=None,
+            model_override=None,
+            response=response,
+        )
+        assert provider == "auto"
+        assert model == "default"
+
+
+# ---------------------------------------------------------------------------
+# Hook-mode integration (ctx.llm called from a post_tool_call callback)
+# ---------------------------------------------------------------------------
+
+
+class TestHookMode:
+    """The docs page promises ``ctx.llm`` works from inside lifecycle
+    hooks. This exercises that path: register a ``post_tool_call``
+    callback that calls ``ctx.llm.complete``, fire the hook through
+    the real ``invoke_hook`` machinery, and check the call landed."""
+
+    def test_complete_works_from_post_tool_call_hook(self):
+        from hermes_cli.plugins import PluginContext, PluginManifest, PluginManager
+
+        manifest = PluginManifest(name="hook-plugin", source="test", key="hook-plugin")
+        manager = PluginManager()
+        ctx = PluginContext(manifest, manager)
+
+        # Replace ctx.llm with a stub that records what the hook called.
+        captured: list = []
+
+        def fake_caller(**kwargs):
+            captured.append(kwargs)
+            return "openrouter", "openai/gpt-4o", _fake_response("rewrote it")
+
+        ctx._llm = make_plugin_llm_for_test(  # type: ignore[attr-defined]
+            plugin_id="hook-plugin",
+            policy=_TrustPolicy(plugin_id="hook-plugin"),
+            sync_caller=fake_caller,
+        )
+
+        # Plugin registers a hook that runs ctx.llm.complete on every tool call.
+        def rewrite_error_hook(*, tool_name, args, result, **_):
+            if "Traceback" in (result or ""):
+                rewritten = ctx.llm.complete(
+                    messages=[
+                        {"role": "system", "content": "Rewrite errors plainly."},
+                        {"role": "user", "content": result},
+                    ],
+                    max_tokens=64,
+                    purpose="hook-plugin.rewrite",
+                )
+                # Real hook would return the rewritten text via
+                # transform_tool_result; here we just capture for the assert.
+                captured.append({"hook_returned": rewritten.text})
+
+        ctx.register_hook("post_tool_call", rewrite_error_hook)
+
+        # Fire the hook the same way the agent core does it.
+        manager.invoke_hook(
+            "post_tool_call",
+            tool_name="terminal",
+            args={"command": "boom"},
+            result="Traceback (most recent call last):\n  RuntimeError",
+        )
+
+        # Verify ctx.llm.complete fired through the hook.
+        assert len(captured) == 2  # one llm call + one hook return record
+        llm_call = captured[0]
+        assert "messages" in llm_call
+        assert any("rewrite" in m.get("content", "").lower()
+                   for m in llm_call["messages"] if isinstance(m, dict))
+        hook_record = captured[1]
+        assert hook_record["hook_returned"] == "rewrote it"
+
+    def test_complete_works_from_post_tool_call_hook_when_async_caller_set(self):
+        """Hooks fired synchronously should still work with sync
+        ctx.llm.complete even if other callsites use async."""
+        from hermes_cli.plugins import PluginContext, PluginManifest, PluginManager
+
+        manifest = PluginManifest(name="hook-async", source="test", key="hook-async")
+        manager = PluginManager()
+        ctx = PluginContext(manifest, manager)
+
+        def fake_caller(**_):
+            return "openrouter", "model-x", _fake_response("ok")
+
+        ctx._llm = make_plugin_llm_for_test(  # type: ignore[attr-defined]
+            plugin_id="hook-async",
+            policy=_TrustPolicy(plugin_id="hook-async"),
+            sync_caller=fake_caller,
+        )
+
+        called: list = []
+
+        def hook(**kwargs):
+            r = ctx.llm.complete(messages=[{"role": "user", "content": "x"}])
+            called.append(r.text)
+
+        ctx.register_hook("post_tool_call", hook)
+        manager.invoke_hook("post_tool_call", tool_name="x", args={}, result="y")
+        assert called == ["ok"]
diff --git a/website/docs/developer-guide/plugin-llm-access.md b/website/docs/developer-guide/plugin-llm-access.md
new file mode 100644
index 00000000000..5396e3a7a5d
--- /dev/null
+++ b/website/docs/developer-guide/plugin-llm-access.md
@@ -0,0 +1,465 @@
+---
+sidebar_position: 11
+title: "Plugin LLM Access"
+description: "Run any LLM call from inside a plugin via ctx.llm — chat or structured, sync or async. Host-owned auth, fail-closed trust gate, optional JSON Schema validation."
+---
+
+# Plugin LLM Access
+
+`ctx.llm` is the supported way for a plugin to make an LLM call.
+Chat completion, structured extraction, sync, async, with or without
+images — same surface, same trust gate, same host-owned credentials.
+
+Plugins reach for this when they need to do something that involves
+the model but isn't part of the agent's conversation. A hook that
+rewrites a tool error into something a non-engineer can read. A
+gateway adapter that translates an inbound message before queuing
+it. A slash command that summarises a long paste. A scheduled job
+that scores yesterday's activity and writes one line to a status
+board. A pre-filter that decides whether a message is worth waking
+the agent up for at all.
+
+These are jobs the agent shouldn't be in the loop on. They want one
+LLM call, a typed answer, and to be done.
+
+## The smallest possible call
+
+```python
+result = ctx.llm.complete(messages=[{"role": "user", "content": "ping"}])
+return result.text
+```
+
+That's the whole API in one line. No keys, no provider config, no
+SDK initialisation. The plugin runs against whatever provider and
+model the user is currently using — when they switch providers, the
+plugin follows them automatically.
+
+## A more complete chat example
+
+```python
+result = ctx.llm.complete(
+    messages=[
+        {"role": "system", "content": "Rewrite errors as one short sentence a non-engineer can act on."},
+        {"role": "user",   "content": traceback_text},
+    ],
+    max_tokens=64,
+    purpose="hooks.error-rewrite",
+)
+return result.text
+```
+
+`purpose` is a free-form audit string — it shows up in `agent.log`
+and in `result.audit` so operators can see which plugin made which
+call. Optional but recommended for anything that fires often.
+
+## Structured output
+
+When the plugin needs a typed answer, switch to the structured lane:
+
+```python
+result = ctx.llm.complete_structured(
+    instructions="Score this support reply for urgency (0–1) and pick a category.",
+    input=[{"type": "text", "text": message_body}],
+    json_schema=TRIAGE_SCHEMA,
+    purpose="support.triage",
+    temperature=0.0,
+    max_tokens=128,
+)
+
+if result.parsed["urgency"] > 0.8:
+    await dispatch_to_oncall(result.parsed["category"], message_body)
+```
+
+The host requests JSON output from the provider, parses it locally
+as a fallback, validates against your schema if `jsonschema` is
+installed, and hands back a Python object on `result.parsed`. If the
+model couldn't produce valid JSON, `result.parsed` is `None` and
+`result.text` carries the raw response.
+
+## What this lane gives you
+
+* **One call, four shapes.** `complete()` for chat,
+  `complete_structured()` for typed JSON, `acomplete()` and
+  `acomplete_structured()` for asyncio. Same arguments, same result
+  objects.
+* **Host-owned credentials.** OAuth tokens, refresh flows, the
+  credential pool, per-task aux overrides — every credential
+  concept Hermes already has applies. The plugin never sees a
+  token; the host attributes the call back through `result.audit`.
+* **Bounded.** Single sync or async call. No streaming, no tool
+  loops, no conversation state to manage. State the input, get the
+  result, return.
+* **Fail-closed trust.** A plugin you've never configured cannot
+  pick its own provider, model, agent, or stored credential. The
+  default posture is "use what the user is using." Operators opt in
+  to specific overrides, per plugin, in `config.yaml`.
+
+## Quick start
+
+Two complete plugins below — one chat, one structured. Both ship
+inside a single `register(ctx)` function and need zero outside
+configuration to run against whatever model the user has active.
+
+### Chat completion — `/tldr`
+
+```python
+def register(ctx):
+    ctx.register_command(
+        name="tldr",
+        handler=lambda raw: _tldr(ctx, raw),
+        description="Summarise the supplied text in one paragraph.",
+        args_hint="<text>",
+    )
+
+
+def _tldr(ctx, raw_args: str) -> str:
+    text = raw_args.strip()
+    if not text:
+        return "Usage: /tldr <text to summarise>"
+    result = ctx.llm.complete(
+        messages=[
+            {"role": "system",
+             "content": "Summarise the user's text in one tight paragraph. No preamble."},
+            {"role": "user", "content": text},
+        ],
+        max_tokens=256,
+        temperature=0.3,
+        purpose="tldr",
+    )
+    return result.text
+```
+
+`result.text` is the model's response; `result.usage` carries token
+counts; `result.provider` and `result.model` carry attribution.
+
+### Structured extraction — `/paste-to-tasks`
+
+```python
+def register(ctx):
+    ctx.register_command(
+        name="paste-to-tasks",
+        handler=lambda raw: _paste_to_tasks(ctx, raw),
+        description="Turn freeform meeting notes into structured tasks.",
+        args_hint="<text>",
+    )
+
+
+_TASKS_SCHEMA = {
+    "type": "object",
+    "properties": {
+        "tasks": {
+            "type": "array",
+            "items": {
+                "type": "object",
+                "properties": {
+                    "owner":  {"type": "string"},
+                    "action": {"type": "string"},
+                    "due":    {"type": "string", "description": "ISO date or empty"},
+                },
+                "required": ["action"],
+            },
+        },
+    },
+    "required": ["tasks"],
+}
+
+
+def _paste_to_tasks(ctx, raw_args: str) -> str:
+    if not raw_args.strip():
+        return "Usage: /paste-to-tasks <meeting notes>"
+    result = ctx.llm.complete_structured(
+        instructions=(
+            "Extract concrete action items from these meeting notes. "
+            "One task per actionable line. If no owner is named, leave 'owner' blank."
+        ),
+        input=[{"type": "text", "text": raw_args}],
+        json_schema=_TASKS_SCHEMA,
+        schema_name="meeting.tasks",
+        purpose="paste-to-tasks",
+        temperature=0.0,
+        max_tokens=512,
+    )
+    if result.parsed is None:
+        return f"Couldn't parse a response. Raw output:\n{result.text}"
+    lines = [f"- [{t.get('owner') or '?'}] {t['action']}" for t in result.parsed["tasks"]]
+    return "\n".join(lines) or "(no tasks found)"
+```
+
+A third worked example, this time with image input, lives in the
+[`hermes-example-plugins`](https://github.com/NousResearch/hermes-example-plugins/tree/main/plugin-llm-example)
+repo (companion repo for reference plugins — not bundled with
+hermes-agent itself). For the async surface (`acomplete()` /
+`acomplete_structured()` with `asyncio.gather()`), see
+[`plugin-llm-async-example`](https://github.com/NousResearch/hermes-example-plugins/tree/main/plugin-llm-async-example)
+in the same repo.
+
+## When to use which
+
+| You want… | Reach for |
+|---|---|
+| A free-form text response (translation, summary, rewrite, generation) | `complete()` |
+| A multi-turn prompt (system + few-shot examples + user) | `complete()` |
+| A typed dict back, validated against a schema | `complete_structured()` |
+| Image-or-text input with a typed dict back | `complete_structured()` |
+| The same call from async code (gateway adapters, async hooks) | `acomplete()` / `acomplete_structured()` |
+
+Everything else — provider selection, model resolution, auth, fallback,
+timeout, vision routing — is the same across all four.
+
+## API surface
+
+`ctx.llm` is an instance of `agent.plugin_llm.PluginLlm`.
+
+### `complete()`
+
+```python
+result = ctx.llm.complete(
+    messages=[{"role": "user", "content": "Hi"}],
+    provider=None,         # optional, gated — Hermes provider id (e.g. "openrouter")
+    model=None,            # optional, gated — whatever string that provider expects
+    temperature=None,
+    max_tokens=None,
+    timeout=None,          # seconds
+    agent_id=None,         # optional, gated
+    profile=None,          # optional, gated — explicit auth-profile name
+    purpose="optional-audit-string",
+)
+# → PluginLlmCompleteResult(text, provider, model, agent_id, usage, audit)
+```
+
+Plain chat completion. `messages` is the standard OpenAI shape — a
+list of `{"role": "...", "content": "..."}` dicts. Multi-turn
+prompts (system + few-shot user/assistant pairs + final user) work
+exactly as they would with the OpenAI SDK.
+
+`provider=` and `model=` are independent and follow the same shape
+as the host's main config (`model.provider` + `model.model`). Set
+just `model=` to use the user's active provider with a different
+model on it. Set both to switch providers entirely. Either argument
+without operator opt-in raises `PluginLlmTrustError`.
+
+### `complete_structured()`
+
+```python
+result = ctx.llm.complete_structured(
+    instructions="What you want extracted.",
+    input=[
+        {"type": "text",  "text": "..."},
+        {"type": "image", "data": b"...", "mime_type": "image/png"},
+        {"type": "image", "url":  "https://..."},
+    ],
+    json_schema={...},     # optional — triggers parsed result + validation
+    json_mode=False,       # set True without a schema to ask for JSON anyway
+    schema_name=None,      # optional human-readable schema name
+    system_prompt=None,
+    provider=None,         # optional, gated
+    model=None,            # optional, gated
+    temperature=None,
+    max_tokens=None,
+    timeout=None,
+    agent_id=None,
+    profile=None,
+    purpose=None,
+)
+# → PluginLlmStructuredResult(text, provider, model, agent_id,
+#                             usage, parsed, content_type, audit)
+```
+
+Inputs are typed text or image blocks (raw bytes get base64 encoded
+as a `data:` URL automatically). When `json_schema` or
+`json_mode=True` is supplied, the host requests JSON output via
+`response_format`, parses it locally as a fallback, and validates
+against your schema if `jsonschema` is installed.
+
+* `result.content_type == "json"` — `result.parsed` is a Python
+  object that matches your schema.
+* `result.content_type == "text"` — parsing or validation failed;
+  inspect `result.text` for the raw model response.
+
+### Async
+
+```python
+result = await ctx.llm.acomplete(messages=...)
+result = await ctx.llm.acomplete_structured(instructions=..., input=...)
+```
+
+Same arguments and result types as their sync counterparts. Use
+these from gateway adapters, async hooks, or any plugin code
+already running on an asyncio loop.
+
+### Result attributes
+
+```python
+@dataclass
+class PluginLlmCompleteResult:
+    text: str                    # the assistant's response
+    provider: str                # e.g. "openrouter", "anthropic"
+    model: str                   # whatever the provider returned for this call
+    agent_id: str                # whose model/auth was used
+    usage: PluginLlmUsage        # tokens + cache + cost estimate
+    audit: Dict[str, Any]        # plugin_id, purpose, profile
+
+@dataclass
+class PluginLlmStructuredResult(PluginLlmCompleteResult):
+    parsed: Optional[Any]        # JSON object when content_type == "json"
+    content_type: str            # "json" or "text"
+    # audit also carries schema_name when supplied
+```
+
+`usage` carries `input_tokens`, `output_tokens`, `total_tokens`,
+`cache_read_tokens`, `cache_write_tokens`, and `cost_usd` when the
+provider returns those fields.
+
+## Trust gate
+
+The default behaviour is fail-closed. With no `plugins.entries`
+config block, a plugin can:
+
+* run any of the four methods against the user's active provider
+  and model,
+* set request-shaping arguments (`temperature`, `max_tokens`,
+  `timeout`, `system_prompt`, `purpose`, `messages`, `instructions`,
+  `input`, `json_schema`),
+
+…and that's it. `provider=`, `model=`, `agent_id=`, and `profile=`
+arguments raise `PluginLlmTrustError` until the operator opts in.
+
+**Most plugins never need this section.** A plugin that just calls
+`ctx.llm.complete(messages=...)` with no overrides runs against
+whatever the user has active and works zero-config. The block below
+is only relevant when a plugin specifically wants to pin to a
+different model or provider than the user.
+
+```yaml
+plugins:
+  entries:
+    my-plugin:
+      llm:
+        # Allow this plugin to choose a different Hermes provider
+        # (must be one Hermes already knows about — same names as
+        # `hermes model` and config.yaml model.provider).
+        allow_provider_override: true
+
+        # Optionally restrict which providers. Use ["*"] for any.
+        allowed_providers:
+          - openrouter
+          - anthropic
+
+        # Allow this plugin to ask for a specific model.
+        allow_model_override: true
+
+        # Optionally restrict which models. Use ["*"] for any.
+        # Models are matched literally against whatever string the
+        # plugin sends — Hermes does not look anything up.
+        allowed_models:
+          - openai/gpt-4o-mini
+          - anthropic/claude-3-5-haiku
+
+        # Allow cross-agent calls (rare).
+        allow_agent_id_override: false
+
+        # Allow the plugin to request a specific stored auth profile
+        # (e.g. a different OAuth account on the same provider).
+        allow_profile_override: false
+```
+
+The plugin id is the manifest `name:` field for flat plugins, or the
+path-derived key for nested plugins (`image_gen/openai`,
+`memory/honcho`, etc.).
+
+### What the gate enforces
+
+| Override        | Default | Config key                       |
+| --------------- | ------- | -------------------------------- |
+| `provider=`     | denied  | `allow_provider_override: true`  |
+| ↳ allowlist     | —       | `allowed_providers: [...]`       |
+| `model=`        | denied  | `allow_model_override: true`     |
+| ↳ allowlist     | —       | `allowed_models: [...]`          |
+| `agent_id=`     | denied  | `allow_agent_id_override: true`  |
+| `profile=`      | denied  | `allow_profile_override: true`   |
+
+Each override is independently gated. Granting `allow_model_override`
+does **not** also grant `allow_provider_override` — a plugin trusted
+to pick a model is still pinned to the user's active provider unless
+it gets the provider gate as well.
+
+### What the gate does NOT need to enforce
+
+* Request-shaping arguments — `temperature`, `max_tokens`,
+  `timeout`, `system_prompt`, `purpose`, `messages`, `instructions`,
+  `input`, `json_schema`, `schema_name`, `json_mode` — are always
+  allowed; they don't pick credentials or routes.
+* The default deny posture means an unconfigured plugin can still do
+  useful work — it just runs against the active provider and model.
+  Operators only need to think about `plugins.entries` for plugins
+  that want finer routing.
+
+## What the host owns
+
+A complete list of the things `ctx.llm` does for the plugin so you
+don't have to:
+
+* **Provider resolution.** Reads `model.provider` + `model.model`
+  from the user's config (or the explicit overrides when trusted).
+* **Auth.** Pulls API keys, OAuth tokens, or refresh tokens from
+  `~/.hermes/auth.json` / env, including the credential pool when
+  one is configured. The plugin never sees them.
+* **Vision routing.** When image input is supplied and the user's
+  active text model is text-only, the host falls back to the
+  configured vision model automatically.
+* **Fallback chain.** If the user's primary provider 5xxs or 429s,
+  the request goes through Hermes' usual aggregator-aware fallback
+  before it returns an error to the plugin.
+* **Timeout.** Honours your `timeout=` argument, falling back to
+  `auxiliary.<task>.timeout` config or the global aux default.
+* **JSON shaping.** Sends `response_format` to the provider when
+  you ask for JSON, then re-parses locally from a code-fenced
+  response if the provider returned one.
+* **Schema validation.** Validates against your `json_schema` when
+  `jsonschema` is installed; logs a debug line and skips strict
+  validation otherwise.
+* **Audit log.** Each call writes one INFO line to `agent.log` with
+  the plugin id, provider/model, purpose, and token totals.
+
+## What the plugin owns
+
+* **Request shape.** `messages` for chat, `instructions` + `input`
+  for structured. The plugin builds the prompt; the host runs it.
+* **Schema.** Whatever shape you want back. The host doesn't infer
+  it for you.
+* **Error handling.** `complete_structured()` raises `ValueError` on
+  empty inputs and on schema-validation failure. `PluginLlmTrustError`
+  fires when the trust gate denies an override. Anything else
+  (provider 5xx, no credentials configured, timeout) raises whatever
+  `auxiliary_client.call_llm()` raises.
+* **Cost.** Every call runs against the user's paid provider. Don't
+  loop on `complete()` for every gateway message without thinking
+  about token spend.
+
+## Where this fits in the plugin surface
+
+Existing `ctx.*` methods extend an existing Hermes subsystem:
+
+| `ctx.register_tool` | adds a tool the agent can call |
+| `ctx.register_platform` | wires a new gateway adapter |
+| `ctx.register_image_gen_provider` | replaces an image-gen backend |
+| `ctx.register_memory_provider` | replaces the memory backend |
+| `ctx.register_context_engine` | replaces the context compressor |
+| `ctx.register_hook` | observes a lifecycle event |
+
+`ctx.llm` is the first surface that lets a plugin run the same
+model the user is talking to, *out of band*, without any of the
+above. That's its only job. If your plugin needs to register a
+tool the agent invokes, use `register_tool`. If it needs to react
+to a lifecycle event, use `register_hook`. If it needs to make its
+own model call — for any reason, structured or not — `ctx.llm`.
+
+## Reference
+
+* Implementation: [`agent/plugin_llm.py`](https://github.com/NousResearch/hermes-agent/blob/main/agent/plugin_llm.py)
+* Tests: [`tests/agent/test_plugin_llm.py`](https://github.com/NousResearch/hermes-agent/blob/main/tests/agent/test_plugin_llm.py)
+* Reference plugins (companion repo):
+  * [`plugin-llm-example`](https://github.com/NousResearch/hermes-example-plugins/tree/main/plugin-llm-example) — sync structured extraction with image input
+  * [`plugin-llm-async-example`](https://github.com/NousResearch/hermes-example-plugins/tree/main/plugin-llm-async-example) — async with `asyncio.gather()`
+* Auxiliary client (the engine under the hood): see
+  [Provider Runtime](/docs/developer-guide/provider-runtime).
diff --git a/website/docs/user-guide/features/built-in-plugins.md b/website/docs/user-guide/features/built-in-plugins.md
index d153f4faf18..aa346308913 100644
--- a/website/docs/user-guide/features/built-in-plugins.md
+++ b/website/docs/user-guide/features/built-in-plugins.md
@@ -64,8 +64,6 @@ The repo ships these bundled plugins under `plugins/`. All are opt-in — enable
 | `image_gen/xai` | image backend | xAI `grok-2-image` backend |
 | `hermes-achievements` | dashboard tab | Steam-style collectible badges generated from your real Hermes session history |
 | `kanban/dashboard` | dashboard tab | Kanban board UI for the multi-agent dispatcher — tasks, comments, fan-out, board switching. See [Kanban Multi-Agent](./kanban.md). |
-| `example-dashboard` | dashboard example | Reference dashboard plugin for [Extending the Dashboard](./extending-the-dashboard.md) |
-| `strike-freedom-cockpit` | dashboard skin | Sample custom dashboard skin |
 
 Memory providers (`plugins/memory/*`) and context engines (`plugins/context_engine/*`) are listed separately on [Memory Providers](./memory-providers.md) — they're managed through `hermes memory` and `hermes plugins` respectively. The full per-plugin detail for the two long-running hooks-based plugins follows.
 
diff --git a/website/docs/user-guide/features/extending-the-dashboard.md b/website/docs/user-guide/features/extending-the-dashboard.md
index 2cccb6c5814..9f4fd95e15e 100644
--- a/website/docs/user-guide/features/extending-the-dashboard.md
+++ b/website/docs/user-guide/features/extending-the-dashboard.md
@@ -681,7 +681,7 @@ Key points:
 - Multiple plugins can claim the same page-scoped slot. They render stacked in registration order.
 - Zero footprint when no plugin registers: the built-in page renders exactly as before.
 
-The bundled `example-dashboard` plugin ships a live demo that injects a banner into `sessions:top` — install it to see the pattern end-to-end.
+A reference plugin (`example-dashboard` in [`hermes-example-plugins`](https://github.com/NousResearch/hermes-example-plugins/tree/main/example-dashboard)) ships a live demo that injects a banner into `sessions:top` — install it to see the pattern end-to-end.
 
 ### Slot-only plugins (`tab.hidden`)
 
@@ -818,7 +818,7 @@ If a plugin's script fails to load (404, syntax error, exception during IIFE), t
 
 ## Combined theme + plugin demo
 
-The repo ships `plugins/strike-freedom-cockpit/` as a complete reskin demo. It pairs a theme YAML with a slot-only plugin to produce a cockpit-style HUD without forking the dashboard.
+The [`strike-freedom-cockpit`](https://github.com/NousResearch/hermes-example-plugins/tree/main/strike-freedom-cockpit) plugin (companion repo `hermes-example-plugins`) is a complete reskin demo. It pairs a theme YAML with a slot-only plugin to produce a cockpit-style HUD without forking the dashboard.
 
 **What it demonstrates:**
 
@@ -832,17 +832,19 @@ The repo ships `plugins/strike-freedom-cockpit/` as a complete reskin demo. It p
 **Install:**
 
 ```bash
+git clone https://github.com/NousResearch/hermes-example-plugins.git
+
 # Theme
-cp plugins/strike-freedom-cockpit/theme/strike-freedom.yaml \
+cp hermes-example-plugins/strike-freedom-cockpit/theme/strike-freedom.yaml \
    ~/.hermes/dashboard-themes/
 
 # Plugin
-cp -r plugins/strike-freedom-cockpit ~/.hermes/plugins/
+cp -r hermes-example-plugins/strike-freedom-cockpit ~/.hermes/plugins/
 ```
 
 Open the dashboard, pick **Strike Freedom** from the theme switcher. The cockpit sidebar appears, the crest shows in the header, the tagline replaces the footer. Switch back to **Hermes Teal** and the plugin remains installed but invisible (the `sidebar` slot only renders under the `cockpit` layout variant).
 
-Read the plugin source (`plugins/strike-freedom-cockpit/dashboard/dist/index.js`) to see how it reads CSS vars, guards against older dashboards without slot support, and registers three slots from one bundle.
+Read the plugin source (`strike-freedom-cockpit/dashboard/dist/index.js` in the companion repo) to see how it reads CSS vars, guards against older dashboards without slot support, and registers three slots from one bundle.
 
 ---
 
diff --git a/website/docs/user-guide/features/plugins.md b/website/docs/user-guide/features/plugins.md
index 3ceabee2081..8bab522f9dd 100644
--- a/website/docs/user-guide/features/plugins.md
+++ b/website/docs/user-guide/features/plugins.md
@@ -111,6 +111,7 @@ Every `ctx.*` API below is available inside a plugin's `register(ctx)` function.
 | Register an image-generation backend | `ctx.register_image_gen_provider(provider)` — see [Image Generation Provider Plugins](/docs/developer-guide/image-gen-provider-plugin) |
 | Register a context-compression engine | `ctx.register_context_engine(engine)` — see [Context Engine Plugins](/docs/developer-guide/context-engine-plugin) |
 | Register a memory backend | Subclass `MemoryProvider` in `plugins/memory/<name>/__init__.py` — see [Memory Provider Plugins](/docs/developer-guide/memory-provider-plugin) (uses a separate discovery system) |
+| Run a host-owned LLM call | `ctx.llm.complete(...)` / `ctx.llm.complete_structured(...)` — borrow the user's active model + auth for a one-shot completion with optional JSON schema validation. See [Plugin LLM Access](/docs/developer-guide/plugin-llm-access) |
 | Register an inference backend (LLM provider) | `register_provider(ProviderProfile(...))` in `plugins/model-providers/<name>/__init__.py` — see [Model Provider Plugins](/docs/developer-guide/model-provider-plugin) (uses a separate discovery system) |
 
 ## Plugin discovery
diff --git a/website/sidebars.ts b/website/sidebars.ts
index a29f366219a..296f0f61f6e 100644
--- a/website/sidebars.ts
+++ b/website/sidebars.ts
@@ -221,6 +221,7 @@ const sidebars: SidebarsConfig = {
             'developer-guide/context-engine-plugin',
             'developer-guide/model-provider-plugin',
             'developer-guide/image-gen-provider-plugin',
+            'developer-guide/plugin-llm-access',
             'developer-guide/creating-skills',
             'developer-guide/extending-the-cli',
           ],