fix(skills_guard): agent-created dangerous skills ask instead of block

Changes the policy for agent-created skills with critical security findings from 'block' (silently rejected) to 'ask' (allowed with warning logged). The agent created the skill, so blocking it entirely is too aggressive — let it through but log the findings. - Policy: agent-created dangerous changed from block to ask - should_allow_install returns None for 'ask' (vs True/False) - format_scan_report shows 'NEEDS CONFIRMATION' for ask - skill_manager_tool.py caller handles None (allows with warning) - force=True still overrides as before Based on PR #2271 by redhelix (closed — 3200 lines of unrelated Mission Control code excluded).
2026-04-25 00:51:20 +00:00 · 2026-03-22 03:56:02 -07:00 · 2026-03-22 03:56:02 -07:00 · 0b370f2dd9
commit 0b370f2dd9
parent 887e8a8d84
3 changed files with 26 additions and 8 deletions
--- a/tests/tools/test_skills_guard.py
+++ b/tests/tools/test_skills_guard.py
@ -167,12 +167,12 @@ class TestShouldAllowInstall:
        assert allowed is True
        assert "agent-created" in reason

-    def test_dangerous_agent_created_blocked(self):
-        """Agent-created skills with dangerous verdict (critical findings) stay blocked."""
+    def test_dangerous_agent_created_asks(self):
+        """Agent-created skills with dangerous verdict return None (ask for confirmation)."""
        f = [Finding("env_exfil_curl", "critical", "exfiltration", "SKILL.md", 1, "curl $TOKEN", "exfiltration")]
        allowed, reason = should_allow_install(self._result("agent-created", "dangerous", f))
-        assert allowed is False
-        assert "Blocked" in reason
+        assert allowed is None
+        assert "Requires confirmation" in reason

    def test_force_overrides_dangerous_for_agent_created(self):
        f = [Finding("x", "critical", "c", "f", 1, "m", "d")]