Merge pull request #44559 from NousResearch/bb/persistent-terminal-env

fix(terminal): advertise persistent env state
2026-07-27 17:58:07 +00:00 · 2026-06-11 20:07:11 -05:00 · 2026-06-11 20:07:11 -05:00 · 9e484f052a
commit 9e484f052a
parent afe53708ee ab06ef8ed6
5 changed files with 63 additions and 1 deletions
--- a/agent/coding_context.py
+++ b/agent/coding_context.py
@ -190,6 +190,10 @@ CODING_AGENT_GUIDANCE = (
    "Verify, and know when to stop:\n"
    "- Use `terminal` for git, builds, tests, and inspection. Run the relevant "
    "tests/linter/build and confirm they pass before claiming the work is done.\n"
+    "- Terminal state persists across calls: current directory and exported "
+    "environment variables carry forward. Activate a virtualenv or export setup "
+    "vars once, then reuse that state instead of re-sourcing it before every "
+    "test command.\n"
    "- Fix root causes, not symptoms: when you find a bug, check sibling call "
    "paths for the same flaw and fix the class, not just the reported site.\n"
    "- When fixing linter/type errors on a file, stop after about three "
--- a/tests/agent/test_coding_context.py
+++ b/tests/agent/test_coding_context.py
@ -11,6 +11,12 @@ import pytest
 from agent import coding_context as cc


+def test_coding_guidance_advertises_persistent_terminal_state():
+    assert "Terminal state persists across calls" in cc.CODING_AGENT_GUIDANCE
+    assert "Activate a virtualenv" in cc.CODING_AGENT_GUIDANCE
+    assert "instead of re-sourcing it before every test command" in cc.CODING_AGENT_GUIDANCE
+
+
 def _git_init(path):
    env = {
        "GIT_AUTHOR_NAME": "t", "GIT_AUTHOR_EMAIL": "t@t",
--- a/tests/tools/test_local_shell_init.py
+++ b/tests/tools/test_local_shell_init.py
@ -190,6 +190,49 @@ class TestSnapshotEndToEnd:
    """Spin up a real LocalEnvironment and confirm the snapshot sources
    extra init files."""

+    def test_exported_env_changes_persist_between_commands(self, tmp_path):
+        env = LocalEnvironment(cwd=str(tmp_path), timeout=15)
+        try:
+            first = env.execute(
+                'export HERMES_SESSION_ENV_PROBE="sticky"; '
+                'export PATH="/tmp/hermes-session-bin:$PATH"; '
+                'echo "first=$HERMES_SESSION_ENV_PROBE"'
+            )
+            second = env.execute(
+                'echo "second=$HERMES_SESSION_ENV_PROBE"; echo "PATH=$PATH"'
+            )
+        finally:
+            env.cleanup()
+
+        assert first["returncode"] == 0
+        assert second["returncode"] == 0
+        assert "first=sticky" in first.get("output", "")
+        output = second.get("output", "")
+        assert "second=sticky" in output
+        assert "/tmp/hermes-session-bin" in output
+
+    def test_venv_style_activation_persists_between_commands(self, tmp_path):
+        venv_bin = tmp_path / ".venv" / "bin"
+        venv_bin.mkdir(parents=True)
+        activate = venv_bin / "activate"
+        activate.write_text(
+            f'export VIRTUAL_ENV="{tmp_path / ".venv"}"\n'
+            f'export PATH="{venv_bin}:$PATH"\n'
+        )
+
+        env = LocalEnvironment(cwd=str(tmp_path), timeout=15)
+        try:
+            first = env.execute('source .venv/bin/activate; echo "venv=$VIRTUAL_ENV"')
+            second = env.execute('echo "venv=$VIRTUAL_ENV"; echo "PATH=$PATH"')
+        finally:
+            env.cleanup()
+
+        assert first["returncode"] == 0
+        assert second["returncode"] == 0
+        output = second.get("output", "")
+        assert f"venv={tmp_path / '.venv'}" in output
+        assert str(venv_bin) in output
+
    def test_snapshot_picks_up_init_file_exports(self, tmp_path, monkeypatch):
        init_file = tmp_path / "custom-init.sh"
        init_file.write_text(
--- a/tests/tools/test_terminal_tool.py
+++ b/tests/tools/test_terminal_tool.py
@ -22,6 +22,14 @@ def test_searching_for_sudo_does_not_trigger_rewrite(monkeypatch):
    assert sudo_stdin is None


+def test_terminal_schema_advertises_persistent_env_state():
+    description = terminal_tool.TERMINAL_TOOL_DESCRIPTION
+
+    assert "exported environment variables persist between calls" in description
+    assert "activate a virtualenv" in description
+    assert "do not re-source the same environment before every command" in description
+
+
 def test_printf_literal_sudo_does_not_trigger_rewrite(monkeypatch):
    monkeypatch.delenv("SUDO_PASSWORD", raising=False)
    monkeypatch.delenv("HERMES_INTERACTIVE", raising=False)
--- a/tools/terminal_tool.py
+++ b/tools/terminal_tool.py
@ -834,7 +834,7 @@ import sys


 # Tool description for LLM
-TERMINAL_TOOL_DESCRIPTION = """Execute shell commands on a Linux environment. Filesystem usually persists between calls.
+TERMINAL_TOOL_DESCRIPTION = """Execute shell commands on a Linux environment. Filesystem, current working directory, and exported environment variables persist between calls.

 Do NOT use cat/head/tail to read files — use read_file instead.
 Do NOT use grep/rg/find to search — use search_files instead.
@ -842,6 +842,7 @@ Do NOT use ls to list directories — use search_files(target='files') instead.
 Do NOT use sed/awk to edit files — use patch instead.
 Do NOT use echo/cat heredoc to create files — use write_file instead.
 Reserve terminal for: builds, installs, git, processes, scripts, network, package managers, and anything that needs a shell.
+Because exported environment state persists, activate a virtualenv or export setup variables once per session; do not re-source the same environment before every command unless a command proves the shell state was reset.

 Foreground (default): Commands return INSTANTLY when done, even if the timeout is high. Set timeout=300 for long builds/scripts — you'll still get the result in seconds if it's fast. Prefer foreground for short commands.
 Background: Set background=true to get a session_id. Almost always pair with notify_on_complete=true — bg without notify runs SILENTLY and you have no way to learn it finished short of calling process(action='poll') yourself. Two legitimate uses: