fix(tools): preserve live session cwd in terminal_tool, and keep ACP update_cwd authoritative
terminal_tool re-sent the init-time/config cwd on every command, clobbering session-local `cd` state: the environment tracked the new directory in `env.cwd`, but foreground/background calls forced the old cwd back. A small `_resolve_command_cwd` resolver now applies the precedence `workdir > live env.cwd > config/override cwd` to: - foreground `env.execute(...)` - background `process_registry.spawn_local(...)` - background `process_registry.spawn_via_env(...)` Additionally, syncing the cwd onto the live cached env when a `cwd` override is (re-)registered. Preferring live `env.cwd` would otherwise demote the ACP `update_cwd` override (registered via `register_task_env_overrides` on `session/load` / `session/resume`) below an already-set `env.cwd`, silently ignoring an editor's mid-session project-root change once any command had run. `register_task_env_overrides` now pushes a new cwd onto the cached env so an explicit ACP cwd change wins, while ordinary in-session `cd` tracking is preserved. Regression coverage: - foreground/background commands follow live `env.cwd` - explicit `workdir` still overrides everything - registering a cwd override updates the live env cwd (ACP authority) - no-op when no live env exists; non-cwd overrides leave env.cwd untouched Based on #35510 by @Dusk1e. Co-authored-by: Dusk1e <yusufalweshdemir@gmail.com>
This commit is contained in:
@ -1,6 +1,7 @@
|
||||
"""Regression tests for task/session cwd propagation in terminal_tool."""
|
||||
|
||||
import json
|
||||
from types import SimpleNamespace
|
||||
|
||||
import tools.terminal_tool as terminal_tool
|
||||
|
||||
@ -10,6 +11,7 @@ def _minimal_terminal_config(cwd="/default"):
|
||||
"env_type": "local",
|
||||
"cwd": cwd,
|
||||
"timeout": 60,
|
||||
"lifetime_seconds": 3600,
|
||||
}
|
||||
|
||||
|
||||
@ -72,3 +74,147 @@ def test_explicit_workdir_still_wins_over_registered_task_cwd(monkeypatch):
|
||||
|
||||
assert result["exit_code"] == 0
|
||||
assert calls == [{"timeout": 60, "cwd": "/explicit/workdir"}]
|
||||
|
||||
|
||||
def test_foreground_command_prefers_live_env_cwd_over_init_time_cwd(monkeypatch):
|
||||
"""A prior `cd` updates env.cwd; terminal_tool must honor that live cwd."""
|
||||
calls = []
|
||||
|
||||
class FakeEnv:
|
||||
env = {}
|
||||
cwd = "/workspace/live"
|
||||
|
||||
def execute(self, command, **kwargs):
|
||||
calls.append((command, kwargs))
|
||||
return {"output": "ok", "returncode": 0}
|
||||
|
||||
task_id = "session-live-cwd"
|
||||
monkeypatch.setattr(terminal_tool, "_active_environments", {task_id: FakeEnv()})
|
||||
monkeypatch.setattr(terminal_tool, "_last_activity", {})
|
||||
monkeypatch.setattr(terminal_tool, "_task_env_overrides", {task_id: {"cwd": "/workspace/init"}})
|
||||
monkeypatch.setattr(terminal_tool, "_get_env_config", lambda: _minimal_terminal_config(cwd="/workspace/init"))
|
||||
monkeypatch.setattr(terminal_tool, "_start_cleanup_thread", lambda: None)
|
||||
monkeypatch.setattr(terminal_tool, "_resolve_container_task_id", lambda value: value or "default")
|
||||
monkeypatch.setattr(
|
||||
terminal_tool,
|
||||
"_check_all_guards",
|
||||
lambda command, env_type: {"approved": True},
|
||||
)
|
||||
|
||||
result = json.loads(terminal_tool.terminal_tool(command="pwd", task_id=task_id))
|
||||
|
||||
assert result["exit_code"] == 0
|
||||
assert calls == [("pwd", {"timeout": 60, "cwd": "/workspace/live"})]
|
||||
|
||||
|
||||
def test_background_command_prefers_live_env_cwd_over_init_time_cwd(monkeypatch):
|
||||
"""Background process launches must also use the live session cwd."""
|
||||
|
||||
class FakeEnv:
|
||||
env = {}
|
||||
cwd = "/workspace/live"
|
||||
|
||||
class FakeRegistry:
|
||||
def __init__(self):
|
||||
self.calls = []
|
||||
self.pending_watchers = []
|
||||
|
||||
def spawn_local(self, **kwargs):
|
||||
self.calls.append(kwargs)
|
||||
return SimpleNamespace(id="proc_test", pid=1234)
|
||||
|
||||
import tools.process_registry as process_registry_mod
|
||||
|
||||
registry = FakeRegistry()
|
||||
task_id = "session-live-cwd-bg"
|
||||
monkeypatch.setattr(terminal_tool, "_active_environments", {task_id: FakeEnv()})
|
||||
monkeypatch.setattr(terminal_tool, "_last_activity", {})
|
||||
monkeypatch.setattr(terminal_tool, "_task_env_overrides", {task_id: {"cwd": "/workspace/init"}})
|
||||
monkeypatch.setattr(terminal_tool, "_get_env_config", lambda: _minimal_terminal_config(cwd="/workspace/init"))
|
||||
monkeypatch.setattr(terminal_tool, "_start_cleanup_thread", lambda: None)
|
||||
monkeypatch.setattr(terminal_tool, "_resolve_container_task_id", lambda value: value or "default")
|
||||
monkeypatch.setattr(
|
||||
terminal_tool,
|
||||
"_check_all_guards",
|
||||
lambda command, env_type: {"approved": True},
|
||||
)
|
||||
monkeypatch.setattr(process_registry_mod, "process_registry", registry)
|
||||
|
||||
result = json.loads(
|
||||
terminal_tool.terminal_tool(
|
||||
command="sleep 1",
|
||||
task_id=task_id,
|
||||
background=True,
|
||||
)
|
||||
)
|
||||
|
||||
assert result["exit_code"] == 0
|
||||
assert registry.calls == [{
|
||||
"command": "sleep 1",
|
||||
"cwd": "/workspace/live",
|
||||
"task_id": task_id,
|
||||
"session_key": "",
|
||||
"env_vars": {},
|
||||
"use_pty": False,
|
||||
}]
|
||||
|
||||
|
||||
def test_registering_cwd_override_updates_live_env_cwd(monkeypatch):
|
||||
"""An ACP ``update_cwd`` (re-)registered mid-session must win over a
|
||||
previously ``cd``-ed live ``env.cwd``.
|
||||
|
||||
Preferring live ``env.cwd`` (so session-local ``cd`` survives) means a
|
||||
freshly registered ``cwd`` override would otherwise sit *below* the
|
||||
already-set ``env.cwd`` and be silently ignored. ``register_task_env_overrides``
|
||||
syncs the new cwd onto the live cached env so an explicit ACP project-root
|
||||
change takes effect, as the editor client expects.
|
||||
"""
|
||||
|
||||
class FakeEnv:
|
||||
env = {}
|
||||
cwd = "/workspace/old"
|
||||
|
||||
task_id = "acp-session-update"
|
||||
fake_env = FakeEnv()
|
||||
monkeypatch.setattr(terminal_tool, "_active_environments", {task_id: fake_env})
|
||||
monkeypatch.setattr(terminal_tool, "_task_env_overrides", {})
|
||||
|
||||
terminal_tool.register_task_env_overrides(task_id, {"cwd": "/workspace/new"})
|
||||
|
||||
# The live env now reflects the editor's new project root.
|
||||
assert fake_env.cwd == "/workspace/new"
|
||||
|
||||
# A subsequent command resolves to the new cwd (env.cwd precedence).
|
||||
assert terminal_tool._resolve_command_cwd(
|
||||
workdir=None, env=fake_env, default_cwd="/workspace/config"
|
||||
) == "/workspace/new"
|
||||
|
||||
|
||||
def test_registering_cwd_override_noop_when_no_live_env(monkeypatch):
|
||||
"""Registering an override before the env exists must not crash; the cwd
|
||||
is applied at env creation time instead."""
|
||||
monkeypatch.setattr(terminal_tool, "_active_environments", {})
|
||||
monkeypatch.setattr(terminal_tool, "_task_env_overrides", {})
|
||||
|
||||
# Should not raise even though no env is cached yet.
|
||||
terminal_tool.register_task_env_overrides("acp-session-pending", {"cwd": "/workspace/new"})
|
||||
|
||||
assert terminal_tool._task_env_overrides["acp-session-pending"] == {"cwd": "/workspace/new"}
|
||||
|
||||
|
||||
def test_registering_non_cwd_override_leaves_live_env_cwd_untouched(monkeypatch):
|
||||
"""A non-cwd override (e.g. a per-task Modal image) must not disturb the
|
||||
live env's cwd."""
|
||||
|
||||
class FakeEnv:
|
||||
env = {}
|
||||
cwd = "/workspace/keep"
|
||||
|
||||
task_id = "rl-rollout-1"
|
||||
fake_env = FakeEnv()
|
||||
monkeypatch.setattr(terminal_tool, "_active_environments", {task_id: fake_env})
|
||||
monkeypatch.setattr(terminal_tool, "_task_env_overrides", {})
|
||||
|
||||
terminal_tool.register_task_env_overrides(task_id, {"modal_image": "custom:latest"})
|
||||
|
||||
assert fake_env.cwd == "/workspace/keep"
|
||||
|
||||
Reference in New Issue
Block a user