Some Windows editors prepend an invisible UTF-8 BOM (U+FEFF) to text files. We had no awareness of it, so: read_file surfaced a phantom U+FEFF as the first character; patch matches against the true first line could miss; and a write/patch round-trip silently stripped the marker, changing the file's byte signature. Now: - read_file / read_file_raw strip a single leading BOM so the model never sees it (only on the first chunk — the marker lives at byte 0). - patch_replace strips the BOM before fuzzy-matching (so an exact first-line match works) and its post-write verification compares BOM-stripped content. - write_file restores the BOM when the original file had one and the new content doesn't, mirroring the existing line-ending preservation (detect on disk via a cheap `head -c 3` probe or reuse pre_content, re-prepend across the edit). Guards against double-BOM. Mid-content U+FEFF is left alone (it's data there, not a file marker). Tests: TestBomHandling (real LocalEnvironment) — read-strips, raw-read strips, write preserves, no-BOM-when-original-had-none, no-double-BOM, patch round-trip preserves, patch matches first line through a BOM, plus helper unit tests. 208 file-tool tests green.
284 lines
12 KiB
Python
284 lines
12 KiB
Python
"""Tests for file write safety and HERMES_WRITE_SAFE_ROOT sandboxing.
|
|
|
|
Based on PR #1085 by ismoilh (salvaged).
|
|
"""
|
|
|
|
import os
|
|
from pathlib import Path
|
|
|
|
import pytest
|
|
|
|
from tools.file_operations import _is_write_denied
|
|
|
|
|
|
class TestStaticDenyList:
|
|
"""Basic sanity checks for the static write deny list."""
|
|
|
|
def test_temp_file_not_denied_by_default(self, tmp_path: Path):
|
|
target = tmp_path / "regular.txt"
|
|
assert _is_write_denied(str(target)) is False
|
|
|
|
def test_ssh_key_is_denied(self):
|
|
assert _is_write_denied(os.path.expanduser("~/.ssh/id_rsa")) is True
|
|
|
|
def test_etc_shadow_is_denied(self):
|
|
assert _is_write_denied("/etc/shadow") is True
|
|
|
|
|
|
class TestSafeWriteRoot:
|
|
"""HERMES_WRITE_SAFE_ROOT should sandbox writes to a specific subtree."""
|
|
|
|
def test_writes_inside_safe_root_are_allowed(self, tmp_path: Path, monkeypatch):
|
|
safe_root = tmp_path / "workspace"
|
|
child = safe_root / "subdir" / "file.txt"
|
|
os.makedirs(child.parent, exist_ok=True)
|
|
|
|
monkeypatch.setenv("HERMES_WRITE_SAFE_ROOT", str(safe_root))
|
|
assert _is_write_denied(str(child)) is False
|
|
|
|
def test_writes_to_safe_root_itself_are_allowed(self, tmp_path: Path, monkeypatch):
|
|
safe_root = tmp_path / "workspace"
|
|
os.makedirs(safe_root, exist_ok=True)
|
|
|
|
monkeypatch.setenv("HERMES_WRITE_SAFE_ROOT", str(safe_root))
|
|
assert _is_write_denied(str(safe_root)) is False
|
|
|
|
def test_writes_outside_safe_root_are_denied(self, tmp_path: Path, monkeypatch):
|
|
safe_root = tmp_path / "workspace"
|
|
outside = tmp_path / "other" / "file.txt"
|
|
os.makedirs(safe_root, exist_ok=True)
|
|
os.makedirs(outside.parent, exist_ok=True)
|
|
|
|
monkeypatch.setenv("HERMES_WRITE_SAFE_ROOT", str(safe_root))
|
|
assert _is_write_denied(str(outside)) is True
|
|
|
|
def test_safe_root_env_ignores_empty_value(self, tmp_path: Path, monkeypatch):
|
|
target = tmp_path / "regular.txt"
|
|
monkeypatch.setenv("HERMES_WRITE_SAFE_ROOT", "")
|
|
assert _is_write_denied(str(target)) is False
|
|
|
|
def test_safe_root_unset_allows_all(self, tmp_path: Path, monkeypatch):
|
|
target = tmp_path / "regular.txt"
|
|
monkeypatch.delenv("HERMES_WRITE_SAFE_ROOT", raising=False)
|
|
assert _is_write_denied(str(target)) is False
|
|
|
|
def test_safe_root_with_tilde_expansion(self, tmp_path: Path, monkeypatch):
|
|
"""~ in HERMES_WRITE_SAFE_ROOT should be expanded."""
|
|
# Use a real subdirectory of tmp_path so we can test tilde-style paths
|
|
safe_root = tmp_path / "workspace"
|
|
inside = safe_root / "file.txt"
|
|
os.makedirs(safe_root, exist_ok=True)
|
|
|
|
monkeypatch.setenv("HERMES_WRITE_SAFE_ROOT", str(safe_root))
|
|
assert _is_write_denied(str(inside)) is False
|
|
|
|
def test_safe_root_does_not_override_static_deny(self, tmp_path: Path, monkeypatch):
|
|
"""Even if a static-denied path is inside the safe root, it's still denied."""
|
|
# Point safe root at home to include ~/.ssh
|
|
monkeypatch.setenv("HERMES_WRITE_SAFE_ROOT", os.path.expanduser("~"))
|
|
assert _is_write_denied(os.path.expanduser("~/.ssh/id_rsa")) is True
|
|
|
|
|
|
class TestCheckSensitivePathMacOSBypass:
|
|
"""Verify _check_sensitive_path blocks /private/etc paths (issue #8734)."""
|
|
|
|
def test_etc_hosts_blocked(self):
|
|
from tools.file_tools import _check_sensitive_path
|
|
assert _check_sensitive_path("/etc/hosts") is not None
|
|
|
|
def test_private_etc_hosts_blocked(self):
|
|
from tools.file_tools import _check_sensitive_path
|
|
assert _check_sensitive_path("/private/etc/hosts") is not None
|
|
|
|
def test_private_etc_ssh_config_blocked(self):
|
|
from tools.file_tools import _check_sensitive_path
|
|
assert _check_sensitive_path("/private/etc/ssh/sshd_config") is not None
|
|
|
|
def test_private_var_blocked(self):
|
|
from tools.file_tools import _check_sensitive_path
|
|
assert _check_sensitive_path("/private/var/db/something") is not None
|
|
|
|
def test_boot_still_blocked(self):
|
|
from tools.file_tools import _check_sensitive_path
|
|
assert _check_sensitive_path("/boot/grub/grub.cfg") is not None
|
|
|
|
def test_safe_path_allowed(self):
|
|
from tools.file_tools import _check_sensitive_path
|
|
assert _check_sensitive_path("/tmp/safe_file.txt") is None
|
|
|
|
|
|
class TestAtomicWrite:
|
|
"""write_file / patch land via a temp-file + atomic rename.
|
|
|
|
The invariant: a write that fails partway NEVER corrupts the existing
|
|
file, and the swap is a real rename (so a reader either sees the full
|
|
old content or the full new content, never a half-written file). These
|
|
run against a real LocalEnvironment so the actual shell script executes.
|
|
"""
|
|
|
|
@pytest.fixture
|
|
def ops(self, tmp_path: Path):
|
|
from tools.environments.local import LocalEnvironment
|
|
from tools.file_operations import ShellFileOperations
|
|
env = LocalEnvironment(cwd=str(tmp_path))
|
|
return ShellFileOperations(env, cwd=str(tmp_path))
|
|
|
|
def test_overwrite_changes_inode(self, ops, tmp_path: Path):
|
|
# A real rename allocates a new inode for the target; an in-place
|
|
# rewrite would keep the same inode. This proves the swap is atomic.
|
|
target = tmp_path / "f.txt"
|
|
target.write_text("v1")
|
|
ino_before = os.stat(target).st_ino
|
|
res = ops.write_file(str(target), "v2 content")
|
|
assert res.error is None, res.error
|
|
assert target.read_text() == "v2 content"
|
|
assert os.stat(target).st_ino != ino_before
|
|
|
|
def test_overwrite_preserves_mode(self, ops, tmp_path: Path):
|
|
target = tmp_path / "perms.txt"
|
|
target.write_text("old")
|
|
os.chmod(target, 0o640)
|
|
res = ops.write_file(str(target), "new")
|
|
assert res.error is None, res.error
|
|
assert (os.stat(target).st_mode & 0o777) == 0o640
|
|
|
|
def test_failed_write_leaves_original_intact(self, ops, tmp_path: Path):
|
|
# A read-only parent directory means the temp file can't be created,
|
|
# so the write fails BEFORE any rename. The original must survive
|
|
# byte-for-byte and no temp file may be left behind.
|
|
if hasattr(os, "geteuid") and os.geteuid() == 0:
|
|
pytest.skip("root bypasses directory permission bits")
|
|
locked = tmp_path / "locked"
|
|
locked.mkdir()
|
|
target = locked / "f.txt"
|
|
target.write_text("ORIGINAL\n")
|
|
os.chmod(locked, 0o500) # r-x: cannot create entries inside
|
|
try:
|
|
res = ops.write_file(str(target), "SHOULD NOT LAND")
|
|
finally:
|
|
os.chmod(locked, 0o700) # restore for cleanup
|
|
assert res.error is not None
|
|
assert target.read_text() == "ORIGINAL\n"
|
|
assert [p for p in os.listdir(locked) if ".hermes-tmp" in p] == []
|
|
|
|
def test_no_temp_file_leaked_on_success(self, ops, tmp_path: Path):
|
|
target = tmp_path / "f.txt"
|
|
ops.write_file(str(target), "hello\n")
|
|
assert [p for p in os.listdir(tmp_path) if ".hermes-tmp" in p] == []
|
|
|
|
def test_special_chars_roundtrip(self, ops, tmp_path: Path):
|
|
target = tmp_path / "special.txt"
|
|
tricky = "q 'single' \"double\" $VAR `cmd` \\back\nünïcödé 日本語\n"
|
|
res = ops.write_file(str(target), tricky)
|
|
assert res.error is None, res.error
|
|
assert target.read_text(encoding="utf-8") == tricky
|
|
|
|
def test_patch_routes_through_atomic_write(self, ops, tmp_path: Path):
|
|
target = tmp_path / "edit.py"
|
|
target.write_text("a = 1\nb = 2\nc = 3\n")
|
|
os.chmod(target, 0o600)
|
|
res = ops.patch_replace(str(target), "b = 2", "b = 22")
|
|
assert res.success, res.error
|
|
assert target.read_text() == "a = 1\nb = 22\nc = 3\n"
|
|
assert (os.stat(target).st_mode & 0o777) == 0o600
|
|
|
|
|
|
class TestBomHandling:
|
|
"""UTF-8 BOM is stripped on read and preserved across write/patch.
|
|
|
|
A BOM (U+FEFF, bytes EF BB BF) is an invisible leading marker some
|
|
Windows editors prepend. The agent should never see it in read output,
|
|
but a file that had one on disk must keep it after an edit so the byte
|
|
signature is preserved.
|
|
"""
|
|
|
|
BOM = "\ufeff"
|
|
|
|
@pytest.fixture
|
|
def ops(self, tmp_path: Path):
|
|
from tools.environments.local import LocalEnvironment
|
|
from tools.file_operations import ShellFileOperations
|
|
env = LocalEnvironment(cwd=str(tmp_path))
|
|
return ShellFileOperations(env, cwd=str(tmp_path))
|
|
|
|
def test_helpers(self):
|
|
from tools.file_operations import _strip_bom, _has_bom
|
|
assert _strip_bom("\ufeffhello") == ("hello", True)
|
|
assert _strip_bom("hello") == ("hello", False)
|
|
assert _strip_bom("") == ("", False)
|
|
# mid-string BOM is data, not a marker — left alone
|
|
assert _strip_bom("a\ufeffb") == ("a\ufeffb", False)
|
|
assert _has_bom("\ufeffx") is True
|
|
assert _has_bom("x") is False
|
|
assert _has_bom(None) is False
|
|
|
|
def test_read_strips_bom(self, ops, tmp_path: Path):
|
|
target = tmp_path / "bom.py"
|
|
# Write raw bytes with a real UTF-8 BOM prefix.
|
|
target.write_bytes(self.BOM.encode("utf-8") + b"import os\nx = 1\n")
|
|
res = ops.read_file(str(target))
|
|
assert res.error is None, res.error
|
|
# Line 1 content must NOT carry the phantom U+FEFF.
|
|
first_line = res.content.split("\n", 1)[0]
|
|
assert self.BOM not in first_line
|
|
assert first_line.endswith("import os")
|
|
|
|
def test_read_raw_strips_bom(self, ops, tmp_path: Path):
|
|
target = tmp_path / "bom.txt"
|
|
target.write_bytes(self.BOM.encode("utf-8") + b"hello\nworld\n")
|
|
res = ops.read_file_raw(str(target))
|
|
assert res.error is None, res.error
|
|
assert not res.content.startswith(self.BOM)
|
|
assert res.content == "hello\nworld\n"
|
|
|
|
def test_write_preserves_bom(self, ops, tmp_path: Path):
|
|
# Existing file has a BOM; agent rewrites with BOM-less content.
|
|
target = tmp_path / "config.txt"
|
|
target.write_bytes(self.BOM.encode("utf-8") + b"old\n")
|
|
res = ops.write_file(str(target), "new content\n")
|
|
assert res.error is None, res.error
|
|
raw = target.read_bytes()
|
|
assert raw.startswith(self.BOM.encode("utf-8")) # BOM restored
|
|
assert raw == self.BOM.encode("utf-8") + b"new content\n"
|
|
|
|
def test_write_no_bom_when_original_had_none(self, ops, tmp_path: Path):
|
|
target = tmp_path / "plain.txt"
|
|
target.write_text("old\n")
|
|
res = ops.write_file(str(target), "new\n")
|
|
assert res.error is None, res.error
|
|
assert not target.read_bytes().startswith(self.BOM.encode("utf-8"))
|
|
|
|
def test_write_does_not_double_bom(self, ops, tmp_path: Path):
|
|
# If content already carries a BOM and the file had one, don't add a
|
|
# second.
|
|
target = tmp_path / "config.txt"
|
|
target.write_bytes(self.BOM.encode("utf-8") + b"old\n")
|
|
res = ops.write_file(str(target), self.BOM + "new\n")
|
|
assert res.error is None, res.error
|
|
raw = target.read_bytes()
|
|
# exactly one BOM
|
|
assert raw == self.BOM.encode("utf-8") + b"new\n"
|
|
|
|
def test_patch_roundtrip_preserves_bom(self, ops, tmp_path: Path):
|
|
target = tmp_path / "edit.py"
|
|
target.write_bytes(self.BOM.encode("utf-8") + b"a = 1\nb = 2\nc = 3\n")
|
|
res = ops.patch_replace(str(target), "b = 2", "b = 22")
|
|
assert res.success, res.error
|
|
raw = target.read_bytes()
|
|
assert raw.startswith(self.BOM.encode("utf-8")) # marker survived
|
|
assert raw == self.BOM.encode("utf-8") + b"a = 1\nb = 22\nc = 3\n"
|
|
|
|
def test_patch_matches_first_line_through_bom(self, ops, tmp_path: Path):
|
|
# The whole point: an edit targeting the BOM-prefixed first line
|
|
# must match cleanly (the matcher sees BOM-stripped content).
|
|
target = tmp_path / "mod.py"
|
|
target.write_bytes(self.BOM.encode("utf-8") + b"import os\nimport sys\n")
|
|
res = ops.patch_replace(str(target), "import os", "import os, json")
|
|
assert res.success, res.error
|
|
raw = target.read_bytes()
|
|
assert raw == self.BOM.encode("utf-8") + b"import os, json\nimport sys\n"
|
|
|
|
|
|
if __name__ == "__main__":
|
|
pytest.main([__file__, "-v"])
|