mirror of
https://github.com/bytedance/deer-flow.git
synced 2026-06-09 17:12:01 +00:00
* fix(agents): harden update_agent null-like args * docs: mention undefined null-like update args --------- Co-authored-by: Willem Jiang <willem.jiang@gmail.com>
384 lines
15 KiB
Python
384 lines
15 KiB
Python
"""Tests for update_agent tool — partial updates, atomic writes, and validation.
|
|
|
|
Resolves issue #2616: a custom agent must be able to persist updates to its
|
|
own SOUL.md / config.yaml from inside a normal chat (not only from bootstrap).
|
|
|
|
The tool writes per-user (``{base_dir}/users/{user_id}/agents/{name}/``) so
|
|
that one user's update cannot mutate another user's agent.
|
|
"""
|
|
|
|
from __future__ import annotations
|
|
|
|
from pathlib import Path
|
|
from types import SimpleNamespace
|
|
from unittest.mock import MagicMock, patch
|
|
|
|
import pytest
|
|
import yaml
|
|
from langchain.tools import ToolRuntime
|
|
|
|
from deerflow.config.agents_config import AgentConfig
|
|
from deerflow.tools.builtins.update_agent_tool import update_agent
|
|
|
|
DEFAULT_USER = "test-user-autouse" # matches the autouse fixture in tests/conftest.py
|
|
|
|
|
|
class _DummyRuntime(SimpleNamespace):
|
|
context: dict
|
|
tool_call_id: str
|
|
|
|
|
|
def _runtime(agent_name: str | None = "test-agent", tool_call_id: str = "call_1") -> _DummyRuntime:
|
|
return _DummyRuntime(context={"agent_name": agent_name} if agent_name is not None else {}, tool_call_id=tool_call_id)
|
|
|
|
|
|
def _tool_runtime(agent_name: str | None = "test-agent", tool_call_id: str = "call_1") -> ToolRuntime:
|
|
return ToolRuntime(
|
|
state={"sandbox": {"sandbox_id": "local"}, "thread_data": {}},
|
|
context={"agent_name": agent_name} if agent_name is not None else {},
|
|
config={"configurable": {"thread_id": "thread-1"}},
|
|
stream_writer=lambda _: None,
|
|
tools=[],
|
|
tool_call_id=tool_call_id,
|
|
store=None,
|
|
)
|
|
|
|
|
|
def _make_paths_mock(tmp_path: Path) -> MagicMock:
|
|
paths = MagicMock()
|
|
paths.base_dir = tmp_path
|
|
paths.agent_dir = lambda name: tmp_path / "agents" / name
|
|
paths.agents_dir = tmp_path / "agents"
|
|
paths.user_agent_dir = lambda user_id, name: tmp_path / "users" / user_id / "agents" / name
|
|
paths.user_agents_dir = lambda user_id: tmp_path / "users" / user_id / "agents"
|
|
return paths
|
|
|
|
|
|
def _user_agent_dir(tmp_path: Path, name: str = "test-agent", user_id: str = DEFAULT_USER) -> Path:
|
|
return tmp_path / "users" / user_id / "agents" / name
|
|
|
|
|
|
def _seed_agent(
|
|
tmp_path: Path,
|
|
name: str = "test-agent",
|
|
*,
|
|
description: str = "old desc",
|
|
soul: str = "old soul",
|
|
skills: list[str] | None = None,
|
|
user_id: str = DEFAULT_USER,
|
|
) -> Path:
|
|
"""Create a baseline agent dir with config.yaml and SOUL.md for tests to mutate."""
|
|
agent_dir = _user_agent_dir(tmp_path, name, user_id=user_id)
|
|
agent_dir.mkdir(parents=True, exist_ok=True)
|
|
cfg: dict = {"name": name, "description": description}
|
|
if skills is not None:
|
|
cfg["skills"] = skills
|
|
(agent_dir / "config.yaml").write_text(yaml.safe_dump(cfg, sort_keys=False), encoding="utf-8")
|
|
(agent_dir / "SOUL.md").write_text(soul, encoding="utf-8")
|
|
return agent_dir
|
|
|
|
|
|
@pytest.fixture()
|
|
def patched_paths(tmp_path: Path):
|
|
paths_mock = _make_paths_mock(tmp_path)
|
|
with patch("deerflow.tools.builtins.update_agent_tool.get_paths", return_value=paths_mock):
|
|
# load_agent_config also calls get_paths(); patch the same target it uses.
|
|
with patch("deerflow.config.agents_config.get_paths", return_value=paths_mock):
|
|
yield paths_mock
|
|
|
|
|
|
@pytest.fixture()
|
|
def stub_app_config():
|
|
"""Stub get_app_config so model validation accepts only known names."""
|
|
fake = MagicMock()
|
|
fake.get_model_config.side_effect = lambda name: object() if name in {"gpt-known", "m1"} else None
|
|
with patch("deerflow.tools.builtins.update_agent_tool.get_app_config", return_value=fake):
|
|
yield fake
|
|
|
|
|
|
# --- Validation tests ---
|
|
|
|
|
|
def test_update_agent_rejects_missing_agent_name(patched_paths):
|
|
result = update_agent.func(runtime=_runtime(agent_name=None), soul="new soul")
|
|
|
|
msg = result.update["messages"][0]
|
|
assert "only available inside a custom agent's chat" in msg.content
|
|
|
|
|
|
def test_update_agent_rejects_invalid_agent_name(patched_paths):
|
|
result = update_agent.func(runtime=_runtime(agent_name="../../etc/passwd"), soul="x")
|
|
|
|
msg = result.update["messages"][0]
|
|
assert "Invalid agent name" in msg.content
|
|
|
|
|
|
def test_update_agent_rejects_unknown_agent(tmp_path, patched_paths):
|
|
result = update_agent.func(runtime=_runtime(agent_name="ghost"), soul="x")
|
|
|
|
msg = result.update["messages"][0]
|
|
assert "does not exist" in msg.content
|
|
assert not _user_agent_dir(tmp_path, "ghost").exists()
|
|
|
|
|
|
def test_update_agent_requires_at_least_one_field(tmp_path, patched_paths):
|
|
_seed_agent(tmp_path)
|
|
|
|
result = update_agent.func(runtime=_runtime())
|
|
|
|
msg = result.update["messages"][0]
|
|
assert "No fields provided" in msg.content
|
|
assert msg.status == "error"
|
|
|
|
|
|
def test_update_agent_rejects_unknown_model(tmp_path, patched_paths, stub_app_config):
|
|
"""Copilot review: model must be validated against configured models before
|
|
being persisted; otherwise _resolve_model_name silently falls back to the
|
|
default and the user gets repeated warnings on every later turn."""
|
|
_seed_agent(tmp_path)
|
|
|
|
result = update_agent.func(runtime=_runtime(), model="not-in-config")
|
|
|
|
msg = result.update["messages"][0]
|
|
assert "Unknown model" in msg.content
|
|
cfg = yaml.safe_load((_user_agent_dir(tmp_path) / "config.yaml").read_text())
|
|
assert "model" not in cfg, "Invalid model must not have been written to config.yaml"
|
|
|
|
|
|
def test_update_agent_accepts_known_model(tmp_path, patched_paths, stub_app_config):
|
|
_seed_agent(tmp_path)
|
|
|
|
result = update_agent.func(runtime=_runtime(), model="gpt-known")
|
|
|
|
cfg = yaml.safe_load((_user_agent_dir(tmp_path) / "config.yaml").read_text())
|
|
assert cfg["model"] == "gpt-known"
|
|
assert "model" in result.update["messages"][0].content
|
|
|
|
|
|
def test_update_agent_treats_nullish_optional_text_as_omitted(tmp_path, patched_paths):
|
|
"""Models sometimes pass literal "null" strings while trying to omit fields.
|
|
|
|
Treat those as omitted for optional text fields so they do not get persisted
|
|
as a model name or SOUL.md content and feed repeated update_agent retries.
|
|
"""
|
|
agent_dir = _seed_agent(tmp_path, description="old desc", soul="old soul")
|
|
|
|
result = update_agent.invoke(
|
|
{
|
|
"runtime": _tool_runtime(),
|
|
"soul": "null",
|
|
"description": "none",
|
|
"model": "undefined",
|
|
}
|
|
)
|
|
|
|
msg = result.update["messages"][0]
|
|
assert "No fields provided" in msg.content
|
|
assert msg.status == "error"
|
|
|
|
cfg = yaml.safe_load((agent_dir / "config.yaml").read_text())
|
|
assert cfg["description"] == "old desc"
|
|
assert "model" not in cfg
|
|
assert (agent_dir / "SOUL.md").read_text() == "old soul"
|
|
|
|
|
|
def test_update_agent_rejects_string_list_fields(tmp_path, patched_paths):
|
|
"""skills/tool_groups must be real arrays; string placeholders are invalid."""
|
|
agent_dir = _seed_agent(tmp_path, skills=["existing"])
|
|
|
|
assert update_agent.args_schema is not None
|
|
with pytest.raises(ValueError, match="skills"):
|
|
update_agent.args_schema.model_validate({"skills": "alpha,beta"})
|
|
|
|
cfg = yaml.safe_load((agent_dir / "config.yaml").read_text())
|
|
assert cfg["skills"] == ["existing"]
|
|
|
|
|
|
def test_update_agent_treats_nullish_string_list_fields_as_omitted(tmp_path, patched_paths):
|
|
agent_dir = _seed_agent(tmp_path, skills=["existing"])
|
|
|
|
result = update_agent.invoke(
|
|
{
|
|
"runtime": _tool_runtime(),
|
|
"skills": "null",
|
|
"tool_groups": "none",
|
|
}
|
|
)
|
|
|
|
msg = result.update["messages"][0]
|
|
assert "No fields provided" in msg.content
|
|
assert msg.status == "error"
|
|
|
|
cfg = yaml.safe_load((agent_dir / "config.yaml").read_text())
|
|
assert cfg["skills"] == ["existing"]
|
|
assert "tool_groups" not in cfg
|
|
|
|
|
|
# --- Partial update tests ---
|
|
|
|
|
|
def test_update_agent_updates_soul_only(tmp_path, patched_paths):
|
|
agent_dir = _seed_agent(tmp_path, description="keep me", soul="old soul")
|
|
|
|
result = update_agent.func(runtime=_runtime(), soul="brand new soul")
|
|
|
|
assert (agent_dir / "SOUL.md").read_text() == "brand new soul"
|
|
cfg = yaml.safe_load((agent_dir / "config.yaml").read_text())
|
|
assert cfg["description"] == "keep me", "description must be preserved"
|
|
assert "soul" in result.update["messages"][0].content
|
|
|
|
|
|
def test_update_agent_updates_description_only(tmp_path, patched_paths):
|
|
agent_dir = _seed_agent(tmp_path, description="old desc", soul="keep this soul")
|
|
|
|
result = update_agent.func(runtime=_runtime(), description="new desc")
|
|
|
|
cfg = yaml.safe_load((agent_dir / "config.yaml").read_text())
|
|
assert cfg["description"] == "new desc"
|
|
assert (agent_dir / "SOUL.md").read_text() == "keep this soul", "SOUL.md must be preserved"
|
|
assert "description" in result.update["messages"][0].content
|
|
|
|
|
|
def test_update_agent_skills_empty_list_disables_all(tmp_path, patched_paths):
|
|
agent_dir = _seed_agent(tmp_path, skills=["a", "b"])
|
|
|
|
result = update_agent.func(runtime=_runtime(), skills=[])
|
|
|
|
cfg = yaml.safe_load((agent_dir / "config.yaml").read_text())
|
|
assert cfg["skills"] == [], "empty list must persist as empty list (not be omitted)"
|
|
assert "skills" in result.update["messages"][0].content
|
|
|
|
|
|
def test_update_agent_skills_omitted_keeps_existing(tmp_path, patched_paths):
|
|
agent_dir = _seed_agent(tmp_path, skills=["alpha", "beta"])
|
|
|
|
update_agent.func(runtime=_runtime(), description="bumped")
|
|
|
|
cfg = yaml.safe_load((agent_dir / "config.yaml").read_text())
|
|
assert cfg["skills"] == ["alpha", "beta"], "omitting skills must preserve the existing whitelist"
|
|
|
|
|
|
def test_update_agent_no_op_when_values_match_existing(tmp_path, patched_paths):
|
|
_seed_agent(tmp_path, description="same")
|
|
|
|
result = update_agent.func(runtime=_runtime(), description="same")
|
|
|
|
assert "No changes applied" in result.update["messages"][0].content
|
|
|
|
|
|
def test_update_agent_forces_name_to_directory(tmp_path, patched_paths):
|
|
"""Copilot review: if the existing config.yaml has a drifted ``name`` field,
|
|
update_agent must rewrite it to match the directory name so on-disk state
|
|
stays consistent with the runtime context."""
|
|
agent_dir = _user_agent_dir(tmp_path)
|
|
agent_dir.mkdir(parents=True)
|
|
(agent_dir / "config.yaml").write_text(yaml.safe_dump({"name": "drifted-name", "description": "old"}, sort_keys=False), encoding="utf-8")
|
|
(agent_dir / "SOUL.md").write_text("soul", encoding="utf-8")
|
|
|
|
update_agent.func(runtime=_runtime(), description="bumped")
|
|
|
|
cfg = yaml.safe_load((agent_dir / "config.yaml").read_text())
|
|
assert cfg["name"] == "test-agent", "config.yaml name must follow the directory name, not legacy yaml content"
|
|
|
|
|
|
# --- Atomicity tests ---
|
|
|
|
|
|
def test_update_agent_failure_preserves_existing_files(tmp_path, patched_paths):
|
|
agent_dir = _seed_agent(tmp_path, soul="original soul")
|
|
|
|
real_replace = Path.replace
|
|
|
|
def _explode(self, target):
|
|
if str(target).endswith("SOUL.md"):
|
|
raise OSError("disk full")
|
|
return real_replace(self, target)
|
|
|
|
with patch.object(Path, "replace", _explode):
|
|
result = update_agent.func(runtime=_runtime(), soul="poisoned content")
|
|
|
|
assert (agent_dir / "SOUL.md").read_text() == "original soul", "atomic write must not corrupt existing SOUL.md"
|
|
assert "Error" in result.update["messages"][0].content
|
|
leftover_tmps = list(agent_dir.glob("*.tmp"))
|
|
assert leftover_tmps == [], "temp files must be cleaned up on failure"
|
|
|
|
|
|
def test_update_agent_soul_failure_does_not_replace_config(tmp_path, patched_paths):
|
|
"""Copilot review: if both config.yaml and SOUL.md are scheduled to be
|
|
written and SOUL.md staging fails *before* any rename, config.yaml must
|
|
NOT be replaced. The fix stages every temp file first and only renames
|
|
after all temps exist on disk."""
|
|
agent_dir = _seed_agent(tmp_path, description="original-desc", soul="original soul")
|
|
|
|
real_named_temp_file = __import__("tempfile").NamedTemporaryFile
|
|
call_count = {"n": 0}
|
|
|
|
def _explode_on_soul(*args, **kwargs):
|
|
# Inspect target dir + suffix; the SOUL temp file is the second one we stage.
|
|
call_count["n"] += 1
|
|
if call_count["n"] >= 2:
|
|
raise OSError("disk full while staging SOUL.md")
|
|
return real_named_temp_file(*args, **kwargs)
|
|
|
|
with patch("deerflow.tools.builtins.update_agent_tool.tempfile.NamedTemporaryFile", side_effect=_explode_on_soul):
|
|
result = update_agent.func(runtime=_runtime(), description="new-desc", soul="new soul")
|
|
|
|
cfg = yaml.safe_load((agent_dir / "config.yaml").read_text())
|
|
assert cfg["description"] == "original-desc", "config.yaml must not be replaced when SOUL.md staging fails"
|
|
assert (agent_dir / "SOUL.md").read_text() == "original soul"
|
|
assert "Error" in result.update["messages"][0].content
|
|
assert list(agent_dir.glob("*.tmp")) == [], "staged config.yaml temp must be cleaned up on SOUL.md failure"
|
|
|
|
|
|
# --- Per-user isolation ---
|
|
|
|
|
|
def test_update_agent_only_writes_under_current_user(tmp_path, patched_paths):
|
|
"""An update from user 'alice' must never touch user 'bob's agent files."""
|
|
from deerflow.runtime.user_context import reset_current_user, set_current_user
|
|
|
|
# Seed an agent for both users with the same name.
|
|
alice_dir = _seed_agent(tmp_path, name="shared", description="alice-desc", soul="alice soul", user_id="alice")
|
|
bob_dir = _seed_agent(tmp_path, name="shared", description="bob-desc", soul="bob soul", user_id="bob")
|
|
|
|
# Override the autouse contextvar so update_agent runs as Alice.
|
|
token = set_current_user(SimpleNamespace(id="alice"))
|
|
try:
|
|
update_agent.func(runtime=_runtime(agent_name="shared"), description="alice-bumped")
|
|
finally:
|
|
reset_current_user(token)
|
|
|
|
alice_cfg = yaml.safe_load((alice_dir / "config.yaml").read_text())
|
|
bob_cfg = yaml.safe_load((bob_dir / "config.yaml").read_text())
|
|
assert alice_cfg["description"] == "alice-bumped"
|
|
assert bob_cfg["description"] == "bob-desc", "bob's config.yaml must not have been touched"
|
|
assert (bob_dir / "SOUL.md").read_text() == "bob soul"
|
|
|
|
|
|
# --- Loader passthrough sanity check ---
|
|
|
|
|
|
def test_update_agent_round_trips_known_fields(tmp_path, patched_paths):
|
|
"""update_agent reads through load_agent_config so all fields the loader
|
|
knows about (name, description, model, tool_groups, skills) round-trip
|
|
on a partial update.
|
|
|
|
Note: ``load_agent_config`` strips unknown fields before constructing
|
|
AgentConfig, so legacy/extra YAML keys are NOT preserved across
|
|
updates — by design.
|
|
"""
|
|
_seed_agent(tmp_path, description="legacy")
|
|
|
|
fake_cfg = AgentConfig(name="test-agent", description="legacy", skills=["s1"], tool_groups=["g1"], model="m1")
|
|
fake_app_config = MagicMock()
|
|
fake_app_config.get_model_config.return_value = object()
|
|
with patch("deerflow.tools.builtins.update_agent_tool.load_agent_config", return_value=fake_cfg):
|
|
with patch("deerflow.tools.builtins.update_agent_tool.get_app_config", return_value=fake_app_config):
|
|
update_agent.func(runtime=_runtime(), description="bumped")
|
|
|
|
cfg = yaml.safe_load((_user_agent_dir(tmp_path) / "config.yaml").read_text())
|
|
assert cfg["description"] == "bumped"
|
|
assert cfg["skills"] == ["s1"]
|
|
assert cfg["tool_groups"] == ["g1"]
|
|
assert cfg["model"] == "m1"
|