Merge remote-tracking branch 'origin/main' into pr-1090

2026-02-24 11:31:40 +00:00
parent 4f8033627e cd5a8ac03d
commit 04218276ab
6 changed files with 281 additions and 75 deletions
--- a/nanobot/agent/memory.py
+++ b/nanobot/agent/memory.py
@@ -125,6 +125,13 @@ class MemoryStore:
                return False
            args = response.tool_calls[0].arguments
            # Some providers return arguments as a JSON string instead of dict
            if isinstance(args, str):
                args = json.loads(args)
            if not isinstance(args, dict):
                logger.warning("Memory consolidation: unexpected arguments type {}", type(args).__name__)
                return False
            if entry := args.get("history_entry"):
                if not isinstance(entry, str):
                    entry = json.dumps(entry, ensure_ascii=False)
--- a/nanobot/agent/tools/web.py
+++ b/nanobot/agent/tools/web.py
@@ -58,12 +58,17 @@ class WebSearchTool(Tool):
    }
    def __init__(self, api_key: str | None = None, max_results: int = 5):
-        self.api_key = api_key or os.environ.get("BRAVE_API_KEY", "")
+        self.api_key = api_key
        self.max_results = max_results
    async def execute(self, query: str, count: int | None = None, **kwargs: Any) -> str:
-        if not self.api_key:
+        api_key = self.api_key or os.environ.get("BRAVE_API_KEY", "")
-            return "Error: BRAVE_API_KEY not configured"
+        if not api_key:
            return (
                "Error: Brave Search API key not configured. "
                "Set it in ~/.nanobot/config.json under tools.web.search.apiKey "
                "(or export BRAVE_API_KEY), then restart the gateway."
            )
        try:
            n = min(max(count or self.max_results, 1), 10)
@@ -71,7 +76,7 @@ class WebSearchTool(Tool):
                r = await client.get(
                    "https://api.search.brave.com/res/v1/web/search",
                    params={"q": query, "count": n},
-                    headers={"Accept": "application/json", "X-Subscription-Token": self.api_key},
+                    headers={"Accept": "application/json", "X-Subscription-Token": api_key},
                    timeout=10.0
                )
                r.raise_for_status()
--- a/nanobot/cli/commands.py
+++ b/nanobot/cli/commands.py
@@ -360,19 +360,19 @@ def gateway(
        return "cli", "direct"
    # Create heartbeat service
-    async def on_heartbeat(prompt: str) -> str:
+    async def on_heartbeat_execute(tasks: str) -> str:
-        """Execute heartbeat through the agent."""
+        """Phase 2: execute heartbeat tasks through the full agent loop."""
        channel, chat_id = _pick_heartbeat_target()
        async def _silent(*_args, **_kwargs):
            pass
        return await agent.process_direct(
-            prompt,
+            tasks,
            session_key="heartbeat",
            channel=channel,
            chat_id=chat_id,
-            on_progress=_silent,  # suppress: heartbeat should not push progress to external channels
+            on_progress=_silent,
        )
    async def on_heartbeat_notify(response: str) -> None:
@@ -383,12 +383,15 @@ def gateway(
            return  # No external channel available to deliver to
        await bus.publish_outbound(OutboundMessage(channel=channel, chat_id=chat_id, content=response))
    hb_cfg = config.gateway.heartbeat
    heartbeat = HeartbeatService(
        workspace=config.workspace_path,
-        on_heartbeat=on_heartbeat,
+        provider=provider,
        model=agent.model,
        on_execute=on_heartbeat_execute,
        on_notify=on_heartbeat_notify,
-        interval_s=30 * 60,  # 30 minutes
+        interval_s=hb_cfg.interval_s,
-        enabled=True
+        enabled=hb_cfg.enabled,
    )
    if channels.enabled_channels:
--- a/nanobot/config/schema.py
+++ b/nanobot/config/schema.py
@@ -228,11 +228,19 @@ class ProvidersConfig(Base):
    github_copilot: ProviderConfig = Field(default_factory=ProviderConfig)  # Github Copilot (OAuth)
 class HeartbeatConfig(Base):
    """Heartbeat service configuration."""
    enabled: bool = True
    interval_s: int = 30 * 60  # 30 minutes
 class GatewayConfig(Base):
    """Gateway/server configuration."""
    host: str = "0.0.0.0"
    port: int = 18790
    heartbeat: HeartbeatConfig = Field(default_factory=HeartbeatConfig)
 class WebSearchConfig(Base):
--- a/nanobot/heartbeat/service.py
+++ b/nanobot/heartbeat/service.py
@@ -1,61 +1,69 @@
 """Heartbeat service - periodic agent wake-up to check for tasks."""
 from __future__ import annotations
 import asyncio
 from pathlib import Path
-from typing import Any, Callable, Coroutine
+from typing import TYPE_CHECKING, Any, Callable, Coroutine
 from loguru import logger
-# Default interval: 30 minutes
+if TYPE_CHECKING:
-DEFAULT_HEARTBEAT_INTERVAL_S = 30 * 60
+    from nanobot.providers.base import LLMProvider
-# Token the agent replies with when there is nothing to report
+_HEARTBEAT_TOOL = [
-HEARTBEAT_OK_TOKEN = "HEARTBEAT_OK"
+    {
-
+        "type": "function",
-# The prompt sent to agent during heartbeat
+        "function": {
-HEARTBEAT_PROMPT = (
+            "name": "heartbeat",
-    "Read HEARTBEAT.md in your workspace and follow any instructions listed there. "
+            "description": "Report heartbeat decision after reviewing tasks.",
-    f"If nothing needs attention, reply with exactly: {HEARTBEAT_OK_TOKEN}"
+            "parameters": {
-)
+                "type": "object",
-
+                "properties": {
-
+                    "action": {
-def _is_heartbeat_empty(content: str | None) -> bool:
+                        "type": "string",
-    """Check if HEARTBEAT.md has no actionable content."""
+                        "enum": ["skip", "run"],
-    if not content:
+                        "description": "skip = nothing to do, run = has active tasks",
-        return True
+                    },
-    
+                    "tasks": {
-    # Lines to skip: empty, headers, HTML comments, empty checkboxes
+                        "type": "string",
-    skip_patterns = {"- [ ]", "* [ ]", "- [x]", "* [x]"}
+                        "description": "Natural-language summary of active tasks (required for run)",
-    
+                    },
-    for line in content.split("\n"):
+                },
-        line = line.strip()
+                "required": ["action"],
-        if not line or line.startswith("#") or line.startswith("<!--") or line in skip_patterns:
+            },
-            continue
+        },
-        return False  # Found actionable content
+    }
-    
+]
    return True
 class HeartbeatService:
    """
    Periodic heartbeat service that wakes the agent to check for tasks.
-    The agent reads HEARTBEAT.md from the workspace and executes any tasks
+    Phase 1 (decision): reads HEARTBEAT.md and asks the LLM — via a virtual
-    listed there. If it has something to report, the response is forwarded
+    tool call — whether there are active tasks.  This avoids free-text parsing
-    to the user via on_notify. If nothing needs attention, the agent replies
+    and the unreliable HEARTBEAT_OK token.
-    HEARTBEAT_OK and the response is silently dropped.
+
    Phase 2 (execution): only triggered when Phase 1 returns ``run``.  The
    ``on_execute`` callback runs the task through the full agent loop and
    returns the result to deliver.
    """
    def __init__(
        self,
        workspace: Path,
-        on_heartbeat: Callable[[str], Coroutine[Any, Any, str]] | None = None,
+        provider: LLMProvider,
        model: str,
        on_execute: Callable[[str], Coroutine[Any, Any, str]] | None = None,
        on_notify: Callable[[str], Coroutine[Any, Any, None]] | None = None,
-        interval_s: int = DEFAULT_HEARTBEAT_INTERVAL_S,
+        interval_s: int = 30 * 60,
        enabled: bool = True,
    ):
        self.workspace = workspace
-        self.on_heartbeat = on_heartbeat
+        self.provider = provider
        self.model = model
        self.on_execute = on_execute
        self.on_notify = on_notify
        self.interval_s = interval_s
        self.enabled = enabled
@@ -67,7 +75,6 @@ class HeartbeatService:
        return self.workspace / "HEARTBEAT.md"
    def _read_heartbeat_file(self) -> str | None:
        """Read HEARTBEAT.md content."""
        if self.heartbeat_file.exists():
            try:
                return self.heartbeat_file.read_text(encoding="utf-8")
@@ -75,6 +82,29 @@ class HeartbeatService:
                return None
        return None
    async def _decide(self, content: str) -> tuple[str, str]:
        """Phase 1: ask LLM to decide skip/run via virtual tool call.
        Returns (action, tasks) where action is 'skip' or 'run'.
        """
        response = await self.provider.chat(
            messages=[
                {"role": "system", "content": "You are a heartbeat agent. Call the heartbeat tool to report your decision."},
                {"role": "user", "content": (
                    "Review the following HEARTBEAT.md and decide whether there are active tasks.\n\n"
                    f"{content}"
                )},
            ],
            tools=_HEARTBEAT_TOOL,
            model=self.model,
        )
        if not response.has_tool_calls:
            return "skip", ""
        args = response.tool_calls[0].arguments
        return args.get("action", "skip"), args.get("tasks", "")
    async def start(self) -> None:
        """Start the heartbeat service."""
        if not self.enabled:
@@ -110,28 +140,34 @@ class HeartbeatService:
    async def _tick(self) -> None:
        """Execute a single heartbeat tick."""
        content = self._read_heartbeat_file()
-        
+        if not content:
-        # Skip if HEARTBEAT.md is empty or doesn't exist
+            logger.debug("Heartbeat: HEARTBEAT.md missing or empty")
        if _is_heartbeat_empty(content):
            logger.debug("Heartbeat: no tasks (HEARTBEAT.md empty)")
            return
        logger.info("Heartbeat: checking for tasks...")
        if self.on_heartbeat:
        try:
-                response = await self.on_heartbeat(HEARTBEAT_PROMPT)
+            action, tasks = await self._decide(content)
-                if HEARTBEAT_OK_TOKEN in response.upper():
+
            if action != "run":
                logger.info("Heartbeat: OK (nothing to report)")
-                else:
+                return
            logger.info("Heartbeat: tasks found, executing...")
            if self.on_execute:
                response = await self.on_execute(tasks)
                if response and self.on_notify:
                    logger.info("Heartbeat: completed, delivering response")
                    if self.on_notify:
                    await self.on_notify(response)
        except Exception:
            logger.exception("Heartbeat execution failed")
    async def trigger_now(self) -> str | None:
        """Manually trigger a heartbeat."""
-        if self.on_heartbeat:
+        content = self._read_heartbeat_file()
-            return await self.on_heartbeat(HEARTBEAT_PROMPT)
+        if not content:
            return None
        action, tasks = await self._decide(content)
        if action != "run" or not self.on_execute:
            return None
        return await self.on_execute(tasks)
--- a/tests/test_memory_consolidation_types.py
+++ b/tests/test_memory_consolidation_types.py
@@ -0,0 +1,147 @@
 """Test MemoryStore.consolidate() handles non-string tool call arguments.
 Regression test for https://github.com/HKUDS/nanobot/issues/1042
 When memory consolidation receives dict values instead of strings from the LLM
 tool call response, it should serialize them to JSON instead of raising TypeError.
 """
 import json
 from pathlib import Path
 from unittest.mock import AsyncMock, MagicMock
 import pytest
 from nanobot.agent.memory import MemoryStore
 from nanobot.providers.base import LLMResponse, ToolCallRequest
 def _make_session(message_count: int = 30, memory_window: int = 50):
    """Create a mock session with messages."""
    session = MagicMock()
    session.messages = [
        {"role": "user", "content": f"msg{i}", "timestamp": "2026-01-01 00:00"}
        for i in range(message_count)
    ]
    session.last_consolidated = 0
    return session
 def _make_tool_response(history_entry, memory_update):
    """Create an LLMResponse with a save_memory tool call."""
    return LLMResponse(
        content=None,
        tool_calls=[
            ToolCallRequest(
                id="call_1",
                name="save_memory",
                arguments={
                    "history_entry": history_entry,
                    "memory_update": memory_update,
                },
            )
        ],
    )
 class TestMemoryConsolidationTypeHandling:
    """Test that consolidation handles various argument types correctly."""
    @pytest.mark.asyncio
    async def test_string_arguments_work(self, tmp_path: Path) -> None:
        """Normal case: LLM returns string arguments."""
        store = MemoryStore(tmp_path)
        provider = AsyncMock()
        provider.chat = AsyncMock(
            return_value=_make_tool_response(
                history_entry="[2026-01-01] User discussed testing.",
                memory_update="# Memory\nUser likes testing.",
            )
        )
        session = _make_session(message_count=60)
        result = await store.consolidate(session, provider, "test-model", memory_window=50)
        assert result is True
        assert store.history_file.exists()
        assert "[2026-01-01] User discussed testing." in store.history_file.read_text()
        assert "User likes testing." in store.memory_file.read_text()
    @pytest.mark.asyncio
    async def test_dict_arguments_serialized_to_json(self, tmp_path: Path) -> None:
        """Issue #1042: LLM returns dict instead of string — must not raise TypeError."""
        store = MemoryStore(tmp_path)
        provider = AsyncMock()
        provider.chat = AsyncMock(
            return_value=_make_tool_response(
                history_entry={"timestamp": "2026-01-01", "summary": "User discussed testing."},
                memory_update={"facts": ["User likes testing"], "topics": ["testing"]},
            )
        )
        session = _make_session(message_count=60)
        result = await store.consolidate(session, provider, "test-model", memory_window=50)
        assert result is True
        assert store.history_file.exists()
        history_content = store.history_file.read_text()
        parsed = json.loads(history_content.strip())
        assert parsed["summary"] == "User discussed testing."
        memory_content = store.memory_file.read_text()
        parsed_mem = json.loads(memory_content)
        assert "User likes testing" in parsed_mem["facts"]
    @pytest.mark.asyncio
    async def test_string_arguments_as_raw_json(self, tmp_path: Path) -> None:
        """Some providers return arguments as a JSON string instead of parsed dict."""
        store = MemoryStore(tmp_path)
        provider = AsyncMock()
        # Simulate arguments being a JSON string (not yet parsed)
        response = LLMResponse(
            content=None,
            tool_calls=[
                ToolCallRequest(
                    id="call_1",
                    name="save_memory",
                    arguments=json.dumps({
                        "history_entry": "[2026-01-01] User discussed testing.",
                        "memory_update": "# Memory\nUser likes testing.",
                    }),
                )
            ],
        )
        provider.chat = AsyncMock(return_value=response)
        session = _make_session(message_count=60)
        result = await store.consolidate(session, provider, "test-model", memory_window=50)
        assert result is True
        assert "User discussed testing." in store.history_file.read_text()
    @pytest.mark.asyncio
    async def test_no_tool_call_returns_false(self, tmp_path: Path) -> None:
        """When LLM doesn't use the save_memory tool, return False."""
        store = MemoryStore(tmp_path)
        provider = AsyncMock()
        provider.chat = AsyncMock(
            return_value=LLMResponse(content="I summarized the conversation.", tool_calls=[])
        )
        session = _make_session(message_count=60)
        result = await store.consolidate(session, provider, "test-model", memory_window=50)
        assert result is False
        assert not store.history_file.exists()
    @pytest.mark.asyncio
    async def test_skips_when_few_messages(self, tmp_path: Path) -> None:
        """Consolidation should be a no-op when messages < keep_count."""
        store = MemoryStore(tmp_path)
        provider = AsyncMock()
        session = _make_session(message_count=10)
        result = await store.consolidate(session, provider, "test-model", memory_window=50)
        assert result is True
        provider.chat.assert_not_called()