feat(memory): Phase 1 — STM ToolResultsCache + ReleaseFocus + cache flag in YAML specs

Adds two STM components and a transparent cache hook in the agent loop so read-only tools don't re-do work the agent already did in this session. New STM components: - ToolResultsCache — {tool_name: {key: result}}, session-scoped. to_dict() exposes only the key inventory (not payloads) to keep the prompt cheap. - ReleaseFocus — current_release_path + working_set list, updated automatically when a path-keyed inspector runs. YAML spec layer: - New optional 'cache: { key: <param_name> }' block in ToolSpec. - Validated at load time: cache.key must be a declared parameter. - Surfaced on Tool dataclass as cache_key: str | None. Agent._execute_tool_call: - Pre-exec cache lookup; hit short-circuits and adds _from_cache=true. - Post-exec: stores successful results, updates release_focus for path-keyed tools, refreshes episodic.last_search_results when find_torrent's hit served the response (so get_torrent_by_index keeps pointing at the right list). Cacheable tools (5): analyze_release, probe_media, list_folder, find_media_imdb_id, find_torrent.
2026-05-15 10:44:14 +02:00
parent 2db3198ef2
commit 3c7c6695f2
12 changed files with 269 additions and 7 deletions
@@ -140,7 +140,7 @@ class Agent:
        memory.save()
        return final_response

-    def _execute_tool_call(self, tool_call: dict[str, Any]) -> dict[str, Any]:
+    def _execute_tool_call(self, tool_call: dict[str, Any]) -> dict[str, Any]:  # noqa: PLR0911
        """
        Execute a single tool call.

@@ -183,25 +183,86 @@ class Agent:
            }

        tool = self.tools[tool_name]
+        memory = get_memory()
+
+        # Cache lookup — for tools flagged cacheable, short-circuit on hit.
+        cache_key_value = self._cache_key_for(tool, args)
+        if cache_key_value is not None:
+            cached = memory.stm.tool_results.get(tool_name, cache_key_value)
+            if cached is not None:
+                logger.info(
+                    f"Tool cache HIT: {tool_name}[{cache_key_value}]"
+                )
+                self._post_tool_side_effects(tool_name, args, cached, from_cache=True)
+                return {**cached, "_from_cache": True}

        # Execute tool
        try:
            result = tool.func(**args)
-            return result
        except KeyboardInterrupt:
            # Don't catch KeyboardInterrupt - let it propagate
            raise
        except TypeError as e:
            # Bad arguments
-            memory = get_memory()
            memory.episodic.add_error(tool_name, f"bad_args: {e}")
            return {"error": "bad_args", "message": str(e), "tool": tool_name}
        except Exception as e:
            # Other errors
-            memory = get_memory()
            memory.episodic.add_error(tool_name, str(e))
            return {"error": "execution_failed", "message": str(e), "tool": tool_name}

+        # Persist + side effects only on successful results.
+        if isinstance(result, dict) and result.get("status") == "ok":
+            if cache_key_value is not None:
+                memory.stm.tool_results.put(tool_name, cache_key_value, result)
+            self._post_tool_side_effects(tool_name, args, result, from_cache=False)
+            memory.save()
+
+        return result
+
+    @staticmethod
+    def _cache_key_for(tool: Tool, args: dict[str, Any]) -> str | None:
+        """Return the cache key value for this call, or None if not cacheable."""
+        if tool.cache_key is None:
+            return None
+        value = args.get(tool.cache_key)
+        if value is None:
+            return None
+        return str(value)
+
+    def _post_tool_side_effects(
+        self,
+        tool_name: str,
+        args: dict[str, Any],
+        result: dict[str, Any],
+        *,
+        from_cache: bool,
+    ) -> None:
+        """
+        Tool-agnostic side effects applied after a successful run or cache hit.
+
+        Today:
+          - Update release_focus when a path-keyed inspector runs.
+          - Refresh episodic.last_search_results on find_torrent cache hits so
+            get_torrent_by_index keeps pointing at the right list.
+        """
+        memory = get_memory()
+        tool = self.tools.get(tool_name)
+
+        # Release focus: any path-keyed inspector updates current_release_path.
+        if tool is not None and tool.cache_key in {"source_path"}:
+            path = args.get(tool.cache_key)
+            if isinstance(path, str) and path:
+                memory.stm.release_focus.focus(path)
+
+        # Episodic refresh when find_torrent's cache short-circuits the call.
+        if from_cache and tool_name == "find_torrent":
+            torrents = result.get("torrents") or []
+            query = args.get("media_title") or ""
+            memory.episodic.store_search_results(
+                query=query, results=torrents, search_type="torrent"
+            )
+
    async def step_streaming(
        self, user_input: str, completion_id: str, created_ts: int, model: str
    ) -> AsyncGenerator[dict[str, Any]]:
@@ -20,6 +20,7 @@ class Tool:
    description: str
    func: Callable[..., dict[str, Any]]
    parameters: dict[str, Any]
+    cache_key: str | None = None  # Parameter name to use as STM cache key.


 _PY_TYPE_TO_JSON = {
@@ -84,11 +85,14 @@ def _create_tool_from_function(func: Callable, spec: ToolSpec | None = None) ->
        "required": required,
    }

+    cache_key = spec.cache.key if spec is not None and spec.cache is not None else None
+
    return Tool(
        name=func.__name__,
        description=description,
        func=func,
        parameters=parameters,
+        cache_key=cache_key,
    )


@@ -61,6 +61,18 @@ class ReturnsSpec:
        )


+@dataclass(frozen=True)
+class CacheSpec:
+    """Marks a tool as cacheable in STM.tool_results, keyed by one of its parameters."""
+
+    key: str  # Name of the parameter whose value is the cache key.
+
+    @classmethod
+    def from_dict(cls, data: dict) -> CacheSpec:
+        _require(data, "key", "cache")
+        return cls(key=str(data["key"]).strip())
+
+
@dataclass(frozen=True)
 class ToolSpec:
    """Full semantic spec for one tool."""
@@ -73,6 +85,7 @@ class ToolSpec:
    next_steps: str | None
    parameters: dict[str, ParameterSpec]      # name -> ParameterSpec
    returns: dict[str, ReturnsSpec]           # status_key -> ReturnsSpec
+    cache: CacheSpec | None = None            # If present, tool is cached.

    @classmethod
    def from_yaml_path(cls, path: Path) -> ToolSpec:
@@ -108,7 +121,12 @@ class ToolSpec:
            for rkey, rdata in returns_raw.items()
        }

-        return cls(
+        cache_raw = data.get("cache")
+        if cache_raw is not None and not isinstance(cache_raw, dict):
+            raise ToolSpecError("cache must be a mapping")
+        cache = CacheSpec.from_dict(cache_raw) if cache_raw else None
+
+        spec = cls(
            name=str(data["name"]).strip(),
            summary=str(data["summary"]).strip(),
            description=str(data["description"]).strip(),
@@ -117,7 +135,14 @@ class ToolSpec:
            next_steps=_strip_or_none(data.get("next_steps")),
            parameters=parameters,
            returns=returns,
+            cache=cache,
        )
+        if cache is not None and cache.key not in parameters:
+            raise ToolSpecError(
+                f"cache.key '{cache.key}' is not a declared parameter "
+                f"(declared: {sorted(parameters)})"
+            )
+        return spec

    def compile_description(self) -> str:
        """
@@ -37,6 +37,9 @@ next_steps: |
  - media_type in (other, unknown) → ask the user what to do; do not
    auto-route.

+cache:
+  key: source_path
+
 parameters:
  release_name:
    description: Raw release folder or file name as it appears on disk.
@@ -27,6 +27,9 @@ next_steps: |
  - On status=error (not_found): show the error and ask the user for
    a more precise title.

+cache:
+  key: media_title
+
 parameters:
  media_title:
    description: Title to search for. Free-form — TMDB does the matching.
@@ -27,6 +27,9 @@ next_steps: |
  - Once chosen: call add_torrent_by_index(N) — that wraps
    get_torrent_by_index + add_torrent_to_qbittorrent.

+cache:
+  key: media_title
+
 parameters:
  media_title:
    description: Title to search for on Knaben. Free-form.
@@ -29,6 +29,9 @@ next_steps: |
  - After listing a library folder: use the result to disambiguate a
    destination during resolve_*_destination.

+cache:
+  key: path
+
 parameters:
  folder_type:
    description: Logical folder key (download, torrent, movie, tv_show, ...).
@@ -27,6 +27,9 @@ next_steps: |
    "this is 7.1 DTS, want to keep it?"); rarely chained directly to
    another tool.

+cache:
+  key: source_path
+
 parameters:
  source_path:
    description: Absolute path to the video file to probe.