feat(refit): complete S1-S6 — case abstraction, grounding, log-odds, plugins, coref, multi-source

Consolidates the long-running refit work (DESIGN.md as authoritative spec) into a single baseline commit. Six stages landed together: S1 Case + EvidenceSource abstraction; tools parameterised by source_id (case.py, main.py multi-source bootstrap, .bin extension support) S2 Grounding gateway in add_phenomenon: verified_facts cite real ToolInvocation ids; substring / normalised match enforced; agent + task scope checked. Phenomenon.description split into verified_facts (grounded) + interpretation (free text). [invocation: inv-xxx] prefix on every wrapped tool result so the LLM can cite. S3 Confidence as additive log-odds: edge_type → log10(LR) calibration table; commutative updates; supported / refuted thresholds derived from log_odds; hypothesis × evidence matrix view. S4 iOS plugin: unzip_archive + parse_plist / sqlite_tables / sqlite_query / parse_ios_keychain / read_idevice_info; IOSArtifactAgent; SOURCE_TYPE_AGENTS routing. S5 Cross-source entity resolution: typed identifiers on Entity, observe_identity gateway, auto coref hypothesis with shared / conflicting strong/weak LR edges, reversible same_as edges, actor_clusters() view. S6 Android partition probe + AndroidArtifactAgent; MediaAgent with OCR fallback; orchestrator Phase 1 iterates every analysable source; platform-aware get_triage_agent_type; ReportAgent renders actor clusters + per-source breakdown. 142 unit tests / 1 skipped — full coverage of the new gateway, log-odds math, coref hypothesis fall-out, and orchestrator multi-source dispatch. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
2026-05-21 02:12:10 -10:00
parent 444d58726a
commit 81ade8f7ac
24 changed files with 5137 additions and 244 deletions
--- a/tool_registry.py
+++ b/tool_registry.py
@@ -1,6 +1,8 @@
 """Central tool registry — catalogs all available forensic tools.

-Tools are registered once at startup with bound image_path and offset.
+Tools are registered once at startup. Sleuth Kit tools resolve their image
+path and partition offset from graph.active_source at call time, so a single
+registered tool follows whichever evidence source is currently active.
 The AgentFactory uses this catalog to compose agents dynamically.
 """

@@ -14,6 +16,11 @@ import re
 from dataclasses import dataclass, field
 from typing import Any

+from evidence_graph import GroundingError
+from tools import archive as arc
+from tools import media as med
+from tools import mobile_android as android
+from tools import mobile_ios as ios
 from tools import parsers
 from tools import registry as reg
 from tools import sleuthkit as tsk
@@ -35,6 +42,13 @@ CACHEABLE_TOOLS: set[str] = {
    "parse_registry_key", "search_registry", "get_user_activity",
    "read_text_file", "read_binary_preview", "search_text_file",
    "read_text_file_section", "list_extracted_dir", "parse_pcap_strings",
+    "find_files",
+    # iOS (read-only file parses):
+    "parse_plist", "sqlite_tables", "sqlite_query",
+    "parse_ios_keychain", "read_idevice_info",
+    # Android + media (read-only):
+    "probe_android_partitions", "ocr_image",
+    # NB: unzip_archive and set_active_partition are NOT cached — they have side effects.
 }


@@ -45,24 +59,106 @@ def _cache_key(tool_name: str, kwargs: dict) -> str:
    return f"{tool_name}:{args_hash}"


+def _looks_like_error(text: str) -> bool:
+    """Heuristic for unsuccessful tool output (mirrors the prior cache filter)."""
+    return text.startswith("Error") or text.startswith("[Command failed") or text.startswith("[icat failed")
+
+
 def _make_cached(tool_name: str, executor: Any) -> Any:
-    """Wrap an executor with an in-memory result cache."""
+    """Thin in-memory cache wrapper around a tool executor.
+
+    Kept as a standalone primitive (no graph dependency) so unit tests can
+    exercise caching in isolation. Production wiring composes this with
+    invocation logging via :func:`_make_invocation_executor`.
+    """

    async def wrapper(**kwargs) -> str:
        key = _cache_key(tool_name, kwargs)
-        cached = _tool_result_cache.get(key)
-        if cached is not None:
-            logger.debug("Cache hit: %s(%s)", tool_name, kwargs)
-            return cached
+        hit = _tool_result_cache.get(key)
+        if hit is not None:
+            return hit
        result = await executor(**kwargs)
-        # Only cache successful results (not errors)
-        if not result.startswith("Error") and not result.startswith("[Command failed"):
+        if not _looks_like_error(result):
            _tool_result_cache[key] = result
        return result

    return wrapper


+def _make_invocation_executor(
+    tool_name: str,
+    executor: Any,
+    graph: Any,
+    *,
+    cacheable: bool,
+    auto_record_category: str | None = None,
+) -> Any:
+    """Single uniform wrapper around a forensic tool executor.
+
+    Responsibilities (in order):
+      1. Serve from the result cache when ``cacheable=True`` and the key
+         is hot. Cached hits still produce a fresh ToolInvocation record
+         marked ``cached=True`` so the agent can cite their work.
+      2. Call the underlying executor on cache miss; store on success.
+      3. Record a :class:`ToolInvocation` on the graph (this is the
+         provenance unit the grounding gateway looks up).
+      4. (Optionally) auto-record the raw output as a Phenomenon with a
+         single ``type=raw`` fact citing the invocation just made. This
+         replaces the pre-S2 ``_make_auto_record`` shortcut.
+      5. Return the result with a ``[invocation: inv-xxx]`` header so
+         the LLM learns the ID to put in ``add_phenomenon`` facts.
+    """
+
+    async def wrapper(**kwargs) -> str:
+        cached_flag = False
+        cache_hit_key: str | None = None
+        text: str | None = None
+
+        if cacheable:
+            cache_hit_key = _cache_key(tool_name, kwargs)
+            hit = _tool_result_cache.get(cache_hit_key)
+            if hit is not None:
+                logger.debug("Cache hit: %s(%s)", tool_name, kwargs)
+                text, cached_flag = hit, True
+
+        if text is None:
+            text = await executor(**kwargs)
+            if cacheable and cache_hit_key and not _looks_like_error(text):
+                _tool_result_cache[cache_hit_key] = text
+
+        inv_id = await graph.record_tool_invocation(
+            tool=tool_name, args=kwargs, output=text, cached=cached_flag,
+        )
+
+        # Auto-record the raw output as a phenomenon (single grounded fact).
+        # Skipped on error outputs and when no graph is present.
+        if auto_record_category and not _looks_like_error(text):
+            agent = getattr(graph, "_current_agent", "") or "unknown"
+            first_line = text.split("\n", 1)[0][:80]
+            try:
+                await graph.add_phenomenon(
+                    source_agent=agent,
+                    category=auto_record_category,
+                    title=f"{tool_name}: {first_line}",
+                    interpretation="(auto-recorded raw tool output)",
+                    verified_facts=[{
+                        "type": "raw",
+                        "value": text[:2000],
+                        "invocation_id": inv_id,
+                    }],
+                    source_tool=tool_name,
+                )
+            except GroundingError as e:
+                # Should never happen for auto-record (we just wrote the
+                # invocation; value is a literal prefix of output). Log
+                # loudly if it does — that's a bug, not a hallucination.
+                logger.error("Auto-record grounding failed for %s: %s", tool_name, e)
+
+        return f"[invocation: {inv_id}]\n{text}"
+
+    return wrapper
+
+
 def get_cache_stats() -> dict[str, int]:
    """Return cache statistics for diagnostics."""
    return {"entries": len(_tool_result_cache)}
@@ -77,12 +173,11 @@ ASSET_CATEGORIES = [
 ]


-def _auto_categorize(filename: str) -> str:
-    """Infer asset category from filename."""
+def _auto_categorize_windows(filename: str) -> str:
+    """Original Windows-leaning heuristic for disk-image-extracted artifacts."""
    name_lower = filename.lower()
    ext = os.path.splitext(name_lower)[1]

-    # Check full name (with extension) and base name against known hive names
    if name_lower in _REGISTRY_HIVE_NAMES:
        return "registry_hive"
    if ext == ".pf":
@@ -93,7 +188,7 @@ def _auto_categorize(filename: str) -> str:
        return "address_book"
    if name_lower == "info2" or re.match(r"dc\d+\.exe", name_lower):
        return "recycle_bin"
-    # Extension-based checks before keyword-based (e.g. mirc.ini → config, not chat)
+    # Extension-based checks before keyword-based (e.g. mirc.ini → config, not chat).
    if ext in (".ini", ".csv", ".dat", ".cfg"):
        return "config_file"
    if ext in (".log", ".lst"):
@@ -107,6 +202,49 @@ def _auto_categorize(filename: str) -> str:
    return "other"


+def _auto_categorize_ios(filename: str) -> str:
+    """iOS extraction heuristic — plist / sqlite / keychain land here.
+
+    Domain-rooted iOS extractions yield specific filenames (sms.db,
+    AddressBook.sqlitedb, keychain-2.db, *.plist) that the Windows
+    categorizer would dump into 'other' — fixing P4.
+    """
+    name_lower = filename.lower()
+    ext = os.path.splitext(name_lower)[1]
+
+    if name_lower == "keychain-2.db":
+        return "ios_keychain"
+    if name_lower in ("sms.db", "chatstorage.sqlite"):
+        return "messaging_db"
+    if name_lower in ("addressbook.sqlitedb", "addressbookimages.sqlitedb"):
+        return "address_book"
+    if name_lower == "idevice_info.txt":
+        return "device_info"
+    if ext in (".sqlite", ".sqlite3", ".sqlitedb", ".db"):
+        return "sqlite_db"
+    if ext == ".plist":
+        return "plist"
+    if ext in (".log",):
+        return "text_log"
+    return "other"
+
+
+# Per-source-type categorizers — dispatched by _auto_categorize at call time
+# based on graph.active_source.type. Solves P4 (Windows-only categorization).
+_CATEGORIZERS = {
+    "disk_image": _auto_categorize_windows,
+    "mobile_extraction": _auto_categorize_ios,
+    "archive": _auto_categorize_windows,
+    "media_collection": lambda fn: "other",
+}
+
+
+def _auto_categorize(filename: str, source_type: str = "disk_image") -> str:
+    """Dispatch to a source-type-aware categorizer (defaults to Windows)."""
+    fn = _CATEGORIZERS.get(source_type, _auto_categorize_windows)
+    return fn(filename)
+
+
@dataclass
 class ToolDefinition:
    """A registered tool available for agent composition."""
@@ -123,44 +261,53 @@ class ToolDefinition:
 TOOL_CATALOG: dict[str, ToolDefinition] = {}


-def _make_auto_record(tool_name: str, category: str, executor: Any, graph: Any) -> Any:
-    """Wrap a forensic tool to auto-record its result as a phenomenon."""
-
-    async def wrapper(**kwargs) -> str:
-        result = await executor(**kwargs)
-        if graph is None or not result or result.startswith("Error") or result.startswith("["):
-            return result
-        # Auto-record: the tool produced a forensic fact
-        agent = getattr(graph, "_current_agent", "") or "unknown"
-        title = f"{tool_name}: {result.split(chr(10))[0][:80]}"
-        await graph.add_phenomenon(
-            source_agent=agent,
-            category=category,
-            title=title,
-            description=result[:2000],
-            source_tool=tool_name,
-        )
-        return result
-
-    return wrapper
+# Set of (tool_name, category) pairs that auto-record a phenomenon when run.
+# Replaces the pre-S2 ``_make_auto_record`` per-tool wrapping; the central
+# instrumentation pass at the end of register_all_tools applies these.
+AUTO_RECORD_TOOLS: dict[str, str] = {
+    "list_installed_software": "registry",
+    "get_system_info": "registry",
+    "get_timezone_info": "registry",
+    "get_computer_name": "registry",
+    "get_shutdown_time": "registry",
+    "enumerate_users": "registry",
+    "get_network_interfaces": "registry",
+    "get_email_config": "registry",
+    "parse_prefetch": "filesystem",
+}


-def register_all_tools(
-    image_path: str,
-    partition_offset: int,
-    graph: Any = None,
-    extracted_dir: str = "extracted",
-) -> None:
-    """Populate TOOL_CATALOG with all available tools, pre-bound to image/offset."""
+def register_all_tools(graph: Any) -> None:
+    """Populate TOOL_CATALOG with all available forensic tools.
+
+    Tools no longer close over a fixed image path. The Sleuth Kit tools
+    resolve the image path and partition offset from ``graph.active_source``
+    at call time, so the same registered tool follows whichever evidence
+    source the orchestrator has made active.
+    """
    TOOL_CATALOG.clear()

+    def _img() -> str:
+        """Resolve the active source's image path at tool-call time."""
+        src = getattr(graph, "active_source", None)
+        if src is None or not src.path:
+            raise RuntimeError(
+                "No active evidence source — call graph.set_active_source() first."
+            )
+        return src.path
+
+    def _off() -> int:
+        """Resolve the active source's partition offset at tool-call time."""
+        src = getattr(graph, "active_source", None)
+        return src.partition_offset if src is not None else 0
+
    # ---- Sleuth Kit tools ----

    TOOL_CATALOG["partition_info"] = ToolDefinition(
        name="partition_info",
        description="Get the partition table layout of the disk image. Run this first to understand disk structure.",
        input_schema={"type": "object", "properties": {}},
-        executor=lambda: tsk.partition_info(image_path),
+        executor=lambda: tsk.partition_info(_img()),
        module="sleuthkit",
        tags=["filesystem", "disk", "partition"],
    )
@@ -169,7 +316,7 @@ def register_all_tools(
        name="filesystem_info",
        description="Get detailed filesystem information (type, block size, volume name, etc.) for the selected partition.",
        input_schema={"type": "object", "properties": {}},
-        executor=lambda: tsk.filesystem_info(image_path, partition_offset),
+        executor=lambda: tsk.filesystem_info(_img(), _off()),
        module="sleuthkit",
        tags=["filesystem", "disk"],
    )
@@ -185,7 +332,7 @@ def register_all_tools(
            },
        },
        executor=lambda inode=None, recursive=False: tsk.list_directory(
-            image_path, partition_offset, inode, recursive
+            _img(), _off(), inode, recursive
        ),
        module="sleuthkit",
        tags=["filesystem", "directory", "listing"],
@@ -204,12 +351,13 @@ def register_all_tools(
                )

        # Resolve real disk path first
-        orig_path = (await tsk.find_file(image_path, inode, partition_offset)).strip()
+        orig_path = (await tsk.find_file(_img(), inode, _off())).strip()
        if not orig_path or "not found" in orig_path.lower():
            return f"Error: inode {inode} not found on the disk image."

        # Derive local filename from real disk path
        filename = os.path.basename(orig_path)
+        extracted_dir = graph.extracted_dir
        local_path = os.path.join(extracted_dir, filename)

        # Handle name collisions by appending inode
@@ -219,12 +367,15 @@ def register_all_tools(
            filename = os.path.basename(local_path)

        # Extract
-        result = await tsk.extract_file(image_path, inode, local_path, partition_offset)
+        result = await tsk.extract_file(_img(), inode, local_path, _off())
        if result.startswith("[icat failed"):
            return result

        size = os.path.getsize(local_path) if os.path.exists(local_path) else 0
-        category = _auto_categorize(os.path.basename(orig_path))
+        src_type = (
+            graph.active_source.type if graph.active_source else "disk_image"
+        )
+        category = _auto_categorize(os.path.basename(orig_path), src_type)

        # Register
        if graph is not None:
@@ -275,7 +426,7 @@ def register_all_tools(
            },
            "required": ["inode"],
        },
-        executor=lambda inode: tsk.find_file(image_path, inode, partition_offset),
+        executor=lambda inode: tsk.find_file(_img(), inode, _off()),
        module="sleuthkit",
        tags=["filesystem"],
    )
@@ -290,7 +441,7 @@ def register_all_tools(
            },
            "required": ["pattern"],
        },
-        executor=lambda pattern: tsk.search_strings(image_path, pattern),
+        executor=lambda pattern: tsk.search_strings(_img(), pattern),
        module="sleuthkit",
        tags=["filesystem", "search", "strings"],
    )
@@ -299,7 +450,7 @@ def register_all_tools(
        name="count_deleted_files",
        description="List and count all deleted files. Shows total count, executables, and extension breakdown.",
        input_schema={"type": "object", "properties": {}},
-        executor=lambda: tsk.count_deleted_files(image_path, partition_offset),
+        executor=lambda: tsk.count_deleted_files(_img(), _off()),
        module="sleuthkit",
        tags=["filesystem", "deleted", "recovery"],
    )
@@ -308,7 +459,7 @@ def register_all_tools(
        name="build_filesystem_timeline",
        description="Build a MAC timeline from the filesystem (Modified/Accessed/Changed times for all files).",
        input_schema={"type": "object", "properties": {}},
-        executor=lambda: tsk.build_timeline(image_path, partition_offset),
+        executor=lambda: tsk.build_timeline(_img(), _off()),
        module="sleuthkit",
        tags=["filesystem", "timeline"],
    )
@@ -341,8 +492,7 @@ def register_all_tools(
            },
            "required": ["hive_path"],
        },
-        executor=_make_auto_record("list_installed_software", "registry",
-                                   lambda hive_path: reg.list_installed_software(hive_path), graph),
+        executor=lambda hive_path: reg.list_installed_software(hive_path),
        module="registry",
        tags=["registry", "software", "installed"],
    )
@@ -390,8 +540,7 @@ def register_all_tools(
            },
            "required": ["hive_path"],
        },
-        executor=_make_auto_record("get_system_info", "registry",
-                                   lambda hive_path: reg.get_system_info(hive_path), graph),
+        executor=lambda hive_path: reg.get_system_info(hive_path),
        module="registry",
        tags=["registry", "system"],
    )
@@ -406,8 +555,7 @@ def register_all_tools(
            },
            "required": ["hive_path"],
        },
-        executor=_make_auto_record("get_timezone_info", "registry",
-                                   lambda hive_path: reg.get_timezone_info(hive_path), graph),
+        executor=lambda hive_path: reg.get_timezone_info(hive_path),
        module="registry",
        tags=["registry", "timezone", "system"],
    )
@@ -422,8 +570,7 @@ def register_all_tools(
            },
            "required": ["hive_path"],
        },
-        executor=_make_auto_record("get_computer_name", "registry",
-                                   lambda hive_path: reg.get_computer_name(hive_path), graph),
+        executor=lambda hive_path: reg.get_computer_name(hive_path),
        module="registry",
        tags=["registry", "system", "hostname"],
    )
@@ -438,8 +585,7 @@ def register_all_tools(
            },
            "required": ["hive_path"],
        },
-        executor=_make_auto_record("get_shutdown_time", "registry",
-                                   lambda hive_path: reg.get_shutdown_time(hive_path), graph),
+        executor=lambda hive_path: reg.get_shutdown_time(hive_path),
        module="registry",
        tags=["registry", "system", "shutdown"],
    )
@@ -454,8 +600,7 @@ def register_all_tools(
            },
            "required": ["hive_path"],
        },
-        executor=_make_auto_record("enumerate_users", "registry",
-                                   lambda hive_path: reg.enumerate_users(hive_path), graph),
+        executor=lambda hive_path: reg.enumerate_users(hive_path),
        module="registry",
        tags=["registry", "user", "accounts", "sam"],
    )
@@ -470,8 +615,7 @@ def register_all_tools(
            },
            "required": ["hive_path"],
        },
-        executor=_make_auto_record("get_network_interfaces", "registry",
-                                   lambda hive_path: reg.get_network_interfaces(hive_path), graph),
+        executor=lambda hive_path: reg.get_network_interfaces(hive_path),
        module="registry",
        tags=["registry", "network", "adapter", "ip"],
    )
@@ -486,8 +630,7 @@ def register_all_tools(
            },
            "required": ["hive_path"],
        },
-        executor=_make_auto_record("get_email_config", "registry",
-                                   lambda hive_path: reg.get_email_config(hive_path), graph),
+        executor=lambda hive_path: reg.get_email_config(hive_path),
        module="registry",
        tags=["registry", "email", "account"],
    )
@@ -504,8 +647,7 @@ def register_all_tools(
            },
            "required": ["file_path"],
        },
-        executor=_make_auto_record("parse_prefetch", "filesystem",
-                                   lambda file_path: parsers.parse_prefetch(file_path), graph),
+        executor=lambda file_path: parsers.parse_prefetch(file_path),
        module="parsers",
        tags=["filesystem", "prefetch", "execution"],
    )
@@ -577,7 +719,13 @@ def register_all_tools(

    TOOL_CATALOG["list_extracted_dir"] = ToolDefinition(
        name="list_extracted_dir",
-        description="List files in an extracted directory with sizes.",
+        description=(
+            "Summarise an extracted directory tree: total counts, "
+            "extension breakdown, top-level layout, largest files. "
+            "Scales to 10k+-file trees without truncating into uselessness. "
+            "For targeted searches (find every *.plist, locate sms.db, ...) "
+            "use find_files instead."
+        ),
        input_schema={
            "type": "object",
            "properties": {
@@ -590,6 +738,31 @@ def register_all_tools(
        tags=["filesystem", "listing", "extracted"],
    )

+    TOOL_CATALOG["find_files"] = ToolDefinition(
+        name="find_files",
+        description=(
+            "Recursively find files under a directory by glob pattern. "
+            "Use this on tree-mode sources (iOS extractions, archives, "
+            "Android-mounted partitions) to locate specific artefacts in "
+            "huge trees. Patterns are fnmatch-style; '**' means 'any "
+            "depth'. Examples: '**/sms.db', '**/keychain-2.db', "
+            "'**/ChatStorage.sqlite', '**/*.plist', 'HomeDomain/Library/**'. "
+            "Results sort by size descending; capped at max_results."
+        ),
+        input_schema={
+            "type": "object",
+            "properties": {
+                "root": {"type": "string", "description": "Directory to search under."},
+                "pattern": {"type": "string", "description": "fnmatch glob pattern (use '**' for any depth)."},
+                "max_results": {"type": "integer", "description": "Result cap (default 500)."},
+            },
+            "required": ["root", "pattern"],
+        },
+        executor=lambda root, pattern, max_results=500: parsers.find_files(root, pattern, max_results),
+        module="parsers",
+        tags=["filesystem", "search", "extracted", "glob"],
+    )
+
    TOOL_CATALOG["parse_pcap_strings"] = ToolDefinition(
        name="parse_pcap_strings",
        description="Extract HTTP headers, hosts, User-Agent, cookies, and URLs from a PCAP/capture file.",
@@ -605,11 +778,224 @@ def register_all_tools(
        tags=["network", "pcap", "http", "capture"],
    )

-    # ---- Apply result caching to deterministic read-only tools ----
-    # Must come AFTER all tools are registered. Auto-record wrapped tools
-    # (e.g. get_system_info) are NOT in CACHEABLE_TOOLS since they write
-    # to the evidence graph as a side effect.
+    # ---- Archive tools (tree-mode prep) ----
+
+    TOOL_CATALOG["unzip_archive"] = ToolDefinition(
+        name="unzip_archive",
+        description=(
+            "Extract a .zip archive into a target directory. Defensive against "
+            "zip-slip; skips symlinks. Idempotent on rerun. Pass `password` for "
+            "password-protected zips — only the legacy ZipCrypto algorithm is "
+            "supported by stdlib (AES zips need an external `7z x` step)."
+        ),
+        input_schema={
+            "type": "object",
+            "properties": {
+                "zip_path": {"type": "string", "description": "Path to the .zip file."},
+                "dest_dir": {"type": "string", "description": "Directory to extract into (created if missing)."},
+                "password": {"type": "string", "description": "Password for encrypted zips (omit for plain archives)."},
+            },
+            "required": ["zip_path", "dest_dir"],
+        },
+        executor=lambda zip_path, dest_dir, password=None: arc.unzip_archive(zip_path, dest_dir, password),
+        module="archive",
+        tags=["archive", "zip", "extract", "ingest"],
+    )
+
+    # ---- iOS plugin tools (DESIGN.md §4.7) ----
+
+    TOOL_CATALOG["parse_plist"] = ToolDefinition(
+        name="parse_plist",
+        description=(
+            "Parse a .plist file (XML or binary) and return its contents as JSON. "
+            "Bytes are rendered as hex; dates as ISO-8601."
+        ),
+        input_schema={
+            "type": "object",
+            "properties": {
+                "file_path": {"type": "string", "description": "Path to .plist file."},
+            },
+            "required": ["file_path"],
+        },
+        executor=lambda file_path: ios.parse_plist(file_path),
+        module="mobile_ios",
+        tags=["ios", "plist", "parse"],
+    )
+
+    TOOL_CATALOG["sqlite_tables"] = ToolDefinition(
+        name="sqlite_tables",
+        description=(
+            "List user tables in a sqlite database with row counts and column "
+            "names. Use this to scout an unfamiliar .sqlite / .db file before "
+            "querying it."
+        ),
+        input_schema={
+            "type": "object",
+            "properties": {
+                "db_path": {"type": "string", "description": "Path to .sqlite/.db file."},
+            },
+            "required": ["db_path"],
+        },
+        executor=lambda db_path: ios.sqlite_tables(db_path),
+        module="mobile_ios",
+        tags=["sqlite", "schema", "ios", "android"],
+    )
+
+    TOOL_CATALOG["sqlite_query"] = ToolDefinition(
+        name="sqlite_query",
+        description=(
+            "Run a single read-only SELECT against a sqlite file. "
+            "Multi-statement queries and non-SELECT statements are rejected. "
+            "Use this for sms.db / ChatStorage.sqlite / AddressBook.sqlitedb / etc."
+        ),
+        input_schema={
+            "type": "object",
+            "properties": {
+                "db_path": {"type": "string", "description": "Path to .sqlite/.db file."},
+                "query": {"type": "string", "description": "A single SELECT statement."},
+                "max_rows": {"type": "integer", "description": "Row cap (default 100)."},
+            },
+            "required": ["db_path", "query"],
+        },
+        executor=lambda db_path, query, max_rows=100: ios.sqlite_query(db_path, query, max_rows),
+        module="mobile_ios",
+        tags=["sqlite", "query", "ios", "android"],
+    )
+
+    TOOL_CATALOG["parse_ios_keychain"] = ToolDefinition(
+        name="parse_ios_keychain",
+        description=(
+            "Locate and summarise iOS keychain entries (keychain-2.db). "
+            "Pass either the db file directly or the containing directory; "
+            "dumps accounting metadata from genp/inet/cert/keys tables."
+        ),
+        input_schema={
+            "type": "object",
+            "properties": {
+                "keychain_root": {
+                    "type": "string",
+                    "description": "Path to keychain-2.db or a directory that contains it.",
+                },
+            },
+            "required": ["keychain_root"],
+        },
+        executor=lambda keychain_root: ios.parse_ios_keychain(keychain_root),
+        module="mobile_ios",
+        tags=["ios", "keychain", "credentials"],
+    )
+
+    TOOL_CATALOG["read_idevice_info"] = ToolDefinition(
+        name="read_idevice_info",
+        description=(
+            "Read the iDevice_info.txt summary at the root of an iOS extraction. "
+            "Pass the file path or the extraction root directory."
+        ),
+        input_schema={
+            "type": "object",
+            "properties": {
+                "file_path": {"type": "string", "description": "Path to iDevice_info.txt or extraction root."},
+            },
+            "required": ["file_path"],
+        },
+        executor=lambda file_path: ios.read_idevice_info(file_path),
+        module="mobile_ios",
+        tags=["ios", "device", "metadata"],
+    )
+
+    # ---- Android plugin (DESIGN.md §4.7) ----
+
+    TOOL_CATALOG["probe_android_partitions"] = ToolDefinition(
+        name="probe_android_partitions",
+        description=(
+            "Survey every partition on an Android disk dump (mmls + per-"
+            "partition fsstat). Returns a markdown table with name, native "
+            "and 512-byte sector offsets, filesystem type, and a strategy "
+            "hint per partition. Use this BEFORE deciding which partitions "
+            "to dive into via set_active_partition + list_directory."
+        ),
+        input_schema={"type": "object", "properties": {}},
+        executor=lambda: android.probe_android_partitions(_img()),
+        module="mobile_android",
+        tags=["android", "partition", "survey"],
+    )
+
+    async def _set_active_partition(partition_offset: int) -> str:
+        src = getattr(graph, "active_source", None)
+        if src is None:
+            return "Error: no active evidence source."
+        old = src.partition_offset
+        new = int(partition_offset)
+        src.partition_offset = new
+        # Sync the legacy mirror field so older readers stay consistent.
+        graph.partition_offset = new
+        return (
+            f"Active partition offset: {old} → {new} (512-byte sectors). "
+            f"Subsequent list_directory / extract_file / search_strings "
+            f"calls now target this partition on {src.id} ({src.label})."
+        )
+
+    TOOL_CATALOG["set_active_partition"] = ToolDefinition(
+        name="set_active_partition",
+        description=(
+            "Switch the current partition offset (in 512-byte sectors) on "
+            "the active disk-image source. Use the values from "
+            "probe_android_partitions's '512-sector' column. NOT a "
+            "forensic read — purely repoints the TSK toolset. Mutates "
+            "shared state; call serially within one agent run."
+        ),
+        input_schema={
+            "type": "object",
+            "properties": {
+                "partition_offset": {
+                    "type": "integer",
+                    "description": "Partition start in 512-byte sectors.",
+                },
+            },
+            "required": ["partition_offset"],
+        },
+        executor=_set_active_partition,
+        module="android",
+        tags=["android", "partition", "navigation"],
+    )
+
+    # ---- Media plugin (DESIGN.md §4.7) ----
+
+    TOOL_CATALOG["ocr_image"] = ToolDefinition(
+        name="ocr_image",
+        description=(
+            "Extract text from an image via tesseract. The LLM backend has "
+            "no vision, so this is the only way to read JPEG/PNG evidence "
+            "(screenshots of chats, transactions, IDs). Default lang covers "
+            "English + Simplified & Traditional Chinese; override `lang` "
+            "if you know the artefact's language. Returns 'Error: OCR "
+            "runtime not available' with an install hint when tesseract "
+            "isn't on the host — record that absence as a negative "
+            "finding rather than guessing."
+        ),
+        input_schema={
+            "type": "object",
+            "properties": {
+                "file_path": {"type": "string", "description": "Path to image file."},
+                "lang": {"type": "string", "description": "Tesseract language code(s), e.g. 'eng' or 'eng+chi_sim'."},
+            },
+            "required": ["file_path"],
+        },
+        executor=lambda file_path, lang="eng+chi_sim+chi_tra": med.ocr_image(file_path, lang),
+        module="media",
+        tags=["media", "ocr", "image"],
+    )
+
+    # ---- Wrap every executor with invocation logging (+ cache + auto-record) ----
+    # Must run AFTER all tools are registered. Every tool call now produces
+    # a ToolInvocation entry on the graph (provenance for grounding), and
+    # returns the result prefixed with ``[invocation: inv-xxx]`` so the LLM
+    # can cite the call in add_phenomenon facts.
    _tool_result_cache.clear()
    for tool_name, td in TOOL_CATALOG.items():
-        if tool_name in CACHEABLE_TOOLS:
-            td.executor = _make_cached(tool_name, td.executor)
+        td.executor = _make_invocation_executor(
+            tool_name,
+            td.executor,
+            graph,
+            cacheable=(tool_name in CACHEABLE_TOOLS),
+            auto_record_category=AUTO_RECORD_TOOLS.get(tool_name),
+        )