npm - @datafog/fogclaw - Versions diffs - 0.1.6 → 0.2.0 - Mend

@datafog/fogclaw 0.1.6 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

package/CHANGELOG.md +31 -0
package/README.md +39 -0
package/dist/extract.d.ts +28 -0
package/dist/extract.d.ts.map +1 -0
package/dist/extract.js +91 -0
package/dist/extract.js.map +1 -0
package/dist/index.d.ts.map +1 -1
package/dist/index.js +11 -3
package/dist/index.js.map +1 -1
package/dist/message-sending-handler.d.ts +40 -0
package/dist/message-sending-handler.d.ts.map +1 -0
package/dist/message-sending-handler.js +50 -0
package/dist/message-sending-handler.js.map +1 -0
package/dist/tool-result-handler.d.ts +36 -0
package/dist/tool-result-handler.d.ts.map +1 -0
package/dist/tool-result-handler.js +91 -0
package/dist/tool-result-handler.js.map +1 -0
package/dist/types.d.ts +1 -0
package/dist/types.d.ts.map +1 -1
package/dist/types.js +3 -0
package/dist/types.js.map +1 -1
package/docs/OBSERVABILITY.md +22 -15
package/docs/SECURITY.md +6 -4
package/docs/plans/active/2026-02-17-feat-tool-result-pii-scanning-plan.md +293 -0
package/docs/specs/2026-02-17-feat-outbound-message-pii-scanning-spec.md +93 -0
package/docs/specs/2026-02-17-feat-tool-result-pii-scanning-spec.md +122 -0
package/openclaw.plugin.json +1 -1
package/package.json +1 -1
package/src/extract.ts +98 -0
package/src/index.ts +13 -4
package/src/message-sending-handler.ts +87 -0
package/src/tool-result-handler.ts +133 -0
package/src/types.ts +4 -0
package/tests/extract.test.ts +185 -0
package/tests/message-sending-handler.test.ts +244 -0
package/tests/plugin-smoke.test.ts +109 -2
package/tests/tool-result-handler.test.ts +329 -0

package/docs/SECURITY.md CHANGED Viewed

@@ -5,11 +5,13 @@ use_when: "Capturing security expectations for this repo: threat model, auth/aut
 ## Threat Model
-FogClaw processes user-provided prompt text and returns extracted entities with character offsets. The main risk is accidental exposure of sensitive information in logs, crash output, or plugin responses.
+FogClaw processes text from two surfaces: user prompts (`before_agent_start`) and tool results (`tool_result_persist`). Both may contain PII. The main risks are:
-Assume untrusted text arrives from user messages.
-For this repo, a concrete threat is that PII can appear in plain text and be reflected back in a wrong form (for example, redacted text leaking original spans) if redaction logic or logging is incorrect.
+1. **PII leaking through unscanned paths.** Any text surface that FogClaw does not hook into is a gap. Currently covered: user prompts and tool results. Not yet covered: outbound messages (`message_sending`), historical messages, compacted summaries.
+2. **Redaction logic errors.** If redaction produces malformed output (e.g., offset miscalculation), original PII spans could leak through or be partially visible.
+3. **Accidental PII in logs/errors.** Audit entries, error messages, and crash output must never contain raw PII values.
+4. **Regex false negatives.** The synchronous tool result path uses regex-only detection. Edge-case PII formats (international phone numbers, non-standard SSN formatting) may not match.
+5. **GLiNER unavailability.** If the ONNX model fails to load, the prompt-level scanner degrades to regex-only mode silently. Users may not realize unstructured entities (names, organizations) are not being detected.
 ## Auth Model

package/docs/plans/active/2026-02-17-feat-tool-result-pii-scanning-plan.md ADDED Viewed

@@ -0,0 +1,293 @@
+---
+slug: 2026-02-17-feat-tool-result-pii-scanning
+status: active
+phase: plan
+plan_mode: lightweight
+detail_level: more
+priority: high
+owner: sidmohan
+---
+# Add PII scanning to tool results via tool_result_persist hook
+This Plan is a living document. Keep `Progress`, `Surprises & Discoveries`, `Decision Log`, `Outcomes & Retrospective`, and `Revision Notes` current as work proceeds.
+This plan must be maintained in accordance with `docs/PLANS.md`.
+## Purpose / Big Picture
+FogClaw currently scans only the user prompt for PII. When an agent reads a file, fetches a web page, or queries an API, the tool result flows into the session transcript unscanned. After this change, FogClaw will intercept every tool result via OpenClaw's `tool_result_persist` hook and redact PII spans (SSN, email, phone, credit card, IP address, date, zip code) before the content is persisted to the session. The agent will see `[SSN_1]` instead of `123-45-6789`.
+To verify it works: install FogClaw in OpenClaw, ask the agent to read a file that contains a phone number and an SSN, then inspect the session transcript. The raw values should be replaced with redaction tokens.
+## Progress
+- [x] (2026-02-17T17:28:00Z) P1 [M1] Create `src/extract.ts` with `extractText` and `replaceText` functions
+- [x] (2026-02-17T17:28:00Z) P2 [M1] Create `tests/extract.test.ts` covering string content, content block arrays, nested structures, empty/null, and non-text types
+- [x] (2026-02-17T17:28:00Z) P3 [M1] All extract tests pass — 27 tests passed
+- [x] (2026-02-17T17:29:00Z) P4 [M2] Create `src/tool-result-handler.ts` with synchronous `createToolResultHandler` factory
+- [x] (2026-02-17T17:29:00Z) P5 [M2] Create `tests/tool-result-handler.test.ts` covering scanning, redaction, audit logging, allowlist, and edge cases
+- [x] (2026-02-17T17:29:00Z) P6 [M2] Register `tool_result_persist` hook in `src/index.ts`
+- [x] (2026-02-17T17:29:00Z) P7 [M2] All tool-result-handler tests pass — 21 tests passed
+- [x] (2026-02-17T17:30:00Z) P8 [M3] Extend `tests/plugin-smoke.test.ts` with `tool_result_persist` hook registration and transformation tests
+- [x] (2026-02-17T17:30:00Z) P9 [M3] Full test suite passes — 149 tests, 8 files, 0 failures
+- [x] (2026-02-17T17:30:00Z) P10 [M3] Commit all changes — 3b7564f
+## Surprises & Discoveries
+- Observation: The Scanner class's `regexEngine` field is private, so we instantiated a fresh `RegexEngine` directly in `register()` rather than exposing the Scanner's internal instance.
+  Evidence: `const toolResultRegex = new RegexEngine();` in src/index.ts. RegexEngine is stateless (only uses pattern matching), so a separate instance is functionally identical.
+- Observation: The null byte separator approach for multi-block content works cleanly — regex PII patterns never match across `\0` boundaries.
+  Evidence: 27 extract tests pass including multi-block scenarios with mixed text/image blocks.
+## Decision Log
+- Decision: Use RegexEngine and redact() directly instead of going through Scanner
+  Rationale: Scanner.scan() is declared `async` (returns a Promise) even when GLiNER is disabled, because the method signature is `async scan(...)`. The `tool_result_persist` hook in OpenClaw is synchronous-only — if a handler returns a Promise, OpenClaw logs a warning and ignores the result. RegexEngine.scan() and redact() are both fully synchronous, so we call them directly.
+  Date/Author: 2026-02-17, sidmohan
+- Decision: All guardrail modes (redact, block, warn) produce span-level redaction in tool results
+  Rationale: Unlike `before_agent_start` where "block" can only prepend a warning context, `tool_result_persist` actually transforms the message. Span-level redaction is the safest behavior — it removes the PII while preserving surrounding context that the agent needs to reason. Replacing the entire tool result would destroy useful non-PII information.
+  Date/Author: 2026-02-17, sidmohan
+- Decision: Reuse existing FogClaw config (guardrail_mode, entityActions, redactStrategy, allowlist)
+  Rationale: Users should have one mental model — "I set SSN to block, and it's blocked everywhere." Adding a separate config section for tool results would create inconsistency and confusion. If a user needs different behavior per-surface, that can be a future initiative.
+  Date/Author: 2026-02-17, sidmohan
+## Outcomes & Retrospective
+All three milestones completed. FogClaw now scans tool results for PII via `tool_result_persist` hook using the regex engine synchronously. 149 tests pass across 8 test files with zero regressions. New modules: `src/extract.ts` (text extraction/replacement), `src/tool-result-handler.ts` (synchronous handler factory). The implementation adds 52 new tests (27 extract + 21 handler + 4 smoke).
+## Context and Orientation
+FogClaw is an OpenClaw plugin that detects and redacts PII in agent conversations. The plugin lives at `/Users/sidmohan/Projects/datafog/fogclaw`.
+Key files relevant to this plan:
+- `src/index.ts` — Plugin entry point. Exports a plugin object with `id`, `name`, and `register(api)`. The `register` function loads config, initializes the Scanner, registers the `before_agent_start` hook, and registers three tools (`fogclaw_scan`, `fogclaw_preview`, `fogclaw_redact`). This is where we will add the `tool_result_persist` hook registration.
+- `src/engines/regex.ts` — The RegexEngine class. Has a `scan(text: string): Entity[]` method that is fully synchronous. Detects 7 PII types: EMAIL, PHONE, SSN, CREDIT_CARD, IP_ADDRESS, DATE, ZIP_CODE. Each match gets confidence 1.0 and source "regex".
+- `src/redactor.ts` — The `redact(text, entities, strategy)` function. Fully synchronous. Takes text, detected entities, and a strategy ("token", "mask", or "hash"). Returns `{ redacted_text, mapping, entities }`. Sorts entities by position descending and replaces from end to start to avoid offset corruption.
+- `src/types.ts` — Type definitions including `Entity`, `RedactStrategy`, `GuardrailAction`, `FogClawConfig`, `ScanResult`, `RedactResult`. Also has `canonicalType()` for normalizing entity labels and `CANONICAL_TYPE_MAP`.
+- `src/config.ts` — `loadConfig(raw)` merges defaults with overrides and validates. The `FogClawConfig` type includes `guardrail_mode`, `entityActions`, `redactStrategy`, `allowlist`, `auditEnabled`, and others.
+- `src/scanner.ts` — The `Scanner` class that orchestrates regex + GLiNER engines. Its `scan()` method is `async` (cannot be used in synchronous hooks). Includes `filterByPolicy()` which applies allowlist filtering — we will need to replicate or extract this logic for the synchronous path.
+- `tests/plugin-smoke.test.ts` — Integration tests for the plugin contract. Creates a mock `api` object with `pluginConfig`, `logger`, `on()`, and `registerTool()`. Tests verify hook registration and tool behavior.
+OpenClaw's `tool_result_persist` hook contract (from OpenClaw's `src/plugins/types.ts`):
+- **Event type**: `{ toolName?: string, toolCallId?: string, message: AgentMessage, isSynthetic?: boolean }`
+- **Context type**: `{ agentId?: string, sessionKey?: string, toolName?: string, toolCallId?: string }`
+- **Result type**: `{ message?: AgentMessage }` — return a modified message, or void to leave it unchanged
+- **Execution**: Synchronous only. If a handler returns a Promise, OpenClaw warns and ignores the result.
+- **Where it runs**: Inside `SessionManager.appendMessage`, via `session-tool-result-guard-wrapper.ts`. Fires on every tool result before it is written to the session transcript.
+The `AgentMessage` type varies by provider and tool, but tool results typically contain text content in one of these shapes:
+- A plain string
+- An array of content blocks, each with `{ type: "text", text: string }` or `{ type: "image", ... }`
+- A structured object with a `content` property that is one of the above
+## Milestones
+### Milestone 1 — Text extraction and replacement utilities
+After this milestone, FogClaw will have a utility module that can defensively extract all text from an `AgentMessage` tool result payload (regardless of its internal shape) and replace text spans within it. This is the foundation for scanning — you need to get text out of the message to scan it, and put redacted text back in.
+The module will be at `src/extract.ts` with two exported functions:
+- `extractText(message: unknown): string` — walks the message structure and concatenates all text content into a single string, with segment boundaries marked so offsets can be mapped back. Returns empty string for non-text content.
+- `replaceText(message: unknown, redactedText: string): unknown` — takes the original message and a redacted version of the extracted text, and returns a new message object with text content replaced. Preserves the original structure (arrays of content blocks stay as arrays, etc.).
+Verification: run `pnpm test tests/extract.test.ts` and see all tests pass, covering: plain string messages, content block arrays with mixed text/image blocks, nested content properties, empty/null messages, and messages with no text content.
+### Milestone 2 — Synchronous tool result handler
+After this milestone, FogClaw will have a handler factory at `src/tool-result-handler.ts` that produces a synchronous `tool_result_persist` handler, and the handler will be registered in `src/index.ts`.
+The factory function `createToolResultHandler(config, regexEngine, logger?)` returns a function with the signature `(event, ctx) => { message } | void`. The handler:
+1. Extracts text from `event.message` using `extractText`
+2. Scans text with `regexEngine.scan(text)` (synchronous)
+3. Filters results through the allowlist (replicating `Scanner.filterByPolicy` logic synchronously)
+4. Determines per-entity action from `config.entityActions` with `config.guardrail_mode` as fallback
+5. Redacts all actionable entities using `redact()` (synchronous)
+6. Replaces text in the message using `replaceText`
+7. Emits an audit log entry if `config.auditEnabled` and entities were found
+8. Returns `{ message: modifiedMessage }` if any redaction occurred, or `void` if no PII found
+The hook will be registered in `src/index.ts` inside the `register(api)` function, alongside the existing `before_agent_start` hook:
+    api.on("tool_result_persist", handler);
+Verification: run `pnpm test tests/tool-result-handler.test.ts` and see all tests pass, covering: SSN redaction in tool results, email/phone detection, allowlist exclusion, audit log emission, no-op when no PII found, and various message shapes.
+### Milestone 3 — Integration smoke test
+After this milestone, the existing plugin smoke test at `tests/plugin-smoke.test.ts` will be extended to verify that FogClaw registers a `tool_result_persist` hook and that invoking it with a tool result containing PII produces a transformed message.
+Verification: run `pnpm test` (full suite) and see all tests pass with no regressions.
+## Plan of Work
+The work proceeds in three sequential steps. Each builds on the previous.
+**Step 1: Text extraction module.** Create `src/extract.ts` with `extractText` and `replaceText`. The `extractText` function should handle these `AgentMessage` shapes: (a) the message itself is a string, (b) the message has a `content` property that is a string, (c) the message has a `content` property that is an array of blocks where each text block has `{ type: "text", text: string }`. For arrays, concatenate text blocks with a newline separator and track the offset ranges so `replaceText` can map redacted text back to the correct blocks. Create `tests/extract.test.ts` with tests for each shape plus edge cases (null, undefined, empty string, image-only content blocks, deeply nested content).
+**Step 2: Tool result handler.** Create `src/tool-result-handler.ts`. Import `RegexEngine` from `src/engines/regex.ts`, `redact` from `src/redactor.ts`, `extractText`/`replaceText` from `src/extract.ts`, and types from `src/types.ts`. The factory function `createToolResultHandler` takes `FogClawConfig`, a `RegexEngine` instance, and an optional logger object. It returns a synchronous handler function. Inside the handler: extract text, scan, filter by allowlist (replicate the allowlist filtering logic from `Scanner.filterByPolicy` in `src/scanner.ts` — the filtering checks `config.allowlist.values`, `config.allowlist.patterns`, and `config.allowlist.entities`), determine actions, redact, replace, audit, return. Then update `src/index.ts` to call `createToolResultHandler` during registration and register the returned handler with `api.on("tool_result_persist", handler)`. Create `tests/tool-result-handler.test.ts`.
+**Step 3: Smoke test extension.** In `tests/plugin-smoke.test.ts`, add a test that verifies `tool_result_persist` appears in the registered hooks after `register(api)` is called. Add a second test that invokes the hook handler with a mock tool result message containing an SSN, and asserts the returned message has the SSN replaced with a redaction token like `[SSN_1]`.
+## Concrete Steps
+All commands run from the FogClaw repo root at `/Users/sidmohan/Projects/datafog/fogclaw`.
+After creating `src/extract.ts` and `tests/extract.test.ts`:
+    pnpm test tests/extract.test.ts
+Expected: all extract tests pass (text extraction from various message shapes, replacement, edge cases).
+After creating `src/tool-result-handler.ts` and `tests/tool-result-handler.test.ts` and updating `src/index.ts`:
+    pnpm test tests/tool-result-handler.test.ts
+Expected: all handler tests pass (scanning, redaction, audit, allowlist, no-op cases).
+After extending `tests/plugin-smoke.test.ts`:
+    pnpm test tests/plugin-smoke.test.ts
+Expected: all smoke tests pass, including new `tool_result_persist` tests.
+Full suite validation:
+    pnpm test
+Expected: all tests pass, no regressions in existing `before_agent_start`, scanner, redactor, regex, or config tests.
+Type check:
+    pnpm lint
+Expected: no type errors.
+## Validation and Acceptance
+The feature is complete when:
+1. `pnpm test` passes with all existing tests plus new tests for extract, tool-result-handler, and extended smoke tests.
+2. `pnpm lint` passes with no type errors.
+3. A tool result message containing `"Call 555-123-4567 or email john@example.com"` is passed to the `tool_result_persist` handler and the returned message contains `"Call [PHONE_1] or email [EMAIL_1]"` (with token strategy) and the original values do not appear.
+4. A tool result message containing no PII returns `void` (no modification).
+5. An allowlisted value (e.g., `noreply@example.com`) is not redacted even when detected.
+6. When `auditEnabled: true`, the logger receives an audit entry with `source: "tool_result"`, entity count, and labels but no raw PII values.
+## Idempotence and Recovery
+All changes are additive — new files (`src/extract.ts`, `src/tool-result-handler.ts`) and new tests. No existing files are modified except `src/index.ts` (adding a hook registration) and `tests/plugin-smoke.test.ts` (adding test cases).
+If a step fails partway, delete the partially created files and restart from the milestone. No database migrations, no state files, no destructive operations.
+Running `pnpm test` at any point is safe and idempotent.
+## Artifacts and Notes
+Full test suite output:
+    ✓ tests/extract.test.ts (27 tests) 4ms
+    ✓ tests/config.test.ts (6 tests) 4ms
+    ✓ tests/redactor.test.ts (21 tests) 6ms
+    ✓ tests/regex.test.ts (39 tests) 11ms
+    ✓ tests/tool-result-handler.test.ts (21 tests) 10ms
+    ✓ tests/gliner.test.ts (12 tests) 10ms
+    ✓ tests/plugin-smoke.test.ts (8 tests) 9ms
+    ✓ tests/scanner.test.ts (15 tests) 13ms
+    Test Files  8 passed (8)
+         Tests  149 passed (149)
+Type check: `npx tsc --noEmit` — clean, no errors.
+## Interfaces and Dependencies
+**New module `src/extract.ts`:**
+    export function extractText(message: unknown): string
+    export function replaceText(message: unknown, redactedText: string): unknown
+**New module `src/tool-result-handler.ts`:**
+    import { RegexEngine } from "./engines/regex.js";
+    import { FogClawConfig } from "./types.js";
+    interface Logger {
+      info(msg: string): void;
+      warn(msg: string): void;
+    }
+    interface ToolResultPersistEvent {
+      toolName?: string;
+      toolCallId?: string;
+      message: unknown;
+      isSynthetic?: boolean;
+    }
+    interface ToolResultPersistContext {
+      agentId?: string;
+      sessionKey?: string;
+      toolName?: string;
+      toolCallId?: string;
+    }
+    export function createToolResultHandler(
+      config: FogClawConfig,
+      regexEngine: RegexEngine,
+      logger?: Logger,
+    ): (event: ToolResultPersistEvent, ctx: ToolResultPersistContext) =>
+      { message: unknown } | void
+**Modified `src/index.ts`:**
+Inside the `register(api)` function, after the existing `before_agent_start` registration, add:
+    const toolResultHandler = createToolResultHandler(config, scanner.regexEngine, api.logger);
+    api.on("tool_result_persist", toolResultHandler);
+This requires exposing `regexEngine` from the Scanner class (currently private). Either make it a public property or instantiate a separate RegexEngine in `register()`.
+**No new dependencies.** All imports are from existing FogClaw modules or Node built-ins.
+## Pull Request
+Populated by `he-github`.
+- pr:
+- branch:
+- commit:
+- ci:
+## Review Findings
+Populated by `he-review`.
+## Verify/Release Decision
+Populated by `he-verify-release`.
+- decision:
+- date:
+- open findings by priority (if any):
+- evidence:
+- rollback:
+- post-release checks:
+- owner:
+## Revision Notes
+- 2026-02-17T00:00:00Z: Initialized plan from template. Reason: establish PLANS-compliant execution baseline for tool result PII scanning.
+- 2026-02-17T17:30:00Z: All milestones completed. Updated Progress, Surprises & Discoveries, Outcomes & Retrospective, and Artifacts sections with implementation evidence.

package/docs/specs/2026-02-17-feat-outbound-message-pii-scanning-spec.md ADDED Viewed

@@ -0,0 +1,93 @@
+---
+slug: 2026-02-17-feat-outbound-message-pii-scanning
+status: intake-complete
+date: 2026-02-17T00:00:00Z
+owner: sidmohan
+plan_mode: lightweight
+spike_recommended: no
+priority: high
+---
+# feat: Add PII scanning to outbound messages via message_sending hook
+## Purpose / Big Picture
+FogClaw now scans user prompts (`before_agent_start`) and tool results (`tool_result_persist`), but outbound messages — the agent's final responses delivered to Telegram, Slack, Discord, etc. — are not scanned. If PII slips through into the agent's response (hallucinated, echoed, or reassembled from partial data), it reaches external channels unredacted.
+By hooking into OpenClaw's `message_sending` lifecycle, FogClaw adds a last-chance gate that scans and redacts PII in outbound messages before they are delivered to recipients.
+Note: `message_sending` is defined in OpenClaw's type system but not yet invoked upstream. This handler will activate automatically when OpenClaw wires the hook into its outbound message flow.
+## Scope
+### In Scope
+- Register a `message_sending` hook handler in FogClaw's plugin registration
+- Scan `event.content` (outbound message text) using the **full Scanner** (regex + GLiNER) since this hook is async-capable
+- Apply existing `guardrail_mode`, `entityActions`, `redactStrategy`, and `allowlist` config
+- Redact PII spans in the outbound message content (all modes produce span-level redaction, never cancel)
+- Return `{ content: redactedText }` when PII is found
+- Emit audit log entries when `auditEnabled: true`
+- Add unit tests for the handler
+- Extend plugin smoke test
+### Boundaries
+- **No message cancellation.** FogClaw will never return `cancel: true`. Span-level redaction is always preferred over dropping messages silently.
+- **No new config surface.** Reuse existing FogClaw config.
+- **No changes to OpenClaw upstream.** Handler will activate when OpenClaw wires the hook.
+- **No scanning of `event.metadata`.** Only `event.content` (the text delivered to the recipient).
+## Non-Goals
+- Cancelling message delivery
+- Scanning message metadata or recipient addresses
+- Modifying recipient routing
+## Risks
+- **Hook not invoked upstream.** The handler exists but won't fire until OpenClaw activates `message_sending`. This is accepted — the code is ready and waiting.
+- **GLiNER latency on outbound path.** Scanner.scan() is async and may add 50-200ms per message. This is acceptable for outbound messages (not a hot-path like tool_result_persist) and provides coverage for person names and organizations.
+## Requirements
+| ID | Priority | Requirement |
+|---|---|---|
+| R1 | critical | Register a `message_sending` hook handler that scans outbound message content for PII using the full Scanner (regex + GLiNER) |
+| R2 | critical | Redact detected PII spans using the configured `redactStrategy` |
+| R3 | critical | Return `{ content: redactedText }` when PII is found; return void when clean |
+| R4 | high | Apply existing `entityActions`, `guardrail_mode`, and `allowlist` config; all actions produce span-level redaction |
+| R5 | high | Never return `cancel: true` — always deliver the (redacted) message |
+| R6 | medium | Emit audit log entry with `source: "outbound"` when PII is detected and `auditEnabled: true` |
+| R7 | low | Handler may be async (Scanner.scan() returns a Promise) |
+## Success Criteria
+- Unit tests pass for the message sending handler covering PII detection, redaction, allowlist, audit logging, and no-op cases
+- Plugin smoke test verifies `message_sending` hook registration
+- Plugin smoke test verifies PII in outbound content is redacted
+- All existing tests pass (no regression)
+## Constraints
+- Must not introduce new dependencies
+- Must not change the existing `FogClawConfig` type
+- Must reuse the existing Scanner instance (not create a new one)
+## Priority
+- priority: high
+- rationale: This is the last-chance safety net before PII reaches external messaging channels. Even if upstream scanning catches most PII, outbound scanning prevents hallucinated or reassembled PII from leaking.
+## Initial Milestone Candidates
+- M1: Create `src/message-sending-handler.ts` with async handler factory, plus unit tests
+- M2: Register hook in `src/index.ts`, extend plugin smoke test, full suite validation
+## Handoff
+After spec approval, proceed directly to implementation (lightweight plan mode — code mirrors the established `tool-result-handler.ts` pattern).
+## Revision Notes
+- 2026-02-17T00:00:00Z: Initialized spec. message_sending hook is typed but not invoked in OpenClaw; handler ships as future-ready.

package/docs/specs/2026-02-17-feat-tool-result-pii-scanning-spec.md ADDED Viewed

@@ -0,0 +1,122 @@
+---
+slug: 2026-02-17-feat-tool-result-pii-scanning
+status: intake-complete
+date: 2026-02-17T00:00:00Z
+owner: sidmohan
+plan_mode: lightweight
+spike_recommended: no
+priority: high
+---
+# feat: Add PII scanning to tool results via tool_result_persist hook
+## Purpose / Big Picture
+FogClaw currently only scans the user prompt text (`before_agent_start`). The majority of PII entering an agent's context comes from **tool results** — file reads, web fetches, API calls, database queries. This content bypasses FogClaw entirely today.
+By hooking into OpenClaw's `tool_result_persist` lifecycle, FogClaw can scan and redact PII in tool results **before they are persisted to the session transcript**, closing the largest gap in FogClaw's coverage.
+## Scope
+### In Scope
+- Register a `tool_result_persist` hook handler in FogClaw's plugin registration
+- Extract text content from `AgentMessage` tool result payloads
+- Scan extracted text using the **regex engine only** (synchronous constraint)
+- Apply the existing `guardrail_mode`, `entityActions`, `redactStrategy`, and `allowlist` config to detected entities
+- Redact PII spans in tool result text content (all modes — redact, block, warn — produce span-level redaction in tool results)
+- Emit audit log entries for tool result detections when `auditEnabled: true`
+- Add unit tests for the new hook handler
+- Add integration test confirming the hook registers and transforms tool results
+### Boundaries
+- **No GLiNER on this path.** The `tool_result_persist` hook is synchronous-only; async handlers are rejected by OpenClaw. Regex covers structured PII (SSN, email, phone, credit card, IP, date, zip). Unstructured entity detection (person names, organizations) is out of scope for this hook.
+- **No `before_tool_call` hook.** This hook exists in OpenClaw's type system but has zero active invocation sites upstream. Will be addressed in a future initiative once OpenClaw wires it in.
+- **No `message_sending` hook.** Outbound message scanning is a separate priority.
+- **No scanning of `event.messages` history.** Historical message scanning is a separate priority.
+- **No new config surface.** Reuse existing FogClaw config — no `toolResultScanning` sub-object.
+- **No changes to OpenClaw upstream.** This initiative is FogClaw-only.
+## Non-Goals
+- Blocking tool execution (requires `before_tool_call`, which is not wired upstream)
+- Modifying files on disk
+- Scanning binary/image content in tool results
+- Real-time GLiNER inference on tool results
+## Risks
+- **Performance on hot path.** `tool_result_persist` runs synchronously on every tool result. Regex scanning is sub-millisecond for typical payloads, but very large tool results (e.g., reading a 10K-line file) could add measurable latency. Mitigation: benchmark and consider a size cap with configurable threshold.
+- **AgentMessage structure varies.** Tool results are typed as `AgentMessage`, whose internal structure depends on the tool and provider. Text extraction must handle multiple content formats without crashing on unexpected shapes. Mitigation: defensive extraction with fallback to no-op.
+- **Redaction alters tool output semantics.** Replacing `123-45-6789` with `[SSN_1]` in a tool result changes what the model sees. This is the intended behavior, but could cause unexpected downstream effects if the model tries to use the redacted value literally. Mitigation: this is inherent to the feature and matches existing `before_agent_start` behavior.
+## Rollout
+- Ship as part of next FogClaw patch release (0.1.7 or 0.2.0)
+- Enabled by default when FogClaw is enabled (no separate toggle)
+- Audit logging captures tool result scans for observability
+## Validation and Acceptance Signals
+- Unit tests pass for text extraction from various `AgentMessage` shapes
+- Unit tests pass for regex scanning + redaction of tool result content
+- Integration test confirms `tool_result_persist` hook registers via `api.on()`
+- Integration test confirms a tool result containing PII is transformed before persistence
+- Audit log entries are emitted for tool result detections
+- Existing `before_agent_start` tests continue to pass (no regression)
+- Manual verification: install FogClaw in OpenClaw, have agent read a file with PII, confirm session transcript shows redacted content
+## Requirements
+| ID | Priority | Requirement |
+|---|---|---|
+| R1 | critical | Register a `tool_result_persist` hook handler that scans tool result text for PII using the regex engine |
+| R2 | critical | Redact detected PII spans in tool result messages using the configured `redactStrategy` (token/mask/hash) |
+| R3 | critical | Handler must be synchronous (no Promises returned) — OpenClaw rejects async `tool_result_persist` handlers |
+| R4 | high | Apply existing `entityActions` and `guardrail_mode` config to determine per-entity action; all actions produce span-level redaction in tool results |
+| R5 | high | Respect existing `allowlist` config (global values, patterns, per-entity lists) |
+| R6 | high | Extract text content defensively from `AgentMessage` payloads — handle string content, array-of-content-blocks, and unexpected shapes without throwing |
+| R7 | medium | Emit audit log entry per tool result scan when `auditEnabled: true`, including tool name, entity count, and labels (no raw PII values in logs) |
+| R8 | medium | Skip scanning for tool results with no extractable text content (binary, empty, non-string) |
+| R9 | low | Include `source: "tool_result"` in audit log entries to distinguish from prompt-level scans |
+## Key Decisions
+- **Regex-only on hot path**: GLiNER is async and cannot run in a synchronous hook. Regex covers the 7 structured PII types (SSN, email, phone, credit card, IP, date, zip) at sub-millisecond latency. This is a deliberate tradeoff — unstructured entities (person names, orgs) are not scanned in tool results.
+- **Reuse existing config**: No separate config section for tool result scanning. The same `guardrail_mode`, `entityActions`, `redactStrategy`, and `allowlist` apply everywhere. Simpler mental model for users.
+- **Span-level redaction for all modes**: Even when `entityActions` says `block` for an entity type, the tool result is redacted at the span level (not replaced entirely). This preserves non-PII context for the agent while removing sensitive values.
+## Success Criteria
+- PII in tool results (file reads, web fetches, etc.) is redacted before entering the session transcript
+- Regex engine detects SSN, email, phone, credit card, IP, date, and zip in tool result content
+- No measurable latency impact for typical tool results (<1KB text)
+- Audit log captures tool result scan events with entity counts and labels
+- All existing tests pass; new tests cover the hook handler, text extraction, and edge cases
+## Constraints
+- `tool_result_persist` handler MUST be synchronous (OpenClaw constraint)
+- Must not introduce new dependencies
+- Must not change the existing `FogClawConfig` type (reuse existing fields)
+- Regex engine only — no ONNX/GLiNER on this path
+## Priority
+- priority: high
+- rationale: This closes the single largest gap in FogClaw's PII coverage. Tool results are the primary vector for PII entering agent context, and this hook is the only active interception point OpenClaw provides for that data flow.
+## Initial Milestone Candidates
+- M1: Text extraction utility — defensively extract text from `AgentMessage` tool result payloads, handling string content, content block arrays, and edge cases. Likely files: `src/extract.ts`, `tests/extract.test.ts`.
+- M2: `tool_result_persist` hook handler — register the hook, wire in regex scanning + redaction + audit logging, return transformed message. Likely files: `src/index.ts`, `tests/tool-result-hook.test.ts`.
+- M3: Integration smoke test — end-to-end test confirming a registered FogClaw plugin transforms a tool result containing PII. Likely files: `tests/plugin-smoke.test.ts` (extend existing).
+## Handoff
+After spec approval, proceed to `he-plan` for implementation breakdown. No spike needed — the OpenClaw hook contract is well-documented and the regex engine + redactor already exist in FogClaw.
+## Revision Notes
+- 2026-02-17T00:00:00Z: Initialized spec from template. Reason: establish intake baseline for tool result PII scanning via `tool_result_persist` hook.

package/openclaw.plugin.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "id": "fogclaw",
   "name": "FogClaw",
-  "version": "0.1.6",
+  "version": "0.2.0",
   "description": "PII detection & custom entity redaction plugin powered by DataFog",
   "configSchema": {
     "type": "object",

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@datafog/fogclaw",
-  "version": "0.1.6",
+  "version": "0.2.0",
   "description": "OpenClaw plugin for PII detection & custom entity redaction powered by DataFog",
   "type": "module",
   "main": "dist/index.js",

package/src/extract.ts ADDED Viewed

@@ -0,0 +1,98 @@
+/**
+ * Utilities for extracting text from AgentMessage tool result payloads
+ * and replacing text content after redaction.
+ *
+ * AgentMessage shapes handled:
+ * - Plain string
+ * - Object with `content: string`
+ * - Object with `content: [{ type: "text", text: "..." }, ...]`
+ *
+ * When multiple text blocks exist in a content array, they are joined
+ * with a null byte separator (\0) so entity offsets stay valid across
+ * the concatenated string. replaceText splits on the same separator
+ * to map redacted text back to individual blocks.
+ */
+// Separator between text segments from content block arrays.
+// Null byte won't appear in regex PII patterns or normal text content.
+const SEGMENT_SEP = "\0";
+/**
+ * Extract all text content from an AgentMessage tool result payload.
+ * Returns an empty string if no text content is found.
+ */
+export function extractText(message: unknown): string {
+  if (message == null) return "";
+  if (typeof message === "string") return message;
+  if (typeof message !== "object") return "";
+  const msg = message as Record<string, unknown>;
+  const content = msg.content;
+  if (content == null) return "";
+  if (typeof content === "string") return content;
+  if (Array.isArray(content)) {
+    const textParts: string[] = [];
+    for (const block of content) {
+      if (
+        block != null &&
+        typeof block === "object" &&
+        (block as Record<string, unknown>).type === "text" &&
+        typeof (block as Record<string, unknown>).text === "string"
+      ) {
+        textParts.push((block as Record<string, unknown>).text as string);
+      }
+    }
+    if (textParts.length === 0) return "";
+    return textParts.join(SEGMENT_SEP);
+  }
+  return "";
+}
+/**
+ * Replace text content in an AgentMessage tool result payload with
+ * the redacted version. Returns a shallow copy; does not mutate.
+ *
+ * If the message shape is not recognized or has no text, returns
+ * the original message unchanged.
+ */
+export function replaceText(message: unknown, redactedText: string): unknown {
+  if (message == null) return message;
+  if (typeof message === "string") return redactedText;
+  if (typeof message !== "object") return message;
+  const msg = message as Record<string, unknown>;
+  const content = msg.content;
+  if (content == null) return message;
+  if (typeof content === "string") {
+    return { ...msg, content: redactedText };
+  }
+  if (Array.isArray(content)) {
+    const segments = redactedText.split(SEGMENT_SEP);
+    let segmentIndex = 0;
+    const newContent = content.map((block) => {
+      if (
+        block != null &&
+        typeof block === "object" &&
+        (block as Record<string, unknown>).type === "text" &&
+        typeof (block as Record<string, unknown>).text === "string" &&
+        segmentIndex < segments.length
+      ) {
+        const replaced = { ...(block as Record<string, unknown>), text: segments[segmentIndex] };
+        segmentIndex++;
+        return replaced;
+      }
+      return block;
+    });
+    return { ...msg, content: newContent };
+  }
+  return message;
+}