npm - delimit-cli - Versions diffs - 4.5.6 → 4.5.8 - Mend

delimit-cli 4.5.6 → 4.5.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

package/gateway/ai/backends/gateway_core.py +62 -1
package/gateway/ai/led193_daemon/__init__.py +61 -0
package/gateway/ai/led193_daemon/audit.py +174 -0
package/gateway/ai/led193_daemon/cost.py +133 -0
package/gateway/ai/led193_daemon/executor.py +683 -0
package/gateway/ai/led193_daemon/gate.py +300 -0
package/gateway/ai/led193_daemon/pause.py +83 -0
package/gateway/ai/led193_daemon/picker.py +236 -0
package/gateway/ai/scan_bridge/__init__.py +39 -0
package/gateway/ai/scan_bridge/bridge.py +473 -0
package/gateway/ai/scan_bridge/dedup.py +335 -0
package/gateway/ai/scan_bridge/digest.py +151 -0
package/gateway/ai/social_capability/current_capabilities.yaml +1 -0
package/gateway/ai/workers/executor.py +18 -9
package/package.json +1 -1

package/gateway/ai/scan_bridge/dedup.py ADDED Viewed

@@ -0,0 +1,335 @@
+"""LED-1264: scan-bridge dedup — fingerprint a signal and check the ledger.
+Two-stage dedup:
+1. Extract a topic fingerprint from the signal — domain/orbit signal
+   terms (reuse ``social_capability.fit_floor._extract_topic_fingerprint``
+   if available), plus the canonical_url host + first significant path
+   segment, plus the leading bracket-prefixed tag (e.g. ``[COMPETITOR
+   RELEASE]``) which is a strong topic signal in our scan corpus.
+2. Look the fingerprint up against the strategy ledger inside a
+   60-day window (any status — open, done, cancelled, blocked,
+   archived). If ANY active or recently-closed item matches, skip
+   promotion. Per the directive: 60% recall is fine; cost of missing
+   a duplicate is one founder-reviewed P2 item.
+Skipped duplicates are logged to ``~/.delimit/scan_bridge_dedup.jsonl``
+so the founder can audit what the bridge filtered out.
+"""
+from __future__ import annotations
+import json
+import re
+from datetime import datetime, timedelta, timezone
+from pathlib import Path
+from typing import Any, Dict, Iterable, Optional, Set
+from urllib.parse import urlparse
+DEDUP_LOG = Path.home() / ".delimit" / "scan_bridge_dedup.jsonl"
+# Bracket-prefix tags carried by the scanner (e.g. "[COMPETITOR RELEASE]
+# oasdiff …" or "[VENDOR NEWS] …"). These are strong topic signals — when
+# present we lift them into the fingerprint as a single canonical token
+# so two scans of "oasdiff v1.15.1" + "oasdiff v1.15.2" both share the
+# "competitor_release:oasdiff" key.
+_BRACKET_PREFIX_RE = re.compile(r"^\s*\[([^\]]{1,40})\]\s*([^\s:.]{1,80})", re.IGNORECASE)
+# A trivial path-segment splitter; we just want the first non-empty
+# significant chunk (e.g. "oasdiff" from /oasdiff/oasdiff/releases/tag/...).
+_SIGNIFICANT_PATH_RE = re.compile(r"[A-Za-z0-9][A-Za-z0-9_\-.]{1,}")
+def _domain_orbit_terms(text: str) -> Set[str]:
+    """Best-effort import of fit_floor's topic extractor.
+    fit_floor extracts the union of matched Delimit-domain + orbit
+    signal terms. If the import fails for any reason (test isolation,
+    refactor) we fall back to an empty set — the URL/bracket terms
+    below are still load-bearing on their own.
+    """
+    try:
+        from ai.social_capability.fit_floor import _extract_topic_fingerprint
+    except Exception:  # pragma: no cover — tolerant fallback
+        return set()
+    try:
+        return set(_extract_topic_fingerprint(text or ""))
+    except Exception:  # pragma: no cover
+        return set()
+def _bracket_prefix_token(snippet: str) -> Optional[str]:
+    """Extract a "<tag>:<head_word>" canonical token from a bracketed
+    snippet header. Returns None when the snippet doesn't start with
+    a recognisable bracket tag.
+    """
+    if not snippet:
+        return None
+    m = _BRACKET_PREFIX_RE.match(snippet)
+    if not m:
+        return None
+    tag = re.sub(r"\s+", "_", m.group(1).strip().lower())
+    head = m.group(2).strip().lower()
+    if not tag or not head:
+        return None
+    return f"{tag}:{head}"
+def _url_terms(canonical_url: str) -> Set[str]:
+    """Return host + first significant path segment as canonical tokens."""
+    if not canonical_url:
+        return set()
+    try:
+        p = urlparse(canonical_url)
+    except Exception:
+        return set()
+    out: Set[str] = set()
+    host = (p.netloc or "").lower().lstrip("www.")
+    if host:
+        out.add(f"host:{host}")
+    # Pull first 1-2 significant path segments. For github.com the first
+    # is the org and the second is the repo — both useful as dedup keys.
+    segments = [s for s in (p.path or "").split("/") if s]
+    for seg in segments[:2]:
+        m = _SIGNIFICANT_PATH_RE.search(seg)
+        if m:
+            out.add(f"seg:{m.group(0).lower()}")
+    return out
+def extract_topic_fingerprint(signal: Dict[str, Any]) -> Set[str]:
+    """Return the dedup fingerprint set for a single scanned signal.
+    The fingerprint is a SET of canonical tokens. Two signals are
+    considered overlapping when their fingerprint sets share at least
+    one token. Per the directive: don't be too clever; 60% recall is
+    fine.
+    """
+    snippet = signal.get("content_snippet") or ""
+    canonical_url = signal.get("canonical_url") or ""
+    rationale = signal.get("rationale") or ""
+    tokens: Set[str] = set()
+    tokens.update(_domain_orbit_terms(f"{snippet}\n{rationale}"))
+    tokens.update(_url_terms(canonical_url))
+    bracket = _bracket_prefix_token(snippet)
+    if bracket:
+        tokens.add(bracket)
+    return tokens
+# ── Ledger lookup ─────────────────────────────────────────────────────
+def _parse_iso(value: Optional[str]) -> Optional[datetime]:
+    if not value:
+        return None
+    try:
+        dt = datetime.fromisoformat(str(value).replace("Z", "+00:00"))
+    except (TypeError, ValueError):
+        return None
+    if dt.tzinfo is None:
+        dt = dt.replace(tzinfo=timezone.utc)
+    return dt
+def _item_fingerprint_tokens(item: Dict[str, Any]) -> Set[str]:
+    """Recover a fingerprint token set from a stored ledger item.
+    Auto-promoted items carry their fingerprint in
+    ``metadata.signal_ref.fingerprint`` as a serialised list. Older /
+    hand-added items don't, so we fall back to extracting on-the-fly
+    from title + description + tags + context — the same fields a
+    reasonable founder would have written about the same topic.
+    """
+    metadata = item.get("metadata") or {}
+    signal_ref = metadata.get("signal_ref") or {}
+    stored = signal_ref.get("fingerprint")
+    if isinstance(stored, list) and stored:
+        return {str(t).lower() for t in stored if t}
+    if isinstance(stored, str) and stored:
+        # Comma-separated fallback shape.
+        return {p.strip().lower() for p in stored.split(",") if p.strip()}
+    # Fallback: synthesise a fingerprint from the human text in the item.
+    parts = [
+        item.get("title") or "",
+        item.get("description") or "",
+        item.get("context") or "",
+    ]
+    tags = item.get("tags") or []
+    if isinstance(tags, list):
+        parts.append(" ".join(str(t) for t in tags))
+    text = "\n".join(p for p in parts if p)
+    fake_signal = {"content_snippet": text, "canonical_url": "", "rationale": ""}
+    return extract_topic_fingerprint(fake_signal)
+def _within_window(item: Dict[str, Any], window_days: int, now: datetime) -> bool:
+    """Item is in-window if either created_at OR updated_at is within
+    ``window_days`` of ``now``.
+    """
+    cutoff = now - timedelta(days=window_days)
+    for field in ("updated_at", "created_at"):
+        ts = _parse_iso(item.get(field))
+        if ts and ts >= cutoff:
+            return True
+    return False
+def _candidate_strategy_items(window_days: int = 60) -> Iterable[Dict[str, Any]]:
+    """Yield strategy items in the dedup window.
+    Imports ``ai.ledger_manager.list_items`` lazily so test patches
+    targeting that symbol take effect at call time.
+    """
+    try:
+        from ai.ledger_manager import list_items
+    except Exception:  # pragma: no cover
+        return iter(())
+    now = datetime.now(timezone.utc)
+    out: list = []
+    cursor: Optional[str] = None
+    seen_ids: Set[str] = set()
+    # Walk pages defensively — most ledgers have <500 strategy items, but
+    # paginate if needed.
+    for _ in range(20):  # hard cap on pages, prevents accidental infinite loop
+        resp = list_items(
+            ledger="strategy",
+            limit=500,
+            cursor=cursor,
+            sort="updated_at",
+            order="desc",
+        )
+        items = (resp.get("items") or {}).get("strategy") or []
+        if not items:
+            break
+        for item in items:
+            iid = item.get("id") or ""
+            if iid and iid in seen_ids:
+                continue
+            if iid:
+                seen_ids.add(iid)
+            if _within_window(item, window_days, now):
+                out.append(item)
+        cursor = resp.get("next_cursor")
+        if not cursor:
+            break
+    return out
+def _log_dedup(signal: Dict[str, Any], match: Dict[str, Any], reason: str) -> None:
+    try:
+        DEDUP_LOG.parent.mkdir(parents=True, exist_ok=True)
+        with DEDUP_LOG.open("a", encoding="utf-8") as fh:
+            fh.write(json.dumps({
+                "ts": datetime.now(timezone.utc).isoformat(),
+                "signal_fingerprint_id": signal.get("fingerprint"),
+                "platform": signal.get("platform"),
+                "canonical_url": signal.get("canonical_url"),
+                "snippet_head": (signal.get("content_snippet") or "")[:160],
+                "matched_item_id": match.get("id"),
+                "matched_item_title": (match.get("title") or "")[:160],
+                "matched_item_status": match.get("status"),
+                "reason": reason,
+            }) + "\n")
+    except OSError:  # pragma: no cover — best-effort
+        pass
+def _is_strong_match(shared: Set[str], sig_tokens: Set[str]) -> bool:
+    """Return True when the shared-token set is specific enough to
+    claim two signals are about the same topic.
+    Strict rule (chosen after empirical scan-corpus tuning, see
+    LED-1264 memo): a true dedup match requires a SPECIFIC token —
+    either a bracket-prefix token (``competitor_release:oasdiff``,
+    ``vendor_news:cursor``, ``outreach_state_change:logto-io``) or a
+    ``seg:<repo>`` URL path segment. Generic orbit terms ("mcp",
+    "claude code", "cursor"), tech-context words, and bare host tokens
+    are NOT enough on their own. A signal where two of those overlap
+    but neither has a specific identifier is two different things
+    that happen to live in the same ecosystem; we want them as
+    separate ledger items.
+    Per the directive: "don't be too clever — 60% recall on duplicates
+    is fine; the cost of missing a duplicate is one founder-reviewed
+    P2 ledger item, not a catastrophe." This rule errs toward
+    promoting (more recall on the no-dedup decision).
+    """
+    if not shared:
+        return False
+    # Bracket-prefix tokens win — they're tightly scoped (vendor name
+    # baked in). Excludes host: and seg: which use the same `:` syntax
+    # but live in their own buckets below.
+    if any(":" in t and not t.startswith("host:") and not t.startswith("seg:") for t in shared):
+        return True
+    # Specific repo segments win — same repo across two signals is a
+    # real dedup. seg: tokens carry the repo name post-host (e.g. for
+    # github.com/oasdiff/oasdiff we extract seg:oasdiff). When two
+    # signals share that, they're about the same project.
+    if any(t.startswith("seg:") for t in shared):
+        return True
+    return False
+def is_duplicate(
+    signal: Dict[str, Any],
+    *,
+    window_days: int = 60,
+    candidates: Optional[Iterable[Dict[str, Any]]] = None,
+) -> Optional[Dict[str, Any]]:
+    """Return the matching ledger item dict if ``signal`` collides with
+    an existing strategy item inside the window; ``None`` otherwise.
+    The match rule is intentionally specific — sharing only "mcp" or
+    "host:github.com" between two signals isn't enough overlap to call
+    them duplicates (that's most of the scan corpus). See
+    :func:`_is_strong_match` for the exact rule.
+    Parameters
+    ----------
+    signal:
+        Raw scan target dict (the JSONL line shape from
+        ``social_targets.jsonl``).
+    window_days:
+        Age window for "recently closed" items. Default 60 — per the
+        directive, avoid re-raising things we explicitly chose not to act
+        on within the last 60 days.
+    candidates:
+        Optional iterable of strategy items to check against. Tests pass
+        an explicit list. Production callers omit it and we fetch from
+        the live ledger.
+    """
+    sig_tokens = extract_topic_fingerprint(signal)
+    if not sig_tokens:
+        # No tokens at all means we can't make a useful dedup judgement.
+        # Treat as non-duplicate; the tight confidence floor is the main
+        # quality gate.
+        return None
+    items = list(candidates) if candidates is not None else list(
+        _candidate_strategy_items(window_days=window_days)
+    )
+    now = datetime.now(timezone.utc)
+    for item in items:
+        # When candidates were supplied explicitly we still respect the
+        # window so unit tests can assert window behaviour without
+        # re-implementing the date filter.
+        if candidates is not None and not _within_window(item, window_days, now):
+            continue
+        item_tokens = _item_fingerprint_tokens(item)
+        if not item_tokens:
+            continue
+        shared = sig_tokens & item_tokens
+        if not _is_strong_match(shared, sig_tokens):
+            continue
+        reason = "open_match" if (item.get("status") == "open") else "recent_match"
+        _log_dedup(signal, item, reason)
+        return item
+    return None

package/gateway/ai/scan_bridge/digest.py ADDED Viewed

@@ -0,0 +1,151 @@
+"""LED-1264 daily digest assembler.
+Reads ``~/.delimit/scan_bridge_promotions.jsonl`` and assembles ONE
+email-ready digest of the last 24h of promotions. Returns ``None``
+(or empty subject/body) on a zero-signal day so the caller can skip
+sending — silent days are fine per the directive.
+The digest text is intentionally plain — no markdown, no html — so
+the same string can be used as an email body or a Slack message
+without re-formatting.
+"""
+from __future__ import annotations
+import json
+from datetime import datetime, timedelta, timezone
+from pathlib import Path
+from typing import Any, Dict, List, Optional
+PROMOTIONS_LOG = Path.home() / ".delimit" / "scan_bridge_promotions.jsonl"
+def _parse_iso(value: Optional[str]) -> Optional[datetime]:
+    if not value:
+        return None
+    try:
+        dt = datetime.fromisoformat(str(value).replace("Z", "+00:00"))
+    except (TypeError, ValueError):
+        return None
+    if dt.tzinfo is None:
+        dt = dt.replace(tzinfo=timezone.utc)
+    return dt
+def _load_promotions(log_path: Path) -> List[Dict[str, Any]]:
+    if not log_path.exists():
+        return []
+    out: List[Dict[str, Any]] = []
+    try:
+        with log_path.open("r", encoding="utf-8") as fh:
+            for line in fh:
+                line = line.strip()
+                if not line:
+                    continue
+                try:
+                    out.append(json.loads(line))
+                except (ValueError, json.JSONDecodeError):
+                    continue
+    except OSError:
+        return []
+    return out
+def _filter_window(
+    promotions: List[Dict[str, Any]], since: datetime
+) -> List[Dict[str, Any]]:
+    out: List[Dict[str, Any]] = []
+    for p in promotions:
+        ts = _parse_iso(p.get("ts"))
+        if ts and ts >= since:
+            out.append(p)
+    return out
+def build_daily_digest(
+    *,
+    now: Optional[datetime] = None,
+    window_hours: int = 24,
+    log_path: Optional[Path] = None,
+) -> Dict[str, Any]:
+    """Assemble the last-N-hour promotion digest.
+    Returns
+    -------
+    dict::
+        {
+          "subject": "Delimit scan-bridge — N strategic items (last 24h)",
+          "body":    "<plain text body>",
+          "count":   N,
+          "since":   ISO datetime,
+          "items":   [...promotion rows...],
+        }
+    When ``count == 0`` the subject and body are empty strings so the
+    caller can short-circuit ("no email on silent days") without having
+    to re-check ``count``.
+    """
+    now = now or datetime.now(timezone.utc)
+    since = now - timedelta(hours=window_hours)
+    log_path = log_path or PROMOTIONS_LOG
+    promotions = _load_promotions(log_path)
+    items = _filter_window(promotions, since)
+    items.sort(key=lambda p: p.get("ts") or "", reverse=True)
+    if not items:
+        return {
+            "subject": "",
+            "body": "",
+            "count": 0,
+            "since": since.isoformat(),
+            "items": [],
+        }
+    lines: List[str] = []
+    lines.append(
+        f"Delimit scan-bridge auto-promoted {len(items)} strategic signal(s) "
+        f"to the strategy ledger in the last {window_hours}h."
+    )
+    lines.append("")
+    lines.append(
+        "All items are P2 (review, not auto-action). Reply with item id + "
+        "decision (escalate, archive, defer) or open the ledger to triage."
+    )
+    lines.append("")
+    lines.append("─" * 70)
+    for p in items:
+        title = p.get("title") or "(no title)"
+        item_id = p.get("item_id") or "(unassigned)"
+        confidence = p.get("confidence")
+        platform = p.get("platform") or "?"
+        url = p.get("canonical_url") or ""
+        first_seen = p.get("first_seen") or ""
+        try:
+            conf_str = f"{float(confidence):.2f}" if confidence is not None else "?"
+        except (TypeError, ValueError):
+            conf_str = str(confidence)
+        lines.append(f"[{item_id}] {title}")
+        lines.append(f"    platform={platform} confidence={conf_str} first_seen={first_seen}")
+        if url:
+            lines.append(f"    {url}")
+        lines.append("")
+    lines.append("─" * 70)
+    lines.append("")
+    lines.append(
+        "Source: ~/.delimit/scan_bridge_promotions.jsonl. "
+        "Skipped duplicates: ~/.delimit/scan_bridge_dedup.jsonl. "
+        "Tune via DELIMIT_SCAN_PROMO_CONFIDENCE (default 0.85)."
+    )
+    body = "\n".join(lines)
+    subject = f"Delimit scan-bridge — {len(items)} strategic item(s) (last {window_hours}h)"
+    return {
+        "subject": subject,
+        "body": body,
+        "count": len(items),
+        "since": since.isoformat(),
+        "items": items,
+    }

package/gateway/ai/social_capability/current_capabilities.yaml CHANGED Viewed

@@ -59,6 +59,7 @@ allowed_claims:
   - id: diff_engine
     surface_name: "27 breaking-change types"
     description: "Deterministic diff engine for OpenAPI spec changes."
+    evidence_link: https://delimit.ai/docs/changes
   - id: github_action
     surface_name: "delimit-ai/delimit-action GitHub Action"
     description: "On Marketplace, breaking-change detection on PRs."

package/gateway/ai/workers/executor.py CHANGED Viewed

@@ -26,6 +26,7 @@ from __future__ import annotations
 import json
 import logging
+import os
 import shlex
 import subprocess
 import time
@@ -94,16 +95,24 @@ ACTION_SPEC: Dict[str, Dict[str, Any]] = {
 }
-# LED-988: allowlist for propose_pr. Any repo path NOT in this set is
-# rejected at runtime regardless of whether the caller claimed validation
+# LED-988 + LED-1258: allowlist for propose_pr. Any repo path NOT in this set
+# is rejected at runtime regardless of whether the caller claimed validation
 # passed. Path-traversal-safe (resolved then checked against canonical).
-PROPOSE_PR_ALLOWED_REPOS = frozenset({
-    "/home/delimit/delimit-gateway",
-    "/home/delimit/delimit-ui",
-    "/home/delimit/delimit-action",
-    "/home/delimit/npm-delimit",
-    "/root/governance-framework",
-})
+#
+# Loaded from the DELIMIT_PROPOSE_PR_REPOS env var (comma-separated absolute
+# paths), NOT hardcoded — hardcoding developer-machine paths in shipped source
+# both leaks the dev directory layout to customers AND makes the allowlist
+# dead-code on customer machines (their paths won't match). Empty / unset env
+# var = empty allowlist = propose_pr fails closed for all repo paths.
+def _load_propose_pr_allowed_repos() -> frozenset:
+    raw = os.environ.get("DELIMIT_PROPOSE_PR_REPOS", "").strip()
+    if not raw:
+        return frozenset()
+    return frozenset(p.strip() for p in raw.split(",") if p.strip())
+PROPOSE_PR_ALLOWED_REPOS = _load_propose_pr_allowed_repos()
 # Any branch created by propose_pr must carry this prefix so human branches
 # are never clobbered and PRs are obviously agent-authored at a glance.
 PROPOSE_PR_BRANCH_PREFIX = "delimit/"

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "delimit-cli",
   "mcpName": "io.github.delimit-ai/delimit-mcp-server",
-  "version": "4.5.6",
+  "version": "4.5.8",
   "description": "Unify Claude Code, Codex, Cursor, and Gemini CLI with persistent context, governance, and multi-model debate.",
   "main": "index.js",
   "files": [