npm - delimit-cli - Versions diffs - 4.1.43 → 4.1.44 - Mend

delimit-cli 4.1.43 → 4.1.44

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

package/CHANGELOG.md +27 -0
package/README.md +46 -5
package/bin/delimit-cli.js +1523 -208
package/bin/delimit-setup.js +8 -2
package/gateway/ai/agent_dispatch.py +34 -2
package/gateway/ai/backends/deploy_bridge.py +167 -12
package/gateway/ai/content_engine.py +1276 -2
package/gateway/ai/github_scanner.py +1 -1
package/gateway/ai/governance.py +58 -0
package/gateway/ai/key_resolver.py +95 -2
package/gateway/ai/ledger_manager.py +13 -3
package/gateway/ai/loop_engine.py +220 -349
package/gateway/ai/notify.py +1786 -2
package/gateway/ai/reddit_scanner.py +45 -1
package/gateway/ai/screen_record.py +1 -1
package/gateway/ai/secrets_broker.py +5 -1
package/gateway/ai/social_cache.py +341 -0
package/gateway/ai/social_daemon.py +41 -10
package/gateway/ai/supabase_sync.py +190 -2
package/gateway/ai/tui.py +594 -36
package/gateway/core/zero_spec/express_extractor.py +2 -2
package/gateway/core/zero_spec/nestjs_extractor.py +40 -9
package/gateway/requirements.txt +3 -6
package/package.json +4 -3
package/scripts/demo-v420-clean.sh +267 -0
package/scripts/demo-v420-deliberation.sh +217 -0
package/scripts/demo-v420.sh +55 -0
package/scripts/postinstall.js +4 -3
package/scripts/publish-ci-guard.sh +30 -0
package/scripts/record-and-upload.sh +132 -0
package/scripts/release.sh +126 -0
package/scripts/sync-gateway.sh +100 -0
package/scripts/youtube-upload.py +141 -0

package/gateway/ai/reddit_scanner.py CHANGED Viewed

@@ -26,7 +26,7 @@ logger = logging.getLogger("delimit.ai.reddit_scanner")
 # ---------------------------------------------------------------------------
 SCAN_GROUPS: Dict[str, List[str]] = {
-    "delimit_core": ["ClaudeAI", "vibecoding", "cursor", "AI_Agents"],
+    "delimit_core": ["ClaudeAI", "vibecoding", "cursor", "AI_Agents", "ObsidianMD"],
     "delimit_adjacent": ["devops", "programming", "ContextEngineering", "LocalLLaMA", "MachineLearning"],
     "domainvested": ["Domains", "Entrepreneur", "SideProject", "flipping"],
     "wirereport": ["sportsbook", "sportsbetting"],
@@ -560,3 +560,47 @@ def _save_scan(result: Dict[str, Any], scan_time: datetime) -> Path:
     path.write_text(json.dumps(result, indent=2, default=str))
     logger.info("Scan saved to %s", path)
     return path
+def fetch_thread(thread_id: str, *, proxy_url: str = PROXY_URL) -> Optional[Dict[str, Any]]:
+    """Fetch a single Reddit thread by ID via the residential proxy."""
+    import urllib.parse
+    import urllib.request
+    reddit_url = f"https://www.reddit.com/comments/{thread_id}.json?raw_json=1"
+    fetch_url = f"{proxy_url}?url={urllib.parse.quote(reddit_url, safe='')}"
+    req = urllib.request.Request(
+        fetch_url,
+        headers={"User-Agent": "delimit-scanner/1.0", "Accept": "application/json"},
+    )
+    try:
+        with urllib.request.urlopen(req, timeout=15) as resp:
+            data = json.loads(resp.read().decode())
+            if isinstance(data, list) and len(data) > 0:
+                post_data = data[0].get("data", {}).get("children", [{}])[0].get("data", {})
+                if post_data:
+                    return {
+                        "id": post_data.get("id", ""),
+                        "title": post_data.get("title", ""),
+                        "author": post_data.get("author", ""),
+                        "score": post_data.get("score", 0),
+                        "num_comments": post_data.get("num_comments", 0),
+                        "subreddit": post_data.get("subreddit", ""),
+                        "permalink": post_data.get("permalink", ""),
+                        "selftext": post_data.get("selftext", ""),
+                        "created_utc": post_data.get("created_utc", 0),
+                    }
+    except Exception as exc:
+        logger.warning("Failed to fetch thread %s: %s", thread_id, exc)
+    return None
+def monitor_user_engagement(username: str = "delimitdev") -> list:
+    """Monitor engagement on posts by a Reddit user (LED-300).
+    Checks recent posts/comments by the user for new replies, upvotes,
+    and engagement signals. Returns a list of alert dicts.
+    """
+    # Stub — full implementation requires residential proxy + Playwright (LED-248)
+    return []

package/gateway/ai/screen_record.py CHANGED Viewed

@@ -22,7 +22,7 @@ logger = logging.getLogger("delimit.ai.screen_record")
 # ── Constants ────────────────────────────────────────────────────────────
-CHROMIUM_PATH = os.environ.get("CHROMIUM_PATH", "chromium")
+CHROMIUM_PATH = "/root/.cache/puppeteer/chrome/linux-146.0.7680.153/chrome-linux64/chrome"
 CONTENT_BASE = Path.home() / ".delimit" / "content"
 VIDEOS_DIR = CONTENT_BASE / "videos"
 GIFS_DIR = CONTENT_BASE / "gifs"

package/gateway/ai/secrets_broker.py CHANGED Viewed

@@ -124,10 +124,14 @@ def list_secrets() -> List[Dict]:
         return []
     secrets = []
     for f in sorted(SECRETS_DIR.glob("*.json")):
+        if f.name.startswith("_"):
+            continue  # skip internal files like _access_log.json
         try:
             s = json.loads(f.read_text())
+            if not isinstance(s, dict):
+                continue
             secrets.append({
-                "name": s["name"],
+                "name": s.get("name", f.stem),
                 "scope": s.get("scope", "all"),
                 "description": s.get("description", ""),
                 "created_by": s.get("created_by", ""),

package/gateway/ai/social_cache.py ADDED Viewed

@@ -0,0 +1,341 @@
+"""SQLite-based caching and dedup layer for social sensing.
+Provides:
+- seen_posts table: dedup + relevance scoring for Reddit (and future platforms)
+- scan_meta table: per-subreddit scan timestamps and high-water marks
+- Relevance scoring with keyword/subreddit boosting
+- Lazy DB creation on first use (thread-safe)
+Cache location: ~/.delimit/social_cache.db
+"""
+import logging
+import os
+import re
+import sqlite3
+import threading
+from datetime import datetime, timezone
+from pathlib import Path
+from typing import Any, Dict, List, Optional, Tuple
+logger = logging.getLogger("delimit.ai.social_cache")
+CACHE_DB_PATH = Path.home() / ".delimit" / "social_cache.db"
+# Thread-local storage for SQLite connections (sqlite3 objects are not
+# safe to share across threads).
+_local = threading.local()
+_init_lock = threading.Lock()
+_db_initialized = False
+# ── Relevance keywords and weights ─────────────────────────────────────
+# High-value keywords strongly associated with Delimit's core domain
+RELEVANCE_KEYWORDS_HIGH: Dict[str, float] = {
+    "openapi": 0.35,
+    "swagger": 0.30,
+    "breaking change": 0.40,
+    "breaking changes": 0.40,
+    "api governance": 0.45,
+    "api contract": 0.40,
+    "api contracts": 0.40,
+    "api versioning": 0.35,
+    "semver": 0.35,
+    "mcp server": 0.30,
+    "mcp tool": 0.30,
+    "model context protocol": 0.30,
+}
+# Medium-value keywords: AI coding tools, adjacent territory
+RELEVANCE_KEYWORDS_MED: Dict[str, float] = {
+    "claude code": 0.25,
+    "codex": 0.20,
+    "gemini cli": 0.25,
+    "cursor": 0.15,
+    "api diff": 0.30,
+    "api lint": 0.30,
+    "api migration": 0.25,
+    "schema validation": 0.20,
+    "backward compatible": 0.25,
+    "backwards compatible": 0.25,
+    "backward compatibility": 0.25,
+    "backwards compatibility": 0.25,
+}
+# Subreddit relevance boosts
+SUBREDDIT_BOOSTS: Dict[str, float] = {
+    "claudeai": 0.20,
+    "chatgptcoding": 0.20,
+    "devops": 0.15,
+    "webdev": 0.10,
+    "experienceddevs": 0.15,
+    "programming": 0.05,
+    "vibecoding": 0.15,
+    "ai_agents": 0.15,
+    "contextengineering": 0.20,
+}
+# Subreddits that get penalized unless they mention dev tools
+GENERIC_SUBREDDITS: set = {
+    "entrepreneur", "startups", "sideproject", "saas",
+}
+DEV_TOOL_TERMS: set = {
+    "api", "developer", "dev tool", "devtool", "sdk", "cli",
+    "cicd", "ci/cd", "pipeline", "openapi", "swagger", "github action",
+}
+def _get_conn() -> sqlite3.Connection:
+    """Get a thread-local SQLite connection, creating the DB lazily."""
+    conn = getattr(_local, "conn", None)
+    if conn is not None:
+        return conn
+    global _db_initialized
+    CACHE_DB_PATH.parent.mkdir(parents=True, exist_ok=True)
+    conn = sqlite3.connect(str(CACHE_DB_PATH), timeout=10)
+    conn.row_factory = sqlite3.Row
+    conn.execute("PRAGMA journal_mode=WAL")
+    conn.execute("PRAGMA synchronous=NORMAL")
+    # Lazy schema creation (idempotent)
+    with _init_lock:
+        if not _db_initialized:
+            _create_schema(conn)
+            _db_initialized = True
+    _local.conn = conn
+    return conn
+def _create_schema(conn: sqlite3.Connection) -> None:
+    """Create tables if they don't exist."""
+    conn.executescript("""
+        CREATE TABLE IF NOT EXISTS seen_posts (
+            post_id          TEXT PRIMARY KEY,
+            subreddit        TEXT NOT NULL DEFAULT '',
+            title            TEXT NOT NULL DEFAULT '',
+            score            INTEGER NOT NULL DEFAULT 0,
+            num_comments     INTEGER NOT NULL DEFAULT 0,
+            first_seen       TEXT NOT NULL,
+            last_seen        TEXT NOT NULL,
+            relevance_score  REAL NOT NULL DEFAULT 0.0,
+            actioned         INTEGER NOT NULL DEFAULT 0,
+            venture          TEXT NOT NULL DEFAULT '',
+            fingerprint      TEXT NOT NULL DEFAULT '',
+            canonical_url    TEXT NOT NULL DEFAULT ''
+        );
+        CREATE INDEX IF NOT EXISTS idx_seen_posts_subreddit
+            ON seen_posts(subreddit);
+        CREATE INDEX IF NOT EXISTS idx_seen_posts_relevance
+            ON seen_posts(relevance_score);
+        CREATE INDEX IF NOT EXISTS idx_seen_posts_first_seen
+            ON seen_posts(first_seen);
+        CREATE TABLE IF NOT EXISTS scan_meta (
+            subreddit        TEXT PRIMARY KEY,
+            last_scan        TEXT NOT NULL,
+            high_water_mark  TEXT NOT NULL DEFAULT '',
+            posts_seen       INTEGER NOT NULL DEFAULT 0,
+            posts_new        INTEGER NOT NULL DEFAULT 0
+        );
+    """)
+    conn.commit()
+def compute_relevance_score(
+    title: str,
+    body: str,
+    subreddit: str,
+    score: int = 0,
+    num_comments: int = 0,
+) -> float:
+    """Compute a 0.0-1.0 relevance score for a Reddit post.
+    Scoring layers:
+    1. Keyword matching (high + medium value terms)
+    2. Subreddit boost/penalty
+    3. Engagement signal (mild boost for proven discussion)
+    """
+    text_lower = f"{title} {body}".lower()
+    sub_lower = subreddit.lower().lstrip("r/")
+    relevance = 0.0
+    # Layer 1: keyword matching
+    for keyword, weight in RELEVANCE_KEYWORDS_HIGH.items():
+        if keyword in text_lower:
+            relevance += weight
+    for keyword, weight in RELEVANCE_KEYWORDS_MED.items():
+        if keyword in text_lower:
+            relevance += weight
+    # Layer 2: subreddit boost
+    boost = SUBREDDIT_BOOSTS.get(sub_lower, 0.0)
+    relevance += boost
+    # Penalty for generic subreddits without dev tool mentions
+    if sub_lower in GENERIC_SUBREDDITS:
+        has_dev_term = any(term in text_lower for term in DEV_TOOL_TERMS)
+        if not has_dev_term:
+            relevance -= 0.20
+    # Layer 3: engagement signal (mild, caps at +0.10)
+    if score > 10 or num_comments > 5:
+        relevance += 0.05
+    if score > 50 or num_comments > 20:
+        relevance += 0.05
+    # Clamp to [0.0, 1.0]
+    return max(0.0, min(1.0, relevance))
+def is_post_seen(post_id: str) -> bool:
+    """Check if a post_id is already in the cache."""
+    conn = _get_conn()
+    row = conn.execute(
+        "SELECT 1 FROM seen_posts WHERE post_id = ?", (post_id,)
+    ).fetchone()
+    return row is not None
+def cache_post(
+    post_id: str,
+    subreddit: str,
+    title: str,
+    score: int,
+    num_comments: int,
+    relevance_score: float,
+    venture: str = "",
+    fingerprint: str = "",
+    canonical_url: str = "",
+) -> bool:
+    """Insert a new post into the cache. Returns True if inserted (new), False if already exists."""
+    conn = _get_conn()
+    now = datetime.now(timezone.utc).isoformat()
+    try:
+        conn.execute(
+            """INSERT INTO seen_posts
+               (post_id, subreddit, title, score, num_comments,
+                first_seen, last_seen, relevance_score, venture,
+                fingerprint, canonical_url)
+               VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)""",
+            (post_id, subreddit, title, score, num_comments,
+             now, now, relevance_score, venture, fingerprint, canonical_url),
+        )
+        conn.commit()
+        return True
+    except sqlite3.IntegrityError:
+        # Already exists -- update last_seen and score
+        conn.execute(
+            """UPDATE seen_posts
+               SET last_seen = ?, score = ?, num_comments = ?
+               WHERE post_id = ?""",
+            (now, score, num_comments, post_id),
+        )
+        conn.commit()
+        return False
+def mark_actioned(post_id: str) -> None:
+    """Mark a post as actioned (won't be returned in future scans)."""
+    conn = _get_conn()
+    conn.execute(
+        "UPDATE seen_posts SET actioned = 1 WHERE post_id = ?", (post_id,)
+    )
+    conn.commit()
+def update_scan_meta(subreddit: str, posts_seen: int, posts_new: int, high_water_mark: str = "") -> None:
+    """Record scan metadata for a subreddit."""
+    conn = _get_conn()
+    now = datetime.now(timezone.utc).isoformat()
+    conn.execute(
+        """INSERT INTO scan_meta (subreddit, last_scan, high_water_mark, posts_seen, posts_new)
+           VALUES (?, ?, ?, ?, ?)
+           ON CONFLICT(subreddit) DO UPDATE SET
+               last_scan = excluded.last_scan,
+               high_water_mark = CASE
+                   WHEN excluded.high_water_mark != '' THEN excluded.high_water_mark
+                   ELSE scan_meta.high_water_mark
+               END,
+               posts_seen = excluded.posts_seen,
+               posts_new = excluded.posts_new""",
+        (subreddit, now, high_water_mark, posts_seen, posts_new),
+    )
+    conn.commit()
+def get_scan_stats() -> Dict[str, Any]:
+    """Get aggregate cache statistics."""
+    conn = _get_conn()
+    total = conn.execute("SELECT COUNT(*) FROM seen_posts").fetchone()[0]
+    actioned = conn.execute("SELECT COUNT(*) FROM seen_posts WHERE actioned = 1").fetchone()[0]
+    high_relevance = conn.execute(
+        "SELECT COUNT(*) FROM seen_posts WHERE relevance_score > 0.8"
+    ).fetchone()[0]
+    medium_relevance = conn.execute(
+        "SELECT COUNT(*) FROM seen_posts WHERE relevance_score > 0.3 AND relevance_score <= 0.8"
+    ).fetchone()[0]
+    low_relevance = conn.execute(
+        "SELECT COUNT(*) FROM seen_posts WHERE relevance_score <= 0.3"
+    ).fetchone()[0]
+    subreddit_counts = {}
+    for row in conn.execute(
+        "SELECT subreddit, COUNT(*) as cnt FROM seen_posts GROUP BY subreddit ORDER BY cnt DESC LIMIT 10"
+    ):
+        subreddit_counts[row["subreddit"]] = row["cnt"]
+    return {
+        "total_cached": total,
+        "actioned": actioned,
+        "high_relevance": high_relevance,
+        "medium_relevance": medium_relevance,
+        "low_relevance": low_relevance,
+        "top_subreddits": subreddit_counts,
+    }
+def get_high_priority_posts(min_score: float = 0.8, limit: int = 20) -> List[Dict]:
+    """Get high-priority posts that haven't been actioned yet."""
+    conn = _get_conn()
+    rows = conn.execute(
+        """SELECT post_id, subreddit, title, score, num_comments,
+                  relevance_score, venture, fingerprint, canonical_url, first_seen
+           FROM seen_posts
+           WHERE relevance_score >= ? AND actioned = 0
+           ORDER BY relevance_score DESC, score DESC
+           LIMIT ?""",
+        (min_score, limit),
+    ).fetchall()
+    return [dict(row) for row in rows]
+def prune_old_posts(days: int = 30) -> int:
+    """Remove posts older than N days that were never actioned. Returns count removed."""
+    conn = _get_conn()
+    from datetime import timedelta
+    cutoff = (datetime.now(timezone.utc) - timedelta(days=days)).isoformat()
+    cursor = conn.execute(
+        "DELETE FROM seen_posts WHERE actioned = 0 AND first_seen < ?",
+        (cutoff,),
+    )
+    conn.commit()
+    return cursor.rowcount
+def close_connection() -> None:
+    """Close the thread-local connection if open."""
+    conn = getattr(_local, "conn", None)
+    if conn is not None:
+        try:
+            conn.close()
+        except Exception:
+            pass
+        _local.conn = None

package/gateway/ai/social_daemon.py CHANGED Viewed

@@ -19,6 +19,13 @@ from typing import Any, Dict, List, Optional
 logger = logging.getLogger("delimit.ai.social_daemon")
+# ── Vertex AI credentials (prefer ADC from gcloud auth) ─────────────
+_adc_path = str(Path.home() / ".config" / "gcloud" / "application_default_credentials.json")
+if not os.environ.get("GOOGLE_APPLICATION_CREDENTIALS") and os.path.exists(_adc_path):
+    os.environ["GOOGLE_APPLICATION_CREDENTIALS"] = _adc_path
+if not os.environ.get("GOOGLE_CLOUD_PROJECT"):
+    os.environ["GOOGLE_CLOUD_PROJECT"] = "jamsons"
 # ── Configuration ────────────────────────────────────────────────────
 # Default to 15 minutes (900 seconds)
 SCAN_INTERVAL = int(os.environ.get("DELIMIT_SOCIAL_SCAN_INTERVAL", "900"))
@@ -205,26 +212,50 @@ def _build_compact_summary(targets: List[Dict], processed: Dict) -> Dict[str, An
     }
+_scan_digest_count_today: int = 0
+_scan_digest_last_date: str = ""
+_SCAN_DIGEST_MAX_PER_DAY = 4  # Max scan digest emails per day
 def _send_scan_digest(compact: Dict, processed: Dict) -> None:
     """Send a digest email summarizing the scan results.
-    Only sends if there are new high-priority targets, new drafts, or new ledger items.
+    Only sends if there are REAL actionable items (ready drafts, not placeholders).
     Suppresses digest if nothing actionable to avoid email fatigue.
+    Capped at 4 per day to prevent inbox flooding.
     """
+    global _scan_digest_count_today, _scan_digest_last_date
     try:
         from ai.notify import send_email
         s = compact.get("summary", {})
         high = s.get("high_priority", 0)
-        drafted = s.get("drafted", 0)
         ledger_items = s.get("ledger_items", 0)
         total = s.get("total_new_targets", 0)
         platforms = s.get("platform_breakdown", {})
-        owner_actions = len(processed.get("owner_actions", []))
-        # Only send if there's something actionable
-        if high == 0 and drafted == 0 and ledger_items == 0 and owner_actions == 0:
+        # Count only REAL owner actions (not placeholder drafts)
+        owner_actions = [a for a in processed.get("owner_actions", []) if a.get("draft_id")]
+        real_owner_actions = len(owner_actions)
+        # Count ready drafts only (not placeholders that failed quality check)
+        real_drafted = len([d for d in processed.get("drafted", [])
+                          if not d.get("suppressed_reason") and not d.get("deduped")])
+        # Only send if there's something genuinely actionable
+        if high == 0 and real_drafted == 0 and ledger_items == 0 and real_owner_actions == 0:
+            return
+        # Daily cap — reset counter at midnight
+        today = datetime.now(timezone.utc).strftime("%Y-%m-%d")
+        if today != _scan_digest_last_date:
+            _scan_digest_count_today = 0
+            _scan_digest_last_date = today
+        if _scan_digest_count_today >= _SCAN_DIGEST_MAX_PER_DAY:
+            logger.info("Scan digest daily cap reached (%d/%d). Suppressing.",
+                       _scan_digest_count_today, _SCAN_DIGEST_MAX_PER_DAY)
             return
+        _scan_digest_count_today += 1
         lines = []
         lines.append(f"Social scan found {total} new targets across {platforms}.")
@@ -241,8 +272,8 @@ def _send_scan_digest(compact: Dict, processed: Dict) -> None:
                     lines.append(f"  {url}")
                 lines.append("")
-        if drafted > 0:
-            lines.append(f"DRAFTS: {drafted} reply drafts created")
+        if real_drafted > 0:
+            lines.append(f"DRAFTS: {real_drafted} ready drafts (quality-checked)")
             lines.append("")
             # Include actual draft text for ready drafts
             for action in processed.get("owner_actions", []):
@@ -273,8 +304,8 @@ def _send_scan_digest(compact: Dict, processed: Dict) -> None:
             lines.append(f"LEDGER: {ledger_items} items added to project ledger")
             lines.append("")
-        if owner_actions > 0:
-            lines.append(f"ACTIONS: {owner_actions} items need your review")
+        if real_owner_actions > 0:
+            lines.append(f"ACTIONS: {real_owner_actions} items need your review")
             lines.append("")
         cache = compact.get("cache_stats", {})
@@ -283,7 +314,7 @@ def _send_scan_digest(compact: Dict, processed: Dict) -> None:
         send_email(
             message="\n".join(lines),
-            subject=f"[SOCIAL] {high} high-pri, {drafted} drafts, {total} targets",
+            subject=f"[SOCIAL] {high} high-pri, {real_drafted} ready drafts, {real_owner_actions} actions",
             event_type="social_digest",
         )
     except Exception as e: