npm - @smilintux/skcapstone - Versions diffs - 0.9.0 → 0.12.5 - Mend

@smilintux/skcapstone 0.9.0 → 0.12.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (284) hide show

package/.env.example +10 -4
package/.github/workflows/ci.yml +2 -2
package/.github/workflows/publish.yml +9 -2
package/.openclaw-workspace.json +2 -2
package/CLAUDE.md +37 -0
package/MISSION.md +17 -2
package/README.md +282 -3
package/docker/Dockerfile +7 -7
package/docker/compose-templates/dev-team.yml +12 -12
package/docker/compose-templates/mini-team.yml +9 -9
package/docker/compose-templates/ops-team.yml +10 -10
package/docker/compose-templates/research-team.yml +10 -10
package/docker/entrypoint.sh +4 -4
package/docs/ADR-optional-integration-backbone.md +181 -0
package/docs/ARCHITECTURE.md +186 -43
package/docs/BOND_WITH_GROK.md +6 -6
package/docs/CUSTOM_AGENT.md +278 -1
package/docs/DREAMING.md +70 -0
package/docs/GETTING_STARTED.md +10 -7
package/docs/QUICKSTART.md +10 -6
package/docs/SKJOULE_ARCHITECTURE.md +3 -3
package/docs/SOUL_SWAPPER.md +5 -5
package/docs/hammertime-audit.md +402 -0
package/docs/sk-integration-HANDOFF.md +117 -0
package/docs/skscheduler.md +155 -0
package/docs/superpowers/examples/jobs.yaml +31 -0
package/docs/superpowers/plans/2026-06-08-skscheduler.md +1265 -0
package/docs/superpowers/specs/2026-06-08-skscheduler-design.md +186 -0
package/examples/custom-bond-template.json +1 -1
package/examples/grok-feb.json +1 -1
package/examples/queen-ava-feb.json +1 -1
package/launchd/com.skcapstone.daemon.plist +52 -0
package/launchd/com.skcapstone.memory-compress.plist +45 -0
package/launchd/com.skcapstone.skcomms-heartbeat.plist +33 -0
package/launchd/com.skcapstone.skcomms-queue-drain.plist +34 -0
package/launchd/install-launchd.sh +156 -0
package/{openclaw-plugin → openclaw-plugin.archived-2026-04-23}/src/index.ts +3 -2
package/package.json +1 -1
package/pyproject.toml +16 -10
package/scripts/archive-sessions.sh +95 -0
package/scripts/check-updates.py +4 -4
package/scripts/install-bundle.sh +8 -8
package/scripts/install.ps1 +12 -11
package/scripts/install.sh +196 -11
package/scripts/model-fallback-monitor.sh +102 -0
package/scripts/notion-api.py +259 -0
package/scripts/nvidia-proxy.mjs +908 -0
package/scripts/proxy-monitor.sh +89 -0
package/scripts/refresh-anthropic-token.sh +172 -0
package/scripts/release.sh +98 -0
package/scripts/session-to-memory.py +219 -0
package/scripts/skgateway.mjs +856 -0
package/scripts/telegram-catchup-all.sh +147 -0
package/scripts/verify_install.sh +2 -2
package/scripts/wargov-ufo-capture/README.md +43 -0
package/scripts/wargov-ufo-capture/cdp_capture_release2.py +273 -0
package/scripts/wargov-ufo-capture/cdp_capture_splc_doj.py +246 -0
package/scripts/wargov-ufo-capture/cdp_finish.py +271 -0
package/scripts/wargov-ufo-capture/cdp_probe.py +188 -0
package/scripts/wargov-ufo-capture/cdp_splc_pressrelease.py +101 -0
package/scripts/wargov-ufo-capture/parse_csv.py +95 -0
package/scripts/wargov-ufo-capture/pull_dvids.sh +107 -0
package/scripts/watch-anthropic-token.sh +212 -0
package/scripts/windows/install-tasks.ps1 +7 -7
package/scripts/windows/skcapstone-task.xml +1 -1
package/src/skcapstone/__init__.py +45 -3
package/src/skcapstone/_cli_monolith.py +20 -15
package/src/skcapstone/activity.py +5 -1
package/src/skcapstone/agent_card.py +3 -2
package/src/skcapstone/api.py +41 -40
package/src/skcapstone/auction.py +14 -11
package/src/skcapstone/backup.py +2 -1
package/src/skcapstone/blueprint_registry.py +4 -3
package/src/skcapstone/blueprints/builtins/itil-operations.yaml +40 -0
package/src/skcapstone/brain_first.py +238 -0
package/src/skcapstone/changelog.py +1 -1
package/src/skcapstone/chat.py +22 -17
package/src/skcapstone/cli/__init__.py +9 -1
package/src/skcapstone/cli/_common.py +1 -0
package/src/skcapstone/cli/agents_spawner.py +5 -2
package/src/skcapstone/cli/alerts.py +25 -4
package/src/skcapstone/cli/bench.py +15 -15
package/src/skcapstone/cli/chat.py +7 -4
package/src/skcapstone/cli/consciousness.py +5 -2
package/src/skcapstone/cli/context_cmd.py +18 -4
package/src/skcapstone/cli/daemon.py +121 -42
package/src/skcapstone/cli/gtd.py +26 -1
package/src/skcapstone/cli/housekeeping.py +3 -3
package/src/skcapstone/cli/identity_cmd.py +378 -0
package/src/skcapstone/cli/joule_cmd.py +7 -3
package/src/skcapstone/cli/memory.py +8 -6
package/src/skcapstone/cli/peers_dir.py +1 -1
package/src/skcapstone/cli/register_cmd.py +29 -3
package/src/skcapstone/cli/scheduler_cmd.py +167 -0
package/src/skcapstone/cli/session.py +25 -0
package/src/skcapstone/cli/setup.py +96 -29
package/src/skcapstone/cli/shell_cmd.py +53 -1
package/src/skcapstone/cli/skills_cmd.py +2 -2
package/src/skcapstone/cli/soul.py +8 -5
package/src/skcapstone/cli/status.py +37 -11
package/src/skcapstone/cli/telegram.py +21 -0
package/src/skcapstone/cli/test_cmd.py +5 -5
package/src/skcapstone/cli/test_connection.py +2 -2
package/src/skcapstone/cli/upgrade_cmd.py +23 -14
package/src/skcapstone/cli/version_cmd.py +1 -1
package/src/skcapstone/cli/watch_cmd.py +9 -6
package/src/skcapstone/cloud9_bridge.py +14 -14
package/src/skcapstone/codex_setup.py +255 -0
package/src/skcapstone/config_validator.py +7 -4
package/src/skcapstone/consciousness_config.py +5 -1
package/src/skcapstone/consciousness_loop.py +313 -273
package/src/skcapstone/context_loader.py +121 -0
package/src/skcapstone/coord_federation.py +2 -1
package/src/skcapstone/coordination.py +23 -6
package/src/skcapstone/crush_integration.py +2 -1
package/src/skcapstone/daemon.py +151 -88
package/src/skcapstone/dashboard.py +10 -10
package/src/skcapstone/data/sk-agent-picker.sh +421 -0
package/src/skcapstone/data/systemd/skcapstone-api.socket +9 -0
package/src/skcapstone/data/systemd/skcapstone-memory-compress.service +18 -0
package/src/skcapstone/data/systemd/skcapstone-memory-compress.timer +11 -0
package/src/skcapstone/data/systemd/skcapstone.service +37 -0
package/src/skcapstone/data/systemd/skcapstone@.service +50 -0
package/src/skcapstone/data/systemd/skcomms-heartbeat.service +18 -0
package/{systemd/skcomm-heartbeat.timer → src/skcapstone/data/systemd/skcomms-heartbeat.timer} +2 -2
package/src/skcapstone/data/systemd/skcomms-queue-drain.service +17 -0
package/{systemd/skcomm-queue-drain.timer → src/skcapstone/data/systemd/skcomms-queue-drain.timer} +2 -2
package/src/skcapstone/defaults/claude/CLAUDE.md +67 -0
package/src/skcapstone/defaults/claude/settings.json +74 -0
package/src/skcapstone/defaults/lumina/config/claude-hooks.md +57 -0
package/src/skcapstone/defaults/lumina/config/skgraph.yaml +55 -10
package/src/skcapstone/defaults/lumina/config/skmemory.yaml +79 -13
package/src/skcapstone/defaults/lumina/config/skvector.yaml +60 -9
package/src/skcapstone/defaults/lumina/memory/long-term/18b9c0d1e2f3-cloud9-protocol.json +2 -2
package/src/skcapstone/defaults/lumina/memory/long-term/a1b2c3d4e5f6-ecosystem-overview.json +2 -2
package/src/skcapstone/defaults/lumina/memory/long-term/b2c3d4e5f6a7-five-pillars.json +9 -9
package/src/skcapstone/defaults/lumina/memory/long-term/d4e5f6a7b8c9-site-directory.json +2 -2
package/src/skcapstone/defaults/unhinged.json +13 -0
package/src/skcapstone/discovery.py +43 -20
package/src/skcapstone/doctor.py +941 -22
package/src/skcapstone/dreaming.py +1183 -109
package/src/skcapstone/emotion_tracker.py +2 -2
package/src/skcapstone/export.py +4 -3
package/src/skcapstone/fuse_mount.py +35 -25
package/src/skcapstone/gui_installer.py +2 -2
package/src/skcapstone/heartbeat.py +34 -30
package/src/skcapstone/housekeeping.py +14 -14
package/src/skcapstone/install_wizard.py +209 -7
package/src/skcapstone/itil.py +13 -4
package/src/skcapstone/kms_scheduler.py +10 -8
package/src/skcapstone/launchd.py +426 -0
package/src/skcapstone/mcp_launcher.py +15 -1
package/src/skcapstone/mcp_server.py +341 -49
package/src/skcapstone/mcp_tools/__init__.py +2 -0
package/src/skcapstone/mcp_tools/_helpers.py +2 -2
package/src/skcapstone/mcp_tools/ansible_tools.py +7 -4
package/src/skcapstone/mcp_tools/brain_first_tools.py +90 -0
package/src/skcapstone/mcp_tools/capauth_tools.py +7 -4
package/src/skcapstone/mcp_tools/comm_tools.py +10 -10
package/src/skcapstone/mcp_tools/coord_tools.py +8 -4
package/src/skcapstone/mcp_tools/did_tools.py +11 -8
package/src/skcapstone/mcp_tools/gtd_tools.py +4 -4
package/src/skcapstone/mcp_tools/memory_tools.py +6 -2
package/src/skcapstone/mcp_tools/notification_tools.py +22 -6
package/src/skcapstone/mcp_tools/{skcomm_tools.py → skcomms_tools.py} +14 -14
package/src/skcapstone/mcp_tools/soul_tools.py +8 -2
package/src/skcapstone/mdns_discovery.py +2 -2
package/src/skcapstone/memory_curator.py +1 -1
package/src/skcapstone/memory_engine.py +10 -3
package/src/skcapstone/metrics.py +30 -16
package/src/skcapstone/migrate_memories.py +4 -3
package/src/skcapstone/migrate_multi_agent.py +8 -7
package/src/skcapstone/models.py +47 -5
package/src/skcapstone/notifications.py +42 -18
package/src/skcapstone/onboard.py +1000 -126
package/src/skcapstone/operator_link.py +170 -0
package/src/skcapstone/peer_directory.py +4 -4
package/src/skcapstone/peers.py +19 -19
package/src/skcapstone/pillars/__init__.py +7 -5
package/src/skcapstone/pillars/consciousness.py +191 -0
package/src/skcapstone/pillars/identity.py +51 -7
package/src/skcapstone/pillars/memory.py +9 -3
package/src/skcapstone/pillars/sync.py +2 -2
package/src/skcapstone/preflight.py +3 -3
package/src/skcapstone/providers/docker.py +28 -28
package/src/skcapstone/register.py +6 -6
package/src/skcapstone/registry_client.py +5 -4
package/src/skcapstone/runtime.py +14 -3
package/src/skcapstone/scheduled_tasks.py +254 -19
package/src/skcapstone/scheduler_jobs.py +456 -0
package/src/skcapstone/scheduler_runner.py +239 -0
package/src/skcapstone/scheduler_state.py +162 -0
package/src/skcapstone/sdk.py +310 -0
package/src/skcapstone/service_health.py +279 -39
package/src/skcapstone/session_briefing.py +108 -0
package/src/skcapstone/session_capture.py +1 -1
package/src/skcapstone/shell.py +7 -1
package/src/skcapstone/soul.py +3 -1
package/src/skcapstone/soul_switch.py +3 -1
package/src/skcapstone/summary.py +6 -6
package/src/skcapstone/sync_engine.py +15 -15
package/src/skcapstone/sync_watcher.py +2 -2
package/src/skcapstone/systemd.py +72 -21
package/src/skcapstone/team_comms.py +8 -8
package/src/skcapstone/team_engine.py +1 -1
package/src/skcapstone/testrunner.py +3 -3
package/src/skcapstone/trust_graph.py +40 -5
package/src/skcapstone/unified_search.py +15 -6
package/src/skcapstone/uninstall_wizard.py +11 -3
package/src/skcapstone/version_check.py +8 -4
package/src/skcapstone/warmth_anchor.py +4 -2
package/src/skcapstone/whoami.py +4 -4
package/systemd/skcapstone.service +4 -6
package/systemd/skcapstone@.service +7 -8
package/systemd/skcomms-heartbeat.service +21 -0
package/systemd/skcomms-heartbeat.timer +12 -0
package/systemd/skcomms-queue-drain.service +17 -0
package/systemd/skcomms-queue-drain.timer +12 -0
package/tests/conftest.py +39 -0
package/tests/integration/test_consciousness_e2e.py +39 -39
package/tests/test_agent_card.py +1 -1
package/tests/test_agent_home_scaffold.py +34 -0
package/tests/test_alerts_consumer_topics.py +27 -0
package/tests/test_backup.py +2 -1
package/tests/test_chat.py +6 -6
package/tests/test_claude_md.py +2 -2
package/tests/test_cli_skills.py +10 -10
package/tests/test_cli_test_cmd.py +4 -4
package/tests/test_cli_test_connection.py +1 -1
package/tests/test_cloud9_bridge.py +6 -6
package/tests/test_consciousness_e2e.py +1 -1
package/tests/test_consciousness_loop.py +10 -10
package/tests/test_coordination.py +25 -0
package/tests/test_cross_package.py +21 -21
package/tests/test_daemon.py +4 -4
package/tests/test_daemon_shutdown.py +1 -1
package/tests/test_docker_provider.py +29 -29
package/tests/test_doctor.py +400 -0
package/tests/test_doctor_skscheduler.py +50 -0
package/tests/test_dreaming_engine.py +147 -0
package/tests/test_dreaming_gtd_capture.py +35 -0
package/tests/test_e2e_automated.py +8 -5
package/tests/test_fuse_mount.py +10 -10
package/tests/test_gtd_brief.py +46 -0
package/tests/test_gtd_malformed_tolerance.py +31 -0
package/tests/test_housekeeping.py +15 -15
package/tests/test_identity_migrate.py +251 -0
package/tests/test_integration_backbone.py +598 -0
package/tests/test_itil_gtd_lifecycle.py +37 -0
package/tests/test_jobs_dropins.py +84 -0
package/tests/test_mcp_server.py +82 -37
package/tests/test_models.py +48 -4
package/tests/test_multi_agent.py +31 -29
package/tests/test_notifications.py +122 -32
package/tests/test_onboard.py +63 -75
package/tests/test_operator_link.py +78 -0
package/tests/test_peers.py +14 -14
package/tests/test_pillars.py +98 -0
package/tests/test_preflight.py +3 -3
package/tests/test_runtime.py +21 -0
package/tests/test_scheduled_tasks.py +11 -6
package/tests/test_scheduler_cli.py +47 -0
package/tests/test_scheduler_features.py +133 -0
package/tests/test_scheduler_integration.py +87 -0
package/tests/test_scheduler_jobs.py +155 -0
package/tests/test_scheduler_runner.py +64 -0
package/tests/test_scheduler_state.py +57 -0
package/tests/test_sdk.py +70 -0
package/tests/test_service_health_incidents.py +34 -0
package/tests/test_service_registry.py +52 -0
package/tests/test_session_briefing.py +130 -0
package/tests/test_snapshots.py +4 -4
package/tests/test_sync_pipeline.py +26 -26
package/tests/test_team_comms.py +2 -2
package/tests/test_testrunner.py +2 -2
package/tests/test_trust_graph.py +18 -0
package/tests/test_unified_search.py +2 -2
package/tests/test_version_check.py +10 -0
package/tests/test_version_cmd.py +8 -8
package/tests/test_whoami.py +1 -1
package/systemd/skcomm-heartbeat.service +0 -18
package/systemd/skcomm-queue-drain.service +0 -17
/package/{openclaw-plugin → openclaw-plugin.archived-2026-04-23}/package.json +0 -0
/package/{openclaw-plugin → openclaw-plugin.archived-2026-04-23}/src/openclaw.plugin.json +0 -0

package/scripts/wargov-ufo-capture/cdp_probe.py ADDED Viewed

@@ -0,0 +1,188 @@
+#!/usr/bin/env python3
+"""Probe war.gov/UFO/ via Lumina Chrome CDP (port 9222).
+Steps:
+  1. Open a new tab on war.gov/UFO/
+  2. Wait for Vue mount to load (CSV must be reachable)
+  3. Pull the CSV via in-page fetch
+  4. Inspect inline scripts for any release_2 link patterns
+  5. Save raw CSV + script index to ~/clawd/tmp/wargov-capture/probe-out/
+Output:
+  probe-out/uap-csv.csv          fresh CSV from the site
+  probe-out/file-index.json      inline-script link probe
+  probe-out/page-meta.json       URL/title/page render check
+"""
+from __future__ import annotations
+import json
+import sys
+import time
+import urllib.request
+from pathlib import Path
+import websocket  # websocket-client
+CDP_HTTP = "http://127.0.0.1:9222"
+TARGET = "https://www.war.gov/UFO/"
+OUT_DIR = Path("/home/cbrd21/clawd/tmp/wargov-capture/probe-out")
+OUT_DIR.mkdir(parents=True, exist_ok=True)
+def cdp_get(path: str) -> dict | list:
+    with urllib.request.urlopen(f"{CDP_HTTP}{path}") as r:
+        return json.loads(r.read())
+def open_tab(url: str) -> dict:
+    # Newer Chrome only accepts PUT on /json/new
+    req = urllib.request.Request(f"{CDP_HTTP}/json/new?{url}", method="PUT")
+    with urllib.request.urlopen(req, timeout=10) as r:
+        return json.loads(r.read())
+def close_tab(target_id: str) -> None:
+    try:
+        with urllib.request.urlopen(f"{CDP_HTTP}/json/close/{target_id}", timeout=5):
+            pass
+    except Exception:
+        pass
+class CDP:
+    def __init__(self, ws_url: str):
+        self.ws = websocket.create_connection(ws_url, timeout=60)
+        self.mid = 0
+    def call(self, method: str, params: dict | None = None, timeout: float = 30.0) -> dict:
+        self.mid += 1
+        msg_id = self.mid
+        self.ws.send(json.dumps({"id": msg_id, "method": method, "params": params or {}}))
+        self.ws.settimeout(timeout)
+        while True:
+            raw = self.ws.recv()
+            msg = json.loads(raw)
+            if msg.get("id") == msg_id:
+                if "error" in msg:
+                    raise RuntimeError(f"{method}: {msg['error']}")
+                return msg.get("result", {})
+    def wait_event(self, name: str, timeout: float = 30.0) -> dict:
+        deadline = time.time() + timeout
+        while time.time() < deadline:
+            self.ws.settimeout(max(0.1, deadline - time.time()))
+            try:
+                raw = self.ws.recv()
+            except websocket.WebSocketTimeoutException:
+                continue
+            msg = json.loads(raw)
+            if msg.get("method") == name:
+                return msg.get("params", {})
+        raise TimeoutError(f"event {name} did not fire within {timeout}s")
+    def close(self) -> None:
+        try:
+            self.ws.close()
+        except Exception:
+            pass
+def main() -> int:
+    print(f"[probe] opening tab → {TARGET}", flush=True)
+    tab = open_tab(TARGET)
+    target_id = tab["id"]
+    ws_url = tab["webSocketDebuggerUrl"]
+    print(f"[probe] tab id={target_id}", flush=True)
+    cdp = CDP(ws_url)
+    try:
+        cdp.call("Page.enable")
+        cdp.call("Runtime.enable")
+        cdp.call("Network.enable", {"maxPostDataSize": 0})
+        cdp.call("Page.navigate", {"url": TARGET})
+        try:
+            cdp.wait_event("Page.loadEventFired", timeout=30.0)
+        except TimeoutError:
+            print("[probe] Page.loadEventFired timeout — proceeding anyway", flush=True)
+        # Give the Vue mount a chance to render the CSV view
+        time.sleep(5.0)
+        # Page meta
+        meta_js = (
+            "({"
+            "  url: location.href,"
+            "  title: document.title,"
+            "  hasMainContent: !!document.querySelector('main'),"
+            "  scriptInlineCount: document.querySelectorAll('script:not([src])').length,"
+            "  ufoMentions: (document.body.innerText.match(/UAP|UFO|PURSUE/g) || []).length,"
+            "  releaseDateGuesses: Array.from(new Set((document.body.innerText.match(/\\b\\d{1,2}\\/\\d{1,2}\\/\\d{2,4}\\b/g) || []))),"
+            "  release2HrefCount: document.querySelectorAll('a[href*=\"release_2\"]').length,"
+            "  release2InHtml: (document.documentElement.outerHTML.match(/release_2/gi) || []).length"
+            "})"
+        )
+        meta = cdp.call("Runtime.evaluate", {"expression": meta_js, "returnByValue": True})
+        meta_val = meta.get("result", {}).get("value", {})
+        (OUT_DIR / "page-meta.json").write_text(json.dumps(meta_val, indent=2))
+        print(f"[probe] page-meta: {json.dumps(meta_val)}", flush=True)
+        # Pull the CSV via in-page fetch
+        csv_js = (
+            "(async () => {"
+            "  const u = '/Portals/1/Interactive/2026/UFO/uap-csv.csv';"
+            "  const r = await fetch(u, {credentials: 'include', cache: 'no-store'});"
+            "  return {status: r.status, len: (await r.clone().text()).length, text: await r.text()};"
+            "})()"
+        )
+        csv_res = cdp.call("Runtime.evaluate", {
+            "expression": csv_js,
+            "awaitPromise": True,
+            "returnByValue": True,
+        }, timeout=60)
+        csv_val = csv_res.get("result", {}).get("value", {})
+        if isinstance(csv_val, dict) and csv_val.get("status") == 200:
+            (OUT_DIR / "uap-csv.csv").write_text(csv_val["text"])
+            print(f"[probe] CSV pulled, {csv_val['len']} bytes", flush=True)
+        else:
+            print(f"[probe] CSV fetch failed: {csv_val}", flush=True)
+            (OUT_DIR / "uap-csv-error.json").write_text(json.dumps(csv_val, indent=2, default=str))
+        # Inspect inline scripts for release_2 hints
+        scripts_js = (
+            "(() => {"
+            "  const out = [];"
+            "  document.querySelectorAll('script:not([src])').forEach((s, i) => {"
+            "    const t = s.textContent || '';"
+            "    out.push({idx: i, len: t.length, hasRelease2: /release_2/i.test(t), hasFetch: /fetch\\(/.test(t), hasCsv: /\\.csv/.test(t), preview: t.slice(0, 400)});"
+            "  });"
+            "  return out;"
+            "})()"
+        )
+        scripts_res = cdp.call("Runtime.evaluate", {"expression": scripts_js, "returnByValue": True})
+        scripts_val = scripts_res.get("result", {}).get("value", [])
+        (OUT_DIR / "inline-scripts.json").write_text(json.dumps(scripts_val, indent=2))
+        print(f"[probe] inline scripts: {len(scripts_val)} ({sum(1 for s in scripts_val if s.get('hasRelease2'))} mention release_2)", flush=True)
+        # Probe for press release link
+        pr_js = (
+            "(() => {"
+            "  const links = Array.from(document.querySelectorAll('a[href]')).map(a => a.href);"
+            "  const press = links.filter(h => /News\\/Releases/i.test(h));"
+            "  const medialink = links.filter(h => /medialink\\/ufo/i.test(h));"
+            "  return {pressCount: press.length, press: press.slice(0, 20), medialinkCount: medialink.length, medialinkSample: medialink.slice(0, 20)};"
+            "})()"
+        )
+        pr_res = cdp.call("Runtime.evaluate", {"expression": pr_js, "returnByValue": True})
+        pr_val = pr_res.get("result", {}).get("value", {})
+        (OUT_DIR / "link-probe.json").write_text(json.dumps(pr_val, indent=2))
+        print(f"[probe] link probe: press={pr_val.get('pressCount')} medialink={pr_val.get('medialinkCount')}", flush=True)
+        print("[probe] DONE", flush=True)
+        return 0
+    finally:
+        cdp.close()
+        close_tab(target_id)
+if __name__ == "__main__":
+    sys.exit(main())

package/scripts/wargov-ufo-capture/cdp_splc_pressrelease.py ADDED Viewed

@@ -0,0 +1,101 @@
+#!/usr/bin/env python3
+"""Discover + capture the DOJ SPLC press release by NAVIGATING the search page
+(so JS renders the result list) then reading the rendered DOM. Falls back to
+scraping any /opa/pr/ or /news/ links the rendered page exposes.
+"""
+from __future__ import annotations
+import json, re, sys, time, urllib.request
+from pathlib import Path
+import websocket
+CDP_HTTP = "http://127.0.0.1:9222"
+SEARCH_URL = "https://www.justice.gov/news?search_api_fulltext=Southern%20Poverty%20Law%20Center"
+OUT = Path("/home/cbrd21/clawd/skills/substance-lens/captures/splc-doj-2026-06-03")
+def open_tab(url):
+    req = urllib.request.Request(f"{CDP_HTTP}/json/new?{url}", method="PUT")
+    with urllib.request.urlopen(req, timeout=10) as r:
+        return json.loads(r.read())
+def close_tab(tid):
+    try:
+        urllib.request.urlopen(f"{CDP_HTTP}/json/close/{tid}", timeout=5)
+    except Exception:
+        pass
+class CDP:
+    def __init__(self, ws): self.ws=websocket.create_connection(ws,timeout=120); self.mid=0
+    def call(self, m, p=None, t=60.0):
+        self.mid+=1; i=self.mid
+        self.ws.send(json.dumps({"id":i,"method":m,"params":p or {}})); self.ws.settimeout(t)
+        while True:
+            msg=json.loads(self.ws.recv())
+            if msg.get("id")==i:
+                if "error" in msg: raise RuntimeError(f"{m}: {msg['error']}")
+                return msg.get("result",{})
+    def wait(self, name, t=30.0):
+        end=time.time()+t
+        while time.time()<end:
+            self.ws.settimeout(max(0.1,end-time.time()))
+            try: msg=json.loads(self.ws.recv())
+            except websocket.WebSocketTimeoutException: continue
+            if msg.get("method")==name: return msg.get("params",{})
+        return {}
+    def close(self):
+        try: self.ws.close()
+        except Exception: pass
+def jseval(cdp, expr, t=60):
+    r=cdp.call("Runtime.evaluate",{"expression":expr,"awaitPromise":True,"returnByValue":True},t)
+    return r.get("result",{}).get("value")
+def fetch_text(cdp,url):
+    expr=(f"(async()=>{{try{{const r=await fetch({json.dumps(url)},{{credentials:'include',cache:'no-store'}});"
+          f"return {{status:r.status,text:await r.text()}};}}catch(e){{return{{status:-1,text:String(e)}};}}}})()")
+    v=jseval(cdp,expr,180) or {}
+    return v.get("status",0), v.get("text","")
+def main():
+    tab=open_tab(SEARCH_URL); tid=tab["id"]; cdp=CDP(tab["webSocketDebuggerUrl"])
+    try:
+        cdp.call("Page.enable"); cdp.call("Runtime.enable")
+        cdp.call("Page.navigate",{"url":SEARCH_URL})
+        cdp.wait("Page.loadEventFired",30.0)
+        time.sleep(6.0)  # let result JS render
+        links=jseval(cdp,
+            "JSON.stringify(Array.from(document.querySelectorAll('a[href]'))"
+            ".map(a=>({h:a.getAttribute('href'),t:(a.innerText||'').trim()}))"
+            ".filter(x=>x.h&&(x.h.includes('/opa/pr/')||x.h.includes('/usao-mdal/pr/')||/southern.poverty|law.center|splc/i.test(x.t))))")
+        cands=json.loads(links) if links else []
+        print(f"[pr] rendered candidates: {len(cands)}", flush=True)
+        for c in cands[:15]: print("   ", c["h"], "::", c["t"][:70], flush=True)
+        # pick best
+        pr=None
+        for c in cands:
+            if re.search(r"southern.poverty|law.center|splc|wire.fraud", (c["h"]+c["t"]).lower()):
+                pr=c["h"]; break
+        if not pr and cands: pr=cands[0]["h"]
+        if pr and pr.startswith("/"): pr="https://www.justice.gov"+pr
+        manifest={"search_url":SEARCH_URL,"rendered_candidates":cands[:15],"chosen":pr}
+        if pr:
+            print(f"[pr] fetching -> {pr}", flush=True)
+            st,html=fetch_text(cdp,pr)
+            print(f"[pr] status={st} len={len(html)}", flush=True)
+            if st==200 and html:
+                (OUT/"doj-press-release.html").write_text(html)
+                txt=jseval(cdp,
+                    f"(async()=>{{const r=await fetch({json.dumps(pr)},{{credentials:'include'}});"
+                    f"const h=await r.text();const d=new DOMParser().parseFromString(h,'text/html');"
+                    f"const a=d.querySelector('.field--name-body')||d.querySelector('article')||d.querySelector('main')||d.body;"
+                    f"return a?a.innerText:'';}})()",60) or ""
+                if txt: (OUT/"doj-press-release.txt").write_text(txt); print(f"[pr] {len(txt)} chars text", flush=True)
+                manifest["status"]=st; manifest["txt_chars"]=len(txt)
+        (OUT/"press-release-discovery.json").write_text(json.dumps(manifest,indent=2))
+        print("[pr] done", flush=True)
+        return 0
+    finally:
+        cdp.close(); close_tab(tid)
+if __name__=="__main__":
+    sys.exit(main())

package/scripts/wargov-ufo-capture/parse_csv.py ADDED Viewed

@@ -0,0 +1,95 @@
+#!/usr/bin/env python3
+"""Parse the new uap-data.csv and split Release 01 vs Release 02 records.
+The CSV has multi-line quoted fields (newlines inside Title and Description Blurb),
+so we use Python's csv module rather than naive line counting.
+"""
+from __future__ import annotations
+import csv
+import json
+from collections import Counter, defaultdict
+from pathlib import Path
+CSV_PATH = Path("/home/cbrd21/nextcloud/cbrd21-share/reference/war-gov-UFO-PURSUE-2026/docs/release-02/uap-data.csv")
+OUT_DIR = Path("/home/cbrd21/clawd/tmp/wargov-capture/probe-out")
+OUT_DIR.mkdir(parents=True, exist_ok=True)
+with CSV_PATH.open(newline="", encoding="utf-8") as f:
+    reader = csv.DictReader(f)
+    rows = [r for r in reader]
+print(f"Total records: {len(rows)}")
+date_counter = Counter()
+for r in rows:
+    date_counter[(r.get("Release Date") or "").strip()] += 1
+print("Release dates:")
+for d, c in sorted(date_counter.items(), key=lambda x: -x[1]):
+    print(f"  {d!r:15} → {c}")
+# Filter for Release 02
+release2 = [r for r in rows if (r.get("Release Date") or "").strip() == "5/22/26"]
+print(f"\nRelease 02 records: {len(release2)}")
+# Bucket by type
+type_counter = Counter()
+agency_counter = Counter()
+for r in release2:
+    type_counter[(r.get("Type") or "").strip()] += 1
+    agency_counter[(r.get("Agency") or "").strip()] += 1
+print("Types:")
+for t, c in type_counter.most_common():
+    print(f"  {t!r:15} → {c}")
+print("Agencies:")
+for a, c in agency_counter.most_common():
+    print(f"  {a!r:15} → {c}")
+# Extract download links
+links = []
+for r in release2:
+    pdf_link = (r.get("PDF | Image Link") or "").strip()
+    modal = (r.get("Modal Image") or "").strip()
+    dvids = (r.get("DVIDS Video ID") or "").strip()
+    title = (r.get("Title") or "").strip().replace("\n", " ").replace("\r", "")
+    rtype = (r.get("Type") or "").strip()
+    agency = (r.get("Agency") or "").strip()
+    incident_date = (r.get("Incident Date") or "").strip()
+    incident_loc = (r.get("Incident Location") or "").strip()
+    links.append({
+        "title": title,
+        "type": rtype,
+        "agency": agency,
+        "incident_date": incident_date,
+        "incident_location": incident_loc,
+        "pdf_link": pdf_link,
+        "modal_image": modal,
+        "dvids_id": dvids,
+    })
+# Save full inventory
+(OUT_DIR / "release-02-records.json").write_text(json.dumps(links, indent=2))
+print(f"\nSaved inventory: {OUT_DIR / 'release-02-records.json'}")
+# Unique direct-fetchable URLs
+urls = set()
+for L in links:
+    if L["pdf_link"]:
+        urls.add(L["pdf_link"])
+    if L["modal_image"]:
+        urls.add(L["modal_image"])
+urls_list = sorted(urls)
+print(f"\nUnique direct URLs: {len(urls_list)}")
+for u in urls_list[:15]:
+    print(f"  {u}")
+if len(urls_list) > 15:
+    print(f"  ... and {len(urls_list) - 15} more")
+(OUT_DIR / "release-02-urls.json").write_text(json.dumps(urls_list, indent=2))
+# DVIDS-only records (videos hosted exclusively on DVIDS)
+dvids_only = [L for L in links if L["dvids_id"] and not L["pdf_link"]]
+print(f"\nDVIDS-only video records: {len(dvids_only)}")
+for L in dvids_only[:10]:
+    print(f"  DVIDS {L['dvids_id']}: {L['title'][:80]}")
+(OUT_DIR / "release-02-dvids.json").write_text(json.dumps(dvids_only, indent=2))

package/scripts/wargov-ufo-capture/pull_dvids.sh ADDED Viewed

@@ -0,0 +1,107 @@
+#!/usr/bin/env bash
+# Pull DVIDS media for Release 02 in parallel (up to 4 at a time).
+# Reads inventory from probe-out/release-02-records.json.
+set -u
+OUT_DIR="$HOME/nextcloud/cbrd21-share/reference/war-gov-UFO-PURSUE-2026/release-02"
+INVENTORY="$HOME/clawd/tmp/wargov-capture/probe-out/release-02-records.json"
+LOG="$HOME/clawd/tmp/wargov-capture/probe-out/dvids-pull.log"
+mkdir -p "$OUT_DIR"
+: > "$LOG"
+pull_one() {
+  local dvids_id="$1"
+  local title_slug="$2"
+  local kind="$3"  # video or audio
+  local out_path="$OUT_DIR/dvids-${kind}-${dvids_id}-${title_slug}"
+  # Pick the right URL prefix
+  local page_url
+  if [[ "$kind" == "audio" ]]; then
+    page_url="https://www.dvidshub.net/audio/${dvids_id}"
+  else
+    page_url="https://www.dvidshub.net/video/${dvids_id}"
+  fi
+  local page_html
+  page_html=$(curl -sSL --max-time 60 "$page_url" 2>/dev/null) || {
+    echo "[FAIL fetch page] dvids=$dvids_id" | tee -a "$LOG"
+    return 1
+  }
+  # Extract mp4 (video) or mp3 (audio) CDN URL
+  local media_url ext
+  if [[ "$kind" == "audio" ]]; then
+    media_url=$(echo "$page_html" | grep -oE 'https?://[^"]+\.mp3[^"]*' | head -1)
+    ext="mp3"
+    # DVIDS audio sometimes is .m4a or hosted via a different path; fallback to grepping for asset URL
+    if [[ -z "$media_url" ]]; then
+      media_url=$(echo "$page_html" | grep -oE 'https?://[^"]+\.m4a[^"]*' | head -1)
+      ext="m4a"
+    fi
+    if [[ -z "$media_url" ]]; then
+      media_url=$(echo "$page_html" | grep -oE 'https?://d34w7g4gy10iej\.cloudfront\.net/[^"]+' | head -1)
+      ext="${media_url##*.}"
+    fi
+  else
+    media_url=$(echo "$page_html" | grep -oE 'https?://[^"]+\.mp4[^"]*' | head -1)
+    ext="mp4"
+  fi
+  if [[ -z "$media_url" ]]; then
+    echo "[FAIL no-media-url] dvids=$dvids_id kind=$kind" | tee -a "$LOG"
+    # Save the page HTML for inspection
+    echo "$page_html" > "${out_path}.html"
+    return 1
+  fi
+  local final_path="${out_path}.${ext}"
+  if [[ -f "$final_path" ]] && [[ -s "$final_path" ]]; then
+    echo "[SKIP already-have] $final_path" | tee -a "$LOG"
+    return 0
+  fi
+  curl -sSL --max-time 600 -o "$final_path" "$media_url" 2>/dev/null
+  local size
+  size=$(stat -c '%s' "$final_path" 2>/dev/null || echo 0)
+  if [[ "$size" -lt 1024 ]]; then
+    echo "[FAIL download too-small=$size] dvids=$dvids_id url=$media_url" | tee -a "$LOG"
+    return 1
+  fi
+  echo "[OK] dvids=$dvids_id kind=$kind size=$((size/1024))KB → $(basename "$final_path")" | tee -a "$LOG"
+}
+# Generate worker commands from the inventory using python
+python3 - <<'PY' > /tmp/wargov-dvids-jobs.txt
+import json, re
+with open("/home/cbrd21/clawd/tmp/wargov-capture/probe-out/release-02-records.json") as f:
+    records = json.load(f)
+for r in records:
+    if not r["dvids_id"]:
+        continue
+    kind = "audio" if r["type"] == "AUD" else "video"
+    # Slugify title: strip quotes, collapse non-alnum to dashes, limit length
+    title = r["title"]
+    slug = re.sub(r'[^a-zA-Z0-9]+', '-', title).strip('-').lower()[:60]
+    # Use the DOW-UAP-PR id from the title if available (more durable)
+    m = re.match(r'([A-Z]+-UAP-(?:PR|D)[0-9]+[a-z]?)', title)
+    if m:
+        slug = m.group(1).lower() + "-" + slug[:30]
+    print(f"{r['dvids_id']}\t{slug}\t{kind}")
+PY
+JOB_COUNT=$(wc -l < /tmp/wargov-dvids-jobs.txt)
+echo "[plan] $JOB_COUNT DVIDS jobs queued" | tee -a "$LOG"
+export -f pull_one
+export OUT_DIR LOG
+# Run with xargs -P 4 (parallelism 4)
+cat /tmp/wargov-dvids-jobs.txt | while IFS=$'\t' read -r id slug kind; do
+  echo "$id $slug $kind"
+done | xargs -L 1 -P 4 -I {} bash -c 'set -- {}; pull_one "$1" "$2" "$3"'
+OK_COUNT=$(grep -c '^\[OK\]' "$LOG" || true)
+FAIL_COUNT=$(grep -cE '^\[FAIL' "$LOG" || true)
+SKIP_COUNT=$(grep -c '^\[SKIP' "$LOG" || true)
+echo "[done] OK=$OK_COUNT FAIL=$FAIL_COUNT SKIP=$SKIP_COUNT" | tee -a "$LOG"