@smilintux/skcapstone 0.6.2 → 0.6.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (70) hide show
  1. package/.github/workflows/publish.yml +1 -1
  2. package/CLAUDE.md +17 -0
  3. package/docs/CUSTOM_AGENT.md +40 -28
  4. package/docs/SOUL_SWAPPER.md +5 -5
  5. package/docs/hammertime-audit.md +402 -0
  6. package/openclaw-plugin/src/index.ts +2 -1
  7. package/package.json +1 -1
  8. package/pyproject.toml +2 -1
  9. package/scripts/install.sh +126 -1
  10. package/scripts/model-fallback-monitor.sh +4 -2
  11. package/scripts/refresh-anthropic-token.sh +9 -3
  12. package/scripts/release.sh +98 -0
  13. package/scripts/session-to-memory.py +1 -1
  14. package/scripts/sk-agent-picker.sh +237 -0
  15. package/scripts/telegram-catchup-all.sh +2 -1
  16. package/scripts/watch-anthropic-token.sh +12 -17
  17. package/src/skcapstone/__init__.py +34 -2
  18. package/src/skcapstone/cli/__init__.py +3 -1
  19. package/src/skcapstone/cli/_common.py +1 -0
  20. package/src/skcapstone/cli/context_cmd.py +16 -4
  21. package/src/skcapstone/cli/daemon.py +2 -1
  22. package/src/skcapstone/cli/joule_cmd.py +7 -3
  23. package/src/skcapstone/cli/memory.py +4 -2
  24. package/src/skcapstone/cli/register_cmd.py +19 -3
  25. package/src/skcapstone/cli/session.py +25 -0
  26. package/src/skcapstone/cli/setup.py +96 -30
  27. package/src/skcapstone/cli/soul.py +3 -3
  28. package/src/skcapstone/context_loader.py +9 -0
  29. package/src/skcapstone/coordination.py +9 -2
  30. package/src/skcapstone/daemon.py +22 -12
  31. package/src/skcapstone/defaults/claude/CLAUDE.md +67 -0
  32. package/src/skcapstone/defaults/claude/settings.json +74 -0
  33. package/src/skcapstone/defaults/lumina/config/skgraph.yaml +55 -10
  34. package/src/skcapstone/defaults/lumina/config/skmemory.yaml +79 -13
  35. package/src/skcapstone/defaults/lumina/config/skvector.yaml +60 -9
  36. package/src/skcapstone/defaults/unhinged.json +13 -0
  37. package/src/skcapstone/discovery.py +5 -5
  38. package/src/skcapstone/doctor.py +4 -2
  39. package/src/skcapstone/dreaming.py +3 -1
  40. package/src/skcapstone/fuse_mount.py +3 -1
  41. package/src/skcapstone/housekeeping.py +3 -3
  42. package/src/skcapstone/install_wizard.py +131 -0
  43. package/src/skcapstone/mcp_launcher.py +14 -1
  44. package/src/skcapstone/mcp_server.py +6 -21
  45. package/src/skcapstone/mcp_tools/notification_tools.py +3 -1
  46. package/src/skcapstone/memory_engine.py +10 -3
  47. package/src/skcapstone/migrate_multi_agent.py +7 -6
  48. package/src/skcapstone/notifications.py +6 -2
  49. package/src/skcapstone/onboard.py +19 -8
  50. package/src/skcapstone/operator_link.py +164 -0
  51. package/src/skcapstone/pillars/consciousness.py +2 -1
  52. package/src/skcapstone/pillars/identity.py +51 -7
  53. package/src/skcapstone/pillars/memory.py +9 -3
  54. package/src/skcapstone/runtime.py +13 -3
  55. package/src/skcapstone/service_health.py +23 -10
  56. package/src/skcapstone/session_briefing.py +108 -0
  57. package/src/skcapstone/trust_graph.py +40 -5
  58. package/src/skcapstone/unified_search.py +11 -2
  59. package/systemd/skcapstone.service +4 -6
  60. package/systemd/skcapstone@.service +7 -8
  61. package/systemd/skcomm-heartbeat.service +5 -2
  62. package/tests/conftest.py +21 -0
  63. package/tests/test_agent_home_scaffold.py +34 -0
  64. package/tests/test_backup.py +2 -1
  65. package/tests/test_mcp_server.py +78 -33
  66. package/tests/test_multi_agent.py +31 -29
  67. package/tests/test_operator_link.py +78 -0
  68. package/tests/test_runtime.py +21 -0
  69. package/tests/test_session_briefing.py +130 -0
  70. package/tests/test_trust_graph.py +18 -0
@@ -43,7 +43,7 @@ jobs:
43
43
  fi
44
44
  - run: pip install build twine
45
45
  - run: python -m build
46
- - run: twine upload dist/*
46
+ - run: twine upload --skip-existing dist/*
47
47
  env:
48
48
  TWINE_USERNAME: __token__
49
49
  TWINE_PASSWORD: ${{ secrets.PYPI_API_TOKEN }}
package/CLAUDE.md CHANGED
@@ -15,6 +15,23 @@ skcapstone coord briefing
15
15
  This prints the complete protocol, JSON schemas, rules, and a live snapshot
16
16
  of current tasks and agent assignments. It works in any terminal.
17
17
 
18
+ ## Agent Switching
19
+
20
+ `SKAGENT` is the primary env var for selecting the active agent across all SK*
21
+ packages (skcapstone, skmemory, skcomm, skchat). Legacy vars `SKCAPSTONE_AGENT`
22
+ and `SKMEMORY_AGENT` are still supported as fallbacks.
23
+
24
+ ```bash
25
+ skswitch lumina # Switch active agent for this shell session
26
+ skswitch opus # Sets SKAGENT + SKCAPSTONE_AGENT + SKMEMORY_AGENT
27
+ skswitch # Interactive picker (if multiple agents)
28
+ SKAGENT=jarvis claude # One-shot override for a single command
29
+ ```
30
+
31
+ `skswitch` is installed automatically by `scripts/install.sh` via the agent
32
+ picker (`sk-agent-picker.sh`). It validates the agent directory exists and
33
+ updates all three env vars in one shot.
34
+
18
35
  ## Quick Reference
19
36
 
20
37
  ```bash
@@ -14,7 +14,7 @@ cp -r src/skcapstone/defaults/lumina ~/.skcapstone/agents/myagent
14
14
  $EDITOR ~/.skcapstone/agents/myagent/soul/base.json
15
15
 
16
16
  # 3. Activate your agent
17
- export SKCAPSTONE_AGENT=myagent
17
+ skswitch myagent
18
18
  skcapstone soul status --agent myagent
19
19
  ```
20
20
 
@@ -167,22 +167,32 @@ Once you've created your agent, you need to configure your AI client tools
167
167
  (Claude Code, Claude Desktop, Cursor, OpenClaw, etc.) so they connect MCP
168
168
  servers to the correct agent profile.
169
169
 
170
- ### The Key: `SKCAPSTONE_AGENT` Environment Variable
170
+ ### The Key: `SKAGENT` Environment Variable
171
171
 
172
- All SK\* MCP servers read `SKCAPSTONE_AGENT` from their environment to
173
- determine which agent profile to load. If unset, they default to `lumina`.
172
+ All SK\* MCP servers read `SKAGENT` from their environment to determine
173
+ which agent profile to load. Legacy vars `SKCAPSTONE_AGENT` and
174
+ `SKMEMORY_AGENT` are supported as fallbacks.
174
175
 
175
176
  The priority chain (highest wins):
176
177
 
177
- 1. `SKMEMORY_AGENT` — skmemory-specific override (rarely needed)
178
- 2. `SKCAPSTONE_AGENT` — universal, used by all SK\* packages
179
- 3. Falls back to `"lumina"`
178
+ 1. `SKAGENT` — primary, used by all SK\* packages
179
+ 2. `SKCAPSTONE_AGENT` — legacy fallback
180
+ 3. `SKMEMORY_AGENT` skmemory-specific legacy override
181
+ 4. First non-template agent in `~/.skcapstone/agents/`
182
+
183
+ Use `skswitch` to change the active agent for the current shell (updates
184
+ all three vars in one shot):
185
+
186
+ ```bash
187
+ skswitch lumina # named switch
188
+ skswitch # interactive picker
189
+ ```
180
190
 
181
191
  ### Claude Code (`~/.claude/mcp.json`)
182
192
 
183
193
  **Do NOT hardcode the agent name in the MCP config.** MCP servers inherit
184
194
  environment variables from the parent process, so if you launch Claude Code
185
- with `SKCAPSTONE_AGENT` set, all servers pick it up automatically.
195
+ with `SKAGENT` set, all servers pick it up automatically.
186
196
 
187
197
  ```json
188
198
  {
@@ -207,7 +217,7 @@ with `SKCAPSTONE_AGENT` set, all servers pick it up automatically.
207
217
  }
208
218
  ```
209
219
 
210
- Notice: **no `env` blocks with `SKCAPSTONE_AGENT`**. This is intentional.
220
+ Notice: **no `env` blocks with `SKAGENT`**. This is intentional.
211
221
  The servers inherit the variable from the shell.
212
222
 
213
223
  Then launch as any agent:
@@ -217,10 +227,12 @@ Then launch as any agent:
217
227
  claude
218
228
 
219
229
  # As Jarvis
220
- SKCAPSTONE_AGENT=jarvis claude
230
+ skswitch jarvis && claude
231
+ # or one-shot:
232
+ SKAGENT=jarvis claude
221
233
 
222
234
  # As a custom agent
223
- SKCAPSTONE_AGENT=nova claude
235
+ SKAGENT=nova claude
224
236
  ```
225
237
 
226
238
  **Anti-pattern — do NOT do this:**
@@ -242,7 +254,7 @@ regardless of what you pass on the command line.
242
254
 
243
255
  ### Claude Desktop (`claude_desktop_config.json`)
244
256
 
245
- Same principle — omit `SKCAPSTONE_AGENT` from the `env` block if you want
257
+ Same principle — omit `SKAGENT` from the `env` block if you want
246
258
  it inherited from the parent process. If Claude Desktop doesn't propagate
247
259
  env vars from the shell, you can set it explicitly per config:
248
260
 
@@ -253,7 +265,7 @@ env vars from the shell, you can set it explicitly per config:
253
265
  "command": "skcapstone-mcp",
254
266
  "args": [],
255
267
  "env": {
256
- "SKCAPSTONE_AGENT": "jarvis"
268
+ "SKAGENT": "jarvis"
257
269
  }
258
270
  }
259
271
  }
@@ -282,30 +294,29 @@ Works the same as Claude Code. Place the config at project root or
282
294
 
283
295
  ### OpenClaw (`~/.openclaw/openclaw.json`)
284
296
 
285
- OpenClaw plugins read `SKCAPSTONE_AGENT` from the environment at startup.
297
+ OpenClaw plugins read `SKAGENT` from the environment at startup.
286
298
  Set it before launching:
287
299
 
288
300
  ```bash
289
- SKCAPSTONE_AGENT=nova openclaw
301
+ SKAGENT=nova openclaw
290
302
  ```
291
303
 
292
- Or set it in your shell profile for a persistent default:
304
+ Or use `skswitch` for a persistent default in the current shell:
293
305
 
294
306
  ```bash
295
- # ~/.bashrc or ~/.zshrc
296
- export SKCAPSTONE_AGENT=lumina
307
+ skswitch lumina
308
+ openclaw
297
309
  ```
298
310
 
299
- ### Shell Aliases (Convenience)
311
+ ### Quick Agent Switching with `skswitch`
300
312
 
301
- Add these to `~/.bashrc` or `~/.zshrc` for quick agent switching:
313
+ `skswitch` is installed automatically with skcapstone. It updates `SKAGENT`,
314
+ `SKCAPSTONE_AGENT`, and `SKMEMORY_AGENT` in one shot:
302
315
 
303
316
  ```bash
304
- # Launch Claude Code as different agents
305
- alias claude-lumina='SKCAPSTONE_AGENT=lumina claude'
306
- alias claude-jarvis='SKCAPSTONE_AGENT=jarvis claude'
307
- alias claude-opus='SKCAPSTONE_AGENT=opus claude'
308
- alias claude-nova='SKCAPSTONE_AGENT=nova claude'
317
+ skswitch lumina # Named switch
318
+ skswitch # Interactive picker (if multiple agents)
319
+ SKAGENT=jarvis claude # One-shot override for a single command
309
320
  ```
310
321
 
311
322
  ### systemd Services
@@ -313,7 +324,7 @@ alias claude-nova='SKCAPSTONE_AGENT=nova claude'
313
324
  For background daemons, set the agent via the templated service unit:
314
325
 
315
326
  ```bash
316
- # Uses SKCAPSTONE_AGENT=%i from the unit template
327
+ # Uses SKAGENT=%i + SKCAPSTONE_AGENT=%i from the unit template
317
328
  systemctl --user start skcapstone@jarvis
318
329
  systemctl --user start skcapstone@nova
319
330
  ```
@@ -322,6 +333,7 @@ Or set it in a non-templated service:
322
333
 
323
334
  ```ini
324
335
  [Service]
336
+ Environment=SKAGENT=jarvis
325
337
  Environment=SKCAPSTONE_AGENT=jarvis
326
338
  ```
327
339
 
@@ -331,7 +343,7 @@ After launching, confirm which agent is active:
331
343
 
332
344
  ```bash
333
345
  # In the terminal
334
- echo $SKCAPSTONE_AGENT
346
+ echo $SKAGENT
335
347
 
336
348
  # Via the CLI
337
349
  skcapstone status
@@ -340,7 +352,7 @@ skcapstone status
340
352
  skmemory ritual --dry-run
341
353
  ```
342
354
 
343
- In Claude Code, ask the agent to run `echo $SKCAPSTONE_AGENT` to confirm
355
+ In Claude Code, ask the agent to run `echo $SKAGENT` to confirm
344
356
  the MCP servers loaded the correct profile.
345
357
 
346
358
  ---
@@ -126,7 +126,7 @@ skcapstone soul install-all ~/clawd/soul-blueprints/blueprints/
126
126
 
127
127
  ## 4. CLI Reference
128
128
 
129
- All soul commands live under the `skcapstone soul` group. Every command accepts a `--agent` / `-a` flag to target a specific agent profile (defaults to `SKCAPSTONE_AGENT` env var or `lumina`).
129
+ All soul commands live under the `skcapstone soul` group. Every command accepts a `--agent` / `-a` flag to target a specific agent profile (defaults to `SKAGENT` env var, with fallback to `SKCAPSTONE_AGENT`).
130
130
 
131
131
  ### `soul list`
132
132
 
@@ -488,7 +488,7 @@ Every soul command supports the `--agent` / `-a` flag to target a specific agent
488
488
 
489
489
  ### How it works
490
490
 
491
- When `--agent casey` is passed (or `SKCAPSTONE_AGENT=casey` is set), all soul data is stored under:
491
+ When `--agent casey` is passed (or `SKAGENT=casey` / `skswitch casey` is used), all soul data is stored under:
492
492
 
493
493
  ```
494
494
  ~/.skcapstone/agents/casey/soul/
@@ -520,10 +520,10 @@ skcapstone soul status --agent nova # -> base
520
520
 
521
521
  ### Environment variable
522
522
 
523
- Instead of passing `--agent` every time, set the environment variable:
523
+ Instead of passing `--agent` every time, use `skswitch`:
524
524
 
525
525
  ```bash
526
- export SKCAPSTONE_AGENT=casey
526
+ skswitch casey
527
527
  skcapstone soul swap the-attorney # targets casey automatically
528
528
  ```
529
529
 
@@ -775,7 +775,7 @@ Registers all `skcapstone soul *` commands via Click. Key implementation details
775
775
 
776
776
  - `_find_blueprint_in_repo(slug)` -- Searches `~/clawd/soul-blueprints/blueprints/*/` for a matching file, trying hyphenated, underscored, and uppercased variants
777
777
  - `soul swap` -- The most complex command; searches installed, then repo, auto-installs if needed, records audit events
778
- - All commands use `SoulManager` with the agent name from `--agent` / `SKCAPSTONE_AGENT`
778
+ - All commands use `SoulManager` with the agent name from `--agent` / `SKAGENT`
779
779
 
780
780
  ### `mcp_tools/soul_tools.py` -- MCP Handlers
781
781
 
@@ -0,0 +1,402 @@
1
+ # hammerTime Audit — Backport Analysis
2
+
3
+ **Date:** 2026-04-09
4
+ **Auditor:** Opus (Claude Code subagent)
5
+ **Source repo:** https://skgit.skstack01.douno.it/smilinTux/hammerTime
6
+ **Target repos:** skmemory, skcapstone
7
+
8
+ ---
9
+
10
+ ## File Tree Summary
11
+
12
+ Top-level structure (code-relevant):
13
+
14
+ ```
15
+ scripts/ # All Python pipeline scripts (~55 files)
16
+ context_bridge_lib.py # 2,800+ line unified retrieval library (THE core)
17
+ context-bridge.py # thin wrapper → main()
18
+ issue-pack.py # thin wrapper → main(mode_override="issue-pack")
19
+ decompose.py # L3 decomposition engine
20
+ pipeline.py # 5-layer orchestrator
21
+ import-qdrant-v2.py # L4 vector embed + Qdrant upsert
22
+ import-falkordb-v2.py # L5 graph import
23
+ corpus_release.py # corpus release/alias/promotion model
24
+ distributed-worker.py # multi-GPU SSH coordinator
25
+ rebuild-stores.py # full/incremental corpus rebuild
26
+ research-synthesis.py # synthesis + filing-ready packet builder
27
+ corpus-guardian.py # health validation daemon
28
+ manage-decomposed.py # decomposed artifact state manager
29
+ case_facts.py # case-fact loader (incident/problem/profile)
30
+ ...47 other scripts
31
+ .cursor/skills/ # 37+ skill definitions (trigger-mapped)
32
+ json/decomposed/ # L3 output: slug.json per artifact
33
+ json/state/ # corpus release state machine files
34
+ json/releases/ # release manifests (dev/uat/prod)
35
+ json/schemas/ # JSON schemas
36
+ incidents/ # Case workspace (problem → incident → artifacts)
37
+ knowledge/ # Primary corpus (markdown)
38
+ templates/ # Filing templates
39
+ profiles/ # Person/company YAML profiles
40
+ models/bge-legal-v1/ # Sovereign embedding model (local)
41
+ ```
42
+
43
+ Key infrastructure:
44
+ - **Qdrant** at `skvector.nativeassetmanagement.com` (collection: `hammertime-v3`, 1024-dim cosine, `bge-legal-v1`)
45
+ - **FalkorDB** at `skgraph.nativeassetmanagement.com:6381` (graph: `hammertime-v2`)
46
+ - **7-node GPU cluster** (chiap01–chiap08 + chiwk12) running Ollama with bge-legal-v1
47
+ - **Embedding model**: `chefboyrave21/bge-legal-v1` (1024-dim, sovereign HuggingFace model)
48
+
49
+ ---
50
+
51
+ ## Key Patterns Found
52
+
53
+ ### L3 Decomposition
54
+
55
+ **Script:** `scripts/decompose.py` (standalone) + `skmemory.decompose.decompose_content` (shared library)
56
+
57
+ hammerTime's decomposition is domain-specialized for legal documents but structurally similar to skmemory's `decompose_content`. Key differences:
58
+
59
+ **hammerTime extras skmemory lacks:**
60
+ 1. **6 citation regex types**: UCC sections, UCC forms (UCC-1/3), CFR, USC, case citations (Smith v. Jones, 123 F.2d 456), Public Law, IRS forms — skmemory has a simpler generic citation extractor
61
+ 2. **Trust type extraction**: 9 named trust forms (Express, Constructive, Resulting, Statutory, etc.)
62
+ 3. **Maritime/Admiralty extraction**: dedicated regex for maritime lien patterns
63
+ 4. **Legal principle extraction**: 25 named principles (Holder in Due Course, Quantum Meruit, etc.)
64
+ 5. **Agency/court extraction**: 20+ named agencies (IRS, Fed Reserve, CFPB, OCC, etc.)
65
+ 6. **Claim confidence scoring**: chunks marked `high/medium/low` based on claim indicator phrases
66
+ 7. **Section-title tracking per chunk**: exact heading ancestry embedded in each chunk
67
+ 8. **CHUNK_TARGET = 900 chars / 450 tokens** (calibrated for bge-legal-v1's 512-token hard limit)
68
+ 9. **Relationship extraction**: 6 rel types: CITES, CONTRADICTS, SUPERSEDES, REQUIRES, DEFINES, ESTABLISHES
69
+ 10. **`secondary` / `form` document-type classification** via title term matching
70
+
71
+ **Output schema** (`json/decomposed/{slug}.json`):
72
+ ```json
73
+ {
74
+ "source_file": "knowledge/irs/example.md",
75
+ "decomposed_at": "2026-04-05T14:21:09Z",
76
+ "frontmatter": {},
77
+ "stats": { "chunks": 2, "claims": 12, "citations": 4, "entities": 11, "relationships": 54 },
78
+ "chunks": [{ "chunk_id": "...", "parent_doc": "...", "chunk_index": 0, "total_chunks": 2,
79
+ "section_title": "...", "text": "..." }],
80
+ "claims": [{ "claim_id": "...", "text": "...", "line": 15, "category": "irs", "confidence": "high" }],
81
+ "citations": [{ "citation_id": "...", "raw_text": "UCC 3-301", "parsed_type": "ucc",
82
+ "section": "3-301", "source_file": "...", "line": 22 }],
83
+ "entities": [{ "entity_id": "...", "name": "IRS", "type": "Agency", "context": "..." }],
84
+ "relationships": [{ "relationship_id": "...", "source_entity": "...",
85
+ "relationship_type": "DEFINES", "target_entity": "...", "evidence_text": "..." }]
86
+ }
87
+ ```
88
+
89
+ **Comparison to skmemory:** skmemory's `DecompositionResult` has chunks/citations/entities/claims but lacks: typed citation parsing, relationship extraction, confidence scoring, and entity-type taxonomy.
90
+
91
+ ---
92
+
93
+ ### Context Bridge (context_bridge_lib.py)
94
+
95
+ This is the most important file for backporting. It is a ~2,800-line retrieval fusion library that merges skmemory + hammertime corpus into a single ranked result set.
96
+
97
+ **Architecture of `build_context()`:**
98
+ 1. **Pivot extraction** — calls `skmemory.decompose.decompose_content(task)` to extract entities, citations, claims from the user's query
99
+ 2. **Memory loading** — `_load_memory_context()` runs: `store.load_context()`, `store.search()`, `store.novelty_search()`, `store.build_session_brief()`, and memory graph pivots (`store.graph.search_by_entity()`, `store.graph.search_by_citation()`, `store.graph.related_claims_by_entity()`)
100
+ 3. **Corpus search** — `_search_corpus()` runs query embedding → Qdrant → result grouping by parent doc
101
+ 4. **Jurisdiction overlay** — `_jurisdiction_overlay_hits()` does keyword-based scoring against a local pre-built index of all decomposed JSON (no live Qdrant needed)
102
+ 5. **Suggestions** — `_derive_connections()` counts entity/citation/claim co-occurrence across corpus hits to surface emergent pivots
103
+ 6. **Ranking** — `_build_ranked_candidates()` computes hybrid score:
104
+ ```
105
+ hybrid_score = base_score
106
+ + authority_weight(tier) × 0.5
107
+ + state_boost (0–0.22)
108
+ + domain_boost (−0.18 to +0.28)
109
+ + quality_boost (−0.18 to +0.28)
110
+ + pivot_count × 0.04 (capped at 0.18)
111
+ − 0.24 if weak_authority_reason
112
+ ```
113
+ 7. **Contradiction detection** — `_detect_contradictions()` checks top-10 results for claim conflicts (negation term asymmetry + shared citations/entities) — emits `contradiction_type`, `severity`, `shared_citations`
114
+ 8. **Contradiction penalty** — weak-authority items involved in contradictions get −0.08 × count penalty
115
+ 9. **Dedup** — by `(source_type, origin_path)` key
116
+
117
+ **Three research modes:**
118
+ - `balanced` — default, filters generic secondary material unless state/pivot hits
119
+ - `primary-authority-first` — aggressively suppresses generic secondary if `<2 practical terms`
120
+ - `allow-secondary` — keeps everything (AmJur/VSOF style)
121
+
122
+ **Caching layers:**
123
+ 1. Query embedding cache (SHA256 key, JSON file, LRU 256 entries)
124
+ 2. Corpus result cache (SHA256 key including collection+URL+state, JSON file, configurable TTL, LRU 128 entries)
125
+ 3. Jurisdiction overlay index (snapshot-hash-based invalidation, JSON file)
126
+ 4. Session-level Qdrant client cache (dict keyed on URL+key+timeout)
127
+
128
+ ---
129
+
130
+ ### Issue Pack / Authority Ranking
131
+
132
+ `issue-pack.py` calls `main(mode_override="issue-pack")` which adds extra sections beyond `build_context()`:
133
+
134
+ 1. **`filing_ready` section** — infers filing type from task terms (claim_of_exemption, motion_to_vacate, objection_or_hearing_request, notice_or_affidavit), builds draft skeletons with:
135
+ - Section prompts per filing type
136
+ - Evidence checklist
137
+ - `draft_markdown` — ready-to-edit filing scaffold
138
+ - `timeline_checkpoints` — deadline-sensitive procedural steps
139
+ - `confidence` score per skeleton
140
+ 2. **`reference_bank`** — separate bucket for secondary-tier results, surfaced without displacing primary authorities
141
+ 3. **`fact_gaps`** — structured questions across 4 profiles: enforcement_instrument, timing_and_service, asset_and_funds_profile, attack_paths — cross-checked against ranked results
142
+ 4. **`procedural_timeline`** — inferred checkpoints (judgment posture, enforcement trigger, objection window, attack path) with high/medium urgency
143
+ 5. **Draft bundle writing** — full packet materialized to disk: `preferred-draft.md`, `EXHIBIT-INDEX.md`, `SUBMISSION-CHECKLIST.md`, `FILING-PLAN.md`, `SERVICE-PACKET.md`, `HEARING-PACKET.md`, `CALENDAR.md`, `PREFERRED-PATH.md`, `NEXT-ACTIONS.md`, `packet-progress.json`
144
+
145
+ **Key struct for skmemory backport consideration:** the `reference_bank` pattern — separating primary action authorities from secondary reference material. skmemory's `search()` currently returns a flat ranked list with no tier-aware split.
146
+
147
+ ---
148
+
149
+ ### Graph Edge Model (FalkorDB via import-falkordb-v2.py)
150
+
151
+ **Node labels (15):**
152
+ ```
153
+ Template, Process, CaseStrategy, Knowledge, Skill, Profile, Entity, Case,
154
+ TemplateChain, Phase, Step, Incident, Judge,
155
+ [Lumina additions:] Statute, Principle, Filing, Court, Agency
156
+ ```
157
+
158
+ **Relationship types (18):**
159
+ ```
160
+ [v1:] HAS_PHASE, HAS_STEP, USES_TEMPLATE, REFERENCES, RELATED_TO, INCLUDES, PRESIDED_BY, CHAIN_LINK, TAGGED
161
+ [Lumina additions:] CITES, CONTRADICTS, SUPERSEDES, REQUIRES, DEFINES, ESTABLISHES, EFFECTIVE_DATE, AMENDED_BY, REPEALED_BY
162
+ ```
163
+
164
+ **Entity type mapping** (from decomposed JSON → graph label):
165
+ ```python
166
+ ENTITY_TYPE_MAP = {
167
+ "statute": "Statute", "law": "Statute", "usc": "Statute", "cfr": "Statute",
168
+ "principle": "Principle", "filing": "Filing", "court": "Court", "agency": "Agency",
169
+ "process": "Process", "template": "Template", "knowledge": "Knowledge",
170
+ "entity": "Entity", "person": "Profile", "company": "Entity", "skill": "Skill",
171
+ }
172
+ ```
173
+
174
+ **Unique key per label** (for MERGE deduplication):
175
+ ```python
176
+ { "Statute": "name", "Principle": "name", "Filing": "filing_id", "Court": "name",
177
+ "Agency": "name", "Memory": "memory_id", ... }
178
+ ```
179
+
180
+ **Cross-reference pass:** after node import, scans skills/knowledge files for path references to build edges. Also scans all knowledge/*.md for USC/CFR citation patterns → auto-creates Statute nodes + CITES edges.
181
+
182
+ **skmemory comparison:** skmemory has `graph_queries.py` but currently only stores Memory nodes, not typed Statute/Principle/Court/Agency nodes. The CITES/CONTRADICTS/SUPERSEDES/DEFINES relationship vocabulary is entirely absent from skmemory's graph layer.
183
+
184
+ ---
185
+
186
+ ### Services/Workers
187
+
188
+ **`distributed-worker.py`** — Multi-GPU SSH coordinator:
189
+ - Reads `gpu-inventory.json` (7 nodes, VRAM weights: 16GB RTX 4080, 8GB RX 7600 ×2, 6GB RTX 3060, 8GB RTX 2080S, 12GB RTX 5070 Ti, 4GB Radeon 780M)
190
+ - Splits work in proportion to VRAM capacity
191
+ - SSHes into remote nodes, runs `worker-embed.py` per batch
192
+ - All nodes share NFS at `/mnt/cloud/onedrive/` — no file transfer needed
193
+ - Results upsert directly to Qdrant from each node
194
+ - Coordinator runs FalkorDB graph import centrally after embedding completes
195
+
196
+ **`corpus-guardian.py`** — Health validation daemon:
197
+ - `validate-env --target uat --deep` — validates release manifest, collection health, graph health, source drift
198
+ - `check-envs --targets dev,uat,prod --deep` — validates all env aliases in one pass
199
+ - Installed via `install-corpus-automation.sh` as systemd user timers
200
+
201
+ **`corpus_release.py`** — Release/alias state machine:
202
+ - Three-tier: `dev` (mutable), `uat` (frozen candidate), `prod` (live)
203
+ - `active_runtime()` → resolves current vector_collection + graph_name from runtime aliases
204
+ - `promote_release()` → updates alias to point a target (dev/uat/prod) at a specific release
205
+ - Processing state tracking: SHA256 content hashes, mtime, per-document last_release_id
206
+ - `diff_source_index()` → detects new/changed/deleted docs since last state snapshot
207
+
208
+ **`cron/hammertime-corpus.crontab.example`** — Suggested crontab for incremental corpus updates
209
+
210
+ ---
211
+
212
+ ### Skills (37+ defined)
213
+
214
+ All skills are `.md` files in `.cursor/skills/` — trigger phrases map to skill invocations. Key skills:
215
+
216
+ | Skill | Purpose |
217
+ |-------|---------|
218
+ | `sovereign-ingestion-pipeline.md` | Master SIP reference — all 5 layers, commands, schemas |
219
+ | `ingest-files.md` | L2 — convert raw docs to markdown + JSON artifacts |
220
+ | `ingest-guide.md` | Ingest a complete guide document |
221
+ | `ingest-telegram.md` | Import Telegram chat exports |
222
+ | `research-query.md` | Run context-bridge / issue-pack queries |
223
+ | `analyze-document.md` | Single-document analysis |
224
+ | `generate-document.md` | Legal document generation from templates |
225
+ | `manage-incidents.md` | ITIL-style incident lifecycle for legal cases |
226
+ | `manage-correspondence.md` | Track filings/letters/responses |
227
+ | `sync-knowledge.md` | Sync knowledge base across devices |
228
+ | `study-archive.md` | Archive and index study materials |
229
+ | `docx-to-md/` | DOCX → markdown conversion (with script) |
230
+ | `pdf-to-image/` | PDF → page images (with script) |
231
+ | `pptx-to-md/` | PPTX → markdown conversion (with script) |
232
+
233
+ **skcapstone relevance:** The skill system maps closely to skcapstone's own skills directory at `~/clawd/skills/`. The trigger-phrase-to-skill mapping and the SKILL.md metadata pattern are worth adopting for skill discoverability.
234
+
235
+ ---
236
+
237
+ ## Recommended Backports (Prioritized)
238
+
239
+ ### 1. HIGH: Jurisdiction/Context Overlay Index → skmemory
240
+
241
+ **What:** `_build_overlay_index()` and `_jurisdiction_overlay_hits()` in `context_bridge_lib.py`
242
+
243
+ **What it does:** Builds a local JSON index from all decomposed artifacts containing each artifact's claims, citations, entities, sections, and a pre-built `search_blob`. This enables sub-millisecond keyword/state-based retrieval WITHOUT a live vector query — pure JSON scan. Falls back to this when Qdrant is slow/offline, and merges results with live semantic search.
244
+
245
+ **Why it matters for skmemory:** skmemory has no equivalent offline search. All retrieval hits skmemory's store (SQLite or vector). An overlay index of memory decompositions would let agents get fast, deterministic hits on known high-value memories before the expensive embedding path.
246
+
247
+ **Implementation path:**
248
+ - Add `build_overlay_index()` to `skmemory/store.py` or a new `skmemory/overlay.py`
249
+ - Cache at `~/.skcapstone/agents/{agent}/memory/overlay-index.json`
250
+ - Invalidate when memory file count or newest mtime changes (current snapshot pattern)
251
+ - Expose via `skmemory search --overlay` or as a fast pre-filter in `MemoryStore.search()`
252
+
253
+ ---
254
+
255
+ ### 2. HIGH: Hybrid Scoring with Authority Weights → skmemory + context_bridge_lib port
256
+
257
+ **What:** `_build_ranked_candidates()` + `_quality_adjustment()` + `_detect_contradictions()` in `context_bridge_lib.py`
258
+
259
+ **What it does:** Computes a `hybrid_score` that merges semantic similarity with: authority tier weight, state-specificity boost, domain relevance boost, pivot alignment bonus, and weak-authority penalty. Detects contradictions between top results and applies penalties.
260
+
261
+ **skmemory current state:** `authority_weight()` and `infer_authority_tier()` exist in `skmemory/retrieval.py` but are only used for metadata preparation — they do NOT feed back into ranking scores in `MemoryStore.search()`.
262
+
263
+ **Why it matters:** skmemory's search returns results ranked purely by semantic similarity. hammerTime's hybrid scoring demonstrably promotes actionable primary-authority results and demotes speculative secondary material. This is directly applicable to non-legal memory contexts: skmemory memories already have authority_tier metadata — it just isn't used for ranking.
264
+
265
+ **Implementation path:**
266
+ - Add `hybrid_score()` function to `skmemory/retrieval.py`
267
+ - Accept: `base_score`, `authority_tier`, `pivot_matches` (entity/citation hits in query), `domain_terms`
268
+ - Apply in `MemoryStore.search()` as a post-processing re-rank step
269
+ - Add `_detect_contradictions()` equivalent for flagging conflicting memory results
270
+
271
+ ---
272
+
273
+ ### 3. HIGH: Corpus Release / Processing State Machine → skcapstone
274
+
275
+ **What:** `corpus_release.py` — the full dev/uat/prod release lifecycle for vector+graph stores
276
+
277
+ **What it does:** Tracks per-document SHA256 hashes and mtimes, diffs against previous state, manages runtime aliases (which Qdrant collection + FalkorDB graph are currently "live" per environment), writes release manifests, validates health, and allows promoting releases between tiers without rebuilding.
278
+
279
+ **Why it matters for skcapstone:** skmemory has no concept of corpus release state. Every rebuild wipes and recreates. When `hammertime-v3` grows to thousands of points, incremental state tracking becomes critical. skcapstone also manages multi-agent deployments where different agents may need different corpus versions (dev/uat/prod).
280
+
281
+ **Implementation path:**
282
+ - Port `corpus_release.py` as `skcapstone/src/skcapstone/corpus_release.py`
283
+ - Integrate with `skmemory` so each agent's Qdrant collection has an aliased runtime name
284
+ - Add `skcapstone corpus release` and `skcapstone corpus promote` CLI commands
285
+ - Store release state at `~/.skcapstone/corpus/{agent}/state/`
286
+
287
+ ---
288
+
289
+ ### 4. MEDIUM: Typed Citation Extraction → skmemory/decompose.py
290
+
291
+ **What:** The 9 citation regex types in `decompose.py` (UCC, CFR, USC, case citations, Public Law, IRS forms, trust types, maritime, legal principles)
292
+
293
+ **Why it matters:** skmemory's `_extract_citations()` uses simpler patterns. If SK agents are going to use hammertime-v3 in recall_collections, the same citation normalization should be shared so citations extracted during memory storage match citations extracted during corpus query pivot extraction.
294
+
295
+ **Implementation path:**
296
+ - Extract citation regexes into `skmemory/citation_patterns.py`
297
+ - Update `skmemory/decompose.py` `_extract_citations()` to use shared patterns
298
+ - hammerTime already calls `skmemory.decompose.decompose_content()` for pivot extraction — the shared library already exists, it just needs richer patterns
299
+
300
+ ---
301
+
302
+ ### 5. MEDIUM: Query Expansion + Stale Cache Fallback → skmemory
303
+
304
+ **What:** `_expand_query()` (domain-aware query expansion) + stale cache fallback in `_search_corpus()`
305
+
306
+ **What it does:** When a query contains enforcement/exemption terms, appends related terms ("writ of execution", "judgment debtor", etc.) to the embedding query. When Qdrant fails mid-query, falls back to last cached result for that exact query (keyed by SHA256 of query+collection+state).
307
+
308
+ **Why it matters:** skmemory has no query expansion and no graceful degradation when the vector backend is unavailable. Both patterns would improve skmemory's recall and reliability.
309
+
310
+ ---
311
+
312
+ ### 6. MEDIUM: Graph Relationship Vocabulary → skmemory/graph_queries.py
313
+
314
+ **What:** CITES, CONTRADICTS, SUPERSEDES, REQUIRES, DEFINES, ESTABLISHES, EFFECTIVE_DATE, AMENDED_BY, REPEALED_BY relationships in FalkorDB
315
+
316
+ **Why it matters:** skmemory's graph layer currently uses RELATED_TO as the primary edge type. Adding typed edges would enable structured queries like "which memories CONTRADICT this one" or "which memories SUPERSEDE that prior belief" — directly useful for emotional continuity (FEBs that supersede old beliefs) and knowledge evolution tracking.
317
+
318
+ **Implementation path:**
319
+ - Add typed relationship support to `skmemory/graph_queries.py`
320
+ - Expose `store.graph.search_related_claims_by_type(entity, rel_type)`
321
+ - Use relationship type when saving FEB memories that explicitly contradict or update prior beliefs
322
+
323
+ ---
324
+
325
+ ### 7. MEDIUM: Draft Bundle / Packet Pattern → skcapstone coordination
326
+
327
+ **What:** The filing-ready draft bundle: preferred-draft, exhibit index, submission checklist, filing plan, service/hearing packet, calendar, preferred-path, next-actions, packet-progress.json
328
+
329
+ **Why it matters:** This is structurally equivalent to skcapstone's coordination task/project pattern. The hammerTime "packet" is a self-contained action workspace that survives across sessions. skcapstone's `~/.skcapstone/coordination/tasks/` does something similar but less structured. The packet-progress.json with status fields (preferred_draft_status, service_status, hearing_status, filing_status) maps directly to task state management.
330
+
331
+ ---
332
+
333
+ ### 8. LOW: Distributed Worker Pattern → skcapstone swarm
334
+
335
+ **What:** `distributed-worker.py` — VRAM-weighted work distribution across SSH nodes
336
+
337
+ **Why it matters:** When skmemory or hammerTime corpus needs to be re-embedded across a large document set, the 7-GPU cluster pattern (VRAM-proportional batching, SSH dispatch, NFS shared storage) could be reused. The `gpu-inventory.json` file already exists as shared infrastructure.
338
+
339
+ **Implementation path:** Low priority because skmemory embeddings are per-memory-file (small), not bulk corpus runs. Relevant only if skmemory gains a sovereign embedding model.
340
+
341
+ ---
342
+
343
+ ### 9. LOW: Corpus Guardian / Health Daemon → skcapstone monitoring
344
+
345
+ **What:** `corpus-guardian.py` validates collection health, graph health, source drift, and alias correctness
346
+
347
+ **Why it matters:** skcapstone has no health monitoring for Qdrant or FalkorDB. If these services are used by multiple agents, a guardian daemon would catch drift (source changed but corpus not rebuilt) and surface it proactively.
348
+
349
+ ---
350
+
351
+ ## recall_collections Recommendation
352
+
353
+ `hammertime-v3` (Qdrant at `skvector.nativeassetmanagement.com`, 1024-dim, bge-legal-v1) should be added to `recall_collections` for:
354
+
355
+ | Agent | Justification |
356
+ |-------|---------------|
357
+ | **lumina** | Primary orchestrator — needs legal corpus access for case-related dispatches |
358
+ | **architect** | Handles system design that may intersect legal/compliance domains |
359
+ | **scholar** | Research-focused agent — direct benefit from legal corpus retrieval |
360
+ | **coder** | Lower priority but useful for regulatory/compliance code generation |
361
+
362
+ **Configuration note:** The bge-legal-v1 model is 1024-dim while the default skmemory collection uses a different embedding model. Recall from `hammertime-v3` requires either:
363
+ 1. Using the same bge-legal-v1 model for query embedding (requires the local model at `models/bge-legal-v1/` or via Ollama), OR
364
+ 2. Adding a separate recall path in `context_bridge_lib.py` that hammerTime already implements
365
+
366
+ The cleanest path: add `hammertime-v3` as a read-only recall collection that only `context-bridge.py` / `issue-pack.py` queries, surfacing results back into skmemory's context system through the bridge interface that already exists in `context_bridge_lib.py`.
367
+
368
+ **Do NOT** route skmemory's standard search to hammertime-v3 directly — the embedding dimensions don't match skmemory's default model.
369
+
370
+ ---
371
+
372
+ ## Dependencies hammerTime Uses That skmemory/skcapstone Should Adopt
373
+
374
+ | Library | hammerTime Use | skcapstone/skmemory Status | Recommendation |
375
+ |---------|---------------|--------------------------|----------------|
376
+ | `sentence-transformers` | L4 embedding (bge-legal-v1 via SentenceTransformer) | Used in skmemory | Already adopted |
377
+ | `qdrant-client` | Vector store (hammertime-v3) | Used in skmemory | Already adopted |
378
+ | `redis` (FalkorDB) | Graph DB via GRAPH.QUERY commands | Not in skmemory | Add for graph layer if FalkorDB adopted |
379
+ | `falkordb` | Newer FalkorDB Python client | Not in skmemory | Optional — redis path works |
380
+ | `concurrent.futures` | ThreadPoolExecutor for Qdrant query timeout | Not systematically used | Add for retrieval deadline enforcement |
381
+ | `yaml` | YAML frontmatter in profiles | Already in skcapstone | Already adopted |
382
+
383
+ **No new mandatory dependencies** are required for the highest-priority backports (overlay index, hybrid scoring). They use only stdlib + existing skmemory internals.
384
+
385
+ ---
386
+
387
+ ## Architecture Note: What hammerTime Does Differently From skmemory
388
+
389
+ | Concern | skmemory | hammerTime |
390
+ |---------|----------|------------|
391
+ | Storage unit | `Memory` object (agent-personal) | Document chunk (corpus-shared) |
392
+ | Embedding dimensions | Variable (default model) | 1024 (bge-legal-v1 sovereign) |
393
+ | Graph node | Generic `Memory` node | 15 typed nodes (Statute, Court, Agency, etc.) |
394
+ | Graph relationships | RELATED_TO primarily | 18 typed rels including CITES, CONTRADICTS, SUPERSEDES |
395
+ | Retrieval | Semantic similarity only | Hybrid: semantic + overlay + authority weight + state boost |
396
+ | Authority ranking | Metadata only (not used in ranking) | Fully integrated into hybrid_score |
397
+ | Contradiction detection | None | Top-10 cross-check + penalty |
398
+ | Release lifecycle | None (rebuild = wipe) | dev/uat/prod alias model with SHA256 drift tracking |
399
+ | Query caching | None | Two-level: embedding LRU + corpus result TTL + stale fallback |
400
+ | Offline mode | None | Jurisdiction overlay (pure JSON, no live vector needed) |
401
+
402
+ The two systems are **complementary, not redundant**. hammerTime is the document corpus for legal knowledge; skmemory is the agent's personal experiential memory. The `context_bridge_lib.py` is the correct integration point — it already merges both. The backport work is about lifting hammerTime's superior retrieval patterns (hybrid scoring, caching, overlay index) into skmemory so the memory side is equally capable when the bridge merges results.
@@ -14,7 +14,7 @@ import { emptyPluginConfigSchema } from "openclaw/plugin-sdk";
14
14
 
15
15
  const SKCAPSTONE_BIN = process.env.SKCAPSTONE_BIN || "skcapstone";
16
16
  const SKMEMORY_BIN = process.env.SKMEMORY_BIN || "skmemory";
17
- const SKCAPSTONE_AGENT = process.env.SKCAPSTONE_AGENT || "lumina";
17
+ const SKCAPSTONE_AGENT = process.env.SKAGENT || process.env.SKCAPSTONE_AGENT || "lumina";
18
18
  const EXEC_TIMEOUT = 60_000;
19
19
  const IS_WIN = process.platform === "win32";
20
20
 
@@ -36,6 +36,7 @@ function runCli(bin: string, args: string, agentOverride?: string): { ok: boolea
36
36
  timeout: EXEC_TIMEOUT,
37
37
  env: {
38
38
  ...process.env,
39
+ SKAGENT: agent,
39
40
  SKCAPSTONE_AGENT: agent,
40
41
  PATH: `${skenvPath()}${sep}${process.env.PATH}`,
41
42
  },