npm - @mizyoel/mercury-mesh - Versions diffs - 0.9.4 → 1.0.0 - Mend

@mizyoel/mercury-mesh 0.9.4 → 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (129) hide show

package/.copilot/mcp-config.json +3 -6
package/.copilot/skills/agent-collaboration/SKILL.md +42 -42
package/.copilot/skills/agent-conduct/SKILL.md +24 -24
package/.copilot/skills/architectural-proposals/SKILL.md +151 -151
package/.copilot/skills/ci-validation-gates/SKILL.md +85 -84
package/.copilot/skills/cli-wiring/SKILL.md +47 -47
package/.copilot/skills/client-compatibility/SKILL.md +89 -89
package/.copilot/skills/cross-mesh/SKILL.md +114 -114
package/.copilot/skills/distributed-mesh/SKILL.md +287 -287
package/.copilot/skills/distributed-mesh/mesh.json.example +30 -30
package/.copilot/skills/distributed-mesh/sync-mesh.ps1 +111 -111
package/.copilot/skills/distributed-mesh/sync-mesh.sh +104 -104
package/.copilot/skills/docs-standards/SKILL.md +71 -71
package/.copilot/skills/economy-mode/SKILL.md +101 -101
package/.copilot/skills/external-comms/SKILL.md +331 -331
package/.copilot/skills/gh-auth-isolation/SKILL.md +183 -183
package/.copilot/skills/git-workflow/SKILL.md +206 -206
package/.copilot/skills/github-multi-account/SKILL.md +95 -95
package/.copilot/skills/history-hygiene/SKILL.md +36 -36
package/.copilot/skills/humanizer/SKILL.md +107 -107
package/.copilot/skills/init-mode/SKILL.md +101 -101
package/.copilot/skills/mesh-conventions/SKILL.md +69 -69
package/.copilot/skills/model-selection/SKILL.md +139 -139
package/.copilot/skills/nap/SKILL.md +24 -24
package/.copilot/skills/personal-mesh/SKILL.md +57 -57
package/.copilot/skills/project-conventions/SKILL.md +56 -56
package/.copilot/skills/release-process/SKILL.md +432 -435
package/.copilot/skills/reskill/SKILL.md +92 -92
package/.copilot/skills/reviewer-protocol/SKILL.md +79 -79
package/.copilot/skills/secret-handling/SKILL.md +200 -200
package/.copilot/skills/session-recovery/SKILL.md +155 -155
package/.copilot/skills/test-discipline/SKILL.md +37 -37
package/.copilot/skills/windows-compatibility/SKILL.md +74 -74
package/.github/agents/mercury-mesh.agent.md +1732 -1732
package/.mesh/manifesto.md +66 -66
package/.mesh/templates/casting/Futurama.json +9 -9
package/.mesh/templates/casting-history.json +4 -4
package/.mesh/templates/casting-policy.json +37 -37
package/.mesh/templates/casting-reference.md +104 -104
package/.mesh/templates/casting-registry.json +3 -3
package/.mesh/templates/ceremonies.md +41 -41
package/.mesh/templates/charter.md +56 -56
package/.mesh/templates/constraint-tracking.md +38 -38
package/.mesh/templates/cooperative-rate-limiting.md +229 -229
package/.mesh/templates/copilot-instructions.md +50 -50
package/.mesh/templates/department-backlog.md +15 -15
package/.mesh/templates/department-charter.md +27 -27
package/.mesh/templates/department-state.json +19 -19
package/.mesh/templates/history.md +10 -10
package/.mesh/templates/identity/now.md +9 -9
package/.mesh/templates/identity/wisdom.md +15 -15
package/.mesh/templates/interface-contract.md +26 -26
package/.mesh/templates/issue-lifecycle.md +421 -421
package/.mesh/templates/keda-scaler.md +166 -166
package/.mesh/templates/local.json +5 -0
package/.mesh/templates/machine-capabilities.md +76 -76
package/.mesh/templates/mcp-config.md +87 -90
package/.mesh/templates/mercury-mesh.agent.md +1732 -1732
package/.mesh/templates/multi-agent-format.md +28 -28
package/.mesh/templates/orchestration-log.md +27 -27
package/.mesh/templates/org-autonomy-spec.md +152 -152
package/.mesh/templates/org-backlog-from-triage.js +199 -199
package/.mesh/templates/org-runtime-reconcile.js +364 -364
package/.mesh/templates/org-seed-runtime.js +237 -237
package/.mesh/templates/org-status.js +193 -193
package/.mesh/templates/org-structure.json +38 -38
package/.mesh/templates/package.json +3 -3
package/.mesh/templates/plugin-marketplace.md +49 -49
package/.mesh/templates/ralph-circuit-breaker.md +313 -313
package/.mesh/templates/ralph-triage.js +849 -844
package/.mesh/templates/raw-agent-output.md +37 -37
package/.mesh/templates/roster.md +60 -60
package/.mesh/templates/routing.md +78 -78
package/.mesh/templates/run-output.md +50 -50
package/.mesh/templates/schedule.json +64 -64
package/.mesh/templates/scribe-charter.md +119 -119
package/.mesh/templates/skill.md +24 -24
package/.mesh/templates/skills/agent-collaboration/SKILL.md +42 -42
package/.mesh/templates/skills/agent-conduct/SKILL.md +24 -24
package/.mesh/templates/skills/architectural-proposals/SKILL.md +151 -151
package/.mesh/templates/skills/ci-validation-gates/SKILL.md +85 -84
package/.mesh/templates/skills/cli-wiring/SKILL.md +47 -47
package/.mesh/templates/skills/client-compatibility/SKILL.md +89 -89
package/.mesh/templates/skills/cross-mesh/SKILL.md +114 -114
package/.mesh/templates/skills/distributed-mesh/SKILL.md +287 -287
package/.mesh/templates/skills/distributed-mesh/mesh.json.example +30 -30
package/.mesh/templates/skills/distributed-mesh/sync-mesh.ps1 +111 -111
package/.mesh/templates/skills/distributed-mesh/sync-mesh.sh +104 -104
package/.mesh/templates/skills/docs-standards/SKILL.md +71 -71
package/.mesh/templates/skills/economy-mode/SKILL.md +101 -101
package/.mesh/templates/skills/external-comms/SKILL.md +331 -331
package/.mesh/templates/skills/gh-auth-isolation/SKILL.md +183 -183
package/.mesh/templates/skills/git-workflow/SKILL.md +204 -204
package/.mesh/templates/skills/github-multi-account/SKILL.md +95 -95
package/.mesh/templates/skills/history-hygiene/SKILL.md +36 -36
package/.mesh/templates/skills/humanizer/SKILL.md +107 -107
package/.mesh/templates/skills/init-mode/SKILL.md +101 -101
package/.mesh/templates/skills/mesh-conventions/SKILL.md +69 -69
package/.mesh/templates/skills/model-selection/SKILL.md +139 -139
package/.mesh/templates/skills/nap/SKILL.md +24 -24
package/.mesh/templates/skills/personal-mesh/SKILL.md +57 -57
package/.mesh/templates/skills/project-conventions/SKILL.md +56 -56
package/.mesh/templates/skills/release-process/SKILL.md +432 -435
package/.mesh/templates/skills/reskill/SKILL.md +92 -92
package/.mesh/templates/skills/reviewer-protocol/SKILL.md +79 -79
package/.mesh/templates/skills/secret-handling/SKILL.md +200 -200
package/.mesh/templates/skills/session-recovery/SKILL.md +155 -155
package/.mesh/templates/skills/test-discipline/SKILL.md +37 -37
package/.mesh/templates/skills/windows-compatibility/SKILL.md +74 -74
package/.mesh/templates/workflows/mesh-ci.yml +24 -24
package/.mesh/templates/workflows/mesh-docs.yml +54 -54
package/.mesh/templates/workflows/mesh-heartbeat.yml +237 -237
package/.mesh/templates/workflows/mesh-insider-release.yml +61 -61
package/.mesh/templates/workflows/mesh-issue-assign.yml +243 -243
package/.mesh/templates/workflows/mesh-label-enforce.yml +181 -181
package/.mesh/templates/workflows/mesh-preview.yml +55 -55
package/.mesh/templates/workflows/mesh-promote.yml +120 -120
package/.mesh/templates/workflows/mesh-release.yml +77 -77
package/.mesh/templates/workflows/mesh-triage.yml +383 -383
package/.mesh/templates/workflows/sync-mesh-labels.yml +204 -204
package/README.md +753 -640
package/bin/mercury-mesh.cjs +1804 -317
package/docs/brand-language.md +287 -287
package/docs/commander-onboarding.md +462 -462
package/docs/mercury-mesh-runtime-rename-impact.md +147 -147
package/docs/persona-manifesto.md +114 -114
package/docs/scenarios/client-compatibility.md +59 -59
package/index.cjs +40 -40
package/package.json +68 -43

package/.copilot/mcp-config.json CHANGED Viewed

@@ -3,12 +3,9 @@
     "EXAMPLE-github": {
       "command": "npx",
       "args": [
-        "-y",
-        "@anthropic/github-mcp-server"
-      ],
-      "env": {
-        "GITHUB_TOKEN": "${GITHUB_TOKEN}"
-      }
+        "mercury-mesh",
+        "github-mcp"
+      ]
     }
   }
 }

package/.copilot/skills/agent-collaboration/SKILL.md CHANGED Viewed

@@ -1,42 +1,42 @@
----
-name: "agent-collaboration"
-description: "Standard collaboration patterns for all Mercury Mesh agents — worktree awareness, decisions, cross-agent communication"
-domain: "team-workflow"
-confidence: "high"
-source: "extracted from charter boilerplate — identical content in 18+ agent charters"
----
-## Context
-Every agent on the team follows identical collaboration patterns for worktree awareness, decision recording, and cross-agent communication. These were previously duplicated in every charter's Collaboration section (~300 bytes × 18 agents = ~5.4KB of redundant context). Now centralized here.
-The coordinator's spawn prompt already instructs agents to read decisions.md and their history.md. This skill adds the patterns for WRITING decisions and requesting help.
-## Patterns
-### Worktree Awareness
-Use the `TEAM ROOT` path provided in your spawn prompt. All `.mesh/` paths are relative to this root. If TEAM ROOT is not provided (rare), run `git rev-parse --show-toplevel` as fallback. Never assume CWD is the repo root.
-### Decision Recording
-After making a decision that affects other team members, write it to:
-`.mesh/decisions/inbox/{your-name}-{brief-slug}.md`
-Format:
-```
-### {date}: {decision title}
-**By:** {Your Name}
-**What:** {the decision}
-**Why:** {rationale}
-```
-### Cross-Agent Communication
-If you need another team member's input, say so in your response. The coordinator will establish an Airbridge. Don't try to do work outside your domain.
-### Reviewer Protocol
-If you have reviewer authority and reject work: the original author is locked out from revising that artifact. A different agent must own the revision. State who should revise in your rejection response.
-## Anti-Patterns
-- Don't read all agent charters — you only need your own context + decisions.md
-- Don't write directly to `.mesh/decisions.md` — always use the inbox drop-box
-- Don't modify other agents' history.md files — that's Scribe's job
-- Don't assume CWD is the repo root — always use TEAM ROOT
+---
+name: "agent-collaboration"
+description: "Standard collaboration patterns for all Mercury Mesh agents — worktree awareness, decisions, cross-agent communication"
+domain: "team-workflow"
+confidence: "high"
+source: "extracted from charter boilerplate — identical content in 18+ agent charters"
+---
+## Context
+Every agent on the team follows identical collaboration patterns for worktree awareness, decision recording, and cross-agent communication. These were previously duplicated in every charter's Collaboration section (~300 bytes × 18 agents = ~5.4KB of redundant context). Now centralized here.
+The coordinator's spawn prompt already instructs agents to read decisions.md and their history.md. This skill adds the patterns for WRITING decisions and requesting help.
+## Patterns
+### Worktree Awareness
+Use the `TEAM ROOT` path provided in your spawn prompt. All `.mesh/` paths are relative to this root. If TEAM ROOT is not provided (rare), run `git rev-parse --show-toplevel` as fallback. Never assume CWD is the repo root.
+### Decision Recording
+After making a decision that affects other team members, write it to:
+`.mesh/decisions/inbox/{your-name}-{brief-slug}.md`
+Format:
+```
+### {date}: {decision title}
+**By:** {Your Name}
+**What:** {the decision}
+**Why:** {rationale}
+```
+### Cross-Agent Communication
+If you need another team member's input, say so in your response. The coordinator will establish an Airbridge. Don't try to do work outside your domain.
+### Reviewer Protocol
+If you have reviewer authority and reject work: the original author is locked out from revising that artifact. A different agent must own the revision. State who should revise in your rejection response.
+## Anti-Patterns
+- Don't read all agent charters — you only need your own context + decisions.md
+- Don't write directly to `.mesh/decisions.md` — always use the inbox drop-box
+- Don't modify other agents' history.md files — that's Scribe's job
+- Don't assume CWD is the repo root — always use TEAM ROOT

package/.copilot/skills/agent-conduct/SKILL.md CHANGED Viewed

@@ -1,24 +1,24 @@
----
-name: "agent-conduct"
-description: "Shared hard rules enforced across all Mercury Mesh agents"
-domain: "team-governance"
-confidence: "high"
-source: "reskill extraction — Product Isolation Rule and Peer Quality Check appeared in all 20 agent charters"
----
-## Context
-Every Mercury Mesh agent must follow these two hard rules. They were previously duplicated in every charter. Now they live here as a shared skill, loaded once.
-## Patterns
-### Product Isolation Rule (hard rule)
-Tests, CI workflows, and product code must NEVER depend on specific agent names from any particular Mercury Mesh. "Our Mercury Mesh" must not impact "the Mercury Mesh." No hardcoded references to agent names (Flight, EECOM, FIDO, etc.) in test assertions, CI configs, or product logic. Use generic/parameterized values. If a test needs agent names, use obviously-fake test fixtures (e.g., "test-agent-1", "TestBot").
-### Peer Quality Check (hard rule)
-Before finishing work, verify your changes don't break existing tests. Run the test suite for files you touched. If CI has been failing, check your changes aren't contributing to the problem. When you learn from mistakes, update your history.md.
-## Anti-Patterns
-- Don't hardcode dev team agent names in product code or tests
-- Don't skip test verification before declaring work done
-- Don't ignore pre-existing CI failures that your changes may worsen
+---
+name: "agent-conduct"
+description: "Shared hard rules enforced across all Mercury Mesh agents"
+domain: "team-governance"
+confidence: "high"
+source: "reskill extraction — Product Isolation Rule and Peer Quality Check appeared in all 20 agent charters"
+---
+## Context
+Every Mercury Mesh agent must follow these two hard rules. They were previously duplicated in every charter. Now they live here as a shared skill, loaded once.
+## Patterns
+### Product Isolation Rule (hard rule)
+Tests, CI workflows, and product code must NEVER depend on specific agent names from any particular Mercury Mesh. "Our Mercury Mesh" must not impact "the Mercury Mesh." No hardcoded references to agent names (Flight, EECOM, FIDO, etc.) in test assertions, CI configs, or product logic. Use generic/parameterized values. If a test needs agent names, use obviously-fake test fixtures (e.g., "test-agent-1", "TestBot").
+### Peer Quality Check (hard rule)
+Before finishing work, verify your changes don't break existing tests. Run the test suite for files you touched. If CI has been failing, check your changes aren't contributing to the problem. When you learn from mistakes, update your history.md.
+## Anti-Patterns
+- Don't hardcode dev team agent names in product code or tests
+- Don't skip test verification before declaring work done
+- Don't ignore pre-existing CI failures that your changes may worsen

package/.copilot/skills/architectural-proposals/SKILL.md CHANGED Viewed

@@ -1,151 +1,151 @@
----
-name: "architectural-proposals"
-description: "How to write comprehensive architectural proposals that drive alignment before code is written"
-domain: "architecture, product-direction"
-confidence: "high"
-source: "earned (2026-02-21 interactive shell proposal)"
-tools:
-  - name: "view"
-    description: "Read existing codebase, prior decisions, and team context before proposing changes"
-    when: "Always read .mesh/decisions.md, relevant PRDs, and current architecture docs before writing proposal"
-  - name: "create"
-    description: "Create proposal in docs/proposals/ with structured format"
-    when: "After gathering context, before any implementation work begins"
----
-## Context
-Proposals create alignment before code is written. Cheaper to change a doc than refactor code. Use this pattern when:
-- Architecture shifts invalidate existing assumptions
-- Product direction changes require new foundation
-- Multiple waves/milestones will be affected by a decision
-- External dependencies (Copilot CLI, SDK APIs) change
-## Patterns
-### Proposal Structure (docs/proposals/)
-**Required sections:**
-1. **Problem Statement** — Why current state is broken (specific, measurable evidence)
-2. **Proposed Architecture** — Solution with technical specifics (not hand-waving)
-3. **What Changes** — Impact on existing work (waves, milestones, modules)
-4. **What Stays the Same** — Preserve existing functionality (no regression)
-5. **Key Decisions Needed** — Explicit choices with recommendations
-6. **Risks and Mitigations** — Likelihood + impact + mitigation strategy
-7. **Scope** — What's in v1, what's deferred (timeline clarity)
-**Optional sections:**
-- Implementation Plan (high-level milestones)
-- Success Criteria (measurable outcomes)
-- Open Questions (unresolved items)
-- Appendix (prior art, alternatives considered)
-### Tone Ceiling Enforcement
-**Always:**
-- Cite specific evidence (user reports, performance data, failure modes)
-- Justify recommendations with technical rationale
-- Acknowledge trade-offs (no perfect solutions)
-- Be specific about APIs, libraries, file paths
-**Never:**
-- Hype ("revolutionary", "game-changing")
-- Hand-waving ("we'll figure it out later")
-- Unsubstantiated claims ("users will love this")
-- Vague timelines ("soon", "eventually")
-### Wave Restructuring Pattern
-When a proposal invalidates existing wave structure:
-1. **Acknowledge the shift:** "This becomes Wave 0 (Foundation)"
-2. **Cascade impacts:** Adjust downstream waves (Wave 1, Wave 2, Wave 3)
-3. **Preserve non-blocking work:** Identify what can proceed in parallel
-4. **Update dependencies:** Document new blocking relationships
-**Example (Interactive Shell):**
-- Wave 0 (NEW): Interactive Shell — blocks all other waves
-- Wave 1 (ADJUSTED): npm Distribution — shell bundled in cli.js
-- Wave 2 (DEFERRED): MeshUI — waits for shell foundation
-- Wave 3 (ADJUSTED): Public Docs — now documents shell as primary interface
-### Decision Framing
-**Format:** "Recommendation: X (recommended) or alternatives?"
-**Components:**
-- Recommendation (pick one, justify)
-- Alternatives (what else was considered)
-- Decision rationale (why recommended option wins)
-- Needs sign-off from (which agents/roles must approve)
-**Example:**
-```
-### 1. Terminal UI Library: `ink` (recommended) or alternatives?
-**Recommendation:** `ink`
-**Alternatives:** `blessed`, raw readline
-**Decision rationale:** Component model enables testable UI. Battle-tested ecosystem.
-**Needs sign-off from:** Brady (product direction), Fortier (runtime performance)
-```
-### Risk Documentation
-**Format per risk:**
-- **Risk:** Specific failure mode
-- **Likelihood:** Low / Medium / High (not percentages)
-- **Impact:** Low / Medium / High
-- **Mitigation:** Concrete actions (measurable)
-**Example:**
-```
-### Risk 2: SDK Streaming Reliability
-**Risk:** SDK streaming events might drop messages or arrive out of order.
-**Likelihood:** Low (SDK is production-grade).
-**Impact:** High — broken streaming makes shell unusable.
-**Mitigation:**
-- Add integration test: Send 1000-message stream, verify all deltas arrive in order
-- Implement fallback: If streaming fails, fall back to polling session state
-- Log all SDK events to `.mesh/orchestration-log/sdk-events.jsonl` for debugging
-```
-## Examples
-**File references from interactive shell proposal:**
-- Full proposal: `docs/proposals/Mercury Mesh-interactive-shell.md`
-- User directive: `.mesh/decisions/inbox/copilot-directive-2026-02-21T202535Z.md`
-- Team decisions: `.mesh/decisions.md`
-- Current architecture: `docs/architecture/module-map.md`, `docs/prd-23-release-readiness.md`
-**Key patterns demonstrated:**
-1. Read user directive first (understand the "why")
-2. Survey current architecture (module map, existing waves)
-3. Research SDK APIs (exploration task to validate feasibility)
-4. Document problem with specific evidence (unreliable handoffs, zero visibility, UX mismatch)
-5. Propose solution with technical specifics (ink components, SDK session management, spawn.ts module)
-6. Restructure waves when foundation shifts (Wave 0 becomes blocker)
-7. Preserve backward compatibility (mercury-mesh.agent.md still works, VS Code mode unchanged)
-8. Frame decisions explicitly (5 key decisions with recommendations)
-9. Document risks with mitigations (5 risks, each with concrete actions)
-10. Define scope (what's in v1 vs. deferred)
-## Anti-Patterns
-**Avoid:**
-- ❌ Proposals without problem statements (solution-first thinking)
-- ❌ Vague architecture ("we'll use a shell") — be specific (ink components, session registry, spawn.ts)
-- ❌ Ignoring existing work — always document impact on waves/milestones
-- ❌ No risk analysis — every architecture has risks, document them
-- ❌ Unbounded scope — draw the v1 line explicitly
-- ❌ Missing decision ownership — always say "needs sign-off from X"
-- ❌ No backward compatibility plan — users don't care about your replatform
-- ❌ Hand-waving timelines ("a few weeks") — be specific (2-3 weeks, 1 engineer full-time)
-**Red flags in proposal reviews:**
-- "Users will love this" (citation needed)
-- "We'll figure out X later" (scope creep incoming)
-- "This is revolutionary" (tone ceiling violation)
-- No section on "What Stays the Same" (regression risk)
-- No risks documented (wishful thinking)
+---
+name: "architectural-proposals"
+description: "How to write comprehensive architectural proposals that drive alignment before code is written"
+domain: "architecture, product-direction"
+confidence: "high"
+source: "earned (2026-02-21 interactive shell proposal)"
+tools:
+  - name: "view"
+    description: "Read existing codebase, prior decisions, and team context before proposing changes"
+    when: "Always read .mesh/decisions.md, relevant PRDs, and current architecture docs before writing proposal"
+  - name: "create"
+    description: "Create proposal in docs/proposals/ with structured format"
+    when: "After gathering context, before any implementation work begins"
+---
+## Context
+Proposals create alignment before code is written. Cheaper to change a doc than refactor code. Use this pattern when:
+- Architecture shifts invalidate existing assumptions
+- Product direction changes require new foundation
+- Multiple waves/milestones will be affected by a decision
+- External dependencies (Copilot CLI, SDK APIs) change
+## Patterns
+### Proposal Structure (docs/proposals/)
+**Required sections:**
+1. **Problem Statement** — Why current state is broken (specific, measurable evidence)
+2. **Proposed Architecture** — Solution with technical specifics (not hand-waving)
+3. **What Changes** — Impact on existing work (waves, milestones, modules)
+4. **What Stays the Same** — Preserve existing functionality (no regression)
+5. **Key Decisions Needed** — Explicit choices with recommendations
+6. **Risks and Mitigations** — Likelihood + impact + mitigation strategy
+7. **Scope** — What's in v1, what's deferred (timeline clarity)
+**Optional sections:**
+- Implementation Plan (high-level milestones)
+- Success Criteria (measurable outcomes)
+- Open Questions (unresolved items)
+- Appendix (prior art, alternatives considered)
+### Tone Ceiling Enforcement
+**Always:**
+- Cite specific evidence (user reports, performance data, failure modes)
+- Justify recommendations with technical rationale
+- Acknowledge trade-offs (no perfect solutions)
+- Be specific about APIs, libraries, file paths
+**Never:**
+- Hype ("revolutionary", "game-changing")
+- Hand-waving ("we'll figure it out later")
+- Unsubstantiated claims ("users will love this")
+- Vague timelines ("soon", "eventually")
+### Wave Restructuring Pattern
+When a proposal invalidates existing wave structure:
+1. **Acknowledge the shift:** "This becomes Wave 0 (Foundation)"
+2. **Cascade impacts:** Adjust downstream waves (Wave 1, Wave 2, Wave 3)
+3. **Preserve non-blocking work:** Identify what can proceed in parallel
+4. **Update dependencies:** Document new blocking relationships
+**Example (Interactive Shell):**
+- Wave 0 (NEW): Interactive Shell — blocks all other waves
+- Wave 1 (ADJUSTED): npm Distribution — shell bundled in cli.js
+- Wave 2 (DEFERRED): MeshUI — waits for shell foundation
+- Wave 3 (ADJUSTED): Public Docs — now documents shell as primary interface
+### Decision Framing
+**Format:** "Recommendation: X (recommended) or alternatives?"
+**Components:**
+- Recommendation (pick one, justify)
+- Alternatives (what else was considered)
+- Decision rationale (why recommended option wins)
+- Needs sign-off from (which agents/roles must approve)
+**Example:**
+```
+### 1. Terminal UI Library: `ink` (recommended) or alternatives?
+**Recommendation:** `ink`
+**Alternatives:** `blessed`, raw readline
+**Decision rationale:** Component model enables testable UI. Battle-tested ecosystem.
+**Needs sign-off from:** Brady (product direction), Fortier (runtime performance)
+```
+### Risk Documentation
+**Format per risk:**
+- **Risk:** Specific failure mode
+- **Likelihood:** Low / Medium / High (not percentages)
+- **Impact:** Low / Medium / High
+- **Mitigation:** Concrete actions (measurable)
+**Example:**
+```
+### Risk 2: SDK Streaming Reliability
+**Risk:** SDK streaming events might drop messages or arrive out of order.
+**Likelihood:** Low (SDK is production-grade).
+**Impact:** High — broken streaming makes shell unusable.
+**Mitigation:**
+- Add integration test: Send 1000-message stream, verify all deltas arrive in order
+- Implement fallback: If streaming fails, fall back to polling session state
+- Log all SDK events to `.mesh/orchestration-log/sdk-events.jsonl` for debugging
+```
+## Examples
+**File references from interactive shell proposal:**
+- Full proposal: `docs/proposals/Mercury Mesh-interactive-shell.md`
+- User directive: `.mesh/decisions/inbox/copilot-directive-2026-02-21T202535Z.md`
+- Team decisions: `.mesh/decisions.md`
+- Current architecture: `docs/architecture/module-map.md`, `docs/prd-23-release-readiness.md`
+**Key patterns demonstrated:**
+1. Read user directive first (understand the "why")
+2. Survey current architecture (module map, existing waves)
+3. Research SDK APIs (exploration task to validate feasibility)
+4. Document problem with specific evidence (unreliable handoffs, zero visibility, UX mismatch)
+5. Propose solution with technical specifics (ink components, SDK session management, spawn.ts module)
+6. Restructure waves when foundation shifts (Wave 0 becomes blocker)
+7. Preserve backward compatibility (mercury-mesh.agent.md still works, VS Code mode unchanged)
+8. Frame decisions explicitly (5 key decisions with recommendations)
+9. Document risks with mitigations (5 risks, each with concrete actions)
+10. Define scope (what's in v1 vs. deferred)
+## Anti-Patterns
+**Avoid:**
+- ❌ Proposals without problem statements (solution-first thinking)
+- ❌ Vague architecture ("we'll use a shell") — be specific (ink components, session registry, spawn.ts)
+- ❌ Ignoring existing work — always document impact on waves/milestones
+- ❌ No risk analysis — every architecture has risks, document them
+- ❌ Unbounded scope — draw the v1 line explicitly
+- ❌ Missing decision ownership — always say "needs sign-off from X"
+- ❌ No backward compatibility plan — users don't care about your replatform
+- ❌ Hand-waving timelines ("a few weeks") — be specific (2-3 weeks, 1 engineer full-time)
+**Red flags in proposal reviews:**
+- "Users will love this" (citation needed)
+- "We'll figure out X later" (scope creep incoming)
+- "This is revolutionary" (tone ceiling violation)
+- No section on "What Stays the Same" (regression risk)
+- No risks documented (wishful thinking)

package/.copilot/skills/ci-validation-gates/SKILL.md CHANGED Viewed

@@ -1,84 +1,85 @@
----
-name: "ci-validation-gates"
-description: "Defensive CI/CD patterns: semver validation, token checks, retry logic, draft detection — earned from v0.8.22"
-domain: "ci-cd"
-confidence: "high"
-source: "extracted from Drucker and Trejo charters — earned knowledge from v0.8.22 release incident"
----
-## Context
-CI workflows must be defensive. These patterns were learned from the v0.8.22 release disaster where invalid semver, wrong token types, missing retry logic, and draft releases caused a multi-hour outage. Both Drucker (CI/CD) and Trejo (Release Manager) carried this knowledge in their charters — now centralized here.
-## Patterns
-### Semver Validation Gate
-Every publish workflow MUST validate version format before `npm publish`. 4-part versions (e.g., 0.8.21.4) are NOT valid semver — npm mangles them.
-```yaml
-- name: Validate semver
-  run: |
-    VERSION="${{ github.event.release.tag_name }}"
-    VERSION="${VERSION#v}"
-    if ! npx semver "$VERSION" > /dev/null 2>&1; then
-      echo "❌ Invalid semver: $VERSION"
-      echo "Only 3-part versions (X.Y.Z) or prerelease (X.Y.Z-tag.N) are valid."
-      exit 1
-    fi
-    echo "✅ Valid semver: $VERSION"
-```
-### NPM Token Type Verification
-NPM_TOKEN MUST be an Automation token, not a User token with 2FA:
-- User tokens require OTP — CI can't provide it → EOTP error
-- Create Automation tokens at npmjs.com → Settings → Access Tokens → Automation
-- Verify before first publish in any workflow
-### Retry Logic for npm Registry Propagation
-npm registry uses eventual consistency. After `npm publish` succeeds, the package may not be immediately queryable.
-- Propagation: typically 5-30s, up to 2min in rare cases
-- All verify steps: 5 attempts, 15-second intervals
-- Log each attempt: "Attempt 1/5: Checking package..."
-- Exit loop on success, fail after max attempts
-```yaml
-- name: Verify package (with retry)
-  run: |
-    MAX_ATTEMPTS=5
-    WAIT_SECONDS=15
-    for attempt in $(seq 1 $MAX_ATTEMPTS); do
-      echo "Attempt $attempt/$MAX_ATTEMPTS: Checking $PACKAGE@$VERSION..."
-      if npm view "$PACKAGE@$VERSION" version > /dev/null 2>&1; then
-        echo "✅ Package verified"
-        exit 0
-      fi
-      [ $attempt -lt $MAX_ATTEMPTS ] && sleep $WAIT_SECONDS
-    done
-    echo "❌ Failed to verify after $MAX_ATTEMPTS attempts"
-    exit 1
-```
-### Draft Release Detection
-Draft releases don't emit `release: published` event. Workflows MUST:
-- Trigger on `release: published` (NOT `created`)
-- If using workflow_dispatch: verify release is published via GitHub API before proceeding
-### Build Script Protection
-Set `SKIP_BUILD_BUMP=1` (or `$env:SKIP_BUILD_BUMP = "1"` on Windows) before ANY release build. bump-build.mjs is for dev builds ONLY — it silently mutates versions.
-## Known Failure Modes (v0.8.22 Incident)
-| # | What Happened | Root Cause | Prevention |
-|---|---------------|-----------|------------|
-| 1 | 4-part version published, npm mangled it | No semver validation gate | `npx semver` check before every publish |
-| 2 | CI failed 5+ times with EOTP | User token with 2FA | Automation token only |
-| 3 | Verify returned false 404 | No retry logic for propagation | 5 attempts, 15s intervals |
-| 4 | Workflow never triggered | Draft release doesn't emit event | Never create draft releases |
-| 5 | Version mutated during release | bump-build.mjs ran in release | SKIP_BUILD_BUMP=1 |
-## Anti-Patterns
-- ❌ Publishing without semver validation gate
-- ❌ Single-shot verification without retry
-- ❌ Hard-coded secrets in workflows
-- ❌ Silent CI failures — every error needs actionable output with remediation
-- ❌ Assuming npm publish is instantly queryable
+---
+name: "ci-validation-gates"
+description: "Defensive CI/CD patterns: semver validation, token checks, retry logic, draft detection — earned from v0.8.22"
+domain: "ci-cd"
+confidence: "high"
+source: "extracted from Drucker and Trejo charters — earned knowledge from v0.8.22 release incident"
+---
+## Context
+CI workflows must be defensive. These patterns were learned from the v0.8.22 release disaster where invalid semver, wrong token types, missing retry logic, and draft releases caused a multi-hour outage. Both Drucker (CI/CD) and Trejo (Release Manager) carried this knowledge in their charters — now centralized here.
+## Patterns
+### Semver Validation Gate
+Every publish workflow MUST validate version format before `npm publish`. 4-part versions (e.g., 0.8.21.4) are NOT valid semver — npm mangles them.
+```yaml
+- name: Validate semver
+  run: |
+    VERSION="${{ github.event.release.tag_name }}"
+    VERSION="${VERSION#v}"
+    if ! npx semver "$VERSION" > /dev/null 2>&1; then
+      echo "❌ Invalid semver: $VERSION"
+      echo "Only 3-part versions (X.Y.Z) or prerelease (X.Y.Z-tag.N) are valid."
+      exit 1
+    fi
+    echo "✅ Valid semver: $VERSION"
+```
+### Publish Authentication Verification
+Prefer npm trusted publishing via OIDC for GitHub Actions:
+- Trusted publishing removes long-lived write tokens from CI entirely
+- Configure npm package settings to trust GitHub repo `mizyoel/mercury-mesh` and workflow `publish.yml`
+- If token fallback is required, `NPM_TOKEN` must be a granular write token with bypass 2FA enabled
+- User tokens that still require OTP will fail in CI with `EOTP`
+### Retry Logic for npm Registry Propagation
+npm registry uses eventual consistency. After `npm publish` succeeds, the package may not be immediately queryable.
+- Propagation: typically 5-30s, up to 2min in rare cases
+- All verify steps: 5 attempts, 15-second intervals
+- Log each attempt: "Attempt 1/5: Checking package..."
+- Exit loop on success, fail after max attempts
+```yaml
+- name: Verify package (with retry)
+  run: |
+    MAX_ATTEMPTS=5
+    WAIT_SECONDS=15
+    for attempt in $(seq 1 $MAX_ATTEMPTS); do
+      echo "Attempt $attempt/$MAX_ATTEMPTS: Checking $PACKAGE@$VERSION..."
+      if npm view "$PACKAGE@$VERSION" version > /dev/null 2>&1; then
+        echo "✅ Package verified"
+        exit 0
+      fi
+      [ $attempt -lt $MAX_ATTEMPTS ] && sleep $WAIT_SECONDS
+    done
+    echo "❌ Failed to verify after $MAX_ATTEMPTS attempts"
+    exit 1
+```
+### Draft Release Detection
+Draft releases don't emit `release: published` event. Workflows MUST:
+- Trigger on `release: published` (NOT `created`)
+- If using workflow_dispatch: verify release is published via GitHub API before proceeding
+### Build Script Protection
+Set `SKIP_BUILD_BUMP=1` (or `$env:SKIP_BUILD_BUMP = "1"` on Windows) before ANY release build. bump-build.mjs is for dev builds ONLY — it silently mutates versions.
+## Known Failure Modes (v0.8.22 Incident)
+| # | What Happened | Root Cause | Prevention |
+|---|---------------|-----------|------------|
+| 1 | 4-part version published, npm mangled it | No semver validation gate | `npx semver` check before every publish |
+| 2 | CI failed 5+ times with EOTP | Token required OTP in CI | Trusted publishing or granular token with bypass 2FA |
+| 3 | Verify returned false 404 | No retry logic for propagation | 5 attempts, 15s intervals |
+| 4 | Workflow never triggered | Draft release doesn't emit event | Never create draft releases |
+| 5 | Version mutated during release | bump-build.mjs ran in release | SKIP_BUILD_BUMP=1 |
+## Anti-Patterns
+- ❌ Publishing without semver validation gate
+- ❌ Single-shot verification without retry
+- ❌ Hard-coded secrets in workflows
+- ❌ Silent CI failures — every error needs actionable output with remediation
+- ❌ Assuming npm publish is instantly queryable