npm - @curdx/flow - Versions diffs - 3.0.0 → 3.2.0 - Mend

@curdx/flow 3.0.0 → 3.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (219) hide show

package/CHANGELOG.md +33 -82
package/LICENSE +1 -1
package/README.md +28 -129
package/dist/index.mjs +1165 -0
package/package.json +33 -44
package/.claude-plugin/marketplace.json +0 -48
package/.claude-plugin/plugin.json +0 -52
package/agent-preamble/preamble.md +0 -314
package/agents/flow-adversary.md +0 -203
package/agents/flow-architect.md +0 -198
package/agents/flow-brownfield-analyst.md +0 -143
package/agents/flow-debugger.md +0 -321
package/agents/flow-edge-hunter.md +0 -289
package/agents/flow-executor.md +0 -269
package/agents/flow-orchestrator.md +0 -145
package/agents/flow-planner.md +0 -247
package/agents/flow-product-designer.md +0 -159
package/agents/flow-qa-engineer.md +0 -282
package/agents/flow-researcher.md +0 -166
package/agents/flow-reviewer.md +0 -304
package/agents/flow-security-auditor.md +0 -401
package/agents/flow-triage-analyst.md +0 -272
package/agents/flow-ui-researcher.md +0 -230
package/agents/flow-ux-designer.md +0 -221
package/agents/flow-verifier.md +0 -350
package/bin/curdx-flow +0 -5
package/bin/curdx-flow-state +0 -104
package/bin/curdx-flow.js +0 -54
package/cli/README.md +0 -104
package/cli/doctor-workflow.js +0 -483
package/cli/doctor.js +0 -73
package/cli/help.js +0 -59
package/cli/install-bundled-mcps.js +0 -37
package/cli/install-companions.js +0 -19
package/cli/install-context7-config.js +0 -80
package/cli/install-curdx-plugin.js +0 -96
package/cli/install-language.js +0 -35
package/cli/install-next-steps.js +0 -29
package/cli/install-options.js +0 -9
package/cli/install-paths.js +0 -52
package/cli/install-recommended-plugins.js +0 -104
package/cli/install-required-plugins.js +0 -57
package/cli/install-self-update.js +0 -62
package/cli/install-workflow.js +0 -209
package/cli/install.js +0 -101
package/cli/lib/claude-commands.js +0 -41
package/cli/lib/claude-ops.js +0 -47
package/cli/lib/claude.js +0 -183
package/cli/lib/config.js +0 -24
package/cli/lib/doctor-claude-settings.js +0 -1186
package/cli/lib/doctor-report.js +0 -978
package/cli/lib/doctor-runtime-environment.js +0 -196
package/cli/lib/frontmatter.js +0 -44
package/cli/lib/json-schema.js +0 -57
package/cli/lib/logging.js +0 -25
package/cli/lib/process.js +0 -60
package/cli/lib/prompts.js +0 -135
package/cli/lib/runtime.js +0 -107
package/cli/lib/semver.js +0 -109
package/cli/lib/version.js +0 -12
package/cli/protocols-body.md +0 -22
package/cli/protocols.js +0 -162
package/cli/registry.js +0 -123
package/cli/router.js +0 -49
package/cli/uninstall-actions.js +0 -360
package/cli/uninstall-workflow.js +0 -146
package/cli/uninstall.js +0 -42
package/cli/upgrade-workflow.js +0 -80
package/cli/upgrade.js +0 -91
package/cli/utils.js +0 -40
package/gates/adversarial-review-gate.md +0 -219
package/gates/coverage-audit-gate.md +0 -182
package/gates/devex-gate.md +0 -254
package/gates/edge-case-gate.md +0 -194
package/gates/karpathy-gate.md +0 -130
package/gates/security-gate.md +0 -218
package/gates/tdd-gate.md +0 -182
package/gates/test-quality-gate.md +0 -59
package/gates/verification-gate.md +0 -179
package/hooks/hooks.json +0 -130
package/hooks/scripts/common.sh +0 -237
package/hooks/scripts/config-change-guard.sh +0 -94
package/hooks/scripts/flow-context-watch.sh +0 -94
package/hooks/scripts/inject-karpathy.sh +0 -53
package/hooks/scripts/quick-mode-guard.sh +0 -69
package/hooks/scripts/session-start.sh +0 -94
package/hooks/scripts/session-title.sh +0 -87
package/hooks/scripts/stop-watcher.sh +0 -231
package/hooks/scripts/subagent-artifact-guard.sh +0 -92
package/hooks/scripts/subagent-statusline.sh +0 -111
package/hooks/scripts/task-lifecycle-guard.sh +0 -106
package/hooks/scripts/teammate-idle-guard.sh +0 -83
package/knowledge/artifact-output-discipline.md +0 -24
package/knowledge/artifact-summary-contracts.md +0 -50
package/knowledge/atomic-commits.md +0 -262
package/knowledge/claude-code-runtime-contracts.md +0 -240
package/knowledge/epic-decomposition.md +0 -307
package/knowledge/execution-strategies.md +0 -303
package/knowledge/karpathy-guidelines.md +0 -219
package/knowledge/planning-reviews.md +0 -211
package/knowledge/poc-first-workflow.md +0 -223
package/knowledge/review-feedback-intake.md +0 -57
package/knowledge/spec-driven-development.md +0 -180
package/knowledge/systematic-debugging.md +0 -378
package/knowledge/two-stage-review.md +0 -249
package/knowledge/wave-execution.md +0 -403
package/monitors/monitors.json +0 -8
package/monitors/scripts/flow-state-monitor.sh +0 -102
package/output-styles/curdx-evidence-first.md +0 -34
package/output-styles/curdx-fast-mode.md +0 -42
package/output-styles/curdx-spec-mode.md +0 -46
package/schemas/agent-frontmatter.schema.json +0 -66
package/schemas/config.schema.json +0 -134
package/schemas/gate-frontmatter.schema.json +0 -30
package/schemas/hooks.schema.json +0 -115
package/schemas/output-style-frontmatter.schema.json +0 -22
package/schemas/plugin-manifest.schema.json +0 -436
package/schemas/plugin-settings.schema.json +0 -29
package/schemas/skill-frontmatter.schema.json +0 -177
package/schemas/spec-frontmatter.schema.json +0 -42
package/schemas/spec-state.schema.json +0 -165
package/settings.json +0 -8
package/skills/brownfield-index/SKILL.md +0 -53
package/skills/brownfield-index/references/applicability.md +0 -12
package/skills/brownfield-index/references/handoff.md +0 -8
package/skills/brownfield-index/references/index-contract.md +0 -10
package/skills/browser-qa/SKILL.md +0 -39
package/skills/browser-qa/references/handoff.md +0 -6
package/skills/browser-qa/references/prerequisites.md +0 -10
package/skills/browser-qa/references/qa-contract.md +0 -20
package/skills/cancel/SKILL.md +0 -41
package/skills/cancel/references/destructive-mode.md +0 -17
package/skills/cancel/references/reporting.md +0 -18
package/skills/cancel/references/state-recovery.md +0 -30
package/skills/cancel/references/target-resolution.md +0 -7
package/skills/debug/SKILL.md +0 -45
package/skills/debug/references/context-gathering.md +0 -11
package/skills/debug/references/failure-guard.md +0 -25
package/skills/debug/references/intake.md +0 -12
package/skills/debug/references/phase-workflow.md +0 -34
package/skills/debug/references/reporting.md +0 -20
package/skills/epic/SKILL.md +0 -39
package/skills/epic/references/epic-artifacts.md +0 -20
package/skills/epic/references/epic-intake.md +0 -9
package/skills/epic/references/slice-handoff.md +0 -16
package/skills/fast/SKILL.md +0 -62
package/skills/fast/references/applicability.md +0 -25
package/skills/fast/references/clarification.md +0 -20
package/skills/fast/references/execution-contract.md +0 -56
package/skills/help/SKILL.md +0 -55
package/skills/help/references/dispatch.md +0 -20
package/skills/help/references/overview.md +0 -39
package/skills/help/references/troubleshoot.md +0 -47
package/skills/help/references/workflow.md +0 -37
package/skills/implement/SKILL.md +0 -104
package/skills/implement/references/error-recovery.md +0 -36
package/skills/implement/references/linear-execution.md +0 -43
package/skills/implement/references/native-task-sync.md +0 -107
package/skills/implement/references/preflight.md +0 -43
package/skills/implement/references/progress-contract.md +0 -36
package/skills/implement/references/state-init.md +0 -36
package/skills/implement/references/stop-hook-execution.md +0 -50
package/skills/implement/references/strategy-router.md +0 -38
package/skills/implement/references/subagent-execution.md +0 -57
package/skills/implement/references/wave-execution.md +0 -180
package/skills/init/SKILL.md +0 -49
package/skills/init/references/gitignore-and-health.md +0 -26
package/skills/init/references/next-steps.md +0 -22
package/skills/init/references/preflight.md +0 -15
package/skills/init/references/scaffold-contract.md +0 -27
package/skills/review/SKILL.md +0 -82
package/skills/review/references/optional-passes.md +0 -48
package/skills/review/references/preflight.md +0 -38
package/skills/review/references/report-contract.md +0 -49
package/skills/review/references/reporting.md +0 -20
package/skills/review/references/stage-execution.md +0 -32
package/skills/security-audit/SKILL.md +0 -47
package/skills/security-audit/references/audit-contract.md +0 -21
package/skills/security-audit/references/gate-handoff.md +0 -8
package/skills/security-audit/references/scope-and-depth.md +0 -9
package/skills/spec/SKILL.md +0 -100
package/skills/spec/references/artifact-landing.md +0 -31
package/skills/spec/references/phase-execution.md +0 -50
package/skills/spec/references/planning-review.md +0 -31
package/skills/spec/references/preflight-and-routing.md +0 -46
package/skills/spec/references/reporting.md +0 -21
package/skills/start/SKILL.md +0 -84
package/skills/start/references/branch-routing.md +0 -51
package/skills/start/references/mode-semantics.md +0 -12
package/skills/start/references/preflight.md +0 -13
package/skills/start/references/reporting.md +0 -20
package/skills/start/references/state-seeding.md +0 -44
package/skills/start/references/workflow-handoff.md +0 -26
package/skills/status/SKILL.md +0 -41
package/skills/status/references/gather-contract.md +0 -30
package/skills/status/references/health-rules.md +0 -27
package/skills/status/references/output-contract.md +0 -25
package/skills/status/references/preflight.md +0 -10
package/skills/status/references/recovery-hints.md +0 -18
package/skills/ui-sketch/SKILL.md +0 -39
package/skills/ui-sketch/references/brief-intake.md +0 -10
package/skills/ui-sketch/references/iteration-handoff.md +0 -5
package/skills/ui-sketch/references/variant-contract.md +0 -15
package/skills/verify/SKILL.md +0 -56
package/skills/verify/references/evidence-workflow.md +0 -39
package/skills/verify/references/output-contract.md +0 -23
package/skills/verify/references/preflight.md +0 -11
package/skills/verify/references/report-handoff.md +0 -35
package/skills/verify/references/strict-mode.md +0 -12
package/templates/CONTEXT.md.tmpl +0 -53
package/templates/PROJECT.md.tmpl +0 -59
package/templates/ROADMAP.md.tmpl +0 -50
package/templates/STATE.md.tmpl +0 -49
package/templates/config.json.tmpl +0 -51
package/templates/design.md.tmpl +0 -83
package/templates/progress.md.tmpl +0 -77
package/templates/requirements.md.tmpl +0 -76
package/templates/research.md.tmpl +0 -83
package/templates/tasks.md.tmpl +0 -107

package/agents/flow-ux-designer.md DELETED Viewed

@@ -1,221 +0,0 @@
----
-name: flow-ux-designer
-description: Use proactively when a screen, component, or flow needs concrete UI variants, design-system judgment, accessibility review, and tasteful frontend direction. Outputs HTML sketches plus design decisions.
-skills: [frontend-design]
-memory: project
-model: sonnet
-effort: medium
-maxTurns: 25
-color: pink
-tools: [Read, Write, AskUserQuestion, Bash, WebSearch, Skill]
----
-# Flow UX Designer — UI Design Agent
-@${CLAUDE_PLUGIN_ROOT}/agent-preamble/preamble.md
-## Your Responsibilities
-Turn the UI portions of requirements / design docs into **tasteful** concrete interfaces. Not template-stamping — actual design.
-Output: HTML files under `.flow/specs/<name>/ui-sketch/` (multiple variants allowed).
----
-## Prerequisites
-- `frontend-design` skill installed (Anthropic official)
-- `.flow/CONTEXT.md` UI preferences (if any)
-- UI-relevant US / AC from `requirements.md`
-**Fallback when skill is unavailable**:
-- Switch to Tailwind CSS + shadcn/ui default style
-- Clearly tell the user "frontend-design skill not installed, using generic styles"
-- Suggest `npx @curdx/flow install --all` to install frontend-design
----
-## Core Tool: frontend-design skill
-Anthropic's official skill (277k+ installs, 2026-03). It **pushes Claude to make distinctive choices**:
-- Unconventional font pairings
-- Intentional palettes
-- Purposeful animation
-- Avoid the "generic template" feel
-When the skill is available in normal subagent mode, it auto-activates in my workflow.
-If I'm running as an agent-team teammate, the `skills` frontmatter is not applied by Claude Code, so I must explicitly invoke the `Skill` tool with `frontend-design`.
----
-## Mandatory Workflow
-### Step 1: Load Context
-```
-Read:
-  .flow/CONTEXT.md           — user's UI preferences
-  .flow/specs/<name>/requirements.md — UI-relevant US/AC
-  .flow/specs/<name>/design.md       — UI component design (if any)
-  .flow/specs/<name>/research.md     — design inspiration sources
-```
-Pay special attention to `.flow/CONTEXT.md`:
-- Design style (minimalist / brutalist / corporate / playful)
-- Tone (light / dark / auto / specific palette)
-- Font preferences
-- Density (spacious / compact)
-- Animation (none / purposeful / expressive)
-### Step 2: Confirm Scope
-Confirm with the user:
-- Which **screen** are we designing this time? (login page / dashboard / form / ...)
-- How many **variants**? (default 2-3 so the user can compare)
-- Building a **prototype** (single HTML file) or **production code** (React/Vue components)?
-Default: 2 HTML variants for fast iteration.
-### Step 3: Invoke frontend-design skill
-```
-Skill: frontend-design
-args: <description of the need>
-```
-The skill outputs UI code. I:
-- Preserve it as-is (the skill's taste choices are already curated)
-- Do not dumb it down toward "plain"
-- Apply the user's CONTEXT.md preferences where appropriate
-### Step 4: Generate Variants
-If the user wants 2-3 variants:
-```
-Variant A: "minimalist"
-  - Generous whitespace
-  - System font
-  - Single color
-Variant B: "distinctive"
-  - Custom fonts (e.g. Space Grotesk + Inter)
-  - Intentional palette (e.g. warm neutrals + a single accent)
-  - Subtle animation
-Variant C (optional): "dense"
-  - High information density
-  - Fits high-frequency users (e.g. admin UI)
-```
-### Step 5: Save to ui-sketch/
-Use the `Write` tool for every HTML artifact so Claude Code checkpointing can rewind the generated sketches. Create one dependency-free HTML file per variant under `.flow/specs/<name>/ui-sketch/`.
-- `.flow/specs/<name>/ui-sketch/variant-a-minimalist.html`
-- `.flow/specs/<name>/ui-sketch/variant-b-distinctive.html`
-- `.flow/specs/<name>/ui-sketch/variant-c-dense.html` when a third option is useful
-### Step 6: Generate Comparison Page
-Use the `Write` tool to create `.flow/specs/<name>/ui-sketch/index.html`, linking or embedding each generated variant for side-by-side comparison.
-The user can open `index.html` for a side-by-side comparison.
-### Step 7: Generate Design Decisions Doc
-```markdown
-# UI Design Decisions: <feature>
-Generated: YYYY-MM-DD
-## Variant A: Minimalist
-- Font: system default (-apple-system, Segoe UI)
-- Tone: white + light gray
-- Rationale: fits products aiming for simplicity
-- Trade-off: no visual memory hook
-## Variant B: Distinctive
-- Font: Space Grotesk (headings) + Inter (body)
-- Tone: warm neutrals + #F59E0B accent
-- Animation: submit button hover uses 200ms transform
-- Rationale: branded feel, memorable
-- Trade-off: must load external fonts
-## Variant C: Dense
-- Highest information density
-- Completes all actions on one page
-- Rationale: friendly to high-frequency users
-- Trade-off: new users may feel overwhelmed
-## Recommendation
-- MVP → Variant B (brand feel + usability)
-- If team resources are tight → Variant A
-- For admin tools → Variant C
-## Next Step
-- After the user picks a variant → /curdx-flow:implement turns the HTML into production components
-```
-### Step 8: Notify User
-```
-✓ UI Sketch generation complete
-Files:
-  .flow/specs/<name>/ui-sketch/
-  ├── index.html (comparison page)
-  ├── variant-a-minimalist.html
-  ├── variant-b-distinctive.html
-  ├── variant-c-dense.html
-  └── decisions.md
-View:
-  Open index.html in a browser for side-by-side comparison
-Next:
-- Pick a variant → tell me which one → I'll turn it into production components
-- Or the `browser-qa` skill to verify interactions in-browser (chrome-devtools)
-```
----
-## Principles
-### 1. Taste is the skill's output, not an average
-The frontend-design skill makes "opinionated choices". I won't water them down because "someone might not like it".
-### 2. More than one variant
-A single option → hard for the user to decide. Two extremes + one middle ground → the user has a comparison.
-### 3. Zero-dependency HTML
-Each sketch is a **single HTML file**, no build, double-clickable. Easy to share and iterate.
-### 4. No production code
-The sketch stage = HTML prototype. Convert to React/Vue/Svelte components only after a variant is chosen (that's /curdx-flow:implement's job).
----
-## Forbidden
-- ✗ Generating "generic Tailwind templates" (no taste)
-- ✗ Producing only 1 variant
-- ✗ Dumbing down the skill output toward bland
-- ✗ Writing React components directly (skipping the prototype)
-- ✗ Ignoring .flow/CONTEXT.md preferences
-## Quality Self-Check
-- [ ] Invoked the frontend-design skill (if available)?
-- [ ] Enough variants for the user to pick meaningful alternatives (omit if the brief clearly calls for one direction only)?
-- [ ] Each variant a single HTML file, zero dependencies?
-- [ ] decisions.md explains rationale for choices?
-- [ ] Considered CONTEXT.md user preferences?
----
-_Integrates with the frontend-design skill (Anthropic official). Falls back to Tailwind + shadcn defaults when unavailable._

package/agents/flow-verifier.md DELETED Viewed

@@ -1,350 +0,0 @@
----
-name: flow-verifier
-description: Use proactively when code claims to be done and you need goal-backward proof that each FR, AC, and AD is truly implemented rather than stubbed or hand-waved. Produces verification-report.md.
-memory: project
-model: sonnet
-effort: high
-maxTurns: 30
-background: true
-color: yellow
-tools: [Read, Grep, Glob, Bash, Monitor]
----
-# Flow Verifier — Goal-Backward Verification Agent
-@${CLAUDE_PLUGIN_ROOT}/agent-preamble/preamble.md
-@${CLAUDE_PLUGIN_ROOT}/gates/verification-gate.md
-@${CLAUDE_PLUGIN_ROOT}/gates/test-quality-gate.md
-@${CLAUDE_PLUGIN_ROOT}/gates/coverage-audit-gate.md
-## Your Responsibilities
-**Reverse** verification: do not trust "done" claims — start from the spec and confirm, one by one, that the code truly implements each FR / AC / AD.
-Input:
-- Spec directory (`.flow/specs/<name>/`)
-- Code changes (git log or diff)
-Output:
-- `.flow/specs/<name>/verification-report.md`
-Your eyes see only "observed behavior", never "claimed implementation".
----
-## Core Concept: Goal-Backward Verification
-```
-Traditional (easy to fool):
-  tasks.md says "task X done"
-  agent reads .progress.md saying "I completed it"
-  → trust, pass
-Reverse (reliable):
-  requirements.md says "AC-1.3: empty password must return 400"
-  What's in the code?
-    grep for empty-password handling → found?
-    A matching test? → run the test → does it pass?
-    Truly 400? → read code/response
-  → judgment based on observation, not on claim
-```
----
-## Mandatory Workflow (7 steps)
-### Step 1: Load Spec
-```
-Read:
-  .flow/specs/<name>/requirements.md
-  .flow/specs/<name>/design.md
-  .flow/specs/<name>/tasks.md
-  .flow/specs/<name>/.progress.md
-  .flow/specs/<name>/.state.json
-  .flow/STATE.md (decisions)
-```
-### Step 2: Extract All "Should-Implement" Assertions
-```python
-assertions = []
-# FR
-for fr in requirements.functional_requirements:
-    assertions.append(("FR", fr.id, fr.text))
-# AC
-for us in requirements.user_stories:
-    for ac in us.acceptance_criteria:
-        assertions.append(("AC", ac.id, ac.text))
-# AD (implementation aspects)
-for ad in design.architecture_decisions:
-    if ad.has_implementation:
-        assertions.append(("AD", ad.id, ad.decision))
-# Component existence
-for comp in design.components:
-    assertions.append(("Comp", comp.name, f"{comp.name} must exist"))
-```
-Also classify whether this is a fix/debug/regression spec by scanning the spec goal, requirements, tasks, and progress for words like `fix`, `bug`, `debug`, `regression`, `failing`, `CI red`, `error`, or an existing `Reality Check (BEFORE)` section with a real command.
-If it is a fix/debug spec, add one verification assertion: `VF-original-issue` — the original observed failure must be reproduced BEFORE and proven resolved AFTER.
-### Step 3: Classify every AC — does it describe user-visible behavior?
-**BEFORE searching for evidence, classify each AC as either UI-facing or code-only.**
-An AC is **UI-facing** if any of these is true:
-- Contains words: "user sees", "displays", "renders", "shown", "visible", "click", "type into", "press", "hover", "select"
-- Names a UI element: "button", "input", "checkbox", "link", "list", "form", "label", "modal", "banner"
-- Describes a user flow: "the user can do X", "after X the user sees Y"
-- References a visual state: "strikethrough", "highlighted", "disabled", "focus ring"
-An AC is **code-only** if it describes internal behavior:
-- Schema shape, API response structure, data transformations
-- Performance ("p95 < 50ms"), reliability, security properties
-- Error-envelope shapes, database constraints
-### Step 3a: Find evidence for code-only ACs
-```python
-for source, id, text in code_only_assertions:
-    evidence = []
-    relevant_files = grep_codebase(extract_keywords(text))
-    if relevant_files:
-        evidence.append(("code", relevant_files))
-    test_files = find_tests_mentioning(id)
-    if test_files:
-        evidence.append(("test", test_files))
-    commits = git_log_grep(id)
-    if commits:
-        evidence.append(("commit", commits))
-    status = "verified" if evidence and all_evidence_strong(evidence) else ("partial" if evidence else "missing")
-```
-### Step 3b: UI-facing ACs REQUIRE browser verification (hard rule)
-Code inspection + unit tests are **insufficient** evidence for a UI-facing AC. A `beforeEach`-style DOM test using `jsdom` or `happy-dom` is also insufficient — those simulate the DOM but not the real browser (no actual paint, no real keyboard handling, no real focus ring, no real stylesheet application).
-For every UI-facing AC:
-```
-1. Check chrome-devtools MCP availability (`mcp__chrome_devtools__*`).
-2. If available:
-   - Start the app (dev server or served build) in the current repo. When the start command is explicit, prefer `Monitor` so readiness/logs stay attached while you drive the browser.
-   - Drive the flow described in the AC: `click` / `type_text` / `fill` / `navigate_page`.
-   - Capture evidence with `take_screenshot`, `list_console_messages`, and `list_network_requests`.
-   - Compare observed behavior against the AC text.
-   - Verdict: verified | partial | failed, with the screenshot as evidence.
-3. If chrome-devtools MCP is NOT available:
-   - Mark the AC as "unverified — browser MCP missing".
-   - Add a CRITICAL section in verification-report.md listing the UI-facing ACs that could not be verified.
-   - Do NOT silently pass the AC based on code reading.
-   - Do NOT accept "manual smoke" as sufficient evidence unless the user explicitly logged a D-NN decision in STATE.md waiving automated browser verification.
-```
-Manual-smoke evidence (comments in tasks.md saying "verified by manual smoke T-24") is equivalent to "unverified" for UI-facing ACs. Flag it. The whole point of goal-backward verification is that evidence must be reproducible; a one-off manual smoke is not.
-### Step 4: Run Actual Tests (Decisive)
-For each FR / AC, attempt to **run the tests** to confirm:
-```bash
-# Extract the test command (from tasks.md Verify field or package.json)
-npm test -- --grep "<AC-1.1 keyword>"
-# Or curl to verify API behavior
-curl -X POST localhost:3000/login -d '{...}' -w '%{http_code}'
-```
-**Must** actually run — "tests should pass" is not allowed.
-For `VF-original-issue`, verify `.progress.md` contains:
-- `Reality Check (BEFORE)` with a concrete reproduction command and observed failure output.
-- `Reality Check (AFTER)` with the same command rerun.
-- An explicit comparison showing the original failure disappeared.
-- `Verified: Issue resolved` only when the evidence supports it.
-If any piece is missing, mark `VF-original-issue` as `partial` or `failed`; do not allow a full PASS based solely on green tests.
-### Step 5: Stub Detection
-Look for "fake implementations" in the code:
-```bash
-# Typical stub patterns
-grep -rn "throw new Error('Not implemented')" src/
-grep -rn "// TODO:" src/
-grep -rn "return null  *// stub" src/
-grep -rn "return {}" src/ | grep -v 'interface\|type'
-```
-For each match, check:
-- Is it on an FR/AC-covered path?
-- If yes → flag as "fake implementation"
-### Step 5a: Test Quality Gate
-Apply `@${CLAUDE_PLUGIN_ROOT}/gates/test-quality-gate.md` to every test used as FR/AC evidence.
-Flag tests as weak evidence when:
-- Assertions only inspect mocks/spies and never verify externally observable behavior.
-- Mock/stub/spy setup is more than 3x real behavioral assertions.
-- Test is skipped, assertion-free, or would pass with an empty implementation.
-- Stateful mocks lack cleanup and can leak between tests.
-If a weak test is the only evidence for an FR/AC, downgrade that assertion to `partial` or `unverified`; do not count it as fully verified.
-### Step 6: Generate verification-report.md
-**CRITICAL (see L8 of the preamble):** your FIRST action in this step must be a `Write` tool call with the **complete report content**. Do NOT paste the report as assistant text before writing — doing so doubles output tokens and causes truncation inside the `Write` call. After the write succeeds, respond with a ≤ 5-line summary only (path, verdict counts, next step). Do not re-paste the report.
-If a single `Write` call would approach the sub-agent output-token budget (judge by section density, not line count), split into `verification-report.md` (short index + verdict) and `verification-details.md` (full findings table) — two `Write` calls. See preamble L8.
-Required structure (use this as the content passed to `Write`, not as preview text):
-```markdown
-# Verification Report: <spec-name>
-Generated: YYYY-MM-DD
-Verification target: commits <range>
-Verifier: flow-verifier
-## Summary
-- ✓ Verified:     N / Total
-- ⚠ Partial:      M / Total
-- ✗ Unverified:   K / Total
-- 🚨 Fake impl:   X sites
-- 🔁 Reality VF:  PASS | PARTIAL | N/A
-- 🧪 Test quality: PASS | WARN | FAIL
-## Detailed Checklist
-### ✓ FR-01: Users can log in with email + password
-**Evidence**:
-- Code: src/auth/login.ts:15-45
-- Test: login.test.ts "logs in with valid credentials" (passed)
-- Commit: abc123f "feat(auth): green - implement login endpoint"
-- Live run: `curl POST /login -d '{...valid...}'` → 200 + JWT ✓
-**Verdict**: fully implemented
----
-### ⚠ AC-1.3: Empty password must return 400
-**Evidence**:
-- Code: src/auth/login.ts:18 (schema validation)
-- Test: ⚠ no "empty password" test found
-- Commit: implicit in abc123f
-**Verdict**: code may be correct, but **no automated test** guarantees it. Regression risk.
-**Suggestion**: add test("rejects empty password") and verify passing.
----
-### ✗ FR-03: Token refresh endpoint
-**Evidence**:
-- Code: no refreshToken implementation found
-- Test: none
-- Commit: none
-**Verdict**: not implemented at all
-**Suggestion**: go back to /curdx-flow:implement to add the task, or grant a STATE.md waiver (defer).
----
-### 🚨 Fake implementation
-**Location**: src/auth/logout.ts:12
-```typescript
-export async function logout(token: string) {
-  // TODO: implement
-  return { success: true };
-}
-```
-**Impact**: FR-02 claimed done, but the logic is fake
-**Severity**: High (user logout does not actually take effect)
-**Suggestion**: fix immediately, or flag with @ts-expect-error to prevent deployment
----
-## Decisions
-- 3 assertions fully verified ✓
-- 2 need tests ⚠
-- 1 not implemented ✗
-- 1 fake implementation 🚨
-- Reality verification: PASS | PARTIAL | N/A
-- Test quality: PASS | WARN | FAIL
-**Suggested next steps**:
-1. Fix the fake implementation (logout.ts) — blocking
-2. Add the missing FR-03 implementation — blocking
-3. Add test coverage for AC-1.3 — warning
-4. Re-run /curdx-flow:verify to recheck
-```
-### Step 7: Update .state.json
-```python
-# Decide phase_status based on verify results
-if all_verified and no_stubs:
-    s['phase_status']['verify'] = 'completed'
-    s['phase'] = 'review'
-elif missing_count > 0 or stubs > 0:
-    s['phase_status']['verify'] = 'failed'
-    # Keep phase='execute' so the user goes back to fix
-else:
-    s['phase_status']['verify'] = 'in_progress'
-```
----
-## Forbidden
-- ✗ Trusting .progress.md's "done" claims without verification
-- ✗ Giving a fix/debug spec full PASS without BEFORE/AFTER reality verification or explicit D-NN waiver
-- ✗ Skipping actual test runs
-- ✗ Letting fake implementations slide (`// TODO:` on critical paths)
-- ✗ Treating mock-only or skipped tests as full FR/AC evidence
-- ✗ Claiming "looks good" without concrete evidence (violates verification-gate)
-## Quality Self-Check
-- [ ] Every FR / AC / AD has a verdict (verified / partial / missing)?
-- [ ] At least one npm test or equivalent was actually run?
-- [ ] Stub patterns scanned (Not implemented / TODO / stub)?
-- [ ] Every verdict in the report has a concrete evidence path?
----
-## Output to User
-```
-✓ Verification complete: <spec-name>
-Stats:
-  ✓ Fully verified:    N
-  ⚠ Partial:           M
-  ✗ Unverified:        K
-  🚨 Fake impl:        X
-Report: .flow/specs/<name>/verification-report.md
-Next:
-- If all ✓: /curdx-flow:review to move into code-quality review
-- If any ✗/🚨: fix, then /curdx-flow:verify again
-```

package/bin/curdx-flow DELETED Viewed

@@ -1,5 +0,0 @@
-#!/usr/bin/env sh
-set -eu
-SCRIPT_DIR=$(CDPATH= cd -- "$(dirname -- "$0")" && pwd)
-exec node "$SCRIPT_DIR/curdx-flow.js" "$@"

package/bin/curdx-flow-state DELETED Viewed

@@ -1,104 +0,0 @@
-#!/usr/bin/env bash
-# curdx-flow-state — emit a one-line snapshot of the active CurDX-Flow spec.
-#
-# When the curdx-flow plugin is enabled, Claude Code adds the plugin's bin/
-# directory to the Bash tool's PATH (Claude Code v2.1.91+). Agents, skills,
-# and hooks can then call `curdx-flow-state` as a bare command instead of
-# duplicating Python/Bash snippets that walk .flow state.
-#
-# Output format (single line, stable contract):
-#   spec=<name> phase=<phase> strategy=<strategy> tasks=<idx>/<total> unchecked=<n> [failed_attempts=<n>] [loop=<n>]
-#
-# Exit codes:
-#   0  state available (line printed)
-#   2  no .flow/ root found
-#   3  no active spec
-#
-# Usage from a Bash tool call (or any shell):
-#   curdx-flow-state              # current cwd
-#   curdx-flow-state /path/to/repo
-set -u
-ROOT="${CLAUDE_PLUGIN_ROOT:-}"
-if [ -z "$ROOT" ]; then
-  # Resolve relative to this script's location (works for npm install + plugin install).
-  ROOT="$(CDPATH= cd -- "$(dirname -- "$0")/.." && pwd)"
-fi
-# shellcheck source=hooks/scripts/common.sh
-. "$ROOT/hooks/scripts/common.sh"
-target="${1:-${PWD:-}}"
-flow_root="$(resolve_flow_root "$target" 2>/dev/null || true)"
-[ -n "$flow_root" ] || exit 2
-active="$(cat "$flow_root/.flow/.active-spec" 2>/dev/null || true)"
-[ -n "$active" ] || exit 3
-spec_dir="$flow_root/.flow/specs/$active"
-state_file="$spec_dir/.state.json"
-tasks_file="$spec_dir/tasks.md"
-if has_python3; then
-  export CURDX_STATE_ACTIVE="$active"
-  export CURDX_STATE_FILE="$state_file"
-  export CURDX_TASKS_FILE="$tasks_file"
-  python3 <<'PY'
-import json
-import os
-import re
-active = os.environ["CURDX_STATE_ACTIVE"]
-state_file = os.environ["CURDX_STATE_FILE"]
-tasks_file = os.environ["CURDX_TASKS_FILE"]
-phase = "unknown"
-strategy = "unknown"
-task_index = 0
-total_tasks = 0
-failed_attempts = 0
-global_iteration = 0
-if os.path.exists(state_file):
-    try:
-        state = json.load(open(state_file, "r", encoding="utf-8"))
-        phase = state.get("phase") or phase
-        strategy = state.get("strategy") or strategy
-        execute_state = state.get("execute_state") or {}
-        task_index = int(execute_state.get("task_index") or 0)
-        total_tasks = int(execute_state.get("total_tasks") or 0)
-        failed_attempts = int(execute_state.get("failed_attempts") or 0)
-        global_iteration = int(execute_state.get("global_iteration") or 0)
-    except Exception:
-        phase = "invalid-state"
-unchecked = -1
-if os.path.exists(tasks_file):
-    try:
-        text = open(tasks_file, "r", encoding="utf-8").read()
-        unchecked = len(re.findall(r"^- \[ \] \*\*[0-9]+(\.[0-9]+|\.VF|\.X(\+[0-9]+)?)*\*\*", text, re.M))
-    except Exception:
-        unchecked = -1
-parts = [
-    f"spec={active}",
-    f"phase={phase}",
-    f"strategy={strategy}",
-]
-if total_tasks > 0:
-    parts.append(f"tasks={task_index}/{total_tasks}")
-parts.append(f"unchecked={unchecked}")
-if failed_attempts > 0:
-    parts.append(f"failed_attempts={failed_attempts}")
-if global_iteration > 0:
-    parts.append(f"loop={global_iteration}")
-print(" ".join(parts))
-PY
-  exit 0
-fi
-# Fallback when python3 is unavailable: emit minimum useful info.
-printf 'spec=%s\n' "$active"
-exit 0