npm - @mainahq/core - Versions diffs - 0.2.0 - Mend

@mainahq/core 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (156) hide show

package/README.md +31 -0
package/package.json +37 -0
package/src/ai/__tests__/ai.test.ts +207 -0
package/src/ai/__tests__/design-approaches.test.ts +192 -0
package/src/ai/__tests__/spec-questions.test.ts +191 -0
package/src/ai/__tests__/tiers.test.ts +110 -0
package/src/ai/commit-msg.ts +28 -0
package/src/ai/design-approaches.ts +76 -0
package/src/ai/index.ts +205 -0
package/src/ai/pr-summary.ts +60 -0
package/src/ai/spec-questions.ts +74 -0
package/src/ai/tiers.ts +52 -0
package/src/ai/try-generate.ts +89 -0
package/src/ai/validate.ts +66 -0
package/src/benchmark/__tests__/reporter.test.ts +525 -0
package/src/benchmark/__tests__/runner.test.ts +113 -0
package/src/benchmark/__tests__/story-loader.test.ts +152 -0
package/src/benchmark/reporter.ts +332 -0
package/src/benchmark/runner.ts +91 -0
package/src/benchmark/story-loader.ts +88 -0
package/src/benchmark/types.ts +95 -0
package/src/cache/__tests__/keys.test.ts +97 -0
package/src/cache/__tests__/manager.test.ts +312 -0
package/src/cache/__tests__/ttl.test.ts +94 -0
package/src/cache/keys.ts +44 -0
package/src/cache/manager.ts +231 -0
package/src/cache/ttl.ts +77 -0
package/src/config/__tests__/config.test.ts +376 -0
package/src/config/index.ts +198 -0
package/src/context/__tests__/budget.test.ts +179 -0
package/src/context/__tests__/engine.test.ts +163 -0
package/src/context/__tests__/episodic.test.ts +291 -0
package/src/context/__tests__/relevance.test.ts +323 -0
package/src/context/__tests__/retrieval.test.ts +143 -0
package/src/context/__tests__/selector.test.ts +174 -0
package/src/context/__tests__/semantic.test.ts +252 -0
package/src/context/__tests__/treesitter.test.ts +229 -0
package/src/context/__tests__/working.test.ts +236 -0
package/src/context/budget.ts +130 -0
package/src/context/engine.ts +394 -0
package/src/context/episodic.ts +251 -0
package/src/context/relevance.ts +325 -0
package/src/context/retrieval.ts +325 -0
package/src/context/selector.ts +93 -0
package/src/context/semantic.ts +331 -0
package/src/context/treesitter.ts +216 -0
package/src/context/working.ts +192 -0
package/src/db/__tests__/db.test.ts +151 -0
package/src/db/index.ts +211 -0
package/src/db/schema.ts +84 -0
package/src/design/__tests__/design.test.ts +310 -0
package/src/design/__tests__/generate-hld-lld.test.ts +109 -0
package/src/design/__tests__/review.test.ts +561 -0
package/src/design/index.ts +297 -0
package/src/design/review.ts +327 -0
package/src/explain/__tests__/explain.test.ts +173 -0
package/src/explain/index.ts +181 -0
package/src/features/__tests__/analyzer.test.ts +358 -0
package/src/features/__tests__/checklist.test.ts +454 -0
package/src/features/__tests__/numbering.test.ts +319 -0
package/src/features/__tests__/quality.test.ts +295 -0
package/src/features/__tests__/traceability.test.ts +147 -0
package/src/features/analyzer.ts +445 -0
package/src/features/checklist.ts +366 -0
package/src/features/index.ts +18 -0
package/src/features/numbering.ts +404 -0
package/src/features/quality.ts +349 -0
package/src/features/test-stubs.ts +157 -0
package/src/features/traceability.ts +260 -0
package/src/feedback/__tests__/async-feedback.test.ts +52 -0
package/src/feedback/__tests__/collector.test.ts +219 -0
package/src/feedback/__tests__/compress.test.ts +150 -0
package/src/feedback/__tests__/preferences.test.ts +169 -0
package/src/feedback/collector.ts +135 -0
package/src/feedback/compress.ts +92 -0
package/src/feedback/preferences.ts +108 -0
package/src/git/__tests__/git.test.ts +62 -0
package/src/git/index.ts +110 -0
package/src/hooks/__tests__/runner.test.ts +266 -0
package/src/hooks/index.ts +8 -0
package/src/hooks/runner.ts +130 -0
package/src/index.ts +356 -0
package/src/init/__tests__/init.test.ts +228 -0
package/src/init/index.ts +364 -0
package/src/language/__tests__/detect.test.ts +77 -0
package/src/language/__tests__/profile.test.ts +51 -0
package/src/language/detect.ts +70 -0
package/src/language/profile.ts +110 -0
package/src/prompts/__tests__/defaults.test.ts +52 -0
package/src/prompts/__tests__/engine.test.ts +183 -0
package/src/prompts/__tests__/evolution-resolve.test.ts +169 -0
package/src/prompts/__tests__/evolution.test.ts +187 -0
package/src/prompts/__tests__/loader.test.ts +105 -0
package/src/prompts/candidates/review-v2.md +55 -0
package/src/prompts/defaults/ai-review.md +49 -0
package/src/prompts/defaults/commit.md +30 -0
package/src/prompts/defaults/context.md +26 -0
package/src/prompts/defaults/design-approaches.md +57 -0
package/src/prompts/defaults/design-hld-lld.md +55 -0
package/src/prompts/defaults/design.md +53 -0
package/src/prompts/defaults/explain.md +31 -0
package/src/prompts/defaults/fix.md +32 -0
package/src/prompts/defaults/index.ts +38 -0
package/src/prompts/defaults/review.md +41 -0
package/src/prompts/defaults/spec-questions.md +59 -0
package/src/prompts/defaults/tests.md +72 -0
package/src/prompts/engine.ts +137 -0
package/src/prompts/evolution.ts +409 -0
package/src/prompts/loader.ts +71 -0
package/src/review/__tests__/review.test.ts +288 -0
package/src/review/comprehensive.ts +362 -0
package/src/review/index.ts +417 -0
package/src/stats/__tests__/tracker.test.ts +323 -0
package/src/stats/index.ts +11 -0
package/src/stats/tracker.ts +492 -0
package/src/ticket/__tests__/ticket.test.ts +273 -0
package/src/ticket/index.ts +185 -0
package/src/utils.ts +87 -0
package/src/verify/__tests__/ai-review.test.ts +242 -0
package/src/verify/__tests__/coverage.test.ts +83 -0
package/src/verify/__tests__/detect.test.ts +175 -0
package/src/verify/__tests__/diff-filter.test.ts +338 -0
package/src/verify/__tests__/fix.test.ts +478 -0
package/src/verify/__tests__/linters/clippy.test.ts +45 -0
package/src/verify/__tests__/linters/go-vet.test.ts +27 -0
package/src/verify/__tests__/linters/ruff.test.ts +64 -0
package/src/verify/__tests__/mutation.test.ts +141 -0
package/src/verify/__tests__/pipeline.test.ts +553 -0
package/src/verify/__tests__/proof.test.ts +97 -0
package/src/verify/__tests__/secretlint.test.ts +190 -0
package/src/verify/__tests__/semgrep.test.ts +217 -0
package/src/verify/__tests__/slop.test.ts +366 -0
package/src/verify/__tests__/sonar.test.ts +113 -0
package/src/verify/__tests__/syntax-guard.test.ts +227 -0
package/src/verify/__tests__/trivy.test.ts +191 -0
package/src/verify/__tests__/visual.test.ts +139 -0
package/src/verify/ai-review.ts +276 -0
package/src/verify/coverage.ts +134 -0
package/src/verify/detect.ts +171 -0
package/src/verify/diff-filter.ts +183 -0
package/src/verify/fix.ts +317 -0
package/src/verify/linters/clippy.ts +52 -0
package/src/verify/linters/go-vet.ts +32 -0
package/src/verify/linters/ruff.ts +47 -0
package/src/verify/mutation.ts +143 -0
package/src/verify/pipeline.ts +328 -0
package/src/verify/proof.ts +277 -0
package/src/verify/secretlint.ts +168 -0
package/src/verify/semgrep.ts +170 -0
package/src/verify/slop.ts +493 -0
package/src/verify/sonar.ts +146 -0
package/src/verify/syntax-guard.ts +251 -0
package/src/verify/trivy.ts +161 -0
package/src/verify/visual.ts +460 -0
package/src/workflow/__tests__/context.test.ts +110 -0
package/src/workflow/context.ts +81 -0

package/src/prompts/candidates/review-v2.md ADDED Viewed

@@ -0,0 +1,55 @@
+You are reviewing code changes in a {{language}} codebase.
+## Constitution (non-negotiable)
+{{constitution}}
+## Team conventions
+{{conventions}}
+## Instructions
+Review ONLY the added/modified lines (lines starting with '+').
+### Priority 1 — Correctness
+1. Security vulnerabilities (injection, XSS, auth bypass)
+2. Business logic errors (wrong conditions, missing edge cases)
+3. Missing error handling (unhandled promises, uncaught exceptions)
+4. Violations of constitution or team conventions
+### Priority 2 — Integration
+5. Hardcoded paths or environment-specific values (must use process.cwd(), env vars, or config)
+6. Framework conventions violated (e.g., Astro BASE_URL needs trailing slash, Starlight slug resolution)
+7. CSS cascade/specificity issues (especially with third-party themes — check if overrides actually win)
+8. Accessibility: color contrast ratios below WCAG AA (4.5:1 for normal text, 3:1 for large text)
+### Priority 3 — Consistency
+9. Dark mode: if light mode styles exist, dark mode must also be handled
+10. Links: verify all internal hrefs resolve to actual pages (no 404s)
+11. Assets: verify all src/href paths include correct base URL prefix
+Do NOT comment on:
+- Style issues (handled by Biome)
+- Naming conventions (handled by linter)
+- Minor refactoring suggestions
+- Lock files (bun.lock, package-lock.json)
+If anything is ambiguous, use [NEEDS CLARIFICATION: specific question] instead of guessing.
+For each issue found, respond in this exact format:
+```yaml
+issues:
+  - file: "path/to/file.ts"
+    line: 42
+    severity: "critical|major|minor"
+    issue: "Brief description"
+    suggestion: "How to fix it"
+```
+If no issues found:
+```yaml
+issues: []
+summary: "No issues found."
+```
+## Diff to review
+{{diff}}

package/src/prompts/defaults/ai-review.md ADDED Viewed

@@ -0,0 +1,49 @@
+You are reviewing code changes for semantic issues that static analysis cannot catch.
+## Constitution (non-negotiable)
+{{constitution}}
+## Review Mode
+{{reviewMode}}
+## Instructions
+Analyze the diff and referenced function bodies below. Report ONLY issues that are:
+1. Cross-function consistency violations (caller passes wrong args, mismatched types, wrong order)
+2. Missing edge cases (null/undefined not handled, empty arrays, boundary values)
+3. Dead branches (conditions that can never be true given the data flow)
+4. API contract violations (return type doesn't match declared interface, missing required fields)
+{{#if specContext}}
+Also check:
+5. Spec compliance — does the implementation match the requirements in the spec?
+6. Architecture — does the structure follow the design described in the plan?
+7. Test coverage gaps — are there untested paths in the changed code?
+{{/if}}
+Severity rules:
+- mechanical mode: ALL findings are "warning" severity (never "error")
+- deep mode: findings may be "warning" or "error"
+Respond in this exact JSON format (no markdown fences, no extra text):
+{"findings":[{"file":"path","line":42,"message":"description","severity":"warning","ruleId":"ai-review/cross-function"}]}
+Valid ruleIds: ai-review/cross-function, ai-review/edge-case, ai-review/dead-code, ai-review/contract, ai-review/spec-compliance, ai-review/architecture, ai-review/coverage-gap
+If no issues found: {"findings":[]}
+## Diff
+{{diff}}
+## Referenced Functions
+{{referencedFunctions}}
+{{#if specContext}}
+## Spec
+{{specContext}}
+{{/if}}
+{{#if planContext}}
+## Plan
+{{planContext}}
+{{/if}}

package/src/prompts/defaults/commit.md ADDED Viewed

@@ -0,0 +1,30 @@
+You are generating a conventional commit message from staged changes.
+## Constitution (non-negotiable)
+{{constitution}}
+## Team conventions
+{{conventions}}
+## Instructions
+Analyze the diff below and produce a single conventional commit message.
+Rules:
+- Format: `<type>(<scope>): <short description>`
+- Types: feat, fix, refactor, test, docs, chore, ci, perf
+- Scope: the package or module affected (e.g. core, cli, cache, prompts)
+- Subject line: imperative mood, max 72 characters, no period at end
+- Body (optional): explain WHY, not WHAT — include if the change is non-obvious
+- Footer (optional): reference issues with `Closes #123` or `Refs #456`
+Do NOT:
+- Generate multiple commits for one diff
+- Use vague messages like "fix stuff" or "updates"
+- Include style-only changes as feat or fix
+If the intent of the change is ambiguous, use [NEEDS CLARIFICATION: what is the business purpose of this change?] before generating.
+Respond with ONLY the commit message, no explanation:
+## Diff to commit
+{{diff}}

package/src/prompts/defaults/context.md ADDED Viewed

@@ -0,0 +1,26 @@
+You are generating a focused context summary for an AI coding session.
+## Constitution (non-negotiable)
+{{constitution}}
+## Instructions
+Given the raw context below (files, git log, recent changes), produce a concise summary that helps an AI assistant understand the current state of the codebase.
+Output structure:
+1. **Current task** — what is being worked on right now?
+2. **Relevant files** — list the files most relevant to the task with one-line descriptions
+3. **Recent changes** — summary of recent commits and what changed
+4. **Dependencies** — key external dependencies and their versions relevant to the task
+5. **Known issues** — open TODOs, failing tests, or known blockers
+Rules:
+- Keep the total output under {{budget}} tokens
+- Prioritize information that changes frequently (recent commits, open issues) over stable facts
+- Omit boilerplate files (lock files, generated code, config files) unless they are the focus
+- Use bullet points, not prose paragraphs
+- Include file paths relative to the repo root
+If the task context is missing or ambiguous, use [NEEDS CLARIFICATION: what is the current task or goal?] before summarizing.
+## Raw context
+{{raw_context}}

package/src/prompts/defaults/design-approaches.md ADDED Viewed

@@ -0,0 +1,57 @@
+You are proposing architectural approaches for a design decision, with tradeoffs and a recommendation.
+## Constitution (non-negotiable)
+{{constitution}}
+## Team conventions
+{{conventions}}
+## Instructions
+Given the design context below, propose 2-3 distinct approaches to the architectural decision.
+For each approach, provide:
+1. **Name** — a short descriptive label (2-4 words)
+2. **Description** — how this approach works (2-3 sentences)
+3. **Pros** — concrete advantages (2-3 bullet points)
+4. **Cons** — concrete disadvantages (2-3 bullet points)
+5. **Recommendation** — boolean, true for at most one approach
+Rules:
+- Approaches must be genuinely different, not minor variations
+- Pros and cons must be specific to this decision, not generic
+- Exactly one approach should be recommended with reasoning
+- Consider: complexity, performance, maintainability, alignment with existing architecture
+- If the context is too vague to propose meaningful approaches, return an empty array
+Output format: valid JSON array. Each approach object has:
+- `name` (string): short label
+- `description` (string): how it works
+- `pros` (string[]): advantages
+- `cons` (string[]): disadvantages
+- `recommended` (boolean): true for the recommended approach
+Example:
+```json
+[
+  {
+    "name": "Event-driven pipeline",
+    "description": "Each verification step emits events consumed by the next. Steps run independently and communicate through an event bus.",
+    "pros": ["Easy to add new steps", "Steps can run in parallel", "Clear separation of concerns"],
+    "cons": ["Harder to debug event flow", "Event ordering complexity", "More infrastructure code"],
+    "recommended": true
+  },
+  {
+    "name": "Sequential middleware chain",
+    "description": "Steps are chained as middleware functions. Each step receives input, processes it, and passes to the next.",
+    "pros": ["Simple mental model", "Easy to debug", "Familiar pattern"],
+    "cons": ["Cannot parallelize", "Adding steps requires chain modification", "Tight coupling"],
+    "recommended": false
+  }
+]
+```
+Output ONLY the JSON array, no surrounding text or markdown fences.
+## Design context
+{{context}}

package/src/prompts/defaults/design-hld-lld.md ADDED Viewed

@@ -0,0 +1,55 @@
+You are generating High-Level Design (HLD) and Low-Level Design (LLD) sections for an Architecture Decision Record.
+## Constitution (non-negotiable)
+{{constitution}}
+## Instructions
+Given the spec below, generate HLD and LLD sections in markdown. Use concrete details from the spec — never invent requirements.
+For any section where the spec does not provide enough information, write `[NEEDS CLARIFICATION]` instead of guessing.
+Output ONLY the markdown sections below (no preamble, no fences):
+## High-Level Design
+### System Overview
+(2-3 sentences describing what this change does at a system level)
+### Component Boundaries
+(List each component/module affected and its responsibility)
+### Data Flow
+(Describe how data moves through the components)
+### External Dependencies
+(List any new dependencies, APIs, or services)
+## Low-Level Design
+### Interfaces & Types
+(TypeScript interfaces and types to be created or modified)
+### Function Signatures
+(Key function signatures with parameter and return types)
+### DB Schema Changes
+(Any database table or column changes, or "None")
+### Sequence of Operations
+(Step-by-step order of operations for the main flow)
+### Error Handling
+(How errors are handled at each step)
+### Edge Cases
+(Known edge cases and how they are addressed)
+## Spec
+{{spec}}
+## Project Conventions
+{{conventions}}
+{{#if context}}
+## Codebase Context
+{{context}}
+{{/if}}

package/src/prompts/defaults/design.md ADDED Viewed

@@ -0,0 +1,53 @@
+You are scaffolding an Architecture Decision Record (ADR) for a technical decision.
+## Constitution (non-negotiable)
+{{constitution}}
+## Team conventions
+{{conventions}}
+## Instructions
+Generate a complete ADR markdown document based on the context below.
+ADR structure (follow exactly):
+```markdown
+# ADR-{{number}}: {{title}}
+**Date:** {{date}}
+**Status:** Proposed | Accepted | Deprecated | Superseded
+## Context
+What is the situation that forces us to make this decision?
+## Decision
+What have we decided to do?
+## Consequences
+### Positive
+- ...
+### Negative
+- ...
+### Risks
+- ...
+## Alternatives considered
+| Option | Pros | Cons | Rejected because |
+|--------|------|------|-----------------|
+| ...    | ...  | ...  | ...             |
+## References
+- Links to relevant code, docs, or prior decisions
+```
+Rules:
+- Be specific and concrete — avoid generic statements
+- State consequences honestly, including negative ones
+- Alternatives must be real options that were actually considered
+- The decision section must be unambiguous
+If the decision context is incomplete, use [NEEDS CLARIFICATION: what constraints drove this decision?] before generating.
+## Design context
+{{context}}

package/src/prompts/defaults/explain.md ADDED Viewed

@@ -0,0 +1,31 @@
+You are explaining code to a developer unfamiliar with this module.
+## Constitution (non-negotiable)
+{{constitution}}
+## Instructions
+Explain the code below clearly and concisely. Include a Mermaid diagram where it helps understanding.
+Structure your explanation as:
+1. **Purpose** — what problem does this code solve?
+2. **How it works** — step-by-step walkthrough of the key logic
+3. **Diagram** — a Mermaid flowchart or sequence diagram showing the main flow
+4. **Key decisions** — why important design choices were made (if apparent from the code)
+5. **Gotchas** — non-obvious behaviors, edge cases, or known limitations
+Rules:
+- Write for a senior developer who is new to this codebase
+- Be precise — use actual function/variable names from the code
+- Keep the diagram to the essential flow (5–15 nodes)
+- Do NOT suggest refactoring unless asked
+If the purpose of the code is unclear, use [NEEDS CLARIFICATION: what is the intended behavior of this module?] before explaining.
+Mermaid diagram format:
+```mermaid
+flowchart TD
+    A[Entry point] --> B[Step]
+```
+## Code to explain
+{{code}}

package/src/prompts/defaults/fix.md ADDED Viewed

@@ -0,0 +1,32 @@
+You are generating code fixes for linter errors and security findings.
+## Constitution (non-negotiable)
+{{constitution}}
+## Team conventions
+{{conventions}}
+## Instructions
+Given the findings below, generate the minimal code changes needed to resolve each issue.
+Rules:
+- Fix ONLY what is reported — do not refactor unrelated code
+- Preserve the original logic unless the logic itself is the bug
+- For security findings: prefer safe APIs over disabling rules
+- For linter errors: apply the fix the linter suggests unless it conflicts with the constitution
+- Show each fix as a unified diff or a before/after code block
+- One fix per finding — do not combine unrelated fixes
+Priority order:
+1. Critical security vulnerabilities (fix immediately)
+2. Runtime errors and crashes
+3. Type errors and undefined behavior
+4. Linter warnings
+If a finding is a false positive or requires design changes beyond a line fix, use [NEEDS CLARIFICATION: this finding may require architectural changes — confirm the intended approach].
+## Findings to fix
+{{findings}}
+## Relevant source
+{{source}}

package/src/prompts/defaults/index.ts ADDED Viewed

@@ -0,0 +1,38 @@
+import { join } from "node:path";
+export type PromptTask =
+	| "review"
+	| "commit"
+	| "tests"
+	| "fix"
+	| "explain"
+	| "design"
+	| "context"
+	| "spec-questions"
+	| "design-approaches"
+	| "ai-review"
+	| "design-hld-lld";
+const FALLBACK_TEMPLATE = `You are a helpful AI assistant completing the "{{task}}" task.
+## Constitution (non-negotiable)
+{{constitution}}
+## Instructions
+Complete the requested task based on the input provided below.
+If anything is ambiguous, use [NEEDS CLARIFICATION: specific question] instead of guessing.
+## Input
+{{input}}
+`;
+export async function loadDefault(task: PromptTask): Promise<string> {
+	try {
+		const filePath = join(import.meta.dir, `${task}.md`);
+		const text = await Bun.file(filePath).text();
+		return text;
+	} catch {
+		return FALLBACK_TEMPLATE;
+	}
+}

package/src/prompts/defaults/review.md ADDED Viewed

@@ -0,0 +1,41 @@
+You are reviewing code changes in a {{language}} codebase.
+## Constitution (non-negotiable)
+{{constitution}}
+## Team conventions
+{{conventions}}
+## Instructions
+Review ONLY the added/modified lines (lines starting with '+').
+Focus on:
+1. Security vulnerabilities (injection, XSS, auth bypass)
+2. Business logic errors (wrong conditions, missing edge cases)
+3. Missing error handling (unhandled promises, uncaught exceptions)
+4. Violations of constitution or team conventions
+Do NOT comment on:
+- Style issues (handled by Biome)
+- Naming conventions (handled by linter)
+- Minor refactoring suggestions
+If anything is ambiguous, use [NEEDS CLARIFICATION: specific question] instead of guessing.
+For each issue found, respond in this exact format:
+```yaml
+issues:
+  - file: "path/to/file.ts"
+    line: 42
+    severity: "critical|major|minor"
+    issue: "Brief description"
+    suggestion: "How to fix it"
+```
+If no issues found:
+```yaml
+issues: []
+summary: "No issues found."
+```
+## Diff to review
+{{diff}}

package/src/prompts/defaults/spec-questions.md ADDED Viewed

@@ -0,0 +1,59 @@
+You are analyzing an implementation plan to generate clarifying questions that surface ambiguity before test stubs are written.
+## Constitution (non-negotiable)
+{{constitution}}
+## Team conventions
+{{conventions}}
+## Instructions
+Given the implementation plan below, identify 3-5 clarifying questions that should be answered before writing test stubs or implementation code.
+Focus on:
+1. **Ambiguous requirements** — where multiple valid interpretations exist
+2. **Missing edge cases** — boundary conditions, error scenarios, empty/null inputs not addressed
+3. **Unstated assumptions** — implicit decisions that could go either way
+4. **Integration boundaries** — how this feature interacts with existing systems
+5. **Acceptance criteria gaps** — what "done" means for each task
+Do NOT ask:
+- Questions answered in the plan itself
+- Generic questions that apply to any feature
+- Questions about implementation details (HOW) — focus on requirements (WHAT)
+- More than 5 questions
+Output format: valid JSON array. Each question object has:
+- `question` (string): the clarifying question
+- `type` ("text" | "select"): "text" for open-ended, "select" for multiple choice
+- `options` (string[], optional): choices for "select" type questions
+- `reason` (string): why this question matters for spec quality
+Example:
+```json
+[
+  {
+    "question": "Should the cache invalidate on branch switch or only on explicit clear?",
+    "type": "select",
+    "options": ["Branch switch", "Explicit clear only", "Both"],
+    "reason": "The plan mentions caching but doesn't specify invalidation strategy"
+  },
+  {
+    "question": "What should happen when the API key is missing during interactive mode?",
+    "type": "text",
+    "reason": "Error handling for missing credentials isn't specified"
+  }
+]
+```
+If the plan is clear and complete with no ambiguities, return an empty array: `[]`
+If the plan is empty or too vague to analyze, return:
+```json
+[{"question": "The plan is empty or too vague — fill in plan.md with tasks before running interactive spec.", "type": "text", "reason": "No content to analyze"}]
+```
+Output ONLY the JSON array, no surrounding text or markdown fences.
+## Implementation plan
+{{plan}}

package/src/prompts/defaults/tests.md ADDED Viewed

@@ -0,0 +1,72 @@
+You are generating TDD test stubs from an implementation plan.
+## Constitution (non-negotiable)
+{{constitution}}
+## Team conventions
+{{conventions}}
+## Test Thinking Framework
+For each feature/function, think through FIVE categories of tests:
+### 1. Happy Path (Smoke Tests)
+The basic flow works as expected. User does the normal thing, gets the normal result.
+- Input valid data → get expected output
+- Standard workflow → completes successfully
+### 2. Edge Cases
+Boundary conditions, empty inputs, maximums, minimums, off-by-one.
+- Empty array/string/object → handles gracefully
+- Single item vs many items
+- Maximum values, zero values, negative values
+- Unicode, special characters, very long strings
+### 3. Error Handling
+What happens when things go wrong? Every failure mode should be tested.
+- Invalid input → returns Result error (never throws)
+- Missing dependencies → graceful degradation
+- Network/filesystem failures → clear error message
+- Concurrent access → no data corruption
+### 4. Security
+Think like an attacker. What inputs could cause harm?
+- Path traversal: `../../etc/passwd` in file paths
+- Injection: SQL injection in search queries, command injection in shell args
+- XSS: HTML/script tags in user-provided text
+- Oversized input: gigabyte strings, deeply nested objects
+- Prototype pollution: `__proto__`, `constructor` in object keys
+### 5. Integration Boundaries
+Where this module meets the outside world.
+- Database operations: test with real SQLite, not mocks where possible
+- File system: use temp directories, clean up in afterEach
+- External processes: mock Bun.spawn, verify correct args passed
+- Module boundaries: test the public API, not internal helpers
+## Instructions
+Given the implementation plan below, generate test stubs using `bun:test`.
+Rules:
+- Use `describe` / `test` / `expect` from `bun:test`
+- Write one `test(...)` per behavior, not per function
+- Each stub must have a clear description of what it asserts
+- Use `expect(...).toThrow()` for error cases (or check Result.ok === false)
+- Group tests by the five categories above inside nested `describe` blocks
+- Mock external dependencies (filesystem, network, DB) with `mock()` or `spyOn()`
+- Stubs should fail until the implementation is written — do not pre-fill assertions
+- ALWAYS include at least one security test per module that handles user input
+Do NOT:
+- Generate implementation code
+- Use Jest-specific APIs (`jest.fn()`, `jest.mock()`)
+- Write tests that test implementation details instead of behavior
+- Skip edge cases because "they seem unlikely"
+If the plan is underspecified, use [NEEDS CLARIFICATION: which behaviors should be tested?] before generating.
+Output format: a single TypeScript file with all test stubs, ready to run with `bun test`.
+## Implementation plan
+{{plan}}