npm - clavix - Versions diffs - 4.6.0 → 4.8.0 - Mend

clavix 4.6.0 → 4.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

package/dist/cli/commands/execute.js +29 -9
package/dist/cli/commands/verify.d.ts +28 -0
package/dist/cli/commands/verify.js +347 -0
package/dist/core/basic-checklist-generator.d.ts +35 -0
package/dist/core/basic-checklist-generator.js +344 -0
package/dist/core/checklist-parser.d.ts +48 -0
package/dist/core/checklist-parser.js +238 -0
package/dist/core/prompt-manager.d.ts +7 -0
package/dist/core/prompt-manager.js +47 -22
package/dist/core/verification-hooks.d.ts +67 -0
package/dist/core/verification-hooks.js +309 -0
package/dist/core/verification-manager.d.ts +106 -0
package/dist/core/verification-manager.js +422 -0
package/dist/templates/agents/agents.md +14 -7
package/dist/templates/agents/copilot-instructions.md +14 -7
package/dist/templates/agents/octo.md +14 -8
package/dist/templates/agents/warp.md +15 -10
package/dist/templates/slash-commands/_canonical/archive.md +6 -5
package/dist/templates/slash-commands/_canonical/deep.md +72 -11
package/dist/templates/slash-commands/_canonical/execute.md +128 -6
package/dist/templates/slash-commands/_canonical/fast.md +70 -13
package/dist/templates/slash-commands/_canonical/verify.md +292 -0
package/dist/templates/slash-commands/_components/agent-protocols/verification-methods.md +184 -0
package/dist/types/verification.d.ts +204 -0
package/dist/types/verification.js +8 -0
package/package.json +1 -1
package/dist/templates/slash-commands/_canonical/prompts.md +0 -97

package/dist/core/verification-manager.js ADDED Viewed

@@ -0,0 +1,422 @@
+/**
+ * Clavix v4.8: Verification Manager
+ *
+ * Manages verification state, execution flow, and persistence.
+ * Coordinates between checklist parsing, hook execution, and result storage.
+ */
+import fs from 'fs-extra';
+import * as path from 'path';
+import { ChecklistParser } from './checklist-parser.js';
+import { VerificationHooks } from './verification-hooks.js';
+import { PromptManager } from './prompt-manager.js';
+/**
+ * Verification Manager
+ */
+export class VerificationManager {
+    promptManager;
+    checklistParser;
+    verificationHooks;
+    outputDir;
+    constructor(baseDir) {
+        this.outputDir = baseDir || path.join(process.cwd(), '.clavix', 'outputs', 'prompts');
+        this.promptManager = new PromptManager(this.outputDir);
+        this.checklistParser = new ChecklistParser();
+        this.verificationHooks = new VerificationHooks();
+    }
+    /**
+     * Initialize verification for a prompt
+     */
+    async initializeVerification(promptId) {
+        // Load prompt
+        const promptData = await this.promptManager.loadPrompt(promptId);
+        if (!promptData) {
+            throw new Error(`Prompt not found: ${promptId}`);
+        }
+        // Parse checklist from prompt content
+        const checklist = this.checklistParser.parse(promptData.content);
+        // Get all items
+        const items = [...checklist.validationItems, ...checklist.edgeCases, ...checklist.risks];
+        // Detect available hooks
+        const detectedHooks = await this.verificationHooks.detectHooks();
+        // Create initial report
+        const report = {
+            version: '1.0',
+            promptId,
+            source: promptData.metadata.source,
+            startedAt: new Date().toISOString(),
+            status: items.length > 0 ? 'pending' : 'completed',
+            items,
+            results: items.map((item) => ({
+                itemId: item.id,
+                status: 'pending',
+                method: item.verificationType === 'automated' ? 'automated' : 'manual',
+                confidence: 'low',
+                verifiedAt: '',
+            })),
+            summary: this.calculateSummary([]),
+            detectedHooks,
+        };
+        // Save initial report
+        await this.saveReport(report);
+        return report;
+    }
+    /**
+     * Get verification report path for a prompt
+     */
+    getReportPath(promptId, source) {
+        return path.join(this.outputDir, source, `${promptId}.verification.json`);
+    }
+    /**
+     * Load verification report
+     */
+    async loadReport(promptId) {
+        // Try both sources
+        for (const source of ['deep', 'fast']) {
+            const reportPath = this.getReportPath(promptId, source);
+            if (await fs.pathExists(reportPath)) {
+                try {
+                    return await fs.readJson(reportPath);
+                }
+                catch {
+                    // Corrupt file, ignore
+                }
+            }
+        }
+        return null;
+    }
+    /**
+     * Save verification report
+     */
+    async saveReport(report) {
+        const reportPath = this.getReportPath(report.promptId, report.source);
+        await fs.ensureDir(path.dirname(reportPath));
+        await fs.writeJson(reportPath, report, { spaces: 2 });
+    }
+    /**
+     * Mark a single item as verified
+     */
+    async markItemVerified(promptId, itemId, status, options = {}) {
+        let report = await this.loadReport(promptId);
+        if (!report) {
+            // Initialize if doesn't exist
+            report = await this.initializeVerification(promptId);
+        }
+        // Find and update result
+        const resultIndex = report.results.findIndex((r) => r.itemId === itemId);
+        if (resultIndex === -1) {
+            throw new Error(`Item not found: ${itemId}`);
+        }
+        const item = report.items.find((i) => i.id === itemId);
+        report.results[resultIndex] = {
+            itemId,
+            status,
+            method: options.method || (item?.verificationType === 'automated' ? 'automated' : 'manual'),
+            confidence: options.confidence || 'medium',
+            evidence: options.evidence,
+            reason: options.reason,
+            verifiedAt: new Date().toISOString(),
+        };
+        // Recalculate summary and status
+        report.summary = this.calculateSummary(report.results);
+        report.status = this.calculateReportStatus(report.results);
+        if (report.status === 'completed') {
+            report.completedAt = new Date().toISOString();
+        }
+        await this.saveReport(report);
+        return report;
+    }
+    /**
+     * Run automated verification for a prompt
+     */
+    async runAutomatedVerification(promptId) {
+        let report = await this.loadReport(promptId);
+        if (!report) {
+            report = await this.initializeVerification(promptId);
+        }
+        // Find automated items that are pending
+        const automatedItems = report.items.filter((item) => item.verificationType === 'automated' &&
+            report.results.find((r) => r.itemId === item.id)?.status === 'pending');
+        if (automatedItems.length === 0) {
+            return report;
+        }
+        // Detect hooks
+        const detectedHooks = await this.verificationHooks.detectHooks();
+        // Run relevant hooks
+        const hookResults = await this.verificationHooks.runAllHooks();
+        // Map hook results to checklist items
+        for (const item of automatedItems) {
+            const lowerContent = item.content.toLowerCase();
+            // Match item to hook result
+            let matched = false;
+            for (const hookResult of hookResults) {
+                if (this.matchItemToHook(lowerContent, hookResult.hook.name)) {
+                    const resultIndex = report.results.findIndex((r) => r.itemId === item.id);
+                    if (resultIndex !== -1) {
+                        report.results[resultIndex] = {
+                            itemId: item.id,
+                            status: hookResult.success ? 'passed' : 'failed',
+                            method: 'automated',
+                            confidence: hookResult.confidence,
+                            evidence: this.truncateOutput(hookResult.output),
+                            reason: hookResult.success ? undefined : 'Hook failed',
+                            verifiedAt: new Date().toISOString(),
+                        };
+                        matched = true;
+                        break;
+                    }
+                }
+            }
+            // If no hook matched, mark as requiring manual verification
+            if (!matched) {
+                const resultIndex = report.results.findIndex((r) => r.itemId === item.id);
+                if (resultIndex !== -1 && report.results[resultIndex].status === 'pending') {
+                    report.results[resultIndex].method = 'manual';
+                }
+            }
+        }
+        // Update summary and status
+        report.summary = this.calculateSummary(report.results);
+        report.status = this.calculateReportStatus(report.results);
+        report.detectedHooks = detectedHooks;
+        await this.saveReport(report);
+        return report;
+    }
+    /**
+     * Match checklist item content to hook type
+     */
+    matchItemToHook(content, hookName) {
+        const hookKeywords = {
+            test: ['tests pass', 'test pass', 'all tests', 'unit test', 'test coverage'],
+            build: ['compiles', 'builds', 'build succeeds', 'no errors', 'runs without errors'],
+            lint: ['lint', 'no warnings', 'style guide', 'conventions'],
+            typecheck: ['typecheck', 'type check', 'type errors', 'typescript'],
+        };
+        const keywords = hookKeywords[hookName] || [];
+        return keywords.some((kw) => content.includes(kw));
+    }
+    /**
+     * Truncate output for storage
+     */
+    truncateOutput(output, maxLength = 500) {
+        if (output.length <= maxLength) {
+            return output;
+        }
+        return output.substring(0, maxLength) + '... (truncated)';
+    }
+    /**
+     * Calculate summary from results
+     */
+    calculateSummary(results) {
+        const total = results.length;
+        const passed = results.filter((r) => r.status === 'passed').length;
+        const failed = results.filter((r) => r.status === 'failed').length;
+        const skipped = results.filter((r) => r.status === 'skipped').length;
+        const notApplicable = results.filter((r) => r.status === 'not-applicable').length;
+        const automatedChecks = results.filter((r) => r.method === 'automated').length;
+        const manualChecks = results.filter((r) => r.method === 'manual' || r.method === 'semi-automated').length;
+        const denominator = total - skipped - notApplicable;
+        const coveragePercent = denominator > 0 ? Math.round((passed / denominator) * 100) : 0;
+        return {
+            total,
+            passed,
+            failed,
+            skipped,
+            notApplicable,
+            coveragePercent,
+            automatedChecks,
+            manualChecks,
+        };
+    }
+    /**
+     * Calculate overall report status
+     */
+    calculateReportStatus(results) {
+        const pending = results.filter((r) => r.status === 'pending').length;
+        const failed = results.filter((r) => r.status === 'failed').length;
+        if (pending === results.length) {
+            return 'pending';
+        }
+        if (pending > 0) {
+            return 'in-progress';
+        }
+        if (failed > 0) {
+            return 'requires-attention';
+        }
+        return 'completed';
+    }
+    /**
+     * Get pending items from report
+     */
+    getPendingItems(report) {
+        const pendingIds = new Set(report.results.filter((r) => r.status === 'pending').map((r) => r.itemId));
+        return report.items.filter((item) => pendingIds.has(item.id));
+    }
+    /**
+     * Get failed items from report
+     */
+    getFailedItems(report) {
+        return report.results
+            .filter((r) => r.status === 'failed')
+            .map((result) => ({
+            item: report.items.find((i) => i.id === result.itemId),
+            result,
+        }))
+            .filter((r) => r.item);
+    }
+    /**
+     * Check if verification is complete
+     */
+    isComplete(report) {
+        return report.status === 'completed';
+    }
+    /**
+     * Check if verification requires attention (has failures)
+     */
+    requiresAttention(report) {
+        return report.status === 'requires-attention';
+    }
+    /**
+     * Delete verification report
+     */
+    async deleteReport(promptId) {
+        for (const source of ['deep', 'fast']) {
+            const reportPath = this.getReportPath(promptId, source);
+            if (await fs.pathExists(reportPath)) {
+                await fs.remove(reportPath);
+                return true;
+            }
+        }
+        return false;
+    }
+    /**
+     * Get all verification reports
+     */
+    async listReports() {
+        const reports = [];
+        for (const source of ['deep', 'fast']) {
+            const sourceDir = path.join(this.outputDir, source);
+            if (await fs.pathExists(sourceDir)) {
+                const files = await fs.readdir(sourceDir);
+                for (const file of files) {
+                    if (file.endsWith('.verification.json')) {
+                        try {
+                            const report = await fs.readJson(path.join(sourceDir, file));
+                            reports.push(report);
+                        }
+                        catch {
+                            // Ignore corrupt files
+                        }
+                    }
+                }
+            }
+        }
+        return reports;
+    }
+    /**
+     * Get verification status for a prompt
+     */
+    async getVerificationStatus(promptId) {
+        const report = await this.loadReport(promptId);
+        if (!report) {
+            return {
+                hasReport: false,
+                status: null,
+                summary: null,
+            };
+        }
+        return {
+            hasReport: true,
+            status: report.status,
+            summary: report.summary,
+        };
+    }
+    /**
+     * Format verification report for display
+     */
+    formatReportForDisplay(report) {
+        const lines = [];
+        const sep = '═'.repeat(70);
+        lines.push(sep);
+        lines.push('                    VERIFICATION REPORT');
+        lines.push(`                    ${report.promptId}`);
+        lines.push(sep);
+        lines.push('');
+        // Group results by category
+        const byCategory = new Map();
+        for (const item of report.items) {
+            const result = report.results.find((r) => r.itemId === item.id);
+            if (!result)
+                continue;
+            const category = item.category;
+            if (!byCategory.has(category)) {
+                byCategory.set(category, []);
+            }
+            byCategory.get(category).push({ item, result });
+        }
+        // Display each category
+        for (const [category, items] of byCategory.entries()) {
+            const categoryName = category === 'validation'
+                ? 'VALIDATION CHECKLIST'
+                : category === 'edge-case'
+                    ? 'EDGE CASES'
+                    : 'RISKS';
+            lines.push(`📋 ${categoryName} (${items.length} items)`);
+            lines.push('');
+            for (const { item, result } of items) {
+                const statusIcon = this.getStatusIcon(result.status);
+                const method = result.method === 'automated'
+                    ? '[automated]'
+                    : result.method === 'semi-automated'
+                        ? '[semi-auto]'
+                        : '[manual]';
+                lines.push(`${statusIcon} ${method} ${item.content}`);
+                if (result.evidence) {
+                    lines.push(`   Evidence: ${result.evidence.substring(0, 80)}`);
+                }
+                if (result.status === 'failed' && result.reason) {
+                    lines.push(`   Reason: ${result.reason}`);
+                }
+                if (result.confidence) {
+                    lines.push(`   Confidence: ${result.confidence.toUpperCase()}`);
+                }
+                lines.push('');
+            }
+        }
+        // Summary
+        lines.push(sep);
+        lines.push('                         SUMMARY');
+        lines.push(sep);
+        lines.push(`Total:        ${report.summary.total} items`);
+        lines.push(`Passed:       ${report.summary.passed} (${report.summary.coveragePercent}%)`);
+        lines.push(`Failed:       ${report.summary.failed}${report.summary.failed > 0 ? ' (requires attention)' : ''}`);
+        lines.push(`Skipped:      ${report.summary.skipped}`);
+        lines.push('');
+        lines.push(`Automated:    ${report.summary.automatedChecks} checks`);
+        lines.push(`Manual:       ${report.summary.manualChecks} checks`);
+        if (report.summary.failed > 0) {
+            lines.push('');
+            lines.push(`⚠️  ${report.summary.failed} item(s) require attention before marking complete`);
+        }
+        lines.push(sep);
+        return lines.join('\n');
+    }
+    /**
+     * Get status icon for display
+     */
+    getStatusIcon(status) {
+        switch (status) {
+            case 'passed':
+                return '✅';
+            case 'failed':
+                return '❌';
+            case 'skipped':
+                return '⏭️';
+            case 'not-applicable':
+                return '➖';
+            case 'pending':
+            default:
+                return '⏳';
+        }
+    }
+}
+//# sourceMappingURL=verification-manager.js.map

package/dist/templates/agents/agents.md CHANGED Viewed

@@ -4,18 +4,25 @@ This guide is for agents that can only read documentation (no slash-command supp
 ---
-## CLAVIX PLANNING MODE
+## ⛔ CLAVIX MODE ENFORCEMENT (v4.7)
-**You are in Clavix prompt/PRD development mode. You help create planning documents, NOT implement features.**
+**CRITICAL: Know which mode you're in and STOP at the right point.**
-**PLANNING workflows** (requirements & documentation):
-- Conversational mode, requirement extraction, fast/deep optimization, PRD generation
+**OPTIMIZATION workflows** (NO CODE ALLOWED):
+- Fast/deep optimization - Prompt improvement only
+- Your role: Analyze, optimize, show improved prompt, **STOP**
+- ❌ DO NOT implement the prompt's requirements
+- ✅ After showing optimized prompt, tell user: "Run `/clavix:execute --latest` to implement"
+**PLANNING workflows** (NO CODE ALLOWED):
+- Conversational mode, requirement extraction, PRD generation
 - Your role: Ask questions, create PRDs/prompts, extract requirements
-- DO NOT implement features during these workflows
+- ❌ DO NOT implement features during these workflows
-**IMPLEMENTATION workflows** (code execution):
-- Only when user explicitly says: "Now implement this" or "Build the feature"
+**IMPLEMENTATION workflows** (CODE ALLOWED):
+- Only after user runs execute/implement commands
 - Your role: Write code, execute tasks, implement features
+- ✅ DO implement code during these workflows
 **If unsure, ASK:** "Should I implement this now, or continue with planning?"

package/dist/templates/agents/copilot-instructions.md CHANGED Viewed

@@ -4,18 +4,25 @@ These instructions enhance GitHub Copilot's understanding of Clavix Intelligence
 ---
-## CLAVIX PLANNING MODE
+## ⛔ CLAVIX MODE ENFORCEMENT (v4.7)
-**You are in Clavix prompt/PRD development mode. You help create planning documents, NOT implement features.**
+**CRITICAL: Know which mode you're in and STOP at the right point.**
-**PLANNING workflows** (requirements & documentation):
-- Conversational mode, requirement extraction, fast/deep optimization, PRD generation
+**OPTIMIZATION workflows** (NO CODE ALLOWED):
+- Fast/deep optimization - Prompt improvement only
+- Your role: Analyze, optimize, show improved prompt, **STOP**
+- ❌ DO NOT implement the prompt's requirements
+- ✅ After showing optimized prompt, tell user: "Run `/clavix:execute --latest` to implement"
+**PLANNING workflows** (NO CODE ALLOWED):
+- Conversational mode, requirement extraction, PRD generation
 - Your role: Ask questions, create PRDs/prompts, extract requirements
-- DO NOT implement features during these workflows
+- ❌ DO NOT implement features during these workflows
-**IMPLEMENTATION workflows** (code execution):
-- Only when user explicitly says: "Now implement this" or "Build the feature"
+**IMPLEMENTATION workflows** (CODE ALLOWED):
+- Only after user runs execute/implement commands
 - Your role: Write code, execute tasks, implement features
+- ✅ DO implement code during these workflows
 **If unsure, ASK:** "Should I implement this now, or continue with planning?"

package/dist/templates/agents/octo.md CHANGED Viewed

@@ -4,19 +4,25 @@ Clavix workflows optimized for Octofriend's capabilities: model switching, multi
 ---
-## CLAVIX PLANNING MODE
+## ⛔ CLAVIX MODE ENFORCEMENT (v4.7)
-**Know which mode you're in:**
+**CRITICAL: Know which mode you're in and STOP at the right point.**
-**PLANNING workflows** (requirements & documentation):
-- start, summarize, fast, deep, prd, plan
+**OPTIMIZATION workflows** (NO CODE ALLOWED):
+- `/clavix:fast`, `/clavix:deep` - Prompt optimization only
+- Your role: Analyze, optimize, show improved prompt, **STOP**
+- ❌ DO NOT implement the prompt's requirements
+- ✅ After showing optimized prompt, tell user: "Run `/clavix:execute --latest` to implement"
+**PLANNING workflows** (NO CODE ALLOWED):
+- `/clavix:start`, `/clavix:summarize`, `/clavix:prd`, `/clavix:plan`
 - Your role: Ask questions, create PRDs/prompts, extract requirements
-- **DO NOT implement features during these workflows**
+- ❌ DO NOT implement features during these workflows
-**IMPLEMENTATION workflows** (code execution):
-- implement, execute, task-complete
+**IMPLEMENTATION workflows** (CODE ALLOWED):
+- `/clavix:implement`, `/clavix:execute`, `clavix task-complete`
 - Your role: Write code, execute tasks, implement features
-- **DO implement code during these workflows**
+- ✅ DO implement code during these workflows
 See `.clavix/instructions/core/clavix-mode.md` for complete mode documentation.

package/dist/templates/agents/warp.md CHANGED Viewed

@@ -4,20 +4,25 @@ Clavix helps Warp developers turn rough ideas into quality, AI-ready prompts and
 ---
-### ⚠️ CLAVIX MODE: Requirements & Planning Only
+### ⛔ CLAVIX MODE ENFORCEMENT (v4.7)
-**When using Clavix workflows, you are in PLANNING mode, NOT implementation mode.**
+**CRITICAL: Know which mode you're in and STOP at the right point.**
-**YOUR ROLE:**
-- ✓ Generate PRDs and prompts
-- ✓ Extract requirements
-- ✓ Optimize prompt quality
+**OPTIMIZATION workflows** (NO CODE ALLOWED):
+- Fast/deep optimization - Prompt improvement only
+- Your role: Analyze, optimize, show improved prompt, **STOP**
+- ❌ DO NOT implement the prompt's requirements
+- ✅ After showing optimized prompt, tell user: "Run `/clavix:execute --latest` to implement"
-**DO NOT IMPLEMENT. DO NOT IMPLEMENT. DO NOT IMPLEMENT.**
-- ✗ DO NOT write application code during Clavix workflows
-- ✗ DO NOT implement features being planned
+**PLANNING workflows** (NO CODE ALLOWED):
+- Conversational mode, requirement extraction, PRD generation
+- Your role: Ask questions, create PRDs/prompts, extract requirements
+- ❌ DO NOT implement features during these workflows
-**ONLY implement if user explicitly says: "Now implement this"**
+**IMPLEMENTATION workflows** (CODE ALLOWED):
+- Only after user runs execute/implement commands
+- Your role: Write code, execute tasks, implement features
+- ✅ DO implement code during these workflows
 See `.clavix/instructions/core/clavix-mode.md` for complete mode documentation.

package/dist/templates/slash-commands/_canonical/archive.md CHANGED Viewed

@@ -158,21 +158,22 @@ Fast/deep prompts from `/clavix:fast` and `/clavix:deep` are stored separately i
 **Prompts are NOT archived with PRD projects.**
-**Manage prompts separately:**
+**Manage prompts separately (CLI commands):**
 ```bash
 clavix prompts list           # View all prompts
-clavix prompts clear          # Cleanup prompts
-/clavix:prompts               # Full management workflow
+clavix prompts clear          # Interactive cleanup
+clavix prompts clear --executed  # Remove executed only
+clavix prompts clear --stale     # Remove >30 day old
 ```
 **Before archiving, consider cleanup:**
 ```bash
-/clavix:prompts clear --executed
+clavix prompts clear --executed
 ```
 **Prompts lifecycle:**
 - Independent from PRD lifecycle
-- Managed via `/clavix:prompts`
+- Managed via CLI commands
 - Clear manually when project complete
 ## Example Workflows