npm - ruvnet-kb-first - Versions diffs - 6.0.0 → 6.1.0 - Mend

ruvnet-kb-first 6.0.0 → 6.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/package.json +1 -1
package/src/mcp-server.js +789 -471

package/src/mcp-server.js CHANGED Viewed

@@ -1,670 +1,988 @@
 /**
- * RuvNet KB-First MCP Server - Score-Driven Architecture
- * Version 6.0.0
+ * RuvNet KB-First MCP Server - Granular Score-Driven Architecture
+ * Version 6.1.0
  *
- * PHILOSOPHY: Scoring IS the enforcement mechanism.
- * - Every operation requires baseline score first
- * - Every operation shows delta (before/after)
- * - Hard gates BLOCK on negative deltas
- * - No shortcuts - rigorous measurement drives quality
+ * PHILOSOPHY: Granular scoring drives discipline.
+ * - Score each KB dimension 1-100 (completeness, depth, comprehensiveness, accuracy, freshness)
+ * - Score each phase readiness 1-100
+ * - Generate enhancement plan based on gaps
+ * - User confirms before execution
+ * - Post-verify: did we hit predicted scores?
  *
- * 4 Tools (not 7):
- *   1. kb_first_assess  - Calculate baseline scores (KB + App + Process)
- *   2. kb_first_phase   - Execute phase work with delta tracking
- *   3. kb_first_delta   - Explicit before/after comparison
- *   4. kb_first_gate    - Hard gate that blocks on negative delta
+ * 5 Tools:
+ *   1. kb_first_assess   - Score ALL dimensions (KB quality + phase readiness)
+ *   2. kb_first_plan     - Generate enhancement plan with predicted improvements
+ *   3. kb_first_confirm  - User confirms readiness, locks in plan
+ *   4. kb_first_execute  - Execute plan phase by phase
+ *   5. kb_first_verify   - Post-verification: predicted vs actual, identify gaps
  *
  * Usage:
  *   npx ruvnet-kb-first mcp
- *   node src/mcp-server.js
  */
 import { existsSync, readFileSync, writeFileSync, mkdirSync, readdirSync, statSync } from 'fs';
 import { join } from 'path';
 import { globSync } from 'glob';
-// MCP Protocol Constants
 const MCP_VERSION = '0.1.0';
 const SERVER_NAME = 'ruvnet-kb-first';
-const SERVER_VERSION = '6.0.0';
+const SERVER_VERSION = '6.1.0';
 /**
- * Score Categories (total 100 points)
- * These are the ONLY metrics that matter
+ * KB Quality Dimensions (each scored 1-100)
  */
-const SCORE_WEIGHTS = {
-  kb: {
-    weight: 40,
-    components: {
-      entries: 10,        // KB has content
-      coverage: 10,       // Domain coverage completeness
-      embeddings: 10,     // Vectors generated
-      freshness: 10       // Recent updates
-    }
+const KB_DIMENSIONS = {
+  completeness: {
+    name: 'Completeness',
+    description: 'Does the KB cover all necessary domain topics?',
+    weight: 20
   },
-  app: {
-    weight: 40,
-    components: {
-      kbCitations: 15,    // Code files cite KB sources
-      gapResolution: 10,  // Gaps identified and resolved
-      testCoverage: 10,   // Tests exist and pass
-      security: 5         // Security basics in place
-    }
+  depth: {
+    name: 'Depth',
+    description: 'Is each topic covered with sufficient detail?',
+    weight: 20
   },
-  process: {
-    weight: 20,
-    components: {
-      phaseCompletion: 10, // Phases properly completed
-      gatesPassed: 5,      // Hard gates verified
-      documentation: 5     // Docs exist
-    }
+  comprehensiveness: {
+    name: 'Comprehensiveness',
+    description: 'Are edge cases, exceptions, and nuances included?',
+    weight: 20
+  },
+  accuracy: {
+    name: 'Accuracy',
+    description: 'Is the information correct and up-to-date?',
+    weight: 20
+  },
+  freshness: {
+    name: 'Freshness',
+    description: 'How recently was the KB updated?',
+    weight: 10
+  },
+  attribution: {
+    name: 'Attribution',
+    description: 'Are sources and experts properly cited?',
+    weight: 10
   }
 };
 /**
- * Phase definitions
+ * Phase Definitions with readiness criteria
  */
 const PHASES = {
-  0:    { name: 'Assessment', gate: 'assessment_documented' },
-  1:    { name: 'KB Design', gate: 'schema_designed' },
-  1.5:  { name: 'Hooks Setup', gate: 'hooks_verified' },
-  2:    { name: 'Schema Definition', gate: 'schema_created' },
-  3:    { name: 'KB Population', gate: 'kb_score_50' },
-  4:    { name: 'Scoring & Gaps', gate: 'kb_score_80' },
-  5:    { name: 'Integration', gate: 'integration_tested' },
-  6:    { name: 'Testing', gate: 'tests_passing' },
-  7:    { name: 'Optimization', gate: 'performance_met' },
-  7.5:  { name: 'Testing Gate', gate: 'coverage_80' },
-  8:    { name: 'Verification', gate: 'all_checks_pass' },
-  9:    { name: 'Security', gate: 'security_audit_passed' },
-  10:   { name: 'Documentation', gate: 'docs_complete' },
-  11:   { name: 'Deployment', gate: 'deployed' },
-  11.5: { name: 'Observability', gate: 'monitoring_active' },
-  12:   { name: 'KB Operations', gate: 'operations_ready' }
+  0: {
+    name: 'Assessment',
+    criteria: ['Project scope documented', 'Domain complexity identified', 'KB-First suitability confirmed', 'Resources estimated']
+  },
+  1: {
+    name: 'KB Design',
+    criteria: ['Domain concepts mapped', 'Taxonomy designed', 'Relationships defined', 'Query patterns planned']
+  },
+  1.5: {
+    name: 'Hooks Setup',
+    criteria: ['Hooks installed', 'Configuration complete', 'Patterns trained', 'Verification passing']
+  },
+  2: {
+    name: 'Schema Definition',
+    criteria: ['Tables created', 'Vector columns added', 'Indexes designed', 'Migrations written']
+  },
+  3: {
+    name: 'KB Population',
+    criteria: ['Content collected', 'Data cleaned', 'Embeddings generated', 'Import validated']
+  },
+  4: {
+    name: 'Scoring & Gaps',
+    criteria: ['Coverage analyzed', 'Quality scored', 'Gaps identified', 'Remediation planned']
+  },
+  5: {
+    name: 'Integration',
+    criteria: ['Search API built', 'Code generation working', 'Citation system active', 'Gap logging enabled']
+  },
+  6: {
+    name: 'Testing',
+    criteria: ['Unit tests written', 'Integration tests passing', 'Accuracy validated', 'Edge cases covered']
+  },
+  7: {
+    name: 'Optimization',
+    criteria: ['Queries optimized', 'Indexes tuned', 'Caching implemented', 'Benchmarks passing']
+  },
+  8: {
+    name: 'Verification',
+    criteria: ['Code scan clean', 'Imports verified', 'Sources return', 'Startup working', 'Fallbacks tested', 'Attribution valid', 'Confidence scores present', 'Gap logging active']
+  },
+  9: {
+    name: 'Security',
+    criteria: ['Dependencies audited', 'OWASP checked', 'SQL injection tested', 'Auth reviewed', 'Secrets secured', 'APIs protected']
+  },
+  10: {
+    name: 'Documentation',
+    criteria: ['README complete', 'API documented', 'Schema documented', 'Architecture documented', 'Operator guide written']
+  },
+  11: {
+    name: 'Deployment',
+    criteria: ['Infrastructure ready', 'Environments configured', 'CI/CD built', 'Migrations run', 'Monitoring active', 'Go-live complete']
+  }
 };
 /**
- * MCP Tools - Score-Driven Architecture
+ * MCP Tools
  */
 const TOOLS = [
   {
     name: 'kb_first_assess',
-    description: `Calculate comprehensive baseline scores for KB, App, and Process.
-ALWAYS RUN THIS FIRST before any work. Returns:
-- KB Score (40 points): entries, coverage, embeddings, freshness
-- App Score (40 points): citations, gap resolution, tests, security
-- Process Score (20 points): phases, gates, documentation
-- Total (100 points)
-This becomes your BASELINE for delta comparison.`,
+    description: `Score ALL dimensions of KB quality and phase readiness (each 1-100).
+KB Quality Dimensions:
+- Completeness: Does KB cover all domain topics?
+- Depth: Is each topic detailed enough?
+- Comprehensiveness: Are edge cases included?
+- Accuracy: Is information correct?
+- Freshness: How recently updated?
+- Attribution: Are sources cited?
+Phase Readiness:
+- Each of 12 phases scored 1-100 based on criteria completion
+Returns granular scores that reveal exactly where gaps exist.
+This is your BASELINE for planning.`,
     inputSchema: {
       type: 'object',
       properties: {
-        detailed: { type: 'boolean', description: 'Show component breakdown', default: true },
-        saveBaseline: { type: 'boolean', description: 'Save as baseline for delta comparison', default: true }
+        projectPath: { type: 'string', description: 'Path to project (default: current directory)' }
       }
     }
   },
   {
-    name: 'kb_first_phase',
-    description: `Execute a phase with automatic delta tracking.
-REQUIRES: kb_first_assess must be run first to establish baseline.
+    name: 'kb_first_plan',
+    description: `Generate enhancement plan based on assessment scores.
-Workflow:
-1. Loads baseline score from last kb_first_assess
-2. Shows phase requirements and sub-phases
-3. Returns guidance for completing the phase
-4. REMINDS you to run kb_first_delta when done
+Analyzes gaps (scores below threshold) and creates:
+- Prioritized list of enhancements
+- Predicted score improvements for each
+- Estimated effort
+- Execution order
-Will WARN if baseline is stale (>1 hour old).`,
+The plan gives you a concrete game plan so you don't lose the thread.
+Returns the plan for user review before execution.`,
     inputSchema: {
       type: 'object',
       properties: {
-        phase: { type: 'number', description: 'Phase number (0-12, including 1.5, 7.5, 11.5)' }
+        threshold: { type: 'number', description: 'Minimum acceptable score (default: 80)', default: 80 },
+        focusArea: { type: 'string', enum: ['kb', 'phases', 'all'], description: 'What to focus on', default: 'all' }
+      }
+    }
+  },
+  {
+    name: 'kb_first_confirm',
+    description: `User confirms readiness to execute enhancement plan.
+Shows the plan summary and asks for confirmation.
+Once confirmed, the plan is locked and execution can begin.
+This ensures user consent before making changes.`,
+    inputSchema: {
+      type: 'object',
+      properties: {
+        confirmed: { type: 'boolean', description: 'User confirms readiness to proceed' }
       },
-      required: ['phase']
+      required: ['confirmed']
     }
   },
   {
-    name: 'kb_first_delta',
-    description: `Compare current scores against baseline. THE ENFORCEMENT MECHANISM.
-Shows:
-- Baseline score (from kb_first_assess)
-- Current score (calculated now)
-- Delta (+ improvement or - regression)
-- VERDICT: PASS (positive delta) or FAIL (negative delta)
-If delta is negative, you CANNOT proceed to next phase.
-This prevents shortcuts and enforces rigor.`,
+    name: 'kb_first_execute',
+    description: `Execute the confirmed enhancement plan.
+Works through the plan systematically:
+- Shows current task
+- Provides guidance for completion
+- Tracks progress
+- Updates predicted scores
+Call repeatedly to work through each enhancement.`,
     inputSchema: {
       type: 'object',
       properties: {
-        showBreakdown: { type: 'boolean', description: 'Show which components changed', default: true }
+        taskComplete: { type: 'boolean', description: 'Mark current task as complete' }
       }
     }
   },
   {
-    name: 'kb_first_gate',
-    description: `Hard gate check for phase transition.
-BLOCKS progress if:
-- Delta is negative (score dropped)
-- Required gate condition not met
-- Baseline not established
-Returns:
-- canProceed: boolean
-- blockReason: string (if blocked)
-- nextPhase: number (if can proceed)
-THIS IS THE HARD GATE. No bypassing.`,
+    name: 'kb_first_verify',
+    description: `Post-verification: Compare predicted vs actual scores.
+Re-scores everything and compares to predictions:
+- Which improvements were achieved?
+- Which fell short?
+- What gaps remain?
+- What's the next priority?
+This closes the loop and ensures you delivered what you promised.`,
     inputSchema: {
       type: 'object',
       properties: {
-        phase: { type: 'number', description: 'Phase to verify gate for' }
-      },
-      required: ['phase']
+        detailed: { type: 'boolean', description: 'Show detailed comparison', default: true }
+      }
     }
   }
 ];
 /**
- * Calculate all scores
+ * Score KB Quality Dimensions (1-100 each)
  */
-function calculateScores(cwd) {
-  const scores = {
-    kb: { total: 0, max: 40, components: {} },
-    app: { total: 0, max: 40, components: {} },
-    process: { total: 0, max: 20, components: {} },
-    total: 0,
-    max: 100,
-    grade: 'F',
-    timestamp: new Date().toISOString()
-  };
-  // ===== KB SCORE (40 points) =====
-  const ruvectorDir = join(cwd, '.ruvector');
+function scoreKBDimensions(cwd) {
+  const scores = {};
   const kbDir = join(cwd, 'src', 'kb');
+  const docsDir = join(cwd, 'docs');
+  const ruvectorDir = join(cwd, '.ruvector');
-  // KB Entries (10 points)
+  // Count KB entries and docs
   let kbEntries = 0;
+  let docFiles = 0;
+  let totalContent = 0;
   if (existsSync(kbDir)) {
     try {
       const files = readdirSync(kbDir);
       kbEntries = files.length;
+      for (const f of files) {
+        try {
+          const content = readFileSync(join(kbDir, f), 'utf-8');
+          totalContent += content.length;
+        } catch {}
+      }
     } catch {}
   }
-  scores.kb.components.entries = Math.min(10, Math.floor(kbEntries / 5) * 2);
-  // KB Coverage (10 points) - based on documented domains
-  const docsDir = join(cwd, 'docs');
-  let domainDocs = 0;
   if (existsSync(docsDir)) {
     try {
-      const files = readdirSync(docsDir);
-      domainDocs = files.filter(f => f.endsWith('.md')).length;
+      docFiles = readdirSync(docsDir).filter(f => f.endsWith('.md')).length;
     } catch {}
   }
-  scores.kb.components.coverage = Math.min(10, domainDocs * 2);
-  // KB Embeddings (10 points) - check for vector files or config
-  const configPath = join(ruvectorDir, 'config.json');
-  let hasEmbeddings = false;
-  if (existsSync(configPath)) {
+  // Completeness: Based on number of KB entries and docs
+  // 0 entries = 0, 5 entries = 50, 10+ entries = 100
+  scores.completeness = {
+    score: Math.min(100, Math.max(0, kbEntries * 10 + docFiles * 10)),
+    reason: `${kbEntries} KB entries, ${docFiles} doc files`,
+    improvement: kbEntries < 10 ? `Add ${10 - kbEntries} more KB entries` : 'Adequate coverage'
+  };
+  // Depth: Based on average content length
+  // < 500 chars avg = shallow, > 2000 = deep
+  const avgLength = kbEntries > 0 ? totalContent / kbEntries : 0;
+  scores.depth = {
+    score: Math.min(100, Math.max(0, Math.round(avgLength / 20))),
+    reason: `Average entry length: ${Math.round(avgLength)} chars`,
+    improvement: avgLength < 2000 ? 'Add more detail to KB entries' : 'Good depth'
+  };
+  // Comprehensiveness: Check for edge case documentation
+  let edgeCaseScore = 0;
+  const srcDir = join(cwd, 'src');
+  if (existsSync(srcDir)) {
     try {
-      const config = JSON.parse(readFileSync(configPath, 'utf-8'));
-      hasEmbeddings = config.kbFirst?.embeddings === true || kbEntries > 0;
+      const files = globSync('**/*.{ts,tsx,js,jsx,py}', { cwd: srcDir });
+      for (const f of files) {
+        try {
+          const content = readFileSync(join(srcDir, f), 'utf-8');
+          if (content.includes('edge case') || content.includes('exception') || content.includes('fallback')) {
+            edgeCaseScore += 10;
+          }
+        } catch {}
+      }
     } catch {}
   }
-  scores.kb.components.embeddings = hasEmbeddings ? 10 : 0;
+  scores.comprehensiveness = {
+    score: Math.min(100, edgeCaseScore + (kbEntries * 5)),
+    reason: `Edge case handling detected in ${Math.floor(edgeCaseScore / 10)} files`,
+    improvement: edgeCaseScore < 50 ? 'Document edge cases and exceptions' : 'Good coverage'
+  };
+  // Accuracy: Based on presence of verification/testing
+  let accuracyScore = 50; // Base score
+  if (existsSync(join(cwd, 'tests')) || existsSync(join(cwd, '__tests__'))) accuracyScore += 25;
+  if (existsSync(join(cwd, '.ruvector', 'config.json'))) accuracyScore += 15;
+  if (existsSync(join(cwd, 'CHANGELOG.md'))) accuracyScore += 10;
+  scores.accuracy = {
+    score: Math.min(100, accuracyScore),
+    reason: accuracyScore > 75 ? 'Tests and verification present' : 'Limited verification',
+    improvement: accuracyScore < 80 ? 'Add tests and validation' : 'Good accuracy controls'
+  };
-  // KB Freshness (10 points) - recent updates
-  let freshness = 0;
+  // Freshness: Based on last modification
+  let freshnessScore = 0;
   if (existsSync(ruvectorDir)) {
     try {
       const stat = statSync(ruvectorDir);
-      const daysSinceUpdate = (Date.now() - stat.mtime.getTime()) / (1000 * 60 * 60 * 24);
-      if (daysSinceUpdate < 1) freshness = 10;
-      else if (daysSinceUpdate < 7) freshness = 7;
-      else if (daysSinceUpdate < 30) freshness = 4;
-      else freshness = 0;
+      const daysSince = (Date.now() - stat.mtime.getTime()) / (1000 * 60 * 60 * 24);
+      if (daysSince < 1) freshnessScore = 100;
+      else if (daysSince < 7) freshnessScore = 80;
+      else if (daysSince < 30) freshnessScore = 50;
+      else if (daysSince < 90) freshnessScore = 25;
+      else freshnessScore = 10;
     } catch {}
   }
-  scores.kb.components.freshness = freshness;
-  scores.kb.total = Object.values(scores.kb.components).reduce((a, b) => a + b, 0);
-  // ===== APP SCORE (40 points) =====
-  const srcDir = join(cwd, 'src');
+  scores.freshness = {
+    score: freshnessScore,
+    reason: freshnessScore > 50 ? 'Recently updated' : 'Stale - needs refresh',
+    improvement: freshnessScore < 80 ? 'Update KB content' : 'Fresh'
+  };
-  // KB Citations (15 points)
-  let codeFiles = [];
-  let filesWithCitation = 0;
+  // Attribution: Check for citations in code
+  let attributionScore = 0;
   if (existsSync(srcDir)) {
     try {
-      codeFiles = globSync('**/*.{ts,tsx,js,jsx,py,go,rs}', { cwd: srcDir });
-      for (const file of codeFiles) {
+      const files = globSync('**/*.{ts,tsx,js,jsx,py}', { cwd: srcDir });
+      let filesWithCitation = 0;
+      for (const f of files) {
         try {
-          const content = readFileSync(join(srcDir, file), 'utf-8');
+          const content = readFileSync(join(srcDir, f), 'utf-8');
           if (content.includes('KB-Generated:') || content.includes('Sources:') || content.includes('@kb-source')) {
             filesWithCitation++;
           }
         } catch {}
       }
+      attributionScore = files.length > 0 ? Math.round((filesWithCitation / files.length) * 100) : 100;
     } catch {}
+  } else {
+    attributionScore = 100; // No code = not applicable
   }
-  const citationPercent = codeFiles.length > 0 ? filesWithCitation / codeFiles.length : 1;
-  scores.app.components.kbCitations = Math.round(citationPercent * 15);
+  scores.attribution = {
+    score: attributionScore,
+    reason: `${attributionScore}% of code files have KB citations`,
+    improvement: attributionScore < 80 ? 'Add KB citations to code files' : 'Good attribution'
+  };
+  return scores;
+}
-  // Gap Resolution (10 points)
-  const gapsPath = join(ruvectorDir, 'gaps.jsonl');
-  let gapCount = 0;
-  if (existsSync(gapsPath)) {
+/**
+ * Score Phase Readiness (1-100 each)
+ */
+function scorePhaseReadiness(cwd) {
+  const scores = {};
+  const configPath = join(cwd, '.ruvector', 'config.json');
+  let config = { phases: { completed: [], gates: {} } };
+  if (existsSync(configPath)) {
     try {
-      const content = readFileSync(gapsPath, 'utf-8').trim();
-      gapCount = content ? content.split('\n').length : 0;
+      config = JSON.parse(readFileSync(configPath, 'utf-8'));
     } catch {}
   }
-  scores.app.components.gapResolution = Math.max(0, 10 - gapCount);
-  // Test Coverage (10 points)
-  let hasTests = false;
-  const testDirs = ['tests', 'test', '__tests__', 'src/__tests__'];
-  for (const td of testDirs) {
-    if (existsSync(join(cwd, td))) {
-      hasTests = true;
-      break;
+  const completed = config.phases?.completed || [];
+  const gates = config.phases?.gates || {};
+  for (const [phaseNum, phaseInfo] of Object.entries(PHASES)) {
+    const num = parseFloat(phaseNum);
+    const isCompleted = completed.includes(num);
+    const criteriaCount = phaseInfo.criteria.length;
+    // Check which criteria are met
+    let metCriteria = 0;
+    const unmetCriteria = [];
+    for (const criterion of phaseInfo.criteria) {
+      // Simplified check - in real implementation, this would be more sophisticated
+      if (isCompleted || checkCriterion(cwd, num, criterion)) {
+        metCriteria++;
+      } else {
+        unmetCriteria.push(criterion);
+      }
     }
-  }
-  const testFiles = existsSync(srcDir) ? globSync('**/*.{test,spec}.{ts,tsx,js,jsx}', { cwd: srcDir }) : [];
-  scores.app.components.testCoverage = hasTests ? 5 : 0;
-  scores.app.components.testCoverage += Math.min(5, testFiles.length);
-  // Security (5 points)
-  let secScore = 5;
-  const gitignorePath = join(cwd, '.gitignore');
-  if (existsSync(gitignorePath)) {
-    try {
-      const content = readFileSync(gitignorePath, 'utf-8');
-      if (!content.includes('.env')) secScore -= 2;
-      if (!content.includes('node_modules')) secScore -= 1;
-    } catch {}
-  } else {
-    secScore -= 3;
+    const score = Math.round((metCriteria / criteriaCount) * 100);
+    scores[phaseNum] = {
+      name: phaseInfo.name,
+      score,
+      metCriteria,
+      totalCriteria: criteriaCount,
+      unmet: unmetCriteria,
+      completed: isCompleted
+    };
   }
-  scores.app.components.security = Math.max(0, secScore);
-  scores.app.total = Object.values(scores.app.components).reduce((a, b) => a + b, 0);
+  return scores;
+}
-  // ===== PROCESS SCORE (20 points) =====
+/**
+ * Check if a criterion is met (simplified)
+ */
+function checkCriterion(cwd, phase, criterion) {
+  // Check for common indicators
+  const criterionLower = criterion.toLowerCase();
-  // Phase Completion (10 points)
-  let completedPhases = [];
-  if (existsSync(configPath)) {
-    try {
-      const config = JSON.parse(readFileSync(configPath, 'utf-8'));
-      completedPhases = config.phases?.completed || [];
-    } catch {}
+  if (criterionLower.includes('documented')) {
+    return existsSync(join(cwd, 'docs')) || existsSync(join(cwd, 'README.md'));
   }
-  const totalPhases = Object.keys(PHASES).length;
-  scores.process.components.phaseCompletion = Math.round((completedPhases.length / totalPhases) * 10);
-  // Gates Passed (5 points)
-  let gatesPassed = 0;
-  if (existsSync(configPath)) {
-    try {
-      const config = JSON.parse(readFileSync(configPath, 'utf-8'));
-      gatesPassed = Object.values(config.phases?.gates || {}).filter(v => v === true).length;
-    } catch {}
+  if (criterionLower.includes('tests')) {
+    return existsSync(join(cwd, 'tests')) || existsSync(join(cwd, '__tests__'));
+  }
+  if (criterionLower.includes('config')) {
+    return existsSync(join(cwd, '.ruvector', 'config.json'));
+  }
+  if (criterionLower.includes('hooks')) {
+    return existsSync(join(cwd, '.ruvector', 'hooks'));
+  }
+  if (criterionLower.includes('schema') || criterionLower.includes('tables')) {
+    return existsSync(join(cwd, 'templates', 'schema.sql'));
   }
-  scores.process.components.gatesPassed = Math.min(5, Math.round((gatesPassed / totalPhases) * 5));
-  // Documentation (5 points)
-  let docScore = 0;
-  if (existsSync(join(cwd, 'README.md'))) docScore += 2;
-  if (existsSync(join(cwd, 'docs', 'api.md')) || existsSync(join(cwd, 'docs', 'API.md'))) docScore += 1;
-  if (existsSync(join(cwd, 'docs', 'architecture.md'))) docScore += 1;
-  if (existsSync(join(cwd, 'CHANGELOG.md'))) docScore += 1;
-  scores.process.components.documentation = Math.min(5, docScore);
+  return false;
+}
-  scores.process.total = Object.values(scores.process.components).reduce((a, b) => a + b, 0);
+/**
+ * Calculate overall weighted scores
+ */
+function calculateOverallScores(kbScores, phaseScores) {
+  // KB Overall (weighted average)
+  let kbTotal = 0;
+  let kbWeightTotal = 0;
+  for (const [dim, info] of Object.entries(KB_DIMENSIONS)) {
+    if (kbScores[dim]) {
+      kbTotal += kbScores[dim].score * info.weight;
+      kbWeightTotal += info.weight;
+    }
+  }
+  const kbOverall = kbWeightTotal > 0 ? Math.round(kbTotal / kbWeightTotal) : 0;
-  // ===== TOTAL =====
-  scores.total = scores.kb.total + scores.app.total + scores.process.total;
+  // Phase Overall (average)
+  const phaseValues = Object.values(phaseScores);
+  const phaseOverall = phaseValues.length > 0
+    ? Math.round(phaseValues.reduce((sum, p) => sum + p.score, 0) / phaseValues.length)
+    : 0;
-  // Grade
-  if (scores.total >= 98) scores.grade = 'A+';
-  else if (scores.total >= 93) scores.grade = 'A';
-  else if (scores.total >= 90) scores.grade = 'A-';
-  else if (scores.total >= 87) scores.grade = 'B+';
-  else if (scores.total >= 83) scores.grade = 'B';
-  else if (scores.total >= 80) scores.grade = 'B-';
-  else if (scores.total >= 70) scores.grade = 'C';
-  else if (scores.total >= 60) scores.grade = 'D';
-  else scores.grade = 'F';
+  // Combined Overall
+  const overall = Math.round((kbOverall * 0.5) + (phaseOverall * 0.5));
-  return scores;
+  return { kbOverall, phaseOverall, overall };
 }
 /**
  * Tool Handlers
  */
-async function handleKbFirstAssess(cwd, args) {
-  const scores = calculateScores(cwd);
-  // Save baseline
-  if (args.saveBaseline !== false) {
-    const ruvectorDir = join(cwd, '.ruvector');
-    if (!existsSync(ruvectorDir)) {
-      mkdirSync(ruvectorDir, { recursive: true });
-    }
-    writeFileSync(join(ruvectorDir, 'baseline.json'), JSON.stringify(scores, null, 2));
+async function handleAssess(cwd, args) {
+  const kbScores = scoreKBDimensions(cwd);
+  const phaseScores = scorePhaseReadiness(cwd);
+  const overall = calculateOverallScores(kbScores, phaseScores);
+  // Save assessment
+  const ruvectorDir = join(cwd, '.ruvector');
+  if (!existsSync(ruvectorDir)) {
+    mkdirSync(ruvectorDir, { recursive: true });
   }
-  const result = {
-    action: 'BASELINE_ESTABLISHED',
-    timestamp: scores.timestamp,
-    total: scores.total,
-    max: scores.max,
-    grade: scores.grade,
-    summary: {
-      kb: `${scores.kb.total}/${scores.kb.max}`,
-      app: `${scores.app.total}/${scores.app.max}`,
-      process: `${scores.process.total}/${scores.process.max}`
-    },
-    nextStep: 'Run kb_first_phase to begin work, then kb_first_delta to measure improvement'
+  const assessment = {
+    timestamp: new Date().toISOString(),
+    kb: kbScores,
+    phases: phaseScores,
+    overall
   };
-  if (args.detailed !== false) {
-    result.breakdown = {
-      kb: scores.kb.components,
-      app: scores.app.components,
-      process: scores.process.components
+  writeFileSync(join(ruvectorDir, 'assessment.json'), JSON.stringify(assessment, null, 2));
+  // Format for display
+  const kbSummary = {};
+  for (const [dim, data] of Object.entries(kbScores)) {
+    kbSummary[dim] = {
+      score: data.score,
+      reason: data.reason
     };
   }
-  return result;
+  const phaseSummary = {};
+  for (const [num, data] of Object.entries(phaseScores)) {
+    phaseSummary[`Phase ${num}: ${data.name}`] = {
+      score: data.score,
+      criteria: `${data.metCriteria}/${data.totalCriteria}`,
+      status: data.completed ? 'COMPLETE' : (data.score >= 80 ? 'READY' : 'GAPS')
+    };
+  }
+  return {
+    action: 'ASSESSMENT_COMPLETE',
+    timestamp: assessment.timestamp,
+    overallScores: {
+      kb: `${overall.kbOverall}/100`,
+      phases: `${overall.phaseOverall}/100`,
+      combined: `${overall.overall}/100`
+    },
+    kbQuality: kbSummary,
+    phaseReadiness: phaseSummary,
+    nextStep: 'Run kb_first_plan to generate enhancement plan based on gaps'
+  };
 }
-async function handleKbFirstPhase(cwd, args) {
-  const phase = args.phase;
-  const phaseInfo = PHASES[phase];
+async function handlePlan(cwd, args) {
+  const assessmentPath = join(cwd, '.ruvector', 'assessment.json');
-  if (!phaseInfo) {
+  if (!existsSync(assessmentPath)) {
     return {
-      error: `Unknown phase: ${phase}`,
-      validPhases: Object.entries(PHASES).map(([k, v]) => ({ phase: parseFloat(k), name: v.name }))
+      error: 'NO_ASSESSMENT',
+      message: 'No assessment found. Run kb_first_assess first.',
+      action: 'Run kb_first_assess to score KB and phase readiness'
     };
   }
-  // Check for baseline
-  const baselinePath = join(cwd, '.ruvector', 'baseline.json');
-  let baseline = null;
-  let baselineWarning = null;
+  const assessment = JSON.parse(readFileSync(assessmentPath, 'utf-8'));
+  const threshold = args.threshold || 80;
+  const focusArea = args.focusArea || 'all';
+  const enhancements = [];
+  let taskId = 1;
+  // Find KB gaps
+  if (focusArea === 'all' || focusArea === 'kb') {
+    for (const [dim, data] of Object.entries(assessment.kb)) {
+      if (data.score < threshold) {
+        const gap = threshold - data.score;
+        enhancements.push({
+          id: taskId++,
+          area: 'KB Quality',
+          dimension: KB_DIMENSIONS[dim]?.name || dim,
+          currentScore: data.score,
+          targetScore: threshold,
+          predictedImprovement: gap,
+          task: data.improvement,
+          priority: gap > 30 ? 'HIGH' : (gap > 15 ? 'MEDIUM' : 'LOW'),
+          effort: gap > 30 ? 'Large' : (gap > 15 ? 'Medium' : 'Small')
+        });
+      }
+    }
+  }
-  if (existsSync(baselinePath)) {
-    try {
-      baseline = JSON.parse(readFileSync(baselinePath, 'utf-8'));
-      const baselineAge = (Date.now() - new Date(baseline.timestamp).getTime()) / (1000 * 60);
-      if (baselineAge > 60) {
-        baselineWarning = `Baseline is ${Math.round(baselineAge)} minutes old. Consider running kb_first_assess for fresh baseline.`;
+  // Find Phase gaps
+  if (focusArea === 'all' || focusArea === 'phases') {
+    for (const [num, data] of Object.entries(assessment.phases)) {
+      if (data.score < threshold && !data.completed) {
+        const gap = threshold - data.score;
+        enhancements.push({
+          id: taskId++,
+          area: 'Phase Readiness',
+          dimension: `Phase ${num}: ${data.name}`,
+          currentScore: data.score,
+          targetScore: threshold,
+          predictedImprovement: gap,
+          task: `Complete: ${data.unmet.slice(0, 3).join(', ')}${data.unmet.length > 3 ? '...' : ''}`,
+          priority: gap > 30 ? 'HIGH' : (gap > 15 ? 'MEDIUM' : 'LOW'),
+          effort: gap > 30 ? 'Large' : (gap > 15 ? 'Medium' : 'Small')
+        });
       }
-    } catch {}
+    }
   }
-  // Phase-specific guidance
-  const phaseGuidance = {
-    0: ['Document project scope', 'Identify domain complexity', 'Assess KB-First suitability', 'Estimate resources', 'Make go/no-go decision'],
-    1: ['Map domain concepts', 'Design taxonomy', 'Define relationships', 'Plan query patterns', 'Review with stakeholders'],
-    1.5: ['Install enforcement hooks', 'Configure hook behavior', 'Train on project patterns', 'Verify hooks work'],
-    2: ['Create database tables', 'Add vector columns', 'Design indexes', 'Write migration scripts'],
-    3: ['Collect domain content', 'Process and clean data', 'Generate embeddings', 'Import to KB', 'Validate entries'],
-    4: ['Analyze KB coverage', 'Calculate quality score', 'Identify gaps', 'Prioritize fixes', 'Create remediation plan'],
-    5: ['Build search API', 'Implement code generation', 'Add citation system', 'Enable gap logging'],
-    6: ['Write unit tests', 'Create integration tests', 'Test KB accuracy', 'Performance tests', 'Edge case testing'],
-    7: ['Optimize queries', 'Tune indexes', 'Add caching', 'Run benchmarks'],
-    7.5: ['Verify test coverage ≥80%', 'Run E2E suite', 'Load testing', 'Build regression suite'],
-    8: ['Run code scan', 'Check imports', 'Verify source returns', 'Test startup', 'Check fallbacks', 'Validate attribution', 'Test confidence', 'Review gap logs'],
-    9: ['Audit dependencies', 'Check OWASP Top 10', 'Test SQL injection', 'Review auth', 'Audit secrets', 'Secure APIs'],
-    10: ['Write README', 'Document API', 'Schema documentation', 'Architecture docs', 'Operator guide'],
-    11: ['Setup infrastructure', 'Configure environments', 'Build CI/CD', 'Run migrations', 'Setup monitoring', 'Go live'],
-    11.5: ['Setup OpenTelemetry', 'Build KB dashboard', 'Configure alerts', 'Write runbooks'],
-    12: ['Define gap triage', 'Setup expert review', 'Document KB updates', 'Version control', 'A/B testing']
+  // Sort by priority
+  const priorityOrder = { HIGH: 0, MEDIUM: 1, LOW: 2 };
+  enhancements.sort((a, b) => priorityOrder[a.priority] - priorityOrder[b.priority]);
+  // Calculate predicted totals
+  const predictedKBImprovement = enhancements
+    .filter(e => e.area === 'KB Quality')
+    .reduce((sum, e) => sum + e.predictedImprovement, 0);
+  const predictedPhaseImprovement = enhancements
+    .filter(e => e.area === 'Phase Readiness')
+    .reduce((sum, e) => sum + e.predictedImprovement, 0);
+  const plan = {
+    timestamp: new Date().toISOString(),
+    threshold,
+    baselineScores: assessment.overall,
+    enhancements,
+    predictions: {
+      kbImprovement: `+${Math.round(predictedKBImprovement / 6)}`, // Average across 6 dimensions
+      phaseImprovement: `+${Math.round(predictedPhaseImprovement / Object.keys(PHASES).length)}`,
+      tasksCount: enhancements.length,
+      highPriority: enhancements.filter(e => e.priority === 'HIGH').length,
+      mediumPriority: enhancements.filter(e => e.priority === 'MEDIUM').length,
+      lowPriority: enhancements.filter(e => e.priority === 'LOW').length
+    },
+    confirmed: false,
+    currentTaskIndex: 0
   };
+  writeFileSync(join(cwd, '.ruvector', 'plan.json'), JSON.stringify(plan, null, 2));
   return {
-    phase,
-    name: phaseInfo.name,
-    gate: phaseInfo.gate,
-    baseline: baseline ? {
-      score: baseline.total,
-      grade: baseline.grade,
-      timestamp: baseline.timestamp
-    } : null,
-    baselineWarning,
-    tasks: phaseGuidance[phase] || [],
-    reminder: '⚠️ IMPORTANT: Run kb_first_delta when phase work is complete to measure improvement',
-    gateRequirement: `Gate "${phaseInfo.gate}" must be satisfied to proceed`
+    action: 'PLAN_GENERATED',
+    summary: {
+      totalTasks: enhancements.length,
+      highPriority: plan.predictions.highPriority,
+      mediumPriority: plan.predictions.mediumPriority,
+      lowPriority: plan.predictions.lowPriority
+    },
+    predictedImprovements: {
+      kb: plan.predictions.kbImprovement,
+      phases: plan.predictions.phaseImprovement
+    },
+    enhancements: enhancements.map(e => ({
+      id: e.id,
+      priority: e.priority,
+      area: e.dimension,
+      current: e.currentScore,
+      target: e.targetScore,
+      task: e.task
+    })),
+    nextStep: 'Review the plan above. Run kb_first_confirm with confirmed=true when ready to proceed.'
   };
 }
-async function handleKbFirstDelta(cwd, args) {
-  const baselinePath = join(cwd, '.ruvector', 'baseline.json');
+async function handleConfirm(cwd, args) {
+  const planPath = join(cwd, '.ruvector', 'plan.json');
-  if (!existsSync(baselinePath)) {
+  if (!existsSync(planPath)) {
     return {
-      error: 'NO_BASELINE',
-      message: 'No baseline found. Run kb_first_assess first to establish baseline.',
-      action: 'Run kb_first_assess with saveBaseline=true'
+      error: 'NO_PLAN',
+      message: 'No plan found. Run kb_first_plan first.',
+      action: 'Run kb_first_plan to generate enhancement plan'
     };
   }
-  let baseline;
-  try {
-    baseline = JSON.parse(readFileSync(baselinePath, 'utf-8'));
-  } catch {
-    return { error: 'CORRUPT_BASELINE', message: 'Baseline file is corrupt. Run kb_first_assess again.' };
+  if (!args.confirmed) {
+    return {
+      action: 'CONFIRMATION_REQUIRED',
+      message: 'You must confirm with confirmed=true to proceed.',
+      hint: 'Review the plan from kb_first_plan, then confirm when ready.'
+    };
   }
-  const current = calculateScores(cwd);
+  const plan = JSON.parse(readFileSync(planPath, 'utf-8'));
+  plan.confirmed = true;
+  plan.confirmedAt = new Date().toISOString();
+  plan.currentTaskIndex = 0;
-  const delta = {
-    total: current.total - baseline.total,
-    kb: current.kb.total - baseline.kb.total,
-    app: current.app.total - baseline.app.total,
-    process: current.process.total - baseline.process.total
-  };
+  writeFileSync(planPath, JSON.stringify(plan, null, 2));
-  const verdict = delta.total >= 0 ? 'PASS' : 'FAIL';
-  const canProceed = delta.total >= 0;
+  const firstTask = plan.enhancements[0];
-  const result = {
-    verdict,
-    canProceed,
-    baseline: {
-      score: baseline.total,
-      grade: baseline.grade,
-      timestamp: baseline.timestamp
-    },
-    current: {
-      score: current.total,
-      grade: current.grade,
-      timestamp: current.timestamp
-    },
-    delta: {
-      total: delta.total > 0 ? `+${delta.total}` : `${delta.total}`,
-      kb: delta.kb > 0 ? `+${delta.kb}` : `${delta.kb}`,
-      app: delta.app > 0 ? `+${delta.app}` : `${delta.app}`,
-      process: delta.process > 0 ? `+${delta.process}` : `${delta.process}`
-    }
+  return {
+    action: 'PLAN_CONFIRMED',
+    confirmedAt: plan.confirmedAt,
+    totalTasks: plan.enhancements.length,
+    message: 'Plan locked. Ready to execute.',
+    firstTask: firstTask ? {
+      id: firstTask.id,
+      priority: firstTask.priority,
+      area: firstTask.dimension,
+      task: firstTask.task,
+      currentScore: firstTask.currentScore,
+      targetScore: firstTask.targetScore
+    } : null,
+    nextStep: 'Run kb_first_execute to work through the plan'
   };
+}
-  if (!canProceed) {
-    result.blockReason = `Score dropped by ${Math.abs(delta.total)} points. You CANNOT proceed until score improves.`;
-    result.action = 'Fix issues causing score regression, then run kb_first_delta again.';
-  } else {
-    result.action = 'Run kb_first_gate to verify phase completion and proceed.';
-  }
+async function handleExecute(cwd, args) {
+  const planPath = join(cwd, '.ruvector', 'plan.json');
-  if (args.showBreakdown !== false) {
-    result.componentChanges = {
-      kb: {
-        before: baseline.kb.components,
-        after: current.kb.components
-      },
-      app: {
-        before: baseline.app.components,
-        after: current.app.components
-      },
-      process: {
-        before: baseline.process.components,
-        after: current.process.components
-      }
+  if (!existsSync(planPath)) {
+    return {
+      error: 'NO_PLAN',
+      message: 'No plan found. Run kb_first_plan first.'
     };
   }
-  return result;
-}
+  const plan = JSON.parse(readFileSync(planPath, 'utf-8'));
-async function handleKbFirstGate(cwd, args) {
-  const phase = args.phase;
-  const phaseInfo = PHASES[phase];
+  if (!plan.confirmed) {
+    return {
+      error: 'PLAN_NOT_CONFIRMED',
+      message: 'Plan not confirmed. Run kb_first_confirm first.',
+      action: 'Run kb_first_confirm with confirmed=true'
+    };
+  }
-  if (!phaseInfo) {
-    return { error: `Unknown phase: ${phase}` };
+  // Mark current task complete if requested
+  if (args.taskComplete && plan.currentTaskIndex < plan.enhancements.length) {
+    plan.enhancements[plan.currentTaskIndex].completed = true;
+    plan.enhancements[plan.currentTaskIndex].completedAt = new Date().toISOString();
+    plan.currentTaskIndex++;
+    writeFileSync(planPath, JSON.stringify(plan, null, 2));
   }
-  // Check baseline exists
-  const baselinePath = join(cwd, '.ruvector', 'baseline.json');
-  if (!existsSync(baselinePath)) {
+  // Check if all done
+  if (plan.currentTaskIndex >= plan.enhancements.length) {
     return {
-      canProceed: false,
-      blockReason: 'GATE_BLOCKED: No baseline established. Run kb_first_assess first.',
-      phase,
-      phaseName: phaseInfo.name
+      action: 'EXECUTION_COMPLETE',
+      message: 'All tasks completed!',
+      completedTasks: plan.enhancements.length,
+      nextStep: 'Run kb_first_verify to compare predicted vs actual improvements'
     };
   }
-  // Check delta
-  let baseline;
-  try {
-    baseline = JSON.parse(readFileSync(baselinePath, 'utf-8'));
-  } catch {
-    return {
-      canProceed: false,
-      blockReason: 'GATE_BLOCKED: Corrupt baseline. Run kb_first_assess again.',
-      phase,
-      phaseName: phaseInfo.name
-    };
+  const currentTask = plan.enhancements[plan.currentTaskIndex];
+  const completedCount = plan.enhancements.filter(e => e.completed).length;
+  return {
+    action: 'EXECUTING',
+    progress: {
+      completed: completedCount,
+      total: plan.enhancements.length,
+      percent: Math.round((completedCount / plan.enhancements.length) * 100)
+    },
+    currentTask: {
+      id: currentTask.id,
+      priority: currentTask.priority,
+      area: currentTask.dimension,
+      task: currentTask.task,
+      currentScore: currentTask.currentScore,
+      targetScore: currentTask.targetScore,
+      predictedImprovement: `+${currentTask.predictedImprovement}`
+    },
+    guidance: getTaskGuidance(currentTask),
+    nextStep: 'Complete the task above, then run kb_first_execute with taskComplete=true'
+  };
+}
+function getTaskGuidance(task) {
+  // Provide specific guidance based on task type
+  if (task.area === 'KB Quality') {
+    switch (task.dimension) {
+      case 'Completeness':
+        return 'Add more KB entries covering missing domain topics. Each entry should be in src/kb/ directory.';
+      case 'Depth':
+        return 'Expand existing KB entries with more detail. Target 2000+ characters per entry.';
+      case 'Comprehensiveness':
+        return 'Document edge cases, exceptions, and nuances in your KB entries.';
+      case 'Accuracy':
+        return 'Add tests to validate KB content. Create a tests/ directory with validation tests.';
+      case 'Freshness':
+        return 'Update KB content with latest information. Touch .ruvector/ to update timestamps.';
+      case 'Attribution':
+        return 'Add KB-Generated: headers to code files citing their KB sources.';
+      default:
+        return task.task;
+    }
   }
+  return task.task;
+}
-  const current = calculateScores(cwd);
-  const delta = current.total - baseline.total;
+async function handleVerify(cwd, args) {
+  const planPath = join(cwd, '.ruvector', 'plan.json');
+  const assessmentPath = join(cwd, '.ruvector', 'assessment.json');
+  const TARGET_SCORE = 98; // Recursive loop until we hit 98+
-  if (delta < 0) {
+  if (!existsSync(planPath) || !existsSync(assessmentPath)) {
     return {
-      canProceed: false,
-      blockReason: `GATE_BLOCKED: Score regression detected (${delta} points). Fix issues before proceeding.`,
-      phase,
-      phaseName: phaseInfo.name,
-      baseline: baseline.total,
-      current: current.total,
-      delta
+      error: 'MISSING_DATA',
+      message: 'Missing plan or assessment. Run kb_first_assess and kb_first_plan first.'
     };
   }
-  // Check gate-specific conditions
-  const configPath = join(cwd, '.ruvector', 'config.json');
-  let config = { phases: { current: 0, completed: [], gates: {} } };
-  if (existsSync(configPath)) {
-    try {
-      config = JSON.parse(readFileSync(configPath, 'utf-8'));
-    } catch {}
-  }
+  const plan = JSON.parse(readFileSync(planPath, 'utf-8'));
+  const originalAssessment = JSON.parse(readFileSync(assessmentPath, 'utf-8'));
-  // Phase-specific gate checks
-  let gateConditionMet = false;
-  let gateMessage = '';
-  switch (phaseInfo.gate) {
-    case 'kb_score_50':
-      gateConditionMet = current.kb.total >= 20; // 50% of 40
-      gateMessage = gateConditionMet ? 'KB score ≥50%' : `KB score ${current.kb.total}/40 < 50%`;
-      break;
-    case 'kb_score_80':
-      gateConditionMet = current.kb.total >= 32; // 80% of 40
-      gateMessage = gateConditionMet ? 'KB score ≥80%' : `KB score ${current.kb.total}/40 < 80%`;
-      break;
-    case 'coverage_80':
-      gateConditionMet = current.app.components.testCoverage >= 8; // 80% of 10
-      gateMessage = gateConditionMet ? 'Test coverage ≥80%' : `Test coverage ${current.app.components.testCoverage}/10 < 80%`;
-      break;
-    default:
-      // Default: pass if delta is non-negative
-      gateConditionMet = true;
-      gateMessage = 'Gate condition satisfied (positive delta)';
+  // Re-assess current state
+  const currentKB = scoreKBDimensions(cwd);
+  const currentPhases = scorePhaseReadiness(cwd);
+  const currentOverall = calculateOverallScores(currentKB, currentPhases);
+  // Compare predictions vs actual
+  const comparison = {
+    kb: {},
+    phases: {}
+  };
+  // Compare KB dimensions
+  for (const [dim, original] of Object.entries(originalAssessment.kb)) {
+    const current = currentKB[dim];
+    const enhancement = plan.enhancements.find(e => e.dimension === KB_DIMENSIONS[dim]?.name);
+    comparison.kb[dim] = {
+      before: original.score,
+      after: current.score,
+      actual: current.score - original.score,
+      predicted: enhancement?.predictedImprovement || 0,
+      hit: current.score >= TARGET_SCORE
+    };
   }
-  if (!gateConditionMet) {
-    return {
-      canProceed: false,
-      blockReason: `GATE_BLOCKED: ${gateMessage}`,
-      phase,
-      phaseName: phaseInfo.name,
-      gate: phaseInfo.gate
+  // Compare phases
+  for (const [num, original] of Object.entries(originalAssessment.phases)) {
+    const current = currentPhases[num];
+    const enhancement = plan.enhancements.find(e => e.dimension === `Phase ${num}: ${original.name}`);
+    comparison.phases[num] = {
+      name: original.name,
+      before: original.score,
+      after: current.score,
+      actual: current.score - original.score,
+      predicted: enhancement?.predictedImprovement || 0,
+      hit: current.score >= TARGET_SCORE
     };
   }
-  // Mark phase as completed
-  if (!config.phases.completed.includes(parseFloat(phase))) {
-    config.phases.completed.push(parseFloat(phase));
+  // Calculate summary
+  const kbHits = Object.values(comparison.kb).filter(c => c.hit).length;
+  const kbTotal = Object.keys(comparison.kb).length;
+  const phaseHits = Object.values(comparison.phases).filter(c => c.hit).length;
+  const phaseTotal = Object.keys(comparison.phases).length;
+  // Identify remaining gaps (anything below 98)
+  const remainingGaps = [];
+  for (const [dim, data] of Object.entries(comparison.kb)) {
+    if (data.after < TARGET_SCORE) {
+      remainingGaps.push({
+        area: 'KB Quality',
+        dimension: KB_DIMENSIONS[dim]?.name || dim,
+        currentScore: data.after,
+        targetScore: TARGET_SCORE,
+        gap: TARGET_SCORE - data.after
+      });
+    }
+  }
+  for (const [num, data] of Object.entries(comparison.phases)) {
+    if (data.after < TARGET_SCORE) {
+      remainingGaps.push({
+        area: 'Phase Readiness',
+        dimension: `Phase ${num}: ${data.name}`,
+        currentScore: data.after,
+        targetScore: TARGET_SCORE,
+        gap: TARGET_SCORE - data.after
+      });
+    }
   }
-  config.phases.gates[phaseInfo.gate] = true;
-  // Determine next phase
-  const phaseOrder = [0, 1, 1.5, 2, 3, 4, 5, 6, 7, 7.5, 8, 9, 10, 11, 11.5, 12];
-  const currentIdx = phaseOrder.indexOf(parseFloat(phase));
-  const nextPhase = currentIdx < phaseOrder.length - 1 ? phaseOrder[currentIdx + 1] : null;
+  // Track iteration count
+  let iterationCount = plan.iterationCount || 1;
+  // Save verification
+  const verification = {
+    timestamp: new Date().toISOString(),
+    iteration: iterationCount,
+    original: originalAssessment.overall,
+    current: currentOverall,
+    comparison,
+    remainingGaps,
+    targetScore: TARGET_SCORE,
+    targetMet: currentOverall.overall >= TARGET_SCORE
+  };
+  writeFileSync(join(cwd, '.ruvector', 'verification.json'), JSON.stringify(verification, null, 2));
-  if (nextPhase !== null) {
-    config.phases.current = nextPhase;
+  const result = {
+    action: 'VERIFICATION_COMPLETE',
+    iteration: iterationCount,
+    targetScore: TARGET_SCORE,
+    summary: {
+      kbAt98Plus: `${kbHits}/${kbTotal}`,
+      phasesAt98Plus: `${phaseHits}/${phaseTotal}`,
+      overallImprovement: {
+        kb: `${originalAssessment.overall.kbOverall} → ${currentOverall.kbOverall} (${currentOverall.kbOverall - originalAssessment.overall.kbOverall >= 0 ? '+' : ''}${currentOverall.kbOverall - originalAssessment.overall.kbOverall})`,
+        phases: `${originalAssessment.overall.phaseOverall} → ${currentOverall.phaseOverall} (${currentOverall.phaseOverall - originalAssessment.overall.phaseOverall >= 0 ? '+' : ''}${currentOverall.phaseOverall - originalAssessment.overall.phaseOverall})`,
+        combined: `${originalAssessment.overall.overall} → ${currentOverall.overall} (${currentOverall.overall - originalAssessment.overall.overall >= 0 ? '+' : ''}${currentOverall.overall - originalAssessment.overall.overall})`
+      }
+    }
+  };
+  if (args.detailed) {
+    result.kbComparison = comparison.kb;
+    result.phaseComparison = comparison.phases;
   }
-  // Save config
-  writeFileSync(configPath, JSON.stringify(config, null, 2));
+  // Check if we've hit the target
+  if (currentOverall.overall >= TARGET_SCORE && remainingGaps.length === 0) {
+    result.status = 'TARGET_ACHIEVED';
+    result.message = `🎯 All scores at ${TARGET_SCORE}+ after ${iterationCount} iteration(s)!`;
+    result.remainingGaps = 'None - all targets met!';
+    result.nextStep = 'Excellence achieved. Ready for production.';
+  } else {
+    // RECURSIVE: Auto-generate next plan
+    result.status = 'NEEDS_MORE_WORK';
+    result.message = `Score ${currentOverall.overall}/100 - target is ${TARGET_SCORE}. Generating next iteration plan...`;
+    result.remainingGaps = remainingGaps;
+    // Update assessment with current scores for next iteration
+    const newAssessment = {
+      timestamp: new Date().toISOString(),
+      kb: currentKB,
+      phases: currentPhases,
+      overall: currentOverall,
+      previousIteration: iterationCount
+    };
+    writeFileSync(join(cwd, '.ruvector', 'assessment.json'), JSON.stringify(newAssessment, null, 2));
+    // Auto-generate new plan for remaining gaps
+    const newEnhancements = remainingGaps.map((gap, idx) => ({
+      id: idx + 1,
+      area: gap.area,
+      dimension: gap.dimension,
+      currentScore: gap.currentScore,
+      targetScore: TARGET_SCORE,
+      predictedImprovement: gap.gap,
+      task: getImprovementTask(gap),
+      priority: gap.gap > 30 ? 'HIGH' : (gap.gap > 15 ? 'MEDIUM' : 'LOW'),
+      effort: gap.gap > 30 ? 'Large' : (gap.gap > 15 ? 'Medium' : 'Small')
+    }));
+    const newPlan = {
+      timestamp: new Date().toISOString(),
+      threshold: TARGET_SCORE,
+      iterationCount: iterationCount + 1,
+      baselineScores: currentOverall,
+      enhancements: newEnhancements,
+      predictions: {
+        tasksCount: newEnhancements.length,
+        highPriority: newEnhancements.filter(e => e.priority === 'HIGH').length,
+        mediumPriority: newEnhancements.filter(e => e.priority === 'MEDIUM').length,
+        lowPriority: newEnhancements.filter(e => e.priority === 'LOW').length
+      },
+      confirmed: false,
+      currentTaskIndex: 0
+    };
+    writeFileSync(join(cwd, '.ruvector', 'plan.json'), JSON.stringify(newPlan, null, 2));
-  // Save current scores as new baseline for next phase
-  writeFileSync(baselinePath, JSON.stringify(current, null, 2));
+    result.newPlan = {
+      iteration: iterationCount + 1,
+      tasks: newEnhancements.length,
+      highPriority: newPlan.predictions.highPriority
+    };
+    result.nextStep = `Iteration ${iterationCount + 1} plan generated. Run kb_first_confirm with confirmed=true to continue.`;
+  }
-  return {
-    canProceed: true,
-    phase,
-    phaseName: phaseInfo.name,
-    gateStatus: 'PASSED',
-    gateMessage,
-    scoreImprovement: delta > 0 ? `+${delta}` : '0',
-    nextPhase,
-    nextPhaseName: nextPhase !== null ? PHASES[nextPhase]?.name : 'PROJECT COMPLETE',
-    action: nextPhase !== null
-      ? `Run kb_first_assess to establish baseline for Phase ${nextPhase}: ${PHASES[nextPhase]?.name}`
-      : 'All phases complete! Project ready for production.'
-  };
+  return result;
+}
+/**
+ * Get improvement task based on gap
+ */
+function getImprovementTask(gap) {
+  if (gap.area === 'KB Quality') {
+    switch (gap.dimension) {
+      case 'Completeness':
+        return `Add more KB entries to reach ${gap.targetScore}% coverage`;
+      case 'Depth':
+        return `Expand KB entries with more detail (target: 2500+ chars each)`;
+      case 'Comprehensiveness':
+        return `Document additional edge cases and exceptions`;
+      case 'Accuracy':
+        return `Add validation tests and verification`;
+      case 'Freshness':
+        return `Update KB content with latest information`;
+      case 'Attribution':
+        return `Add KB-Generated headers to remaining code files`;
+      default:
+        return `Improve ${gap.dimension} to ${gap.targetScore}`;
+    }
+  }
+  return `Complete remaining criteria for ${gap.dimension}`;
 }
 /**
  * Handle MCP tool calls
  */
 async function handleToolCall(toolName, args) {
-  const cwd = process.cwd();
+  const cwd = args.projectPath || process.cwd();
   switch (toolName) {
     case 'kb_first_assess':
-      return await handleKbFirstAssess(cwd, args);
-    case 'kb_first_phase':
-      return await handleKbFirstPhase(cwd, args);
-    case 'kb_first_delta':
-      return await handleKbFirstDelta(cwd, args);
-    case 'kb_first_gate':
-      return await handleKbFirstGate(cwd, args);
+      return await handleAssess(cwd, args);
+    case 'kb_first_plan':
+      return await handlePlan(cwd, args);
+    case 'kb_first_confirm':
+      return await handleConfirm(cwd, args);
+    case 'kb_first_execute':
+      return await handleExecute(cwd, args);
+    case 'kb_first_verify':
+      return await handleVerify(cwd, args);
     default:
       return { error: `Unknown tool: ${toolName}` };
   }
@@ -711,12 +1029,12 @@ async function handleMCPMessage(message) {
 }
 /**
- * Start MCP Server (stdio mode)
+ * Start MCP Server
  */
 export async function startMCPServer(options = {}) {
   console.error(`RuvNet KB-First MCP Server v${SERVER_VERSION}`);
-  console.error('Architecture: Score-Driven | Tools: 4 | Phases: 15');
-  console.error('Philosophy: Scoring IS enforcement. No shortcuts.');
+  console.error('Architecture: Granular Score-Driven | Tools: 5 | Dimensions: 6 KB + 12 Phases');
+  console.error('Workflow: Assess → Plan → Confirm → Execute → Verify');
   let buffer = '';
   process.stdin.setEncoding('utf-8');