npm - @aiready/context-analyzer - Versions diffs - 0.5.1 → 0.6.0 - Mend

@aiready/context-analyzer 0.5.1 → 0.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

package/.turbo/turbo-build.log +7 -7
package/.turbo/turbo-test.log +10 -27
package/COHESION-IMPROVEMENTS.md +202 -0
package/dist/chunk-DD7UVNE3.mjs +678 -0
package/dist/chunk-EX7HCWAO.mjs +625 -0
package/dist/cli.js +100 -32
package/dist/cli.mjs +1 -1
package/dist/index.js +100 -32
package/dist/index.mjs +1 -1
package/package.json +2 -2
package/src/__tests__/analyzer.test.ts +24 -0
package/src/__tests__/enhanced-cohesion.test.ts +126 -0
package/src/analyzer.ts +178 -40
package/src/index.ts +1 -1
package/src/types.ts +3 -0

package/src/analyzer.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { estimateTokens } from '@aiready/core';
+import { estimateTokens, parseFileExports, calculateImportSimilarity, type ExportWithImports } from '@aiready/core';
 import type {
   ContextAnalysisResult,
   DependencyGraph,
@@ -24,7 +24,10 @@ export function buildDependencyGraph(
   // First pass: Create nodes
   for (const { file, content } of files) {
     const imports = extractImportsFromContent(content);
-    const exports = extractExports(content);
+    // Use AST-based extraction for better accuracy, fallback to regex
+    const exports = extractExportsWithAST(content, file);
     const tokenCost = estimateTokens(content);
     const linesOfCode = content.split('\n').length;
@@ -199,33 +202,28 @@ export function detectCircularDependencies(
 /**
  * Calculate cohesion score (how related are exports in a file)
- * Uses entropy: low entropy = high cohesion
+ * Uses enhanced calculation combining domain-based and import-based analysis
+ * @param exports - Array of export information
+ * @param filePath - Optional file path for context-aware scoring
  */
-export function calculateCohesion(exports: ExportInfo[]): number {
-  if (exports.length === 0) return 1;
-  if (exports.length === 1) return 1; // Single export = perfect cohesion
-  const domains = exports.map((e) => e.inferredDomain || 'unknown');
-  const domainCounts = new Map<string, number>();
-  for (const domain of domains) {
-    domainCounts.set(domain, (domainCounts.get(domain) || 0) + 1);
-  }
-  // Calculate Shannon entropy
-  const total = domains.length;
-  let entropy = 0;
-  for (const count of domainCounts.values()) {
-    const p = count / total;
-    if (p > 0) {
-      entropy -= p * Math.log2(p);
-    }
-  }
+export function calculateCohesion(exports: ExportInfo[], filePath?: string): number {
+  return calculateEnhancedCohesion(exports, filePath);
+}
-  // Normalize to 0-1 (higher = better cohesion)
-  const maxEntropy = Math.log2(total);
-  return maxEntropy > 0 ? 1 - entropy / maxEntropy : 1;
+/**
+ * Check if a file is a test/mock/fixture file
+ */
+function isTestFile(filePath: string): boolean {
+  const lower = filePath.toLowerCase();
+  return (
+    lower.includes('test') ||
+    lower.includes('spec') ||
+    lower.includes('mock') ||
+    lower.includes('fixture') ||
+    lower.includes('__tests__') ||
+    lower.includes('.test.') ||
+    lower.includes('.spec.')
+  );
 }
 /**
@@ -279,7 +277,7 @@ export function detectModuleClusters(
     const avgCohesion =
       files.reduce((sum, file) => {
         const node = graph.nodes.get(file);
-        return sum + (node ? calculateCohesion(node.exports) : 0);
+        return sum + (node ? calculateCohesion(node.exports, file) : 0);
       }, 0) / files.length;
     // Generate consolidation plan
@@ -349,33 +347,45 @@ function extractExports(content: string): ExportInfo[] {
 /**
  * Infer domain from export name
- * Uses common naming patterns
+ * Uses common naming patterns with word boundary matching
  */
 function inferDomain(name: string): string {
   const lower = name.toLowerCase();
-  // Common domain keywords
+  // Domain keywords ordered from most specific to most general
+  // This prevents generic terms like 'util' from matching before specific domains
   const domainKeywords = [
-    'user',
-    'auth',
-    'order',
-    'product',
+    'authentication',
+    'authorization',
     'payment',
-    'cart',
     'invoice',
     'customer',
+    'product',
+    'order',
+    'cart',
+    'user',
     'admin',
-    'api',
-    'util',
-    'helper',
-    'config',
-    'service',
     'repository',
     'controller',
+    'service',
+    'config',
     'model',
     'view',
+    'auth',
+    'api',
+    'helper',
+    'util',
   ];
+  // Try word boundary matching first for more accurate detection
+  for (const keyword of domainKeywords) {
+    const wordBoundaryPattern = new RegExp(`\\b${keyword}\\b`, 'i');
+    if (wordBoundaryPattern.test(name)) {
+      return keyword;
+    }
+  }
+  // Fallback to substring matching for compound words
   for (const keyword of domainKeywords) {
     if (lower.includes(keyword)) {
       return keyword;
@@ -424,3 +434,131 @@ function generateConsolidationPlan(
   return plan;
 }
+/**
+ * Extract exports using AST parsing (enhanced version)
+ * Falls back to regex if AST parsing fails
+ */
+export function extractExportsWithAST(content: string, filePath: string): ExportInfo[] {
+  try {
+    const { exports: astExports } = parseFileExports(content, filePath);
+    return astExports.map(exp => ({
+      name: exp.name,
+      type: exp.type,
+      inferredDomain: inferDomain(exp.name),
+      imports: exp.imports,
+      dependencies: exp.dependencies,
+    }));
+  } catch (error) {
+    // Fallback to regex-based extraction
+    return extractExports(content);
+  }
+}
+/**
+ * Calculate enhanced cohesion score using both domain inference and import similarity
+ *
+ * This combines:
+ * 1. Domain-based cohesion (entropy of inferred domains)
+ * 2. Import-based cohesion (Jaccard similarity of shared imports)
+ *
+ * Weight: 60% import-based, 40% domain-based (import analysis is more reliable)
+ */
+export function calculateEnhancedCohesion(
+  exports: ExportInfo[],
+  filePath?: string
+): number {
+  if (exports.length === 0) return 1;
+  if (exports.length === 1) return 1;
+  // Special case for test files
+  if (filePath && isTestFile(filePath)) {
+    return 1;
+  }
+  // Calculate domain-based cohesion (existing method)
+  const domainCohesion = calculateDomainCohesion(exports);
+  // Calculate import-based cohesion if imports are available
+  const hasImportData = exports.some(e => e.imports && e.imports.length > 0);
+  if (!hasImportData) {
+    // No import data available, use domain-based only
+    return domainCohesion;
+  }
+  const importCohesion = calculateImportBasedCohesion(exports);
+  // Weighted combination: 60% import-based, 40% domain-based
+  return importCohesion * 0.6 + domainCohesion * 0.4;
+}
+/**
+ * Calculate cohesion based on shared imports (Jaccard similarity)
+ */
+function calculateImportBasedCohesion(exports: ExportInfo[]): number {
+  const exportsWithImports = exports.filter(e => e.imports && e.imports.length > 0);
+  if (exportsWithImports.length < 2) {
+    return 1; // Not enough data
+  }
+  // Calculate pairwise import similarity
+  let totalSimilarity = 0;
+  let comparisons = 0;
+  for (let i = 0; i < exportsWithImports.length; i++) {
+    for (let j = i + 1; j < exportsWithImports.length; j++) {
+      const exp1 = exportsWithImports[i] as ExportInfo & { imports: string[] };
+      const exp2 = exportsWithImports[j] as ExportInfo & { imports: string[] };
+      const similarity = calculateJaccardSimilarity(exp1.imports, exp2.imports);
+      totalSimilarity += similarity;
+      comparisons++;
+    }
+  }
+  return comparisons > 0 ? totalSimilarity / comparisons : 1;
+}
+/**
+ * Calculate Jaccard similarity between two arrays
+ */
+function calculateJaccardSimilarity(arr1: string[], arr2: string[]): number {
+  if (arr1.length === 0 && arr2.length === 0) return 1;
+  if (arr1.length === 0 || arr2.length === 0) return 0;
+  const set1 = new Set(arr1);
+  const set2 = new Set(arr2);
+  const intersection = new Set([...set1].filter(x => set2.has(x)));
+  const union = new Set([...set1, ...set2]);
+  return intersection.size / union.size;
+}
+/**
+ * Calculate domain-based cohesion (existing entropy method)
+ */
+function calculateDomainCohesion(exports: ExportInfo[]): number {
+  const domains = exports.map((e) => e.inferredDomain || 'unknown');
+  const domainCounts = new Map<string, number>();
+  for (const domain of domains) {
+    domainCounts.set(domain, (domainCounts.get(domain) || 0) + 1);
+  }
+  const total = domains.length;
+  let entropy = 0;
+  for (const count of domainCounts.values()) {
+    const p = count / total;
+    if (p > 0) {
+      entropy -= p * Math.log2(p);
+    }
+  }
+  const maxEntropy = Math.log2(total);
+  return maxEntropy > 0 ? 1 - entropy / maxEntropy : 1;
+}

package/src/index.ts CHANGED Viewed

@@ -157,7 +157,7 @@ export async function analyzeContext(
     const cohesionScore =
       focus === 'cohesion' || focus === 'all'
-        ? calculateCohesion(node.exports)
+        ? calculateCohesion(node.exports, file)
         : 1;
     const fragmentationScore = fragmentationMap.get(file) || 0;

package/src/types.ts CHANGED Viewed

@@ -101,4 +101,7 @@ export interface ExportInfo {
   name: string;
   type: 'function' | 'class' | 'const' | 'type' | 'interface' | 'default';
   inferredDomain?: string; // Inferred from name/usage
+  imports?: string[]; // Imports used by this export (for import-based cohesion)
+  dependencies?: string[]; // Other exports from same file this depends on
 }