npm - codecritique - Versions diffs - 1.2.2 → 1.2.4 - Mend

codecritique 1.2.2 → 1.2.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

package/package.json +1 -1
package/src/content-retrieval.js +93 -153
package/src/content-retrieval.test.js +49 -9
package/src/custom-documents.js +17 -17
package/src/feedback-loader.js +31 -31
package/src/index.js +71 -94
package/src/llm.js +4 -3
package/src/project-analyzer.js +73 -41
package/src/project-analyzer.test.js +3 -5
package/src/rag-analyzer.js +189 -169
package/src/rag-analyzer.test.js +55 -0
package/src/rag-review.js +105 -74
package/src/rag-review.test.js +115 -3
package/src/zero-shot-classifier-open.js +3 -2

package/src/project-analyzer.js CHANGED Viewed

@@ -13,6 +13,7 @@ import { getDefaultEmbeddingsSystem } from './embeddings/factory.js';
 import * as llm from './llm.js';
 import { FILE_SELECTION_SYSTEM_PROMPT, PROJECT_SUMMARY_SYSTEM_PROMPT } from './prompt-cache.js';
 import { isDocumentationFile, isTestFile } from './utils/file-validation.js';
+import { verboseLog } from './utils/logging.js';
 // Consolidated file classification configuration
 const FILE_PATTERNS = {
@@ -198,9 +199,7 @@ export class ProjectAnalyzer {
     const { verbose = false, forceAnalysis = false } = options;
     try {
-      if (verbose) {
-        console.log(chalk.cyan('🔍 Starting project architecture analysis...'));
-      }
+      verboseLog(verbose, chalk.cyan('🔍 Starting project architecture analysis...'));
       // Initialize LLM client
       if (!this.llm) {
@@ -210,18 +209,20 @@ export class ProjectAnalyzer {
       // Check for existing analysis
       const existingSummary = forceAnalysis ? null : await this.loadExistingAnalysis(projectPath);
       if (existingSummary && !forceAnalysis) {
-        const currentHash = await this.calculateKeyFilesHash(existingSummary.keyFiles);
-        if (existingSummary.keyFilesHash === currentHash) {
-          if (verbose) {
-            console.log(chalk.green('✅ Project analysis up-to-date (no key file changes detected)'));
+        const currentEmbeddingInventoryHash = await this.calculateEmbeddingInventoryHash(projectPath);
+        if (existingSummary.embeddingInventoryHash !== currentEmbeddingInventoryHash) {
+          verboseLog(verbose, chalk.yellow('🔄 Embedding inventory changed, regenerating analysis...'));
+        } else {
+          const currentHash = await this.calculateKeyFilesHash(existingSummary.keyFiles);
+          if (existingSummary.keyFilesHash === currentHash) {
+            verboseLog(verbose, chalk.green('✅ Project analysis up-to-date (no key file changes detected)'));
+            return existingSummary;
           }
-          return existingSummary;
-        }
-        if (verbose) {
-          console.log(chalk.yellow('🔄 Key files changed, regenerating analysis...'));
+          verboseLog(verbose, chalk.yellow('🔄 Key files changed, regenerating analysis...'));
         }
-      } else if (verbose) {
-        console.log(
+      } else {
+        verboseLog(
+          verbose,
           chalk.cyan(
             forceAnalysis
               ? '🔄 Force analysis requested - regenerating from scratch...'
@@ -235,10 +236,8 @@ export class ProjectAnalyzer {
         ? await this.validateAndUpdateKeyFiles(existingSummary.keyFiles, projectPath)
         : await this.discoverKeyFilesWithLLM(projectPath);
-      if (verbose) {
-        console.log(chalk.gray(`   Found ${keyFiles.length} key architectural files`));
-        console.log(chalk.cyan('🧠 Generating LLM-based project analysis...'));
-      }
+      verboseLog(verbose, chalk.gray(`   Found ${keyFiles.length} key architectural files`));
+      verboseLog(verbose, chalk.cyan('🧠 Generating LLM-based project analysis...'));
       // Generate summary
       const projectSummary = await this.generateProjectSummary(keyFiles, projectPath);
@@ -247,6 +246,7 @@ export class ProjectAnalyzer {
       const currentHash = await this.calculateKeyFilesHash(keyFiles);
       projectSummary.keyFiles = keyFiles;
       projectSummary.keyFilesHash = currentHash;
+      projectSummary.embeddingInventoryHash = await this.calculateEmbeddingInventoryHash(projectPath);
       await this.storeAnalysis(projectPath, projectSummary);
@@ -254,12 +254,10 @@ export class ProjectAnalyzer {
       this.keyFiles = keyFiles;
       this.lastAnalysisHash = currentHash;
-      if (verbose) {
-        console.log(chalk.green('✅ Project analysis complete'));
-        console.log(chalk.gray(`   Technologies: ${(projectSummary.technologies || []).join(', ')}`));
-        console.log(chalk.gray(`   Key patterns: ${(projectSummary.keyPatterns || []).length} identified`));
-        console.log(chalk.gray(`   Key files tracked: ${keyFiles.length}`));
-      }
+      verboseLog(verbose, chalk.green('✅ Project analysis complete'));
+      verboseLog(verbose, chalk.gray(`   Technologies: ${(projectSummary.technologies || []).join(', ')}`));
+      verboseLog(verbose, chalk.gray(`   Key patterns: ${(projectSummary.keyPatterns || []).length} identified`));
+      verboseLog(verbose, chalk.gray(`   Key files tracked: ${keyFiles.length}`));
       return projectSummary;
     } catch (error) {
@@ -300,7 +298,7 @@ export class ProjectAnalyzer {
     try {
       const embeddingsSystem = getDefaultEmbeddingsSystem();
       await embeddingsSystem.storeProjectSummary(projectPath, projectSummary);
-      console.log(chalk.green('✅ Project analysis stored in database'));
+      verboseLog({}, chalk.green('✅ Project analysis stored in database'));
     } catch (error) {
       console.error(chalk.yellow('Warning: Could not store analysis:'), error.message);
     }
@@ -328,7 +326,7 @@ export class ProjectAnalyzer {
     // If we lost more than 30% of key files, trigger fresh discovery
     if (validatedFiles.length < existingKeyFiles.length * 0.7) {
-      console.log(chalk.yellow('⚠️ Many key files missing, performing fresh discovery...'));
+      verboseLog({}, chalk.yellow('⚠️ Many key files missing, performing fresh discovery...'));
       return await this.discoverKeyFilesWithLLM(projectPath);
     }
@@ -339,10 +337,10 @@ export class ProjectAnalyzer {
    * Discover key architectural files using LanceDB hybrid search
    */
   async discoverKeyFilesWithLLM(projectPath) {
-    console.log(chalk.cyan('🔍 Mining codebase embeddings with LanceDB hybrid search...'));
+    verboseLog({}, chalk.cyan('🔍 Mining codebase embeddings with LanceDB hybrid search...'));
     const keyFilesByCategory = await this.mineKeyFilesFromEmbeddings(projectPath);
-    console.log(chalk.cyan(`🧠 LLM analyzing ${keyFilesByCategory.length} candidates from embedding search...`));
+    verboseLog({}, chalk.cyan(`🧠 LLM analyzing ${keyFilesByCategory.length} candidates from embedding search...`));
     const keyFiles = await this.selectFinalKeyFiles(keyFilesByCategory, projectPath);
     return keyFiles;
@@ -362,7 +360,7 @@ export class ProjectAnalyzer {
       await table.optimize();
     } catch (optimizeError) {
       if (optimizeError.message && optimizeError.message.includes('legacy format')) {
-        console.log(chalk.yellow(`Skipping optimization due to legacy index format - will be auto-upgraded during normal operations`));
+        console.warn(chalk.yellow(`Skipping optimization due to legacy index format - will be auto-upgraded during normal operations`));
       } else {
         console.warn(chalk.yellow(`Warning: Failed to optimize file embeddings table: ${optimizeError.message}`));
       }
@@ -371,7 +369,7 @@ export class ProjectAnalyzer {
     const keyFiles = new Map();
     try {
-      console.log(chalk.gray(`   📊 Using LanceDB hybrid search for project: ${projectPath}`));
+      verboseLog({}, chalk.gray(`   📊 Using LanceDB hybrid search for project: ${projectPath}`));
       // Unified query function
       const queryFiles = async (config) => {
@@ -414,17 +412,17 @@ export class ProjectAnalyzer {
           return await query.limit(config.limit || 30).toArray();
         } catch (error) {
-          console.log(chalk.yellow(`     ⚠️ Query failed for ${config.category}: ${error.message}`));
+          verboseLog({}, chalk.yellow(`     ⚠️ Query failed for ${config.category}: ${error.message}`));
           return [];
         }
       };
       // Execute all searches
       for (const config of DB_SEARCH_CONFIGS) {
-        console.log(chalk.gray(`   🔍 Searching for ${config.category} files...`));
+        verboseLog({}, chalk.gray(`   🔍 Searching for ${config.category} files...`));
         const results = await queryFiles(config);
-        console.log(chalk.gray(`   📦 Found ${results.length} ${config.category} file candidates`));
+        verboseLog({}, chalk.gray(`   📦 Found ${results.length} ${config.category} file candidates`));
         results.forEach((result) => {
           if (this.matchesFileType(result.path, result.name, config.matcher)) {
@@ -438,7 +436,7 @@ export class ProjectAnalyzer {
     }
     const results = Array.from(keyFiles.values());
-    console.log(chalk.cyan(`🗃️ Found ${results.length} key files from embeddings database`));
+    verboseLog({}, chalk.cyan(`🗃️ Found ${results.length} key files from embeddings database`));
     return results;
   }
@@ -475,11 +473,11 @@ export class ProjectAnalyzer {
    */
   async selectFinalKeyFiles(candidates, projectPath) {
     if (candidates.length === 0) {
-      console.log(chalk.yellow('⚠️ No candidates found from embeddings search'));
+      verboseLog({}, chalk.yellow('⚠️ No candidates found from embeddings search'));
       return [];
     }
-    console.log(chalk.cyan(`🤖 LLM analyzing ${candidates.length} candidates...`));
+    verboseLog({}, chalk.cyan(`🤖 LLM analyzing ${candidates.length} candidates...`));
     const candidatesSummary = candidates
       .map((file, index) => {
@@ -520,7 +518,7 @@ Select files following the criteria in the system instructions.`;
         jsonSchema: fileSelectionSchema,
       });
-      console.log(chalk.gray('   📄 LLM Response preview:'), response.content.substring(0, 200));
+      verboseLog({}, chalk.gray('   📄 LLM Response preview:'), response.content.substring(0, 200));
       const selectedPaths = response.json.selectedFiles;
@@ -546,14 +544,14 @@ Select files following the criteria in the system instructions.`;
           })
           .filter(Boolean);
-        console.log(chalk.cyan(`🎯 LLM selected ${keyFiles.length} final key files`));
+        verboseLog({}, chalk.cyan(`🎯 LLM selected ${keyFiles.length} final key files`));
         return keyFiles;
       } else {
         throw new Error(`Failed to extract valid JSON array from LLM response`);
       }
     } catch (error) {
       console.error(chalk.red('Error in LLM selection:'), error.message);
-      console.log(chalk.yellow('   🔄 Falling back to automatic selection...'));
+      verboseLog({}, chalk.yellow('   🔄 Falling back to automatic selection...'));
       return this.fallbackFileSelection(candidates, projectPath);
     }
   }
@@ -588,7 +586,7 @@ Select files following the criteria in the system instructions.`;
       }
     }
-    console.log(chalk.yellow(`⚠️ Used fallback selection: ${fallbackFiles.length} files`));
+    verboseLog({}, chalk.yellow(`⚠️ Used fallback selection: ${fallbackFiles.length} files`));
     return fallbackFiles;
   }
@@ -621,6 +619,39 @@ Select files following the criteria in the system instructions.`;
     return hash.digest('hex');
   }
+  /**
+   * Calculate a project-scoped hash of the current embedding inventory.
+   */
+  async calculateEmbeddingInventoryHash(projectPath) {
+    try {
+      const embeddingsSystem = getDefaultEmbeddingsSystem();
+      await embeddingsSystem.initialize();
+      const table = await embeddingsSystem.databaseManager.getTable(embeddingsSystem.databaseManager.fileEmbeddingsTable);
+      if (!table) {
+        return 'no-file-embeddings-table';
+      }
+      const records = await table
+        .query()
+        .select(['type', 'path', 'content_hash', 'project_path'])
+        .where(`project_path = '${projectPath.replace(/'/g, "''")}'`)
+        .toArray();
+      const hash = crypto.createHash('sha256');
+      const normalizedRows = records.map((record) => `${record.type || 'file'}:${record.path || ''}:${record.content_hash || ''}`).sort();
+      for (const row of normalizedRows) {
+        hash.update(row);
+      }
+      return hash.digest('hex');
+    } catch (error) {
+      verboseLog({}, chalk.yellow(`Warning: Could not calculate embedding inventory hash: ${error.message}`));
+      return 'embedding-inventory-unavailable';
+    }
+  }
   /**
    * Generate comprehensive project summary using LLM analysis (SINGLE CALL)
    */
@@ -793,7 +824,7 @@ Follow the analysis guidelines from the system instructions to identify custom i
     } catch (error) {
       console.error(chalk.red('Error generating project summary:'), error.message);
       const fallback = this.createFallbackSummary(projectPath, keyFiles);
-      console.log(chalk.yellow('Using fallback summary with technologies:'), fallback.technologies);
+      verboseLog({}, chalk.yellow('Using fallback summary with technologies:'), fallback.technologies);
       return fallback;
     }
   }
@@ -857,7 +888,8 @@ Follow the analysis guidelines from the system instructions to identify custom i
       };
     }
-    console.log(
+    verboseLog(
+      {},
       chalk.cyan(
         `✅ Project summary validated - Technologies: ${validatedSummary.technologies.length}, Frameworks: ${validatedSummary.mainFrameworks.length}`
       )

package/src/project-analyzer.test.js CHANGED Viewed

@@ -272,7 +272,6 @@ describe('ProjectAnalyzer', () => {
       await analyzer.storeAnalysis(mockProjectPath, summary);
       expect(mockEmbeddingsSystem.storeProjectSummary).toHaveBeenCalledWith(mockProjectPath, summary);
-      expect(console.log).toHaveBeenCalledWith(expect.stringContaining('Project analysis stored'));
     });
     it('should handle storage errors gracefully', async () => {
@@ -319,7 +318,7 @@ describe('ProjectAnalyzer', () => {
       await analyzer.validateAndUpdateKeyFiles(existingFiles, mockProjectPath);
       // With 1 of 3 files found (33%), it should trigger fresh discovery
-      expect(console.log).toHaveBeenCalledWith(expect.stringContaining('Many key files missing'));
+      expect(mockEmbeddingsSystem.initialize).toHaveBeenCalled();
     });
     it('should filter out missing files and keep existing ones', async () => {
@@ -366,7 +365,7 @@ describe('ProjectAnalyzer', () => {
       await analyzer.validateAndUpdateKeyFiles(existingFiles, mockProjectPath);
       // Should trigger discoverKeyFilesWithLLM
-      expect(console.log).toHaveBeenCalledWith(expect.stringContaining('Many key files missing'));
+      expect(mockEmbeddingsSystem.initialize).toHaveBeenCalled();
     });
   });
@@ -410,7 +409,7 @@ describe('ProjectAnalyzer', () => {
       const result = await analyzer.mineKeyFilesFromEmbeddings(mockProjectPath);
       expect(result).toEqual([]);
-      expect(console.log).toHaveBeenCalledWith(expect.stringContaining('Skipping optimization'));
+      expect(console.warn).toHaveBeenCalledWith(expect.stringContaining('legacy index format'));
     });
     it('should return empty array on query error', async () => {
@@ -496,7 +495,6 @@ describe('ProjectAnalyzer', () => {
       await analyzer.selectFinalKeyFiles(candidates, mockProjectPath);
       expect(console.error).toHaveBeenCalled();
-      expect(console.log).toHaveBeenCalledWith(expect.stringContaining('Falling back to automatic selection'));
     });
     it('should fallback if LLM returns invalid response', async () => {