prjct-cli 0.45.0 → 0.45.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (207) hide show
  1. package/CHANGELOG.md +82 -0
  2. package/bin/prjct.ts +117 -10
  3. package/core/__tests__/agentic/memory-system.test.ts +39 -26
  4. package/core/__tests__/agentic/plan-mode.test.ts +64 -46
  5. package/core/__tests__/agentic/prompt-builder.test.ts +14 -14
  6. package/core/__tests__/services/project-index.test.ts +353 -0
  7. package/core/__tests__/types/fs.test.ts +3 -3
  8. package/core/__tests__/utils/date-helper.test.ts +10 -10
  9. package/core/__tests__/utils/output.test.ts +9 -6
  10. package/core/__tests__/utils/project-commands.test.ts +5 -6
  11. package/core/agentic/agent-router.ts +9 -10
  12. package/core/agentic/chain-of-thought.ts +16 -4
  13. package/core/agentic/command-executor.ts +66 -40
  14. package/core/agentic/context-builder.ts +8 -5
  15. package/core/agentic/ground-truth.ts +15 -9
  16. package/core/agentic/index.ts +145 -152
  17. package/core/agentic/loop-detector.ts +40 -11
  18. package/core/agentic/memory-system.ts +98 -35
  19. package/core/agentic/orchestrator-executor.ts +135 -71
  20. package/core/agentic/plan-mode.ts +46 -16
  21. package/core/agentic/prompt-builder.ts +108 -42
  22. package/core/agentic/services.ts +10 -9
  23. package/core/agentic/skill-loader.ts +9 -15
  24. package/core/agentic/smart-context.ts +129 -79
  25. package/core/agentic/template-executor.ts +13 -12
  26. package/core/agentic/template-loader.ts +7 -4
  27. package/core/agentic/tool-registry.ts +16 -13
  28. package/core/agents/index.ts +1 -1
  29. package/core/agents/performance.ts +10 -27
  30. package/core/ai-tools/formatters.ts +8 -6
  31. package/core/ai-tools/generator.ts +4 -4
  32. package/core/ai-tools/index.ts +1 -1
  33. package/core/ai-tools/registry.ts +21 -11
  34. package/core/bus/bus.ts +23 -16
  35. package/core/bus/index.ts +2 -2
  36. package/core/cli/linear.ts +3 -5
  37. package/core/cli/start.ts +28 -25
  38. package/core/commands/analysis.ts +58 -39
  39. package/core/commands/analytics.ts +52 -44
  40. package/core/commands/base.ts +15 -13
  41. package/core/commands/cleanup.ts +6 -13
  42. package/core/commands/command-data.ts +28 -4
  43. package/core/commands/commands.ts +57 -24
  44. package/core/commands/context.ts +4 -4
  45. package/core/commands/design.ts +3 -10
  46. package/core/commands/index.ts +5 -8
  47. package/core/commands/maintenance.ts +7 -4
  48. package/core/commands/planning.ts +179 -56
  49. package/core/commands/register.ts +13 -9
  50. package/core/commands/registry.ts +15 -14
  51. package/core/commands/setup.ts +26 -14
  52. package/core/commands/shipping.ts +11 -16
  53. package/core/commands/snapshots.ts +16 -32
  54. package/core/commands/uninstall.ts +541 -0
  55. package/core/commands/workflow.ts +24 -28
  56. package/core/constants/index.ts +10 -22
  57. package/core/context/generator.ts +82 -33
  58. package/core/context-tools/files-tool.ts +18 -19
  59. package/core/context-tools/imports-tool.ts +13 -33
  60. package/core/context-tools/index.ts +29 -54
  61. package/core/context-tools/recent-tool.ts +16 -22
  62. package/core/context-tools/signatures-tool.ts +17 -26
  63. package/core/context-tools/summary-tool.ts +20 -22
  64. package/core/context-tools/token-counter.ts +25 -20
  65. package/core/context-tools/types.ts +5 -5
  66. package/core/domain/agent-generator.ts +7 -5
  67. package/core/domain/agent-loader.ts +2 -2
  68. package/core/domain/analyzer.ts +19 -16
  69. package/core/domain/architecture-generator.ts +6 -3
  70. package/core/domain/context-estimator.ts +3 -4
  71. package/core/domain/snapshot-manager.ts +25 -22
  72. package/core/domain/task-stack.ts +24 -14
  73. package/core/errors.ts +1 -1
  74. package/core/events/events.ts +2 -4
  75. package/core/events/index.ts +1 -2
  76. package/core/index.ts +28 -16
  77. package/core/infrastructure/agent-detector.ts +3 -3
  78. package/core/infrastructure/ai-provider.ts +23 -20
  79. package/core/infrastructure/author-detector.ts +16 -10
  80. package/core/infrastructure/capability-installer.ts +2 -2
  81. package/core/infrastructure/claude-agent.ts +6 -6
  82. package/core/infrastructure/command-installer.ts +22 -17
  83. package/core/infrastructure/config-manager.ts +18 -14
  84. package/core/infrastructure/editors-config.ts +8 -4
  85. package/core/infrastructure/path-manager.ts +8 -6
  86. package/core/infrastructure/permission-manager.ts +20 -17
  87. package/core/infrastructure/setup.ts +42 -38
  88. package/core/infrastructure/update-checker.ts +5 -5
  89. package/core/integrations/issue-tracker/enricher.ts +8 -19
  90. package/core/integrations/issue-tracker/index.ts +2 -2
  91. package/core/integrations/issue-tracker/manager.ts +15 -15
  92. package/core/integrations/issue-tracker/types.ts +5 -22
  93. package/core/integrations/jira/client.ts +67 -59
  94. package/core/integrations/jira/index.ts +11 -14
  95. package/core/integrations/jira/mcp-adapter.ts +5 -10
  96. package/core/integrations/jira/service.ts +10 -10
  97. package/core/integrations/linear/client.ts +27 -18
  98. package/core/integrations/linear/index.ts +9 -12
  99. package/core/integrations/linear/service.ts +11 -11
  100. package/core/integrations/linear/sync.ts +8 -8
  101. package/core/outcomes/analyzer.ts +5 -18
  102. package/core/outcomes/index.ts +2 -2
  103. package/core/outcomes/recorder.ts +3 -3
  104. package/core/plugin/builtin/webhook.ts +19 -15
  105. package/core/plugin/hooks.ts +29 -21
  106. package/core/plugin/index.ts +7 -7
  107. package/core/plugin/loader.ts +19 -19
  108. package/core/plugin/registry.ts +12 -23
  109. package/core/schemas/agents.ts +1 -1
  110. package/core/schemas/analysis.ts +1 -1
  111. package/core/schemas/enriched-task.ts +62 -49
  112. package/core/schemas/ideas.ts +13 -13
  113. package/core/schemas/index.ts +17 -27
  114. package/core/schemas/issues.ts +40 -25
  115. package/core/schemas/metrics.ts +25 -25
  116. package/core/schemas/outcomes.ts +70 -62
  117. package/core/schemas/permissions.ts +15 -12
  118. package/core/schemas/prd.ts +27 -14
  119. package/core/schemas/project.ts +3 -3
  120. package/core/schemas/roadmap.ts +47 -34
  121. package/core/schemas/schemas.ts +3 -4
  122. package/core/schemas/shipped.ts +3 -3
  123. package/core/schemas/state.ts +43 -29
  124. package/core/server/index.ts +5 -6
  125. package/core/server/routes-extended.ts +68 -72
  126. package/core/server/routes.ts +3 -3
  127. package/core/server/server.ts +31 -26
  128. package/core/services/agent-generator.ts +237 -0
  129. package/core/services/agent-service.ts +2 -2
  130. package/core/services/breakdown-service.ts +2 -4
  131. package/core/services/context-generator.ts +299 -0
  132. package/core/services/context-selector.ts +420 -0
  133. package/core/services/doctor-service.ts +426 -0
  134. package/core/services/file-categorizer.ts +448 -0
  135. package/core/services/file-scorer.ts +270 -0
  136. package/core/services/git-analyzer.ts +267 -0
  137. package/core/services/index.ts +27 -10
  138. package/core/services/memory-service.ts +3 -4
  139. package/core/services/project-index.ts +911 -0
  140. package/core/services/project-service.ts +4 -4
  141. package/core/services/skill-installer.ts +14 -17
  142. package/core/services/skill-lock.ts +3 -3
  143. package/core/services/skill-service.ts +12 -6
  144. package/core/services/stack-detector.ts +245 -0
  145. package/core/services/sync-service.ts +87 -345
  146. package/core/services/watch-service.ts +294 -0
  147. package/core/session/compaction.ts +23 -31
  148. package/core/session/index.ts +11 -5
  149. package/core/session/log-migration.ts +3 -3
  150. package/core/session/metrics.ts +19 -14
  151. package/core/session/session-log-manager.ts +12 -17
  152. package/core/session/task-session-manager.ts +25 -25
  153. package/core/session/utils.ts +1 -1
  154. package/core/storage/ideas-storage.ts +41 -57
  155. package/core/storage/index-storage.ts +514 -0
  156. package/core/storage/index.ts +41 -17
  157. package/core/storage/metrics-storage.ts +39 -34
  158. package/core/storage/queue-storage.ts +35 -45
  159. package/core/storage/shipped-storage.ts +17 -20
  160. package/core/storage/state-storage.ts +50 -30
  161. package/core/storage/storage-manager.ts +6 -6
  162. package/core/storage/storage.ts +18 -15
  163. package/core/sync/auth-config.ts +3 -3
  164. package/core/sync/index.ts +13 -19
  165. package/core/sync/oauth-handler.ts +3 -3
  166. package/core/sync/sync-client.ts +4 -9
  167. package/core/sync/sync-manager.ts +12 -14
  168. package/core/types/commands.ts +42 -7
  169. package/core/types/index.ts +284 -305
  170. package/core/types/integrations.ts +3 -3
  171. package/core/types/storage.ts +14 -14
  172. package/core/types/utils.ts +3 -3
  173. package/core/utils/agent-stream.ts +3 -1
  174. package/core/utils/animations.ts +14 -11
  175. package/core/utils/branding.ts +7 -7
  176. package/core/utils/cache.ts +1 -3
  177. package/core/utils/collection-filters.ts +3 -15
  178. package/core/utils/date-helper.ts +2 -7
  179. package/core/utils/file-helper.ts +13 -8
  180. package/core/utils/jsonl-helper.ts +13 -10
  181. package/core/utils/keychain.ts +4 -8
  182. package/core/utils/logger.ts +1 -1
  183. package/core/utils/next-steps.ts +3 -3
  184. package/core/utils/output.ts +58 -11
  185. package/core/utils/project-commands.ts +6 -6
  186. package/core/utils/project-credentials.ts +5 -12
  187. package/core/utils/runtime.ts +2 -2
  188. package/core/utils/session-helper.ts +3 -4
  189. package/core/utils/version.ts +3 -3
  190. package/core/wizard/index.ts +13 -0
  191. package/core/wizard/onboarding.ts +633 -0
  192. package/core/workflow/state-machine.ts +7 -7
  193. package/dist/bin/prjct.mjs +18755 -15574
  194. package/dist/core/infrastructure/command-installer.js +86 -79
  195. package/dist/core/infrastructure/editors-config.js +6 -6
  196. package/dist/core/infrastructure/setup.js +246 -225
  197. package/dist/core/utils/version.js +9 -9
  198. package/package.json +11 -12
  199. package/scripts/build.js +3 -3
  200. package/scripts/postinstall.js +2 -2
  201. package/templates/mcp-config.json +6 -1
  202. package/templates/permissions/permissive.jsonc +1 -1
  203. package/templates/permissions/strict.jsonc +5 -9
  204. package/templates/global/docs/agents.md +0 -88
  205. package/templates/global/docs/architecture.md +0 -103
  206. package/templates/global/docs/commands.md +0 -96
  207. package/templates/global/docs/validation.md +0 -95
@@ -0,0 +1,448 @@
1
+ /**
2
+ * FileCategorizer - LLM-based file categorization for Smart Context Selection
3
+ *
4
+ * Two-phase process:
5
+ * 1. DISCOVER DOMAINS: LLM analyzes project structure to identify functional domains
6
+ * 2. CATEGORIZE FILES: LLM assigns files to discovered domains
7
+ *
8
+ * Features:
9
+ * - Dynamic domain discovery (no hardcoded domains)
10
+ * - Batch processing (20 files per LLM call)
11
+ * - Heuristic fallback when LLM unavailable
12
+ * - Caching for efficiency
13
+ */
14
+
15
+ import path from 'node:path'
16
+ import {
17
+ type CategoriesCache,
18
+ type DiscoveredDomains,
19
+ type DomainDefinition,
20
+ type FileCategory,
21
+ INDEX_VERSION,
22
+ indexStorage,
23
+ type ScoredFile,
24
+ } from '../storage/index-storage'
25
+ import { getTimestamp } from '../utils/date-helper'
26
+
27
+ // ============================================================================
28
+ // TYPES
29
+ // ============================================================================
30
+
31
+ export interface CategorizationResult {
32
+ domains: DomainDefinition[]
33
+ categories: FileCategory[]
34
+ metrics: {
35
+ totalFiles: number
36
+ categorizedFiles: number
37
+ domainsDiscovered: number
38
+ llmCalls: number
39
+ usedHeuristics: boolean
40
+ }
41
+ }
42
+
43
+ export interface CategorizationOptions {
44
+ batchSize?: number // Files per LLM call (default: 20)
45
+ maxDomains?: number // Max domains to discover (default: 15)
46
+ useLLM?: boolean // Use LLM or heuristics only (default: true)
47
+ projectId?: string // For caching
48
+ }
49
+
50
+ // ============================================================================
51
+ // HEURISTIC PATTERNS
52
+ // ============================================================================
53
+
54
+ /**
55
+ * Fallback heuristic patterns for when LLM is unavailable
56
+ * Maps directory/filename patterns to domain names
57
+ */
58
+ const HEURISTIC_PATTERNS: { pattern: RegExp; domain: string }[] = [
59
+ // Payment-related
60
+ { pattern: /\b(payment|stripe|billing|checkout|invoice)/i, domain: 'payments' },
61
+
62
+ // User/Auth
63
+ { pattern: /\b(auth|login|signup|user|session|password|oauth)/i, domain: 'auth' },
64
+
65
+ // API
66
+ { pattern: /\b(api|endpoint|route|controller)/i, domain: 'api' },
67
+
68
+ // Database
69
+ { pattern: /\b(model|schema|migration|database|db|prisma|drizzle)/i, domain: 'database' },
70
+
71
+ // Frontend
72
+ { pattern: /\b(component|page|view|layout|ui|button|form|modal)/i, domain: 'frontend' },
73
+
74
+ // Testing
75
+ { pattern: /\b(test|spec|__tests__|e2e|cypress)/i, domain: 'testing' },
76
+
77
+ // Configuration
78
+ { pattern: /\b(config|setting|env)/i, domain: 'config' },
79
+
80
+ // Utilities
81
+ { pattern: /\b(util|helper|lib|common|shared)/i, domain: 'utilities' },
82
+
83
+ // Services/Business Logic
84
+ { pattern: /\b(service|handler|processor|worker)/i, domain: 'services' },
85
+
86
+ // Types/Interfaces
87
+ { pattern: /\b(type|interface|dto)/i, domain: 'types' },
88
+ ]
89
+
90
+ // ============================================================================
91
+ // FILE CATEGORIZER CLASS
92
+ // ============================================================================
93
+
94
+ export class FileCategorizer {
95
+ private batchSize: number
96
+ private maxDomains: number
97
+
98
+ constructor(options: CategorizationOptions = {}) {
99
+ this.batchSize = options.batchSize || 20
100
+ this.maxDomains = options.maxDomains || 15
101
+ }
102
+
103
+ // ==========================================================================
104
+ // MAIN METHODS
105
+ // ==========================================================================
106
+
107
+ /**
108
+ * Full analysis: discover domains + categorize files
109
+ */
110
+ async analyzeProject(
111
+ projectPath: string,
112
+ files: ScoredFile[],
113
+ options: CategorizationOptions = {}
114
+ ): Promise<CategorizationResult> {
115
+ const useLLM = options.useLLM !== false
116
+
117
+ // Phase 1: Discover domains
118
+ const domains = useLLM
119
+ ? await this.discoverDomainsWithLLM(projectPath, files)
120
+ : this.discoverDomainsHeuristic(files)
121
+
122
+ // Phase 2: Categorize files
123
+ const categories = useLLM
124
+ ? await this.categorizeFilesWithLLM(files, domains)
125
+ : this.categorizeFilesHeuristic(files, domains)
126
+
127
+ // Update domain file counts
128
+ for (const domain of domains) {
129
+ domain.fileCount = categories.filter((c) => c.primaryDomain === domain.name).length
130
+ }
131
+
132
+ // Save to cache if projectId provided
133
+ if (options.projectId) {
134
+ await this.saveToCache(options.projectId, domains, categories)
135
+ }
136
+
137
+ return {
138
+ domains,
139
+ categories,
140
+ metrics: {
141
+ totalFiles: files.length,
142
+ categorizedFiles: categories.length,
143
+ domainsDiscovered: domains.length,
144
+ llmCalls: useLLM ? Math.ceil(files.length / this.batchSize) + 1 : 0,
145
+ usedHeuristics: !useLLM,
146
+ },
147
+ }
148
+ }
149
+
150
+ /**
151
+ * Discover domains from project structure (LLM)
152
+ */
153
+ async discoverDomainsWithLLM(
154
+ _projectPath: string,
155
+ files: ScoredFile[]
156
+ ): Promise<DomainDefinition[]> {
157
+ // For now, fall back to heuristics
158
+ // TODO: Implement LLM call when LLM service is available
159
+ // The prompt would analyze directory structure and file names
160
+ // to identify functional domains unique to this project
161
+ return this.discoverDomainsHeuristic(files)
162
+ }
163
+
164
+ /**
165
+ * Categorize files using discovered domains (LLM)
166
+ */
167
+ async categorizeFilesWithLLM(
168
+ files: ScoredFile[],
169
+ domains: DomainDefinition[]
170
+ ): Promise<FileCategory[]> {
171
+ // For now, fall back to heuristics
172
+ // TODO: Implement LLM batch processing when LLM service is available
173
+ // The prompt would ask LLM to categorize batches of files using
174
+ // the discovered domain definitions
175
+ return this.categorizeFilesHeuristic(files, domains)
176
+ }
177
+
178
+ // ==========================================================================
179
+ // HEURISTIC METHODS (Fallback)
180
+ // ==========================================================================
181
+
182
+ /**
183
+ * Discover domains using heuristics (fallback)
184
+ */
185
+ discoverDomainsHeuristic(files: ScoredFile[]): DomainDefinition[] {
186
+ const domainCounts = new Map<string, number>()
187
+ const domainPatterns = new Map<string, Set<string>>()
188
+
189
+ // Count files matching each heuristic pattern
190
+ for (const file of files) {
191
+ const filePath = file.path.toLowerCase()
192
+ for (const { pattern, domain } of HEURISTIC_PATTERNS) {
193
+ if (pattern.test(filePath)) {
194
+ domainCounts.set(domain, (domainCounts.get(domain) || 0) + 1)
195
+ if (!domainPatterns.has(domain)) {
196
+ domainPatterns.set(domain, new Set())
197
+ }
198
+ // Extract the matched directory as a pattern
199
+ const dir = path.dirname(file.path)
200
+ domainPatterns.get(domain)!.add(`**/${path.basename(dir)}/**`)
201
+ }
202
+ }
203
+ }
204
+
205
+ // Also detect domains from common directory names
206
+ const dirDomains = this.extractDirectoryDomains(files)
207
+ for (const [domain, count] of dirDomains) {
208
+ domainCounts.set(domain, (domainCounts.get(domain) || 0) + count)
209
+ }
210
+
211
+ // Build domain definitions for domains with at least 2 files
212
+ const domains: DomainDefinition[] = []
213
+ for (const [name, count] of domainCounts) {
214
+ if (count >= 2) {
215
+ const heuristic = HEURISTIC_PATTERNS.find((h) => h.domain === name)
216
+ domains.push({
217
+ name,
218
+ description: `Files related to ${name}`,
219
+ keywords: heuristic ? [name] : [name],
220
+ filePatterns: Array.from(domainPatterns.get(name) || []),
221
+ fileCount: count,
222
+ })
223
+ }
224
+ }
225
+
226
+ // Sort by file count (most files first) and limit
227
+ return domains.sort((a, b) => b.fileCount - a.fileCount).slice(0, this.maxDomains)
228
+ }
229
+
230
+ /**
231
+ * Extract domains from directory structure
232
+ */
233
+ private extractDirectoryDomains(files: ScoredFile[]): Map<string, number> {
234
+ const dirCounts = new Map<string, number>()
235
+
236
+ for (const file of files) {
237
+ const parts = file.path.split('/')
238
+ // Look at immediate parent directories
239
+ for (const part of parts.slice(0, -1)) {
240
+ const normalizedDir = part.toLowerCase()
241
+ // Skip generic directories
242
+ if (['src', 'lib', 'app', 'core', 'dist', 'build'].includes(normalizedDir)) {
243
+ continue
244
+ }
245
+ // Count meaningful directory names
246
+ if (normalizedDir.length > 2 && !normalizedDir.startsWith('.')) {
247
+ dirCounts.set(normalizedDir, (dirCounts.get(normalizedDir) || 0) + 1)
248
+ }
249
+ }
250
+ }
251
+
252
+ return dirCounts
253
+ }
254
+
255
+ /**
256
+ * Categorize files using heuristics (fallback)
257
+ */
258
+ categorizeFilesHeuristic(files: ScoredFile[], domains: DomainDefinition[]): FileCategory[] {
259
+ const categories: FileCategory[] = []
260
+ const now = getTimestamp()
261
+
262
+ for (const file of files) {
263
+ const matchedDomains: { domain: string; score: number }[] = []
264
+ const filePath = file.path.toLowerCase()
265
+
266
+ // Check against each domain's keywords and patterns
267
+ for (const domain of domains) {
268
+ let score = 0
269
+
270
+ // Check keywords
271
+ for (const keyword of domain.keywords) {
272
+ if (filePath.includes(keyword.toLowerCase())) {
273
+ score += 1
274
+ }
275
+ }
276
+
277
+ // Check heuristic patterns
278
+ for (const { pattern, domain: patternDomain } of HEURISTIC_PATTERNS) {
279
+ if (patternDomain === domain.name && pattern.test(filePath)) {
280
+ score += 2
281
+ }
282
+ }
283
+
284
+ // Check directory patterns
285
+ for (const pattern of domain.filePatterns) {
286
+ const patternBase = pattern.replace(/\*\*/g, '').replace(/\//g, '')
287
+ if (filePath.includes(patternBase.toLowerCase())) {
288
+ score += 1
289
+ }
290
+ }
291
+
292
+ if (score > 0) {
293
+ matchedDomains.push({ domain: domain.name, score })
294
+ }
295
+ }
296
+
297
+ // Sort by score and take top matches
298
+ matchedDomains.sort((a, b) => b.score - a.score)
299
+
300
+ const fileCategories =
301
+ matchedDomains.length > 0 ? matchedDomains.slice(0, 3).map((m) => m.domain) : ['general']
302
+
303
+ const primaryDomain = fileCategories[0]
304
+ const confidence = matchedDomains.length > 0 ? Math.min(1, matchedDomains[0].score / 5) : 0.1
305
+
306
+ categories.push({
307
+ path: file.path,
308
+ categories: fileCategories,
309
+ primaryDomain,
310
+ confidence,
311
+ categorizedAt: now,
312
+ method: 'heuristic',
313
+ })
314
+ }
315
+
316
+ return categories
317
+ }
318
+
319
+ // ==========================================================================
320
+ // CACHING
321
+ // ==========================================================================
322
+
323
+ /**
324
+ * Save domains and categories to cache
325
+ */
326
+ async saveToCache(
327
+ projectId: string,
328
+ domains: DomainDefinition[],
329
+ categories: FileCategory[]
330
+ ): Promise<void> {
331
+ const now = getTimestamp()
332
+
333
+ // Save domains
334
+ const domainsData: DiscoveredDomains = {
335
+ version: INDEX_VERSION,
336
+ projectId,
337
+ domains,
338
+ discoveredAt: now,
339
+ }
340
+ await indexStorage.writeDomains(projectId, domainsData)
341
+
342
+ // Build domain index (domain -> file paths)
343
+ const domainIndex: Record<string, string[]> = {}
344
+ for (const cat of categories) {
345
+ for (const domain of cat.categories) {
346
+ if (!domainIndex[domain]) {
347
+ domainIndex[domain] = []
348
+ }
349
+ domainIndex[domain].push(cat.path)
350
+ }
351
+ }
352
+
353
+ // Save categories
354
+ const cacheData: CategoriesCache = {
355
+ version: INDEX_VERSION,
356
+ lastUpdate: now,
357
+ fileCategories: categories,
358
+ domainIndex,
359
+ }
360
+ await indexStorage.writeCategories(projectId, cacheData)
361
+ }
362
+
363
+ /**
364
+ * Load cached categorization
365
+ */
366
+ async loadFromCache(projectId: string): Promise<CategorizationResult | null> {
367
+ const [domainsData, cacheData] = await Promise.all([
368
+ indexStorage.readDomains(projectId),
369
+ indexStorage.readCategories(projectId),
370
+ ])
371
+
372
+ if (!domainsData || !cacheData) {
373
+ return null
374
+ }
375
+
376
+ return {
377
+ domains: domainsData.domains,
378
+ categories: cacheData.fileCategories,
379
+ metrics: {
380
+ totalFiles: cacheData.fileCategories.length,
381
+ categorizedFiles: cacheData.fileCategories.length,
382
+ domainsDiscovered: domainsData.domains.length,
383
+ llmCalls: 0,
384
+ usedHeuristics: cacheData.fileCategories[0]?.method === 'heuristic',
385
+ },
386
+ }
387
+ }
388
+
389
+ /**
390
+ * Update categories for specific files (incremental)
391
+ */
392
+ async updateFilesCategories(
393
+ projectId: string,
394
+ files: ScoredFile[],
395
+ options: CategorizationOptions = {}
396
+ ): Promise<FileCategory[]> {
397
+ // Load existing domains
398
+ const domainsData = await indexStorage.readDomains(projectId)
399
+ if (!domainsData) {
400
+ // No domains yet, need full analysis
401
+ const result = await this.analyzeProject('', files, { ...options, projectId })
402
+ return result.categories
403
+ }
404
+
405
+ // Categorize just the new/changed files
406
+ const newCategories =
407
+ options.useLLM !== false
408
+ ? await this.categorizeFilesWithLLM(files, domainsData.domains)
409
+ : this.categorizeFilesHeuristic(files, domainsData.domains)
410
+
411
+ // Load existing cache and merge
412
+ const existingCache = await indexStorage.readCategories(projectId)
413
+ if (existingCache) {
414
+ // Remove old entries for updated files
415
+ const updatedPaths = new Set(files.map((f) => f.path))
416
+ const existingCategories = existingCache.fileCategories.filter(
417
+ (c) => !updatedPaths.has(c.path)
418
+ )
419
+
420
+ // Merge and save
421
+ const allCategories = [...existingCategories, ...newCategories]
422
+
423
+ // Rebuild domain index
424
+ const domainIndex: Record<string, string[]> = {}
425
+ for (const cat of allCategories) {
426
+ for (const domain of cat.categories) {
427
+ if (!domainIndex[domain]) {
428
+ domainIndex[domain] = []
429
+ }
430
+ domainIndex[domain].push(cat.path)
431
+ }
432
+ }
433
+
434
+ const cacheData: CategoriesCache = {
435
+ version: INDEX_VERSION,
436
+ lastUpdate: getTimestamp(),
437
+ fileCategories: allCategories,
438
+ domainIndex,
439
+ }
440
+ await indexStorage.writeCategories(projectId, cacheData)
441
+ }
442
+
443
+ return newCategories
444
+ }
445
+ }
446
+
447
+ export const fileCategorizer = new FileCategorizer()
448
+ export default FileCategorizer
@@ -0,0 +1,270 @@
1
+ /**
2
+ * FileScorer - Calculates relevance scores for files
3
+ *
4
+ * Scoring factors:
5
+ * - recency: Modified recently? (0-20)
6
+ * - centrality: Imported by many files? (0-25)
7
+ * - configRelevance: Is config file? (0-20)
8
+ * - nameRelevance: Name indicates importance? (0-15)
9
+ * - sizeOptimal: Useful size (not too large)? (0-10)
10
+ * - gitActivity: Recent commits? (0-10)
11
+ *
12
+ * Total score: 0-100
13
+ * Files with score > 30 are considered relevant
14
+ */
15
+
16
+ import path from 'node:path'
17
+
18
+ // ============================================================================
19
+ // TYPES
20
+ // ============================================================================
21
+
22
+ export interface FileScore {
23
+ path: string
24
+ score: number
25
+ factors: {
26
+ recency: number // 0-20
27
+ centrality: number // 0-25
28
+ configRelevance: number // 0-20
29
+ nameRelevance: number // 0-15
30
+ sizeOptimal: number // 0-10
31
+ gitActivity: number // 0-10
32
+ }
33
+ }
34
+
35
+ export interface FileStats {
36
+ path: string
37
+ size: number // bytes
38
+ mtime: Date // modification time
39
+ lines?: number // line count
40
+ imports?: string[] // files this imports
41
+ importedBy?: string[] // files that import this
42
+ recentCommits?: number // commits in last 30 days
43
+ }
44
+
45
+ export interface ScoringContext {
46
+ allFiles: Map<string, FileStats>
47
+ configFiles: Set<string>
48
+ maxFileSize: number
49
+ maxRecentCommits: number
50
+ now: Date
51
+ }
52
+
53
+ // ============================================================================
54
+ // CONSTANTS
55
+ // ============================================================================
56
+
57
+ export const RELEVANCE_THRESHOLD = 30
58
+
59
+ // Config file patterns (high importance)
60
+ const CONFIG_PATTERNS = [
61
+ /^package\.json$/,
62
+ /^tsconfig.*\.json$/,
63
+ /^\.env(\..*)?$/,
64
+ /^\.eslintrc.*$/,
65
+ /^\.prettierrc.*$/,
66
+ /^vite\.config\.\w+$/,
67
+ /^next\.config\.\w+$/,
68
+ /^webpack\.config\.\w+$/,
69
+ /^rollup\.config\.\w+$/,
70
+ /^jest\.config\.\w+$/,
71
+ /^vitest\.config\.\w+$/,
72
+ /^tailwind\.config\.\w+$/,
73
+ /^postcss\.config\.\w+$/,
74
+ /^Cargo\.toml$/,
75
+ /^go\.mod$/,
76
+ /^pyproject\.toml$/,
77
+ /^requirements\.txt$/,
78
+ /^Dockerfile$/,
79
+ /^docker-compose\.ya?ml$/,
80
+ /^\.github\/workflows\/.*\.ya?ml$/,
81
+ ]
82
+
83
+ // Important filename patterns
84
+ const IMPORTANT_NAME_PATTERNS = [
85
+ /^index\.\w+$/, // Entry points
86
+ /^main\.\w+$/, // Main files
87
+ /^app\.\w+$/, // App files
88
+ /^server\.\w+$/, // Server files
89
+ /^router\.\w+$/, // Router files
90
+ /^routes\.\w+$/, // Routes
91
+ /^api\.\w+$/, // API files
92
+ /^schema\.\w+$/, // Schema files
93
+ /^types?\.\w+$/, // Type definitions
94
+ /^constants?\.\w+$/, // Constants
95
+ /^config\.\w+$/, // Config files
96
+ /^utils?\.\w+$/, // Utilities
97
+ /^helpers?\.\w+$/, // Helpers
98
+ /README\.md$/i, // Documentation
99
+ /CHANGELOG\.md$/i, // Changelog
100
+ ]
101
+
102
+ // ============================================================================
103
+ // FILE SCORER
104
+ // ============================================================================
105
+
106
+ export class FileScorer {
107
+ /**
108
+ * Score a single file
109
+ */
110
+ scoreFile(stats: FileStats, context: ScoringContext): FileScore {
111
+ const factors = {
112
+ recency: this.calculateRecency(stats, context),
113
+ centrality: this.calculateCentrality(stats, context),
114
+ configRelevance: this.calculateConfigRelevance(stats),
115
+ nameRelevance: this.calculateNameRelevance(stats),
116
+ sizeOptimal: this.calculateSizeOptimal(stats, context),
117
+ gitActivity: this.calculateGitActivity(stats, context),
118
+ }
119
+
120
+ const score = Object.values(factors).reduce((sum, v) => sum + v, 0)
121
+
122
+ return {
123
+ path: stats.path,
124
+ score: Math.min(100, Math.max(0, score)),
125
+ factors,
126
+ }
127
+ }
128
+
129
+ /**
130
+ * Score all files and return sorted by score
131
+ */
132
+ scoreAll(context: ScoringContext): FileScore[] {
133
+ const scores: FileScore[] = []
134
+
135
+ for (const stats of context.allFiles.values()) {
136
+ scores.push(this.scoreFile(stats, context))
137
+ }
138
+
139
+ return scores.sort((a, b) => b.score - a.score)
140
+ }
141
+
142
+ /**
143
+ * Get relevant files (score > threshold)
144
+ */
145
+ getRelevantFiles(context: ScoringContext, threshold: number = RELEVANCE_THRESHOLD): FileScore[] {
146
+ return this.scoreAll(context).filter((f) => f.score >= threshold)
147
+ }
148
+
149
+ // ==========================================================================
150
+ // FACTOR CALCULATIONS
151
+ // ==========================================================================
152
+
153
+ /**
154
+ * Recency factor (0-20)
155
+ * Files modified recently get higher scores
156
+ */
157
+ private calculateRecency(stats: FileStats, context: ScoringContext): number {
158
+ const daysSinceModified =
159
+ (context.now.getTime() - stats.mtime.getTime()) / (1000 * 60 * 60 * 24)
160
+
161
+ if (daysSinceModified < 1) return 20 // Today
162
+ if (daysSinceModified < 7) return 15 // This week
163
+ if (daysSinceModified < 30) return 10 // This month
164
+ if (daysSinceModified < 90) return 5 // Last 3 months
165
+ return 0 // Older
166
+ }
167
+
168
+ /**
169
+ * Centrality factor (0-25)
170
+ * Files imported by many others are more important
171
+ */
172
+ private calculateCentrality(stats: FileStats, context: ScoringContext): number {
173
+ const importedByCount = stats.importedBy?.length || 0
174
+ const totalFiles = context.allFiles.size
175
+
176
+ if (totalFiles === 0) return 0
177
+
178
+ // Normalize: files imported by 20%+ of codebase get max score
179
+ const ratio = importedByCount / totalFiles
180
+ if (ratio >= 0.2) return 25
181
+ if (ratio >= 0.1) return 20
182
+ if (ratio >= 0.05) return 15
183
+ if (importedByCount >= 5) return 10
184
+ if (importedByCount >= 2) return 5
185
+ return 0
186
+ }
187
+
188
+ /**
189
+ * Config relevance factor (0-20)
190
+ * Config files are always important
191
+ */
192
+ private calculateConfigRelevance(stats: FileStats): number {
193
+ const filename = path.basename(stats.path)
194
+
195
+ for (const pattern of CONFIG_PATTERNS) {
196
+ if (pattern.test(filename) || pattern.test(stats.path)) {
197
+ return 20
198
+ }
199
+ }
200
+
201
+ return 0
202
+ }
203
+
204
+ /**
205
+ * Name relevance factor (0-15)
206
+ * Certain filenames indicate importance
207
+ */
208
+ private calculateNameRelevance(stats: FileStats): number {
209
+ const filename = path.basename(stats.path)
210
+
211
+ for (const pattern of IMPORTANT_NAME_PATTERNS) {
212
+ if (pattern.test(filename)) {
213
+ return 15
214
+ }
215
+ }
216
+
217
+ // Directories that suggest importance
218
+ const dir = path.dirname(stats.path)
219
+ if (dir.includes('/api/') || dir.includes('/routes/')) return 10
220
+ if (dir.includes('/components/') && filename.startsWith('index')) return 10
221
+ if (dir.includes('/pages/') || dir.includes('/app/')) return 8
222
+
223
+ return 0
224
+ }
225
+
226
+ /**
227
+ * Size optimal factor (0-10)
228
+ * Files that are neither too small nor too large
229
+ */
230
+ private calculateSizeOptimal(stats: FileStats, _context: ScoringContext): number {
231
+ const size = stats.size
232
+
233
+ // Too small (likely stub or barrel export)
234
+ if (size < 100) return 2
235
+
236
+ // Optimal range: 500 bytes to 50KB
237
+ if (size >= 500 && size <= 50_000) return 10
238
+
239
+ // Large but not huge (50KB - 200KB)
240
+ if (size > 50_000 && size <= 200_000) return 5
241
+
242
+ // Very large files are less useful as context
243
+ if (size > 200_000) return 0
244
+
245
+ // Small files (100-500 bytes)
246
+ return 5
247
+ }
248
+
249
+ /**
250
+ * Git activity factor (0-10)
251
+ * Files with recent commits are more actively developed
252
+ */
253
+ private calculateGitActivity(stats: FileStats, context: ScoringContext): number {
254
+ const commits = stats.recentCommits || 0
255
+
256
+ if (context.maxRecentCommits === 0) return 0
257
+
258
+ // Normalize against max
259
+ const ratio = commits / context.maxRecentCommits
260
+
261
+ if (ratio >= 0.5) return 10 // Among most active
262
+ if (ratio >= 0.25) return 7
263
+ if (ratio >= 0.1) return 5
264
+ if (commits > 0) return 2
265
+ return 0
266
+ }
267
+ }
268
+
269
+ export const fileScorer = new FileScorer()
270
+ export default FileScorer