claude-memory-layer 1.0.31 → 1.0.32

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (313) hide show
  1. package/README.md +9 -2
  2. package/dist/cli/index.js +1 -1
  3. package/package.json +11 -2
  4. package/scripts/postinstall-embedding-backend.cjs +16 -12
  5. package/AGENTS.md +0 -71
  6. package/CLAUDE.md +0 -30
  7. package/HANDOFF.md +0 -92
  8. package/Memo.txt +0 -558
  9. package/benchmarks/replay/anonymized-real-sessions.json +0 -48
  10. package/config/kpi-thresholds.json +0 -7
  11. package/context.md +0 -636
  12. package/docs/ARCHITECTURE_COMPARISON_AND_RECOMMENDATIONS.md +0 -627
  13. package/docs/HERMES_MEMORY_INGESTION_ANALYSIS.md +0 -440
  14. package/docs/MCP_MEMORY_SERVICE_COMPARATIVE_REVIEW.md +0 -271
  15. package/docs/MEMORY_USEFULNESS_AUDIT.md +0 -371
  16. package/docs/MEMORY_USEFULNESS_AUDIT_RAW.json +0 -80
  17. package/docs/MEMSEARCH_PROJECT_STRUCTURE_ANALYSIS.md +0 -333
  18. package/docs/MEMU_ADOPTION.md +0 -40
  19. package/docs/OPERATIONS.md +0 -18
  20. package/docs/PRODUCT_VALIDATION_MATRIX.md +0 -82
  21. package/docs/PROJECT_STRUCTURE_ANALYSIS.md +0 -421
  22. package/docs/REFACTORING_MILESTONES_AND_ISSUES.md +0 -501
  23. package/docs/REFACTORING_PLAN_THIN_CORE.md +0 -414
  24. package/docs/REFERENCE_PROJECT_ANALYSES.md +0 -25
  25. package/docs/SUPERLOCALMEMORY_PROJECT_STRUCTURE_ANALYSIS.md +0 -452
  26. package/docs/TARGET_ARCHITECTURE_AND_FOLDER_STRUCTURE.md +0 -446
  27. package/docs/architecture/comparison-index.md +0 -47
  28. package/docs/reports/codex-real-data-validation-20260505T040447Z.md +0 -46
  29. package/plan.md +0 -1642
  30. package/scripts/build.ts +0 -159
  31. package/scripts/bump-patch-version.sh +0 -18
  32. package/scripts/delete-unknown-projects.js +0 -154
  33. package/scripts/fix-sync-gap.js +0 -32
  34. package/scripts/generate-session-qrels.ts +0 -126
  35. package/scripts/heartbeat-memory-orchestrator.sh +0 -28
  36. package/scripts/replay-retrieval-benchmark.ts +0 -69
  37. package/scripts/report-sync-gap.js +0 -26
  38. package/scripts/review-queue-auto-resolve.js +0 -21
  39. package/scripts/sync-gap-auto-heal.sh +0 -17
  40. package/spec.md +0 -624
  41. package/specs/20260207-dashboard-upgrade/context.md +0 -38
  42. package/specs/20260207-dashboard-upgrade/spec.md +0 -96
  43. package/specs/citations-system/context.md +0 -243
  44. package/specs/citations-system/plan.md +0 -495
  45. package/specs/citations-system/spec.md +0 -371
  46. package/specs/endless-mode/context.md +0 -305
  47. package/specs/endless-mode/plan.md +0 -620
  48. package/specs/endless-mode/spec.md +0 -455
  49. package/specs/entity-edge-model/context.md +0 -401
  50. package/specs/entity-edge-model/plan.md +0 -459
  51. package/specs/entity-edge-model/spec.md +0 -391
  52. package/specs/evidence-aligner-v2/context.md +0 -401
  53. package/specs/evidence-aligner-v2/plan.md +0 -303
  54. package/specs/evidence-aligner-v2/spec.md +0 -312
  55. package/specs/mcp-desktop-integration/context.md +0 -278
  56. package/specs/mcp-desktop-integration/plan.md +0 -550
  57. package/specs/mcp-desktop-integration/spec.md +0 -494
  58. package/specs/memory-utilization-improvements/context.md +0 -145
  59. package/specs/memory-utilization-improvements/plan.md +0 -361
  60. package/specs/memory-utilization-improvements/spec.md +0 -361
  61. package/specs/post-tool-use-hook/context.md +0 -319
  62. package/specs/post-tool-use-hook/plan.md +0 -469
  63. package/specs/post-tool-use-hook/spec.md +0 -364
  64. package/specs/private-tags/context.md +0 -288
  65. package/specs/private-tags/plan.md +0 -412
  66. package/specs/private-tags/spec.md +0 -345
  67. package/specs/progressive-disclosure/context.md +0 -346
  68. package/specs/progressive-disclosure/plan.md +0 -663
  69. package/specs/progressive-disclosure/spec.md +0 -415
  70. package/specs/selective-tool-observation/context.md +0 -100
  71. package/specs/selective-tool-observation/plan.md +0 -158
  72. package/specs/selective-tool-observation/spec.md +0 -127
  73. package/specs/task-entity-system/context.md +0 -297
  74. package/specs/task-entity-system/plan.md +0 -301
  75. package/specs/task-entity-system/spec.md +0 -314
  76. package/specs/thin-core-refactor/context.md +0 -275
  77. package/specs/thin-core-refactor/plan.md +0 -536
  78. package/specs/thin-core-refactor/spec.md +0 -465
  79. package/specs/vector-outbox-v2/context.md +0 -470
  80. package/specs/vector-outbox-v2/plan.md +0 -562
  81. package/specs/vector-outbox-v2/spec.md +0 -466
  82. package/specs/web-viewer-ui/context.md +0 -384
  83. package/specs/web-viewer-ui/plan.md +0 -797
  84. package/specs/web-viewer-ui/spec.md +0 -516
  85. package/src/adapters/claude/capture/index.ts +0 -3
  86. package/src/adapters/claude/context/index.ts +0 -3
  87. package/src/adapters/claude/hooks/index.ts +0 -21
  88. package/src/adapters/claude/hooks/post-tool-use.ts +0 -239
  89. package/src/adapters/claude/hooks/prompt-injection-policy.ts +0 -104
  90. package/src/adapters/claude/hooks/semantic-daemon-client.ts +0 -209
  91. package/src/adapters/claude/hooks/semantic-daemon.ts +0 -283
  92. package/src/adapters/claude/hooks/session-end.ts +0 -59
  93. package/src/adapters/claude/hooks/session-start.ts +0 -73
  94. package/src/adapters/claude/hooks/stop.ts +0 -128
  95. package/src/adapters/claude/hooks/user-prompt-submit.ts +0 -361
  96. package/src/adapters/claude/index.ts +0 -4
  97. package/src/adapters/claude/transcript/index.ts +0 -4
  98. package/src/adapters/claude/transcript/transcript-reader.ts +0 -57
  99. package/src/adapters/claude/transcript/turn-reconstructor.ts +0 -65
  100. package/src/apps/cli/claude-settings-hooks.ts +0 -138
  101. package/src/apps/cli/codex-import-runner.ts +0 -125
  102. package/src/apps/cli/codex-validation-output.ts +0 -95
  103. package/src/apps/cli/hermes-import-runner.ts +0 -130
  104. package/src/apps/cli/hermes-validation-output.ts +0 -91
  105. package/src/apps/cli/index.ts +0 -1735
  106. package/src/apps/cli/mcp-install.ts +0 -106
  107. package/src/apps/cli/retrieval-disclosure-output.ts +0 -196
  108. package/src/apps/dashboard/assets/js/bootstrap.js +0 -244
  109. package/src/apps/dashboard/assets/js/chat.js +0 -373
  110. package/src/apps/dashboard/assets/js/disclosure.js +0 -232
  111. package/src/apps/dashboard/assets/js/modals.js +0 -298
  112. package/src/apps/dashboard/assets/js/overview.js +0 -655
  113. package/src/apps/dashboard/assets/js/state.js +0 -72
  114. package/src/apps/dashboard/assets/js/views.js +0 -468
  115. package/src/apps/dashboard/index.html +0 -543
  116. package/src/apps/dashboard/index.ts +0 -3
  117. package/src/apps/dashboard/style.css +0 -1750
  118. package/src/apps/index.ts +0 -5
  119. package/src/apps/server/api/chat.ts +0 -244
  120. package/src/apps/server/api/citations.ts +0 -105
  121. package/src/apps/server/api/events.ts +0 -137
  122. package/src/apps/server/api/health.ts +0 -53
  123. package/src/apps/server/api/index.ts +0 -26
  124. package/src/apps/server/api/projects.ts +0 -74
  125. package/src/apps/server/api/search.ts +0 -184
  126. package/src/apps/server/api/sessions.ts +0 -115
  127. package/src/apps/server/api/stats.ts +0 -723
  128. package/src/apps/server/api/turns.ts +0 -143
  129. package/src/apps/server/api/utils.ts +0 -65
  130. package/src/apps/server/index.ts +0 -111
  131. package/src/cli/index.ts +0 -3
  132. package/src/cli/retrieval-disclosure-output.ts +0 -2
  133. package/src/compat/index.ts +0 -5
  134. package/src/core/canonical-key.ts +0 -186
  135. package/src/core/citation-generator.ts +0 -63
  136. package/src/core/consolidated-store.ts +0 -356
  137. package/src/core/consolidation-worker.ts +0 -493
  138. package/src/core/context-formatter.ts +0 -276
  139. package/src/core/continuity-manager.ts +0 -341
  140. package/src/core/db-wrapper.ts +0 -64
  141. package/src/core/derive/fact-deriver.ts +0 -170
  142. package/src/core/derive/index.ts +0 -2
  143. package/src/core/derive/summary-deriver.ts +0 -76
  144. package/src/core/edge-repo.ts +0 -333
  145. package/src/core/embedder.ts +0 -4
  146. package/src/core/engine/embedding-maintenance-service.ts +0 -187
  147. package/src/core/engine/endless-memory-services.ts +0 -4
  148. package/src/core/engine/index.ts +0 -19
  149. package/src/core/engine/memory-engine-services.ts +0 -170
  150. package/src/core/engine/memory-ingest-service.ts +0 -317
  151. package/src/core/engine/memory-query-service.ts +0 -173
  152. package/src/core/engine/memory-runtime-service.ts +0 -162
  153. package/src/core/engine/memory-service-composition.ts +0 -231
  154. package/src/core/engine/retrieval-analytics-service.ts +0 -181
  155. package/src/core/engine/retrieval-disclosure-service.ts +0 -420
  156. package/src/core/engine/retrieval-orchestrator.ts +0 -377
  157. package/src/core/engine/retrieval-services.ts +0 -176
  158. package/src/core/engine/shared-memory-services.ts +0 -4
  159. package/src/core/entity-repo.ts +0 -349
  160. package/src/core/event-store.ts +0 -779
  161. package/src/core/evidence-aligner.ts +0 -635
  162. package/src/core/external-market-context.ts +0 -582
  163. package/src/core/graduation-worker.ts +0 -171
  164. package/src/core/graduation.ts +0 -377
  165. package/src/core/index.ts +0 -64
  166. package/src/core/ingest-interceptor.ts +0 -80
  167. package/src/core/markdown-mirror.ts +0 -70
  168. package/src/core/matcher.ts +0 -208
  169. package/src/core/md-mirror.ts +0 -92
  170. package/src/core/metadata-extractor.ts +0 -203
  171. package/src/core/model/memory-fact.ts +0 -30
  172. package/src/core/model/memory-rule.ts +0 -14
  173. package/src/core/model/memory-summary.ts +0 -21
  174. package/src/core/model/raw-event.ts +0 -28
  175. package/src/core/model/retrieval-result.ts +0 -35
  176. package/src/core/mongo-sync-config.ts +0 -165
  177. package/src/core/mongo-sync-worker.ts +0 -381
  178. package/src/core/privacy/filter.ts +0 -190
  179. package/src/core/privacy/index.ts +0 -20
  180. package/src/core/privacy/tag-parser.ts +0 -145
  181. package/src/core/product-validation-matrix.ts +0 -314
  182. package/src/core/progressive-retriever.ts +0 -414
  183. package/src/core/registry/project-path.ts +0 -54
  184. package/src/core/registry/session-registry.ts +0 -69
  185. package/src/core/replay-evaluator.ts +0 -625
  186. package/src/core/retrieval-benchmark.ts +0 -117
  187. package/src/core/retrieval-quality.ts +0 -109
  188. package/src/core/retriever.ts +0 -800
  189. package/src/core/session-qrels.ts +0 -360
  190. package/src/core/shared-event-store.ts +0 -114
  191. package/src/core/shared-promoter.ts +0 -249
  192. package/src/core/shared-store.ts +0 -289
  193. package/src/core/shared-vector-store.ts +0 -203
  194. package/src/core/sqlite-event-store.ts +0 -1846
  195. package/src/core/sqlite-wrapper.ts +0 -116
  196. package/src/core/sync-worker.ts +0 -228
  197. package/src/core/tag-taxonomy.ts +0 -51
  198. package/src/core/task/blocker-resolver.ts +0 -333
  199. package/src/core/task/index.ts +0 -9
  200. package/src/core/task/task-matcher.ts +0 -240
  201. package/src/core/task/task-projector.ts +0 -358
  202. package/src/core/task/task-resolver.ts +0 -421
  203. package/src/core/turn-state.ts +0 -207
  204. package/src/core/types.ts +0 -952
  205. package/src/core/vector-outbox.ts +0 -299
  206. package/src/core/vector-store.ts +0 -231
  207. package/src/core/vector-worker.ts +0 -521
  208. package/src/core/working-set-store.ts +0 -257
  209. package/src/extensions/endless-memory/endless-memory-services.ts +0 -350
  210. package/src/extensions/endless-memory/index.ts +0 -1
  211. package/src/extensions/index.ts +0 -5
  212. package/src/extensions/mcp/handlers.ts +0 -960
  213. package/src/extensions/mcp/index.ts +0 -48
  214. package/src/extensions/mcp/tools.ts +0 -252
  215. package/src/extensions/shared-memory/index.ts +0 -1
  216. package/src/extensions/shared-memory/shared-memory-services.ts +0 -211
  217. package/src/extensions/vector/embedder.ts +0 -234
  218. package/src/extensions/vector/index.ts +0 -1
  219. package/src/hooks/post-tool-use.ts +0 -9
  220. package/src/hooks/semantic-daemon-client.ts +0 -1
  221. package/src/hooks/semantic-daemon.ts +0 -11
  222. package/src/hooks/session-end.ts +0 -9
  223. package/src/hooks/session-start.ts +0 -9
  224. package/src/hooks/stop.ts +0 -9
  225. package/src/hooks/user-prompt-submit.ts +0 -9
  226. package/src/index.ts +0 -13
  227. package/src/mcp/handlers.ts +0 -2
  228. package/src/mcp/index.ts +0 -4
  229. package/src/mcp/tools.ts +0 -2
  230. package/src/server/api/chat.ts +0 -2
  231. package/src/server/api/citations.ts +0 -2
  232. package/src/server/api/events.ts +0 -2
  233. package/src/server/api/health.ts +0 -2
  234. package/src/server/api/index.ts +0 -2
  235. package/src/server/api/projects.ts +0 -2
  236. package/src/server/api/search.ts +0 -2
  237. package/src/server/api/sessions.ts +0 -2
  238. package/src/server/api/stats.ts +0 -2
  239. package/src/server/api/turns.ts +0 -2
  240. package/src/server/api/utils.ts +0 -2
  241. package/src/server/index.ts +0 -2
  242. package/src/services/bootstrap-organizer.ts +0 -463
  243. package/src/services/codex-session-history-importer.ts +0 -966
  244. package/src/services/hermes-session-history-importer.ts +0 -733
  245. package/src/services/memory-service-config.ts +0 -36
  246. package/src/services/memory-service-registry.ts +0 -150
  247. package/src/services/memory-service.ts +0 -688
  248. package/src/services/session-history-importer.ts +0 -629
  249. package/tests/README.md +0 -23
  250. package/tests/adapters/claude/claude-semantic-daemon-adapter.test.ts +0 -54
  251. package/tests/adapters/claude/claude-transcript-reconstructor.test.ts +0 -98
  252. package/tests/adapters/claude-hook-prompt-injection-policy.test.ts +0 -99
  253. package/tests/apps/app-layer-boundary.test.ts +0 -48
  254. package/tests/apps/claude-settings-hooks.test.ts +0 -107
  255. package/tests/apps/cli-disclosure-output.test.ts +0 -212
  256. package/tests/apps/codex-import-runner.test.ts +0 -99
  257. package/tests/apps/codex-validation-output.test.ts +0 -100
  258. package/tests/apps/hermes-import-runner.test.ts +0 -99
  259. package/tests/apps/mcp-install-command.test.ts +0 -59
  260. package/tests/apps/package-build-entrypoints.test.ts +0 -30
  261. package/tests/apps/postinstall-embedding-backend.test.ts +0 -185
  262. package/tests/apps/search-api-disclosure.test.ts +0 -162
  263. package/tests/apps/stats-api-lightweight.test.ts +0 -67
  264. package/tests/apps/ui-disclosure-output.test.ts +0 -140
  265. package/tests/core/bootstrap-organizer.test.ts +0 -111
  266. package/tests/core/canonical-key.test.ts +0 -101
  267. package/tests/core/codex-session-history-importer-validation.test.ts +0 -185
  268. package/tests/core/consolidation-worker.test.ts +0 -75
  269. package/tests/core/embedding-maintenance-service.test.ts +0 -282
  270. package/tests/core/evidence-aligner.test.ts +0 -152
  271. package/tests/core/external-market-context.test.ts +0 -209
  272. package/tests/core/fact-deriver.test.ts +0 -79
  273. package/tests/core/hermes-session-history-importer-validation.test.ts +0 -609
  274. package/tests/core/ingest-interceptor.test.ts +0 -38
  275. package/tests/core/markdown-mirror.test.ts +0 -85
  276. package/tests/core/matcher.test.ts +0 -112
  277. package/tests/core/md-mirror.test.ts +0 -50
  278. package/tests/core/memory-engine-services.test.ts +0 -240
  279. package/tests/core/memory-ingest-service.test.ts +0 -296
  280. package/tests/core/memory-query-service.test.ts +0 -129
  281. package/tests/core/memory-runtime-service.test.ts +0 -201
  282. package/tests/core/memory-service-composition.test.ts +0 -192
  283. package/tests/core/memory-service-config.test.ts +0 -41
  284. package/tests/core/memory-service-facade.test.ts +0 -30
  285. package/tests/core/memory-service-registry.test.ts +0 -206
  286. package/tests/core/product-validation-matrix.test.ts +0 -61
  287. package/tests/core/project-registry.test.ts +0 -78
  288. package/tests/core/replay-evaluator.test.ts +0 -181
  289. package/tests/core/retrieval-analytics-service.test.ts +0 -210
  290. package/tests/core/retrieval-benchmark.test.ts +0 -93
  291. package/tests/core/retrieval-disclosure-service.test.ts +0 -264
  292. package/tests/core/retrieval-orchestrator.test.ts +0 -403
  293. package/tests/core/retrieval-quality.test.ts +0 -31
  294. package/tests/core/retrieval-services.test.ts +0 -185
  295. package/tests/core/retriever-fallback-chain.test.ts +0 -223
  296. package/tests/core/retriever-strategy-scope.test.ts +0 -164
  297. package/tests/core/retriever.memu-adoption.test.ts +0 -122
  298. package/tests/core/session-history-importer-filter.test.ts +0 -78
  299. package/tests/core/session-qrels.test.ts +0 -250
  300. package/tests/core/sqlite-event-store-replication.test.ts +0 -127
  301. package/tests/core/summary-deriver.test.ts +0 -66
  302. package/tests/extensions/embedder-warning-suppression.test.ts +0 -84
  303. package/tests/extensions/endless-memory-extension-boundary.test.ts +0 -17
  304. package/tests/extensions/endless-memory-services.test.ts +0 -325
  305. package/tests/extensions/mcp-context-tools.test.ts +0 -905
  306. package/tests/extensions/mcp-extension-boundary.test.ts +0 -21
  307. package/tests/extensions/mcp-package-build.test.ts +0 -22
  308. package/tests/extensions/mcp-project-aware-tools.test.ts +0 -102
  309. package/tests/extensions/shared-memory-extension-boundary.test.ts +0 -24
  310. package/tests/extensions/shared-memory-services.test.ts +0 -309
  311. package/tests/extensions/vector-extension-boundary.test.ts +0 -21
  312. package/tsconfig.json +0 -24
  313. package/vitest.config.ts +0 -15
@@ -1,463 +0,0 @@
1
- import * as fs from 'node:fs';
2
- import * as path from 'node:path';
3
- import { execSync } from 'node:child_process';
4
-
5
- export interface BootstrapKnowledgeOptions {
6
- repoPath: string;
7
- outDir: string;
8
- since?: string;
9
- maxCommits?: number;
10
- incremental?: boolean;
11
- }
12
-
13
- interface CommitInfo {
14
- hash: string;
15
- date: string;
16
- author: string;
17
- subject: string;
18
- files: string[];
19
- }
20
-
21
- interface ModuleSummary {
22
- name: string;
23
- root: string;
24
- fileCount: number;
25
- languages: string[];
26
- entryCandidates: string[];
27
- }
28
-
29
- const EXCLUDED_DIRS = new Set(['.git', 'node_modules', 'dist', 'build', 'coverage', '.next', '.turbo', 'memory']);
30
- const CODE_EXTENSIONS = new Set([
31
- '.ts', '.tsx', '.js', '.jsx', '.mjs', '.cjs', '.py', '.go', '.rs', '.java', '.kt', '.swift', '.rb', '.php', '.cs',
32
- '.scala', '.sh', '.zsh', '.yaml', '.yml', '.json', '.sql', '.md'
33
- ]);
34
-
35
- function safeRel(base: string, target: string): string {
36
- return path.relative(base, target).replaceAll('\\', '/');
37
- }
38
-
39
- function mkdirp(dir: string): void {
40
- fs.mkdirSync(dir, { recursive: true });
41
- }
42
-
43
- function walkCodeFiles(root: string): string[] {
44
- const out: string[] = [];
45
-
46
- function walk(dir: string): void {
47
- const entries = fs.readdirSync(dir, { withFileTypes: true }).sort((a, b) => a.name.localeCompare(b.name));
48
-
49
- for (const e of entries) {
50
- const full = path.join(dir, e.name);
51
- if (e.isDirectory()) {
52
- if (!EXCLUDED_DIRS.has(e.name)) walk(full);
53
- } else if (e.isFile()) {
54
- const ext = path.extname(e.name).toLowerCase();
55
- if (CODE_EXTENSIONS.has(ext)) out.push(full);
56
- }
57
- }
58
- }
59
-
60
- walk(root);
61
- return out.sort();
62
- }
63
-
64
- function detectLanguage(file: string): string {
65
- const ext = path.extname(file).toLowerCase();
66
- const map: Record<string, string> = {
67
- '.ts': 'TypeScript', '.tsx': 'TypeScript', '.js': 'JavaScript', '.jsx': 'JavaScript', '.mjs': 'JavaScript', '.cjs': 'JavaScript',
68
- '.py': 'Python', '.go': 'Go', '.rs': 'Rust', '.java': 'Java', '.kt': 'Kotlin', '.swift': 'Swift', '.rb': 'Ruby', '.php': 'PHP',
69
- '.cs': 'C#', '.scala': 'Scala', '.sh': 'Shell', '.zsh': 'Shell', '.yaml': 'YAML', '.yml': 'YAML', '.json': 'JSON', '.sql': 'SQL', '.md': 'Markdown'
70
- };
71
- return map[ext] || 'Other';
72
- }
73
-
74
- function summarizeModules(repoPath: string, files: string[]): ModuleSummary[] {
75
- const modules = new Map<string, { files: string[]; langs: Map<string, number> }>();
76
-
77
- for (const abs of files) {
78
- const rel = safeRel(repoPath, abs);
79
- const seg = rel.split('/').filter(Boolean);
80
- const top = seg[0] || 'root';
81
-
82
- if (!modules.has(top)) modules.set(top, { files: [], langs: new Map() });
83
-
84
- const bucket = modules.get(top)!;
85
- bucket.files.push(rel);
86
-
87
- const lang = detectLanguage(abs);
88
- bucket.langs.set(lang, (bucket.langs.get(lang) || 0) + 1);
89
- }
90
-
91
- return [...modules.entries()]
92
- .map(([name, data]) => ({
93
- name,
94
- root: name,
95
- fileCount: data.files.length,
96
- languages: [...data.langs.entries()].sort((a, b) => b[1] - a[1]).map(([l]) => l).slice(0, 5),
97
- entryCandidates: data.files.filter((f) => /(index|main|app|server|cli)\./i.test(path.basename(f))).slice(0, 10)
98
- }))
99
- .sort((a, b) => b.fileCount - a.fileCount || a.name.localeCompare(b.name));
100
- }
101
-
102
- function runGit(repoPath: string, command: string): string {
103
- return execSync(`git -C ${JSON.stringify(repoPath)} ${command}`, { encoding: 'utf8', stdio: ['ignore', 'pipe', 'ignore'] });
104
- }
105
-
106
- function parseGitLog(raw: string): CommitInfo[] {
107
- const lines = raw.split(/\r?\n/);
108
- const commits: CommitInfo[] = [];
109
- let current: CommitInfo | null = null;
110
-
111
- for (const line of lines) {
112
- if (!line.trim()) {
113
- if (current) {
114
- commits.push(current);
115
- current = null;
116
- }
117
- continue;
118
- }
119
-
120
- if (line.includes('\t') && line.split('\t').length >= 4) {
121
- if (current) commits.push(current);
122
- const [hash, date, author, ...subjectRest] = line.split('\t');
123
- current = { hash, date, author, subject: subjectRest.join('\t').trim(), files: [] };
124
- } else if (current) {
125
- current.files.push(line.trim());
126
- }
127
- }
128
-
129
- if (current) commits.push(current);
130
- return commits;
131
- }
132
-
133
- function getGitCommits(repoPath: string, since = '180 days ago', maxCommits = 1000): CommitInfo[] {
134
- try {
135
- const raw = runGit(
136
- repoPath,
137
- `log --since=${JSON.stringify(since)} -n ${Math.max(1, maxCommits)} --date=short --pretty=format:%H%x09%ad%x09%an%x09%s --name-only --reverse`
138
- );
139
- return parseGitLog(raw);
140
- } catch {
141
- return [];
142
- }
143
- }
144
-
145
- function getGitCommitsAfterHash(repoPath: string, hash: string, maxCommits = 1000): CommitInfo[] {
146
- try {
147
- const raw = runGit(
148
- repoPath,
149
- `log ${JSON.stringify(`${hash}..HEAD`)} -n ${Math.max(1, maxCommits)} --date=short --pretty=format:%H%x09%ad%x09%an%x09%s --name-only --reverse`
150
- );
151
- return parseGitLog(raw);
152
- } catch {
153
- return [];
154
- }
155
- }
156
-
157
- function extractDecisions(commits: CommitInfo[]): CommitInfo[] {
158
- const decisionPattern = /(refactor|migrate|deprecat|remove|replace|introduce|adopt|switch|upgrade|breaking|architecture|feat|fix)/i;
159
- return commits.filter((c) => decisionPattern.test(c.subject));
160
- }
161
-
162
- function buildTimeline(commits: CommitInfo[]): Map<string, CommitInfo[]> {
163
- const timeline = new Map<string, CommitInfo[]>();
164
- for (const c of commits) {
165
- const key = (c.date || '').slice(0, 7) || 'unknown';
166
- if (!timeline.has(key)) timeline.set(key, []);
167
- timeline.get(key)!.push(c);
168
- }
169
- return new Map([...timeline.entries()].sort((a, b) => a[0].localeCompare(b[0])));
170
- }
171
-
172
- function buildGlossary(files: string[]): string[] {
173
- const stop = new Set(['src', 'test', 'dist', 'lib', 'core', 'index', 'main', 'app', 'server', 'client', 'utils']);
174
- const freq = new Map<string, number>();
175
-
176
- for (const f of files) {
177
- const base = path.basename(f, path.extname(f));
178
- const tokens = base
179
- .split(/[^a-zA-Z0-9]+/)
180
- .flatMap((t) => t.split(/(?=[A-Z])/))
181
- .map((t) => t.toLowerCase())
182
- .filter((t) => t.length >= 3 && !stop.has(t));
183
-
184
- for (const t of tokens) freq.set(t, (freq.get(t) || 0) + 1);
185
- }
186
-
187
- return [...freq.entries()]
188
- .filter(([, count]) => count >= 2)
189
- .sort((a, b) => b[1] - a[1] || a[0].localeCompare(b[0]))
190
- .slice(0, 80)
191
- .map(([term]) => term);
192
- }
193
-
194
- function writeFile(filePath: string, content: string): void {
195
- mkdirp(path.dirname(filePath));
196
- fs.writeFileSync(filePath, content, 'utf8');
197
- }
198
-
199
- function confidenceByEvidence(sourceCount: number): 'high' | 'mid' | 'low' {
200
- if (sourceCount >= 3) return 'high';
201
- if (sourceCount >= 1) return 'mid';
202
- return 'low';
203
- }
204
-
205
- function sourceLine(source: string): string {
206
- return `- source: ${source}`;
207
- }
208
-
209
- interface ExistingManifest {
210
- generatedAt?: string;
211
- lastCommitDate?: string;
212
- lastCommitHash?: string;
213
- }
214
-
215
- function loadExistingManifest(outDir: string): ExistingManifest | null {
216
- try {
217
- const p = path.join(outDir, 'sources', 'manifest.json');
218
- if (!fs.existsSync(p)) return null;
219
- const data = JSON.parse(fs.readFileSync(p, 'utf8')) as ExistingManifest;
220
- return data;
221
- } catch {
222
- return null;
223
- }
224
- }
225
-
226
- function listMarkdownOutputs(outDir: string): string[] {
227
- const out: string[] = [];
228
- const stack = [outDir];
229
- while (stack.length) {
230
- const dir = stack.pop()!;
231
- for (const entry of fs.readdirSync(dir, { withFileTypes: true })) {
232
- const full = path.join(dir, entry.name);
233
- if (entry.isDirectory()) stack.push(full);
234
- else if (entry.isFile() && entry.name.endsWith('.md')) out.push(full);
235
- }
236
- }
237
- return out.sort((a, b) => a.localeCompare(b));
238
- }
239
-
240
- export async function bootstrapKnowledgeBase(options: BootstrapKnowledgeOptions): Promise<{
241
- outDir: string;
242
- fileCount: number;
243
- moduleCount: number;
244
- commitCount: number;
245
- generatedFiles: string[];
246
- }> {
247
- const repoPath = path.resolve(options.repoPath);
248
- const outDir = path.resolve(options.outDir);
249
- const maxCommits = options.maxCommits ?? 1000;
250
-
251
- const existingManifest = options.incremental ? loadExistingManifest(outDir) : null;
252
- const incrementalSince = existingManifest?.lastCommitDate || existingManifest?.generatedAt;
253
- const since = options.since || incrementalSince || '180 days ago';
254
-
255
- const codeFiles = walkCodeFiles(repoPath);
256
- const modules = summarizeModules(repoPath, codeFiles);
257
- const commits = options.incremental && existingManifest?.lastCommitHash
258
- ? getGitCommitsAfterHash(repoPath, existingManifest.lastCommitHash, maxCommits)
259
- : getGitCommits(repoPath, since, maxCommits);
260
- const decisions = extractDecisions(commits);
261
- const timeline = buildTimeline(commits);
262
- const glossary = buildGlossary(codeFiles);
263
-
264
- const generatedFiles: string[] = [];
265
-
266
- const sections = {
267
- overview: path.join(outDir, 'overview'),
268
- modules: path.join(outDir, 'modules'),
269
- decisions: path.join(outDir, 'decisions'),
270
- timeline: path.join(outDir, 'timeline'),
271
- glossary: path.join(outDir, 'glossary'),
272
- sources: path.join(outDir, 'sources')
273
- };
274
-
275
- for (const sectionDir of Object.values(sections)) {
276
- mkdirp(sectionDir);
277
- }
278
-
279
- const overviewPath = path.join(sections.overview, 'overview.md');
280
- const overview = [
281
- '# Codebase Overview',
282
- '',
283
- `- generatedAt: ${new Date().toISOString()}`,
284
- '- deterministicPipeline: true',
285
- `- repo: ${repoPath}`,
286
- `- filesAnalyzed: ${codeFiles.length}`,
287
- `- commitsAnalyzed: ${commits.length}`,
288
- `- confidence: ${confidenceByEvidence(modules.length > 0 ? 3 : 0)}`,
289
- '',
290
- '## Directory / Module Map',
291
- ...modules.slice(0, 50).map((m) => `- ${m.name}: ${m.fileCount} files (${m.languages.join(', ') || 'n/a'})`),
292
- '',
293
- '## Fact',
294
- '- Generated from deterministic file scan and git history parsing.',
295
- '',
296
- '## Inference',
297
- '- Module responsibilities should be reviewed by maintainers for nuanced boundaries.',
298
- '',
299
- '## Sources',
300
- sourceLine(`repo-scan:${repoPath}`),
301
- sourceLine(`git-log:since=${since};max=${maxCommits}`),
302
- ''
303
- ].join('\n');
304
- writeFile(overviewPath, overview);
305
- generatedFiles.push(overviewPath);
306
-
307
- const touchedRoots = new Set(
308
- commits
309
- .flatMap((c) => c.files)
310
- .map((f) => f.split('/').filter(Boolean)[0])
311
- .filter(Boolean)
312
- );
313
- const moduleTargets = options.incremental && touchedRoots.size > 0
314
- ? modules.filter((m) => touchedRoots.has(m.root)).slice(0, 200)
315
- : modules.slice(0, 200);
316
-
317
- for (const m of moduleTargets) {
318
- const relatedCommits = commits.filter((c) => c.files.some((f) => f.startsWith(`${m.root}/`))).slice(0, 15);
319
- const content = [
320
- `# Module: ${m.name}`,
321
- '',
322
- `- responsibility: inferred from top-level path \`${m.root}/\``,
323
- `- files: ${m.fileCount}`,
324
- `- languages: ${m.languages.join(', ') || 'n/a'}`,
325
- `- confidence: ${confidenceByEvidence(relatedCommits.length)}`,
326
- '',
327
- '## Entry Candidates',
328
- ...(m.entryCandidates.length > 0 ? m.entryCandidates.map((f) => `- ${f}`) : ['- none detected']),
329
- '',
330
- '## Related Commits (recent sample)',
331
- ...(relatedCommits.length > 0
332
- ? relatedCommits.map((c) => `- ${c.date} ${c.hash.slice(0, 8)} ${c.subject}`)
333
- : ['- none in selected range']),
334
- '',
335
- '## Sources',
336
- sourceLine(`repo-path:${m.root}/**`),
337
- ...relatedCommits.map((c) => sourceLine(`commit:${c.hash}`)),
338
- ''
339
- ].join('\n');
340
-
341
- const modulePath = path.join(sections.modules, `${m.name.replace(/[^a-z0-9._-]+/gi, '-').toLowerCase()}.md`);
342
- writeFile(modulePath, content);
343
- generatedFiles.push(modulePath);
344
- }
345
-
346
- const decisionsPath = path.join(sections.decisions, 'decisions.md');
347
- const decisionsMd = [
348
- '# Decisions (extracted)',
349
- '',
350
- `- confidence: ${confidenceByEvidence(decisions.length)}`,
351
- '',
352
- ...(decisions.length > 0
353
- ? decisions.slice(0, 500).map((d) => [
354
- `## ${d.date} | ${d.subject}`,
355
- '- status: active (inferred)',
356
- sourceLine(`commit:${d.hash}`),
357
- `- author: ${d.author}`,
358
- `- changedFiles: ${d.files.length}`,
359
- `- confidence: ${confidenceByEvidence(d.files.length > 0 ? 2 : 1)}`,
360
- ''
361
- ].join('\n'))
362
- : ['- No decision-like commits found in selected range.', '']),
363
- '## Sources',
364
- sourceLine(`git-log:since=${since};max=${maxCommits}`),
365
- ''
366
- ].join('\n');
367
- writeFile(decisionsPath, decisionsMd);
368
- generatedFiles.push(decisionsPath);
369
-
370
- const timelinePath = path.join(sections.timeline, 'timeline.md');
371
- const timelineMd = [
372
- '# Timeline',
373
- '',
374
- `- confidence: ${confidenceByEvidence(commits.length > 0 ? 2 : 0)}`,
375
- '',
376
- ...[...timeline.entries()].flatMap(([month, list]) => [
377
- `## ${month}`,
378
- ...list.slice(0, 40).map((c) => `- ${c.date} ${c.hash.slice(0, 8)} ${c.subject}`),
379
- ''
380
- ]),
381
- '## Sources',
382
- sourceLine(`git-log:since=${since};max=${maxCommits}`),
383
- ''
384
- ].join('\n');
385
- writeFile(timelinePath, timelineMd);
386
- generatedFiles.push(timelinePath);
387
-
388
- const glossaryPath = path.join(sections.glossary, 'glossary.md');
389
- const glossaryMd = [
390
- '# Glossary (auto-extracted)',
391
- '',
392
- `- confidence: ${confidenceByEvidence(glossary.length > 0 ? 1 : 0)}`,
393
- '',
394
- ...glossary.map((t) => `- ${t}`),
395
- '',
396
- '## Sources',
397
- sourceLine(`repo-scan:${repoPath}`),
398
- ''
399
- ].join('\n');
400
- writeFile(glossaryPath, glossaryMd);
401
- generatedFiles.push(glossaryPath);
402
-
403
- const outputs = generatedFiles.map((f) => safeRel(outDir, f)).sort((a, b) => a.localeCompare(b));
404
- const allOutputs = listMarkdownOutputs(outDir).map((f) => safeRel(outDir, f));
405
-
406
- const sourceItems = [
407
- ...codeFiles.slice(0, 200).map((f) => ({ type: 'file', ref: safeRel(repoPath, f) })),
408
- ...commits.slice(0, 400).map((c) => ({ type: 'commit', ref: c.hash, date: c.date, subject: c.subject }))
409
- ];
410
-
411
- const latestCommitDate = commits.length > 0 ? commits[commits.length - 1].date : existingManifest?.lastCommitDate;
412
- const latestCommitHash = commits.length > 0 ? commits[commits.length - 1].hash : existingManifest?.lastCommitHash;
413
- const manifest = {
414
- generatedAt: new Date().toISOString(),
415
- deterministicPipeline: true,
416
- mode: options.incremental ? 'incremental' : 'full',
417
- repoPath,
418
- options: { since, maxCommits, incremental: Boolean(options.incremental) },
419
- stats: {
420
- filesAnalyzed: codeFiles.length,
421
- modules: modules.length,
422
- modulesGenerated: moduleTargets.length,
423
- commits: commits.length,
424
- decisions: decisions.length,
425
- glossaryTerms: glossary.length
426
- },
427
- lastCommitDate: latestCommitDate,
428
- lastCommitHash: latestCommitHash,
429
- outputs,
430
- allOutputs,
431
- sources: sourceItems
432
- };
433
-
434
- const manifestJsonPath = path.join(sections.sources, 'manifest.json');
435
- writeFile(manifestJsonPath, `${JSON.stringify(manifest, null, 2)}\n`);
436
- generatedFiles.push(manifestJsonPath);
437
-
438
- const manifestMdPath = path.join(sections.sources, 'manifest.md');
439
- const manifestMd = [
440
- '# Sources Manifest',
441
- '',
442
- '- deterministicPipeline: true',
443
- `- mode: ${options.incremental ? 'incremental' : 'full'}`,
444
- `- sourceCount: ${sourceItems.length}`,
445
- '',
446
- '## Outputs',
447
- ...outputs.map((o) => `- ${o}`),
448
- '',
449
- '## Sources (sample)',
450
- ...sourceItems.slice(0, 300).map((s) => `- ${s.type}:${s.ref}`),
451
- ''
452
- ].join('\n');
453
- writeFile(manifestMdPath, manifestMd);
454
- generatedFiles.push(manifestMdPath);
455
-
456
- return {
457
- outDir,
458
- fileCount: codeFiles.length,
459
- moduleCount: modules.length,
460
- commitCount: commits.length,
461
- generatedFiles: generatedFiles.sort((a, b) => a.localeCompare(b))
462
- };
463
- }