claude-brain 0.14.2 → 0.14.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (246) hide show
  1. package/README.md +191 -191
  2. package/VERSION +1 -1
  3. package/assets/CLAUDE-unified.md +11 -11
  4. package/assets/CLAUDE.md +11 -11
  5. package/bunfig.toml +8 -8
  6. package/package.json +80 -80
  7. package/packs/backend/node.json +173 -173
  8. package/packs/core/javascript.json +176 -176
  9. package/packs/core/typescript.json +222 -222
  10. package/packs/frontend/react.json +254 -254
  11. package/packs/meta/testing.json +172 -172
  12. package/src/automation/auto-context.ts +240 -240
  13. package/src/automation/decision-detector.ts +452 -452
  14. package/src/automation/index.ts +11 -11
  15. package/src/automation/phase12-manager.ts +456 -456
  16. package/src/automation/proactive-recall.ts +373 -373
  17. package/src/automation/project-detector.ts +310 -310
  18. package/src/automation/repo-scanner.ts +205 -205
  19. package/src/cli/auto-setup.ts +82 -82
  20. package/src/cli/bin.ts +202 -202
  21. package/src/cli/commands/chroma.ts +573 -573
  22. package/src/cli/commands/git-hook.ts +189 -189
  23. package/src/cli/commands/hooks.ts +213 -213
  24. package/src/cli/commands/init.ts +122 -122
  25. package/src/cli/commands/install-mcp.ts +92 -92
  26. package/src/cli/commands/pack.ts +197 -197
  27. package/src/cli/commands/serve.ts +167 -167
  28. package/src/cli/commands/start.ts +42 -42
  29. package/src/cli/commands/uninstall-mcp.ts +41 -41
  30. package/src/cli/commands/update.ts +121 -121
  31. package/src/cli/diagnose.ts +4 -4
  32. package/src/cli/health-check.ts +4 -4
  33. package/src/cli/migrate-chroma.ts +106 -106
  34. package/src/cli/setup.ts +4 -4
  35. package/src/cli/ui/animations.ts +80 -80
  36. package/src/cli/ui/components.ts +82 -82
  37. package/src/cli/ui/index.ts +4 -4
  38. package/src/cli/ui/logo.ts +36 -36
  39. package/src/cli/ui/theme.ts +55 -55
  40. package/src/config/defaults.ts +50 -50
  41. package/src/config/home.ts +55 -55
  42. package/src/config/index.ts +7 -7
  43. package/src/config/loader.ts +166 -166
  44. package/src/config/migration.ts +76 -76
  45. package/src/config/schema.ts +360 -360
  46. package/src/config/validator.ts +184 -184
  47. package/src/config/watcher.ts +86 -86
  48. package/src/context/assembler.ts +398 -398
  49. package/src/context/cache-manager.ts +101 -101
  50. package/src/context/formatter.ts +84 -84
  51. package/src/context/hierarchy.ts +85 -85
  52. package/src/context/index.ts +83 -83
  53. package/src/context/progress-tracker.ts +174 -174
  54. package/src/context/standards-manager.ts +287 -287
  55. package/src/context/types.ts +252 -252
  56. package/src/context/validator.ts +58 -58
  57. package/src/diagnostics/index.ts +123 -123
  58. package/src/health/index.ts +229 -229
  59. package/src/hooks/brain-hook.ts +112 -112
  60. package/src/hooks/capture.ts +168 -168
  61. package/src/hooks/deduplicator.ts +72 -72
  62. package/src/hooks/git-capture.ts +109 -109
  63. package/src/hooks/git-hook-installer.ts +207 -207
  64. package/src/hooks/index.ts +20 -20
  65. package/src/hooks/installer.ts +191 -194
  66. package/src/hooks/passive-classifier.ts +366 -366
  67. package/src/hooks/queue.ts +129 -129
  68. package/src/hooks/session-tracker.ts +275 -275
  69. package/src/hooks/types.ts +47 -47
  70. package/src/index.ts +7 -7
  71. package/src/intelligence/cross-project/affinity.ts +162 -162
  72. package/src/intelligence/cross-project/generalizer.ts +283 -283
  73. package/src/intelligence/cross-project/index.ts +13 -13
  74. package/src/intelligence/cross-project/transfer.ts +201 -201
  75. package/src/intelligence/index.ts +24 -24
  76. package/src/intelligence/optimization/index.ts +10 -10
  77. package/src/intelligence/optimization/precompute.ts +202 -202
  78. package/src/intelligence/optimization/semantic-cache.ts +207 -207
  79. package/src/intelligence/prediction/context-anticipator.ts +198 -198
  80. package/src/intelligence/prediction/decision-predictor.ts +184 -184
  81. package/src/intelligence/prediction/index.ts +13 -13
  82. package/src/intelligence/prediction/recommender.ts +268 -268
  83. package/src/intelligence/reasoning/chain-retrieval.ts +247 -247
  84. package/src/intelligence/reasoning/counterfactual.ts +248 -248
  85. package/src/intelligence/reasoning/index.ts +13 -13
  86. package/src/intelligence/reasoning/synthesizer.ts +169 -169
  87. package/src/intelligence/temporal/evolution.ts +197 -197
  88. package/src/intelligence/temporal/index.ts +16 -16
  89. package/src/intelligence/temporal/query-processor.ts +190 -190
  90. package/src/intelligence/temporal/timeline.ts +259 -259
  91. package/src/intelligence/temporal/trends.ts +263 -263
  92. package/src/knowledge/entity-extractor.ts +416 -416
  93. package/src/knowledge/graph/builder.ts +185 -185
  94. package/src/knowledge/graph/linker.ts +201 -201
  95. package/src/knowledge/graph/memory-graph.ts +359 -359
  96. package/src/knowledge/graph/schema.ts +99 -99
  97. package/src/knowledge/graph/search.ts +168 -168
  98. package/src/knowledge/relationship-extractor.ts +108 -108
  99. package/src/memory/chroma/client.ts +174 -174
  100. package/src/memory/chroma/collection-manager.ts +94 -94
  101. package/src/memory/chroma/config.ts +57 -57
  102. package/src/memory/chroma/embeddings.ts +153 -153
  103. package/src/memory/chroma/index.ts +82 -82
  104. package/src/memory/chroma/migration.ts +270 -270
  105. package/src/memory/chroma/schemas.ts +69 -69
  106. package/src/memory/chroma/search.ts +315 -315
  107. package/src/memory/chroma/store.ts +741 -741
  108. package/src/memory/consolidation/archiver.ts +164 -164
  109. package/src/memory/consolidation/merger.ts +186 -186
  110. package/src/memory/consolidation/scorer.ts +138 -138
  111. package/src/memory/context-builder.ts +236 -236
  112. package/src/memory/database.ts +169 -169
  113. package/src/memory/embedding-utils.ts +156 -156
  114. package/src/memory/embeddings.ts +226 -226
  115. package/src/memory/episodic/detector.ts +108 -108
  116. package/src/memory/episodic/manager.ts +351 -351
  117. package/src/memory/episodic/summarizer.ts +179 -179
  118. package/src/memory/episodic/types.ts +52 -52
  119. package/src/memory/index.ts +582 -582
  120. package/src/memory/knowledge-extractor.ts +455 -455
  121. package/src/memory/learning.ts +378 -378
  122. package/src/memory/patterns.ts +396 -396
  123. package/src/memory/schema.ts +88 -88
  124. package/src/memory/search.ts +309 -309
  125. package/src/memory/store.ts +787 -787
  126. package/src/memory/types.ts +121 -121
  127. package/src/orchestrator/coordinator.ts +272 -272
  128. package/src/orchestrator/decision-logger.ts +228 -228
  129. package/src/orchestrator/event-emitter.ts +198 -198
  130. package/src/orchestrator/event-queue.ts +184 -184
  131. package/src/orchestrator/handlers/base-handler.ts +70 -70
  132. package/src/orchestrator/handlers/context-handler.ts +73 -73
  133. package/src/orchestrator/handlers/decision-handler.ts +204 -204
  134. package/src/orchestrator/handlers/index.ts +10 -10
  135. package/src/orchestrator/handlers/status-handler.ts +131 -131
  136. package/src/orchestrator/handlers/task-handler.ts +171 -171
  137. package/src/orchestrator/index.ts +275 -275
  138. package/src/orchestrator/task-parser.ts +284 -284
  139. package/src/orchestrator/types.ts +98 -98
  140. package/src/packs/index.ts +9 -9
  141. package/src/packs/loader.ts +134 -134
  142. package/src/packs/manager.ts +204 -204
  143. package/src/packs/ranker.ts +78 -78
  144. package/src/packs/types.ts +81 -81
  145. package/src/phase12/index.ts +5 -5
  146. package/src/retrieval/bm25/index.ts +300 -300
  147. package/src/retrieval/bm25/tokenizer.ts +184 -184
  148. package/src/retrieval/feedback/adaptive.ts +223 -223
  149. package/src/retrieval/feedback/index.ts +16 -16
  150. package/src/retrieval/feedback/metrics.ts +223 -223
  151. package/src/retrieval/feedback/store.ts +283 -283
  152. package/src/retrieval/fusion/index.ts +194 -194
  153. package/src/retrieval/fusion/rrf.ts +163 -163
  154. package/src/retrieval/index.ts +12 -12
  155. package/src/retrieval/pipeline.ts +375 -375
  156. package/src/retrieval/query/expander.ts +198 -198
  157. package/src/retrieval/query/index.ts +27 -27
  158. package/src/retrieval/query/intent-classifier.ts +236 -236
  159. package/src/retrieval/query/temporal-parser.ts +295 -295
  160. package/src/retrieval/reranker/index.ts +188 -188
  161. package/src/retrieval/reranker/model.ts +95 -95
  162. package/src/retrieval/service.ts +125 -125
  163. package/src/retrieval/types.ts +162 -162
  164. package/src/routing/entity-extractor.ts +428 -428
  165. package/src/routing/intent-classifier.ts +436 -436
  166. package/src/routing/response-filter.ts +258 -254
  167. package/src/routing/router.ts +1322 -1314
  168. package/src/routing/search-engine.ts +475 -475
  169. package/src/routing/types.ts +94 -84
  170. package/src/scripts/health-check.ts +118 -118
  171. package/src/scripts/setup.ts +122 -122
  172. package/src/server/handlers/call-tool.ts +156 -156
  173. package/src/server/handlers/index.ts +9 -9
  174. package/src/server/handlers/list-tools.ts +35 -35
  175. package/src/server/handlers/tools/analyze-decision-evolution.ts +151 -151
  176. package/src/server/handlers/tools/auto-remember.ts +200 -200
  177. package/src/server/handlers/tools/brain.ts +85 -85
  178. package/src/server/handlers/tools/create-project.ts +135 -135
  179. package/src/server/handlers/tools/detect-trends.ts +144 -144
  180. package/src/server/handlers/tools/find-cross-project-patterns.ts +168 -168
  181. package/src/server/handlers/tools/get-activity-log.ts +194 -194
  182. package/src/server/handlers/tools/get-code-standards.ts +124 -124
  183. package/src/server/handlers/tools/get-corrections.ts +154 -154
  184. package/src/server/handlers/tools/get-decision-timeline.ts +172 -172
  185. package/src/server/handlers/tools/get-episode.ts +103 -103
  186. package/src/server/handlers/tools/get-patterns.ts +158 -158
  187. package/src/server/handlers/tools/get-phase12-status.ts +63 -63
  188. package/src/server/handlers/tools/get-project-context.ts +75 -75
  189. package/src/server/handlers/tools/get-recommendations.ts +145 -145
  190. package/src/server/handlers/tools/index.ts +31 -31
  191. package/src/server/handlers/tools/init-project.ts +757 -757
  192. package/src/server/handlers/tools/list-episodes.ts +90 -90
  193. package/src/server/handlers/tools/list-projects.ts +125 -125
  194. package/src/server/handlers/tools/rate-memory.ts +101 -101
  195. package/src/server/handlers/tools/recall-similar.ts +87 -87
  196. package/src/server/handlers/tools/recognize-pattern.ts +126 -126
  197. package/src/server/handlers/tools/record-correction.ts +125 -125
  198. package/src/server/handlers/tools/remember-decision.ts +153 -153
  199. package/src/server/handlers/tools/schemas.ts +253 -253
  200. package/src/server/handlers/tools/search-knowledge-graph.ts +102 -102
  201. package/src/server/handlers/tools/smart-context.ts +146 -146
  202. package/src/server/handlers/tools/update-progress.ts +131 -131
  203. package/src/server/handlers/tools/what-if-analysis.ts +135 -135
  204. package/src/server/http-api.ts +693 -693
  205. package/src/server/index.ts +40 -40
  206. package/src/server/mcp-server.ts +283 -283
  207. package/src/server/providers/index.ts +7 -7
  208. package/src/server/providers/prompts.ts +327 -327
  209. package/src/server/providers/resources.ts +622 -622
  210. package/src/server/services.ts +468 -468
  211. package/src/server/types.ts +39 -39
  212. package/src/server/utils/error-handler.ts +155 -155
  213. package/src/server/utils/index.ts +13 -13
  214. package/src/server/utils/memory-indicator.ts +83 -83
  215. package/src/server/utils/request-context.ts +122 -122
  216. package/src/server/utils/response-formatter.ts +129 -124
  217. package/src/server/utils/validators.ts +210 -210
  218. package/src/setup/index.ts +48 -48
  219. package/src/setup/wizard.ts +461 -461
  220. package/src/tools/index.ts +24 -24
  221. package/src/tools/registry.ts +115 -115
  222. package/src/tools/schemas.test.ts +30 -30
  223. package/src/tools/schemas.ts +617 -617
  224. package/src/tools/types.ts +412 -412
  225. package/src/utils/circuit-breaker.ts +130 -130
  226. package/src/utils/cleanup.ts +34 -34
  227. package/src/utils/error-handler.ts +132 -132
  228. package/src/utils/error-messages.ts +60 -60
  229. package/src/utils/fallback.ts +45 -45
  230. package/src/utils/index.ts +54 -54
  231. package/src/utils/logger-utils.ts +80 -80
  232. package/src/utils/logger.ts +88 -88
  233. package/src/utils/phase12-helper.ts +56 -56
  234. package/src/utils/retry.ts +94 -94
  235. package/src/utils/timing.ts +47 -47
  236. package/src/utils/transaction.ts +63 -63
  237. package/src/vault/frontmatter.ts +264 -264
  238. package/src/vault/index.ts +318 -318
  239. package/src/vault/paths.ts +106 -106
  240. package/src/vault/query.ts +422 -422
  241. package/src/vault/reader.ts +264 -264
  242. package/src/vault/templates.ts +186 -186
  243. package/src/vault/types.ts +73 -73
  244. package/src/vault/watcher.ts +277 -277
  245. package/src/vault/writer.ts +413 -413
  246. package/tsconfig.json +30 -30
@@ -1,188 +1,188 @@
1
- /**
2
- * Cross-Encoder Reranker
3
- * Uses a cross-encoder model to rerank search results for improved relevance
4
- */
5
-
6
- import type { Logger } from 'pino'
7
- import { loadRerankerModel, isModelLoaded, unloadModel } from './model'
8
- import type { HybridSearchResult } from '../types'
9
-
10
- export interface RerankerConfig {
11
- /** Model to use for reranking */
12
- model: string
13
- /** Number of top results to rerank */
14
- topK: number
15
- /** Batch size for inference */
16
- batchSize?: number
17
- }
18
-
19
- export class Reranker {
20
- private logger: Logger
21
- private config: RerankerConfig
22
- private model: any | null = null
23
-
24
- constructor(logger: Logger, config: Partial<RerankerConfig> = {}) {
25
- this.logger = logger.child({ component: 'reranker' })
26
- this.config = {
27
- model: config.model || 'cross-encoder/ms-marco-MiniLM-L-6-v2',
28
- topK: config.topK || 10,
29
- batchSize: config.batchSize || 8
30
- }
31
- }
32
-
33
- /**
34
- * Initialize the reranker (loads model)
35
- */
36
- async initialize(): Promise<void> {
37
- if (this.model) {
38
- return
39
- }
40
-
41
- this.logger.info('Initializing reranker')
42
- const { model } = await loadRerankerModel(this.logger, this.config.model)
43
- this.model = model
44
- this.logger.info('Reranker initialized')
45
- }
46
-
47
- /**
48
- * Rerank search results using cross-encoder
49
- *
50
- * @param query - The search query
51
- * @param results - Results to rerank
52
- * @returns Reranked results with updated scores
53
- */
54
- async rerank(
55
- query: string,
56
- results: HybridSearchResult[]
57
- ): Promise<HybridSearchResult[]> {
58
- if (!this.model) {
59
- await this.initialize()
60
- }
61
-
62
- if (results.length === 0) {
63
- return []
64
- }
65
-
66
- // Only rerank top K results
67
- const toRerank = results.slice(0, this.config.topK)
68
- const remainder = results.slice(this.config.topK)
69
-
70
- this.logger.debug({
71
- query: query.slice(0, 50),
72
- resultsCount: toRerank.length
73
- }, 'Reranking results')
74
-
75
- try {
76
- // Create query-document pairs for cross-encoder
77
- const pairs = toRerank.map(result => ({
78
- text: query,
79
- text_pair: result.content
80
- }))
81
-
82
- // Process in batches
83
- const scores: number[] = []
84
- for (let i = 0; i < pairs.length; i += this.config.batchSize!) {
85
- const batch = pairs.slice(i, i + this.config.batchSize!)
86
-
87
- // Run inference
88
- const batchScores = await Promise.all(
89
- batch.map(async (pair) => {
90
- const output = await this.model(`${pair.text} [SEP] ${pair.text_pair}`)
91
- // Cross-encoder outputs score indicating relevance
92
- // Higher score = more relevant
93
- return this.extractScore(output)
94
- })
95
- )
96
-
97
- scores.push(...batchScores)
98
- }
99
-
100
- // Normalize scores to 0-1 range
101
- const normalizedScores = this.normalizeScores(scores)
102
-
103
- // Update results with reranked scores
104
- const rerankedResults = toRerank.map((result, index) => ({
105
- ...result,
106
- scores: {
107
- ...result.scores,
108
- reranked: normalizedScores[index],
109
- final: normalizedScores[index] // Reranked score becomes final
110
- }
111
- }))
112
-
113
- // Sort by reranked score
114
- rerankedResults.sort((a, b) => b.scores.final - a.scores.final)
115
-
116
- // Append non-reranked results
117
- return [...rerankedResults, ...remainder]
118
-
119
- } catch (error) {
120
- this.logger.error({ error }, 'Reranking failed, returning original order')
121
- return results
122
- }
123
- }
124
-
125
- /**
126
- * Extract score from model output
127
- */
128
- private extractScore(output: any): number {
129
- // Handle different output formats from transformers.js
130
- if (Array.isArray(output) && output.length > 0) {
131
- // Classification output format
132
- if (typeof output[0] === 'object' && 'score' in output[0]) {
133
- return output[0].score
134
- }
135
- // Raw logits format
136
- if (typeof output[0] === 'number') {
137
- return output[0]
138
- }
139
- }
140
- // Single score
141
- if (typeof output === 'number') {
142
- return output
143
- }
144
- // Object with score
145
- if (typeof output === 'object' && 'score' in output) {
146
- return output.score
147
- }
148
-
149
- this.logger.warn({ output }, 'Unexpected reranker output format')
150
- return 0
151
- }
152
-
153
- /**
154
- * Normalize scores to 0-1 range using min-max normalization
155
- */
156
- private normalizeScores(scores: number[]): number[] {
157
- if (scores.length === 0) return []
158
- if (scores.length === 1) return [1.0]
159
-
160
- const min = Math.min(...scores)
161
- const max = Math.max(...scores)
162
- const range = max - min
163
-
164
- if (range === 0) {
165
- return scores.map(() => 0.5)
166
- }
167
-
168
- return scores.map(score => (score - min) / range)
169
- }
170
-
171
- /**
172
- * Check if reranker is ready
173
- */
174
- isReady(): boolean {
175
- return isModelLoaded()
176
- }
177
-
178
- /**
179
- * Cleanup model from memory
180
- */
181
- cleanup(): void {
182
- unloadModel()
183
- this.model = null
184
- this.logger.info('Reranker model unloaded')
185
- }
186
- }
187
-
188
- export { loadRerankerModel, isModelLoaded, unloadModel } from './model'
1
+ /**
2
+ * Cross-Encoder Reranker
3
+ * Uses a cross-encoder model to rerank search results for improved relevance
4
+ */
5
+
6
+ import type { Logger } from 'pino'
7
+ import { loadRerankerModel, isModelLoaded, unloadModel } from './model'
8
+ import type { HybridSearchResult } from '../types'
9
+
10
+ export interface RerankerConfig {
11
+ /** Model to use for reranking */
12
+ model: string
13
+ /** Number of top results to rerank */
14
+ topK: number
15
+ /** Batch size for inference */
16
+ batchSize?: number
17
+ }
18
+
19
+ export class Reranker {
20
+ private logger: Logger
21
+ private config: RerankerConfig
22
+ private model: any | null = null
23
+
24
+ constructor(logger: Logger, config: Partial<RerankerConfig> = {}) {
25
+ this.logger = logger.child({ component: 'reranker' })
26
+ this.config = {
27
+ model: config.model || 'cross-encoder/ms-marco-MiniLM-L-6-v2',
28
+ topK: config.topK || 10,
29
+ batchSize: config.batchSize || 8
30
+ }
31
+ }
32
+
33
+ /**
34
+ * Initialize the reranker (loads model)
35
+ */
36
+ async initialize(): Promise<void> {
37
+ if (this.model) {
38
+ return
39
+ }
40
+
41
+ this.logger.info('Initializing reranker')
42
+ const { model } = await loadRerankerModel(this.logger, this.config.model)
43
+ this.model = model
44
+ this.logger.info('Reranker initialized')
45
+ }
46
+
47
+ /**
48
+ * Rerank search results using cross-encoder
49
+ *
50
+ * @param query - The search query
51
+ * @param results - Results to rerank
52
+ * @returns Reranked results with updated scores
53
+ */
54
+ async rerank(
55
+ query: string,
56
+ results: HybridSearchResult[]
57
+ ): Promise<HybridSearchResult[]> {
58
+ if (!this.model) {
59
+ await this.initialize()
60
+ }
61
+
62
+ if (results.length === 0) {
63
+ return []
64
+ }
65
+
66
+ // Only rerank top K results
67
+ const toRerank = results.slice(0, this.config.topK)
68
+ const remainder = results.slice(this.config.topK)
69
+
70
+ this.logger.debug({
71
+ query: query.slice(0, 50),
72
+ resultsCount: toRerank.length
73
+ }, 'Reranking results')
74
+
75
+ try {
76
+ // Create query-document pairs for cross-encoder
77
+ const pairs = toRerank.map(result => ({
78
+ text: query,
79
+ text_pair: result.content
80
+ }))
81
+
82
+ // Process in batches
83
+ const scores: number[] = []
84
+ for (let i = 0; i < pairs.length; i += this.config.batchSize!) {
85
+ const batch = pairs.slice(i, i + this.config.batchSize!)
86
+
87
+ // Run inference
88
+ const batchScores = await Promise.all(
89
+ batch.map(async (pair) => {
90
+ const output = await this.model(`${pair.text} [SEP] ${pair.text_pair}`)
91
+ // Cross-encoder outputs score indicating relevance
92
+ // Higher score = more relevant
93
+ return this.extractScore(output)
94
+ })
95
+ )
96
+
97
+ scores.push(...batchScores)
98
+ }
99
+
100
+ // Normalize scores to 0-1 range
101
+ const normalizedScores = this.normalizeScores(scores)
102
+
103
+ // Update results with reranked scores
104
+ const rerankedResults = toRerank.map((result, index) => ({
105
+ ...result,
106
+ scores: {
107
+ ...result.scores,
108
+ reranked: normalizedScores[index],
109
+ final: normalizedScores[index] // Reranked score becomes final
110
+ }
111
+ }))
112
+
113
+ // Sort by reranked score
114
+ rerankedResults.sort((a, b) => b.scores.final - a.scores.final)
115
+
116
+ // Append non-reranked results
117
+ return [...rerankedResults, ...remainder]
118
+
119
+ } catch (error) {
120
+ this.logger.error({ error }, 'Reranking failed, returning original order')
121
+ return results
122
+ }
123
+ }
124
+
125
+ /**
126
+ * Extract score from model output
127
+ */
128
+ private extractScore(output: any): number {
129
+ // Handle different output formats from transformers.js
130
+ if (Array.isArray(output) && output.length > 0) {
131
+ // Classification output format
132
+ if (typeof output[0] === 'object' && 'score' in output[0]) {
133
+ return output[0].score
134
+ }
135
+ // Raw logits format
136
+ if (typeof output[0] === 'number') {
137
+ return output[0]
138
+ }
139
+ }
140
+ // Single score
141
+ if (typeof output === 'number') {
142
+ return output
143
+ }
144
+ // Object with score
145
+ if (typeof output === 'object' && 'score' in output) {
146
+ return output.score
147
+ }
148
+
149
+ this.logger.warn({ output }, 'Unexpected reranker output format')
150
+ return 0
151
+ }
152
+
153
+ /**
154
+ * Normalize scores to 0-1 range using min-max normalization
155
+ */
156
+ private normalizeScores(scores: number[]): number[] {
157
+ if (scores.length === 0) return []
158
+ if (scores.length === 1) return [1.0]
159
+
160
+ const min = Math.min(...scores)
161
+ const max = Math.max(...scores)
162
+ const range = max - min
163
+
164
+ if (range === 0) {
165
+ return scores.map(() => 0.5)
166
+ }
167
+
168
+ return scores.map(score => (score - min) / range)
169
+ }
170
+
171
+ /**
172
+ * Check if reranker is ready
173
+ */
174
+ isReady(): boolean {
175
+ return isModelLoaded()
176
+ }
177
+
178
+ /**
179
+ * Cleanup model from memory
180
+ */
181
+ cleanup(): void {
182
+ unloadModel()
183
+ this.model = null
184
+ this.logger.info('Reranker model unloaded')
185
+ }
186
+ }
187
+
188
+ export { loadRerankerModel, isModelLoaded, unloadModel } from './model'
@@ -1,95 +1,95 @@
1
- /**
2
- * Reranker Model Loader
3
- * Handles loading and caching of the cross-encoder model
4
- */
5
-
6
- import type { Logger } from 'pino'
7
-
8
- // Dynamic import for transformers to avoid bundling issues
9
- let pipeline: any
10
- let AutoTokenizer: any
11
-
12
- interface RerankerModel {
13
- tokenizer: any
14
- model: any
15
- }
16
-
17
- let modelInstance: RerankerModel | null = null
18
- let loadingPromise: Promise<RerankerModel> | null = null
19
-
20
- /**
21
- * Load the cross-encoder model
22
- * Uses singleton pattern to avoid loading multiple times
23
- */
24
- export async function loadRerankerModel(
25
- logger: Logger,
26
- modelName: string = 'cross-encoder/ms-marco-MiniLM-L-6-v2'
27
- ): Promise<RerankerModel> {
28
- // Return existing instance if loaded
29
- if (modelInstance) {
30
- return modelInstance
31
- }
32
-
33
- // Wait for in-progress loading
34
- if (loadingPromise) {
35
- return loadingPromise
36
- }
37
-
38
- // Start loading
39
- loadingPromise = (async () => {
40
- logger.info({ modelName }, 'Loading cross-encoder reranker model')
41
-
42
- try {
43
- // Dynamic import to avoid issues if transformers.js not available
44
- const transformers = await import('@xenova/transformers')
45
- pipeline = transformers.pipeline
46
- AutoTokenizer = transformers.AutoTokenizer
47
-
48
- // Load text-classification pipeline for cross-encoder
49
- // Cross-encoders score query-document pairs
50
- const classifier = await pipeline('text-classification', modelName, {
51
- quantized: true // Use quantized model for faster inference
52
- })
53
-
54
- const tokenizer = await AutoTokenizer.from_pretrained(modelName)
55
-
56
- modelInstance = {
57
- tokenizer,
58
- model: classifier
59
- }
60
-
61
- logger.info({ modelName }, 'Cross-encoder model loaded successfully')
62
- return modelInstance
63
-
64
- } catch (error) {
65
- logger.error({ error, modelName }, 'Failed to load cross-encoder model')
66
- loadingPromise = null
67
- throw error
68
- }
69
- })()
70
-
71
- return loadingPromise
72
- }
73
-
74
- /**
75
- * Check if model is loaded
76
- */
77
- export function isModelLoaded(): boolean {
78
- return modelInstance !== null
79
- }
80
-
81
- /**
82
- * Unload model to free memory
83
- */
84
- export function unloadModel(): void {
85
- modelInstance = null
86
- loadingPromise = null
87
- }
88
-
89
- /**
90
- * Get model memory usage estimate
91
- */
92
- export function getModelMemoryEstimate(): number {
93
- // ms-marco-MiniLM-L-6-v2 quantized is roughly 22MB
94
- return isModelLoaded() ? 22 * 1024 * 1024 : 0
95
- }
1
+ /**
2
+ * Reranker Model Loader
3
+ * Handles loading and caching of the cross-encoder model
4
+ */
5
+
6
+ import type { Logger } from 'pino'
7
+
8
+ // Dynamic import for transformers to avoid bundling issues
9
+ let pipeline: any
10
+ let AutoTokenizer: any
11
+
12
+ interface RerankerModel {
13
+ tokenizer: any
14
+ model: any
15
+ }
16
+
17
+ let modelInstance: RerankerModel | null = null
18
+ let loadingPromise: Promise<RerankerModel> | null = null
19
+
20
+ /**
21
+ * Load the cross-encoder model
22
+ * Uses singleton pattern to avoid loading multiple times
23
+ */
24
+ export async function loadRerankerModel(
25
+ logger: Logger,
26
+ modelName: string = 'cross-encoder/ms-marco-MiniLM-L-6-v2'
27
+ ): Promise<RerankerModel> {
28
+ // Return existing instance if loaded
29
+ if (modelInstance) {
30
+ return modelInstance
31
+ }
32
+
33
+ // Wait for in-progress loading
34
+ if (loadingPromise) {
35
+ return loadingPromise
36
+ }
37
+
38
+ // Start loading
39
+ loadingPromise = (async () => {
40
+ logger.info({ modelName }, 'Loading cross-encoder reranker model')
41
+
42
+ try {
43
+ // Dynamic import to avoid issues if transformers.js not available
44
+ const transformers = await import('@xenova/transformers')
45
+ pipeline = transformers.pipeline
46
+ AutoTokenizer = transformers.AutoTokenizer
47
+
48
+ // Load text-classification pipeline for cross-encoder
49
+ // Cross-encoders score query-document pairs
50
+ const classifier = await pipeline('text-classification', modelName, {
51
+ quantized: true // Use quantized model for faster inference
52
+ })
53
+
54
+ const tokenizer = await AutoTokenizer.from_pretrained(modelName)
55
+
56
+ modelInstance = {
57
+ tokenizer,
58
+ model: classifier
59
+ }
60
+
61
+ logger.info({ modelName }, 'Cross-encoder model loaded successfully')
62
+ return modelInstance
63
+
64
+ } catch (error) {
65
+ logger.error({ error, modelName }, 'Failed to load cross-encoder model')
66
+ loadingPromise = null
67
+ throw error
68
+ }
69
+ })()
70
+
71
+ return loadingPromise
72
+ }
73
+
74
+ /**
75
+ * Check if model is loaded
76
+ */
77
+ export function isModelLoaded(): boolean {
78
+ return modelInstance !== null
79
+ }
80
+
81
+ /**
82
+ * Unload model to free memory
83
+ */
84
+ export function unloadModel(): void {
85
+ modelInstance = null
86
+ loadingPromise = null
87
+ }
88
+
89
+ /**
90
+ * Get model memory usage estimate
91
+ */
92
+ export function getModelMemoryEstimate(): number {
93
+ // ms-marco-MiniLM-L-6-v2 quantized is roughly 22MB
94
+ return isModelLoaded() ? 22 * 1024 * 1024 : 0
95
+ }