lynkr 7.2.5 → 8.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (124) hide show
  1. package/README.md +3 -3
  2. package/config/model-tiers.json +89 -0
  3. package/install.sh +6 -1
  4. package/package.json +4 -2
  5. package/scripts/setup.js +0 -1
  6. package/src/agents/executor.js +14 -6
  7. package/src/api/middleware/session.js +15 -2
  8. package/src/api/openai-router.js +162 -37
  9. package/src/api/providers-handler.js +15 -1
  10. package/src/api/router.js +107 -2
  11. package/src/budget/index.js +4 -3
  12. package/src/clients/databricks.js +431 -234
  13. package/src/clients/gpt-utils.js +181 -0
  14. package/src/clients/ollama-utils.js +66 -140
  15. package/src/clients/routing.js +0 -1
  16. package/src/clients/standard-tools.js +99 -3
  17. package/src/config/index.js +133 -35
  18. package/src/context/toon.js +173 -0
  19. package/src/logger/index.js +23 -0
  20. package/src/orchestrator/index.js +688 -213
  21. package/src/routing/agentic-detector.js +320 -0
  22. package/src/routing/complexity-analyzer.js +202 -2
  23. package/src/routing/cost-optimizer.js +305 -0
  24. package/src/routing/index.js +168 -159
  25. package/src/routing/model-tiers.js +365 -0
  26. package/src/server.js +4 -14
  27. package/src/sessions/cleanup.js +3 -3
  28. package/src/sessions/record.js +10 -1
  29. package/src/sessions/store.js +7 -2
  30. package/src/tools/agent-task.js +48 -1
  31. package/src/tools/index.js +19 -2
  32. package/src/tools/lazy-loader.js +7 -0
  33. package/src/tools/tinyfish.js +358 -0
  34. package/src/tools/truncate.js +1 -0
  35. package/.github/FUNDING.yml +0 -15
  36. package/.github/workflows/README.md +0 -215
  37. package/.github/workflows/ci.yml +0 -69
  38. package/.github/workflows/index.yml +0 -62
  39. package/.github/workflows/web-tools-tests.yml +0 -56
  40. package/CITATIONS.bib +0 -6
  41. package/CLAWROUTER_ROUTING_PLAN.md +0 -910
  42. package/DEPLOYMENT.md +0 -1001
  43. package/LYNKR-TUI-PLAN.md +0 -984
  44. package/PERFORMANCE-REPORT.md +0 -866
  45. package/PLAN-per-client-model-routing.md +0 -252
  46. package/ROUTER_COMPARISON.md +0 -173
  47. package/TIER_ROUTING_PLAN.md +0 -771
  48. package/docs/42642f749da6234f41b6b425c3bb07c9.txt +0 -1
  49. package/docs/BingSiteAuth.xml +0 -4
  50. package/docs/docs-style.css +0 -478
  51. package/docs/docs.html +0 -197
  52. package/docs/google5be250e608e6da39.html +0 -1
  53. package/docs/index.html +0 -577
  54. package/docs/index.md +0 -577
  55. package/docs/robots.txt +0 -4
  56. package/docs/sitemap.xml +0 -44
  57. package/docs/style.css +0 -1223
  58. package/documentation/README.md +0 -100
  59. package/documentation/api.md +0 -806
  60. package/documentation/claude-code-cli.md +0 -672
  61. package/documentation/codex-cli.md +0 -397
  62. package/documentation/contributing.md +0 -571
  63. package/documentation/cursor-integration.md +0 -731
  64. package/documentation/docker.md +0 -867
  65. package/documentation/embeddings.md +0 -760
  66. package/documentation/faq.md +0 -659
  67. package/documentation/features.md +0 -396
  68. package/documentation/headroom.md +0 -519
  69. package/documentation/installation.md +0 -706
  70. package/documentation/memory-system.md +0 -476
  71. package/documentation/production.md +0 -601
  72. package/documentation/providers.md +0 -906
  73. package/documentation/testing.md +0 -629
  74. package/documentation/token-optimization.md +0 -323
  75. package/documentation/tools.md +0 -697
  76. package/documentation/troubleshooting.md +0 -893
  77. package/final-test.js +0 -33
  78. package/headroom-sidecar/config.py +0 -93
  79. package/headroom-sidecar/requirements.txt +0 -14
  80. package/headroom-sidecar/server.py +0 -451
  81. package/monitor-agents.sh +0 -31
  82. package/scripts/audit-log-reader.js +0 -399
  83. package/scripts/compact-dictionary.js +0 -204
  84. package/scripts/test-deduplication.js +0 -448
  85. package/src/db/database.sqlite +0 -0
  86. package/test/README.md +0 -212
  87. package/test/azure-openai-config.test.js +0 -204
  88. package/test/azure-openai-error-resilience.test.js +0 -238
  89. package/test/azure-openai-format-conversion.test.js +0 -354
  90. package/test/azure-openai-integration.test.js +0 -281
  91. package/test/azure-openai-routing.test.js +0 -177
  92. package/test/azure-openai-streaming.test.js +0 -171
  93. package/test/bedrock-integration.test.js +0 -471
  94. package/test/comprehensive-test-suite.js +0 -928
  95. package/test/config-validation.test.js +0 -207
  96. package/test/cursor-integration.test.js +0 -484
  97. package/test/format-conversion.test.js +0 -578
  98. package/test/hybrid-routing-integration.test.js +0 -254
  99. package/test/hybrid-routing-performance.test.js +0 -418
  100. package/test/llamacpp-integration.test.js +0 -863
  101. package/test/lmstudio-integration.test.js +0 -335
  102. package/test/memory/extractor.test.js +0 -398
  103. package/test/memory/retriever.test.js +0 -613
  104. package/test/memory/retriever.test.js.bak +0 -585
  105. package/test/memory/search.test.js +0 -537
  106. package/test/memory/search.test.js.bak +0 -389
  107. package/test/memory/store.test.js +0 -344
  108. package/test/memory/store.test.js.bak +0 -312
  109. package/test/memory/surprise.test.js +0 -300
  110. package/test/memory-performance.test.js +0 -472
  111. package/test/openai-integration.test.js +0 -686
  112. package/test/openrouter-error-resilience.test.js +0 -418
  113. package/test/passthrough-mode.test.js +0 -385
  114. package/test/performance-benchmark.js +0 -351
  115. package/test/performance-tests.js +0 -528
  116. package/test/routing.test.js +0 -219
  117. package/test/web-tools.test.js +0 -329
  118. package/test-agents-simple.js +0 -43
  119. package/test-cli-connection.sh +0 -33
  120. package/test-learning-unit.js +0 -126
  121. package/test-learning.js +0 -112
  122. package/test-parallel-agents.sh +0 -124
  123. package/test-parallel-direct.js +0 -155
  124. package/test-subagents.sh +0 -117
@@ -0,0 +1,305 @@
1
+ /**
2
+ * Cost Optimizer Module
3
+ * Tracks and optimizes LLM costs across providers
4
+ * Uses ModelRegistry for dynamic pricing data
5
+ */
6
+
7
+ const logger = require('../logger');
8
+ const config = require('../config');
9
+ const { getModelRegistry, getModelRegistrySync } = require('./model-registry');
10
+ const { getModelTierSelector, TIER_DEFINITIONS } = require('./model-tiers');
11
+
12
+ // Session cost tracking (in-memory)
13
+ const sessionCosts = new Map(); // sessionId -> { total, requests, byModel, byProvider }
14
+
15
+ // Global stats
16
+ const globalStats = {
17
+ totalCost: 0,
18
+ totalSavings: 0,
19
+ requestCount: 0,
20
+ byProvider: {},
21
+ byTier: {},
22
+ };
23
+
24
+ class CostOptimizer {
25
+ constructor() {
26
+ this.registry = null;
27
+ this.tierSelector = null;
28
+ }
29
+
30
+ /**
31
+ * Initialize with registry (async)
32
+ */
33
+ async initialize() {
34
+ this.registry = await getModelRegistry();
35
+ this.tierSelector = getModelTierSelector();
36
+ }
37
+
38
+ /**
39
+ * Get registry (sync fallback)
40
+ */
41
+ _getRegistry() {
42
+ if (!this.registry) {
43
+ this.registry = getModelRegistrySync();
44
+ }
45
+ return this.registry;
46
+ }
47
+
48
+ /**
49
+ * Get tier selector
50
+ */
51
+ _getTierSelector() {
52
+ if (!this.tierSelector) {
53
+ this.tierSelector = getModelTierSelector();
54
+ }
55
+ return this.tierSelector;
56
+ }
57
+
58
+ /**
59
+ * Estimate cost for a request before sending
60
+ * @param {string} model - Model name
61
+ * @param {number} inputTokens - Estimated input tokens
62
+ * @param {number} outputTokens - Estimated output tokens (optional)
63
+ * @returns {Object} Cost estimate
64
+ */
65
+ estimateCost(model, inputTokens, outputTokens = null) {
66
+ const registry = this._getRegistry();
67
+ const costs = registry.getCost(model);
68
+
69
+ const inputCost = (inputTokens / 1_000_000) * costs.input;
70
+ const estimatedOutputTokens = outputTokens || Math.min(inputTokens * 0.5, 4096);
71
+ const outputCost = (estimatedOutputTokens / 1_000_000) * costs.output;
72
+
73
+ return {
74
+ inputCost: Math.round(inputCost * 1_000_000) / 1_000_000,
75
+ outputCost: Math.round(outputCost * 1_000_000) / 1_000_000,
76
+ totalEstimate: Math.round((inputCost + outputCost) * 1_000_000) / 1_000_000,
77
+ model,
78
+ inputTokens,
79
+ outputTokens: estimatedOutputTokens,
80
+ pricePerMillion: {
81
+ input: costs.input,
82
+ output: costs.output,
83
+ },
84
+ source: costs.source,
85
+ };
86
+ }
87
+
88
+ /**
89
+ * Find cheapest model capable of handling a complexity tier
90
+ * @param {string} requiredTier - Minimum tier required
91
+ * @param {string[]} availableProviders - Providers to consider
92
+ * @returns {Object|null} Cheapest model info
93
+ */
94
+ findCheapestForTier(requiredTier, availableProviders) {
95
+ const registry = this._getRegistry();
96
+ const tierSelector = this._getTierSelector();
97
+
98
+ const tierOrder = ['SIMPLE', 'MEDIUM', 'COMPLEX', 'REASONING'];
99
+ const minTierIndex = tierOrder.indexOf(requiredTier);
100
+
101
+ if (minTierIndex === -1) {
102
+ logger.warn({ tier: requiredTier }, '[CostOptimizer] Unknown tier');
103
+ return null;
104
+ }
105
+
106
+ const candidates = [];
107
+
108
+ // Collect models from all capable tiers (>= required tier)
109
+ for (let i = minTierIndex; i < tierOrder.length; i++) {
110
+ const tier = tierOrder[i];
111
+
112
+ for (const provider of availableProviders) {
113
+ const models = tierSelector.getPreferredModels(tier, provider);
114
+
115
+ for (const model of models) {
116
+ const cost = registry.getCost(model);
117
+ const totalCost = cost.input + cost.output; // Simple cost metric
118
+
119
+ candidates.push({
120
+ model,
121
+ provider,
122
+ tier,
123
+ inputCost: cost.input,
124
+ outputCost: cost.output,
125
+ totalCost,
126
+ context: cost.context,
127
+ source: cost.source,
128
+ });
129
+ }
130
+ }
131
+ }
132
+
133
+ if (candidates.length === 0) {
134
+ return null;
135
+ }
136
+
137
+ // Sort by total cost (input + output per 1M tokens)
138
+ candidates.sort((a, b) => a.totalCost - b.totalCost);
139
+
140
+ const cheapest = candidates[0];
141
+
142
+ logger.debug({
143
+ requiredTier,
144
+ selectedModel: cheapest.model,
145
+ selectedProvider: cheapest.provider,
146
+ cost: cheapest.totalCost,
147
+ candidateCount: candidates.length,
148
+ }, '[CostOptimizer] Found cheapest model');
149
+
150
+ return cheapest;
151
+ }
152
+
153
+ /**
154
+ * Record actual cost after response
155
+ * @param {string} sessionId - Session identifier
156
+ * @param {string} provider - Provider used
157
+ * @param {string} model - Model used
158
+ * @param {number} inputTokens - Actual input tokens
159
+ * @param {number} outputTokens - Actual output tokens
160
+ * @param {string} tier - Complexity tier
161
+ * @returns {number} Actual cost
162
+ */
163
+ recordCost(sessionId, provider, model, inputTokens, outputTokens, tier = 'MEDIUM') {
164
+ const registry = this._getRegistry();
165
+ const costs = registry.getCost(model);
166
+
167
+ const inputCost = (inputTokens / 1_000_000) * costs.input;
168
+ const outputCost = (outputTokens / 1_000_000) * costs.output;
169
+ const actualCost = inputCost + outputCost;
170
+
171
+ // Update session costs
172
+ if (sessionId) {
173
+ if (!sessionCosts.has(sessionId)) {
174
+ sessionCosts.set(sessionId, {
175
+ total: 0,
176
+ requests: 0,
177
+ byModel: {},
178
+ byProvider: {},
179
+ byTier: {},
180
+ });
181
+ }
182
+
183
+ const session = sessionCosts.get(sessionId);
184
+ session.total += actualCost;
185
+ session.requests++;
186
+ session.byModel[model] = (session.byModel[model] || 0) + actualCost;
187
+ session.byProvider[provider] = (session.byProvider[provider] || 0) + actualCost;
188
+ session.byTier[tier] = (session.byTier[tier] || 0) + actualCost;
189
+ }
190
+
191
+ // Update global stats
192
+ globalStats.totalCost += actualCost;
193
+ globalStats.requestCount++;
194
+ globalStats.byProvider[provider] = (globalStats.byProvider[provider] || 0) + actualCost;
195
+ globalStats.byTier[tier] = (globalStats.byTier[tier] || 0) + actualCost;
196
+
197
+ logger.debug({
198
+ sessionId,
199
+ provider,
200
+ model,
201
+ inputTokens,
202
+ outputTokens,
203
+ cost: actualCost.toFixed(6),
204
+ tier,
205
+ }, '[CostOptimizer] Recorded cost');
206
+
207
+ return actualCost;
208
+ }
209
+
210
+ /**
211
+ * Calculate potential savings from routing optimization
212
+ */
213
+ calculateSavings(originalModel, optimizedModel, tokens) {
214
+ const registry = this._getRegistry();
215
+
216
+ const originalCost = registry.getCost(originalModel);
217
+ const optimizedCost = registry.getCost(optimizedModel);
218
+
219
+ const originalTotal = (tokens / 1_000_000) * (originalCost.input + originalCost.output);
220
+ const optimizedTotal = (tokens / 1_000_000) * (optimizedCost.input + optimizedCost.output);
221
+
222
+ const savings = originalTotal - optimizedTotal;
223
+
224
+ if (savings > 0) {
225
+ globalStats.totalSavings += savings;
226
+ }
227
+
228
+ return {
229
+ originalCost: originalTotal,
230
+ optimizedCost: optimizedTotal,
231
+ savings: Math.max(0, savings),
232
+ percentSaved: originalTotal > 0 ? (savings / originalTotal) * 100 : 0,
233
+ };
234
+ }
235
+
236
+
237
+ /**
238
+ * Get session cost summary
239
+ */
240
+ getSessionCost(sessionId) {
241
+ return sessionCosts.get(sessionId) || {
242
+ total: 0,
243
+ requests: 0,
244
+ byModel: {},
245
+ byProvider: {},
246
+ byTier: {},
247
+ };
248
+ }
249
+
250
+ /**
251
+ * Get global stats
252
+ */
253
+ getStats() {
254
+ return {
255
+ ...globalStats,
256
+ sessionCount: sessionCosts.size,
257
+ avgCostPerRequest: globalStats.requestCount > 0
258
+ ? (globalStats.totalCost / globalStats.requestCount).toFixed(6)
259
+ : '0',
260
+ totalCostFormatted: `$${globalStats.totalCost.toFixed(4)}`,
261
+ totalSavingsFormatted: `$${globalStats.totalSavings.toFixed(4)}`,
262
+ };
263
+ }
264
+
265
+ /**
266
+ * Clear session data (for cleanup)
267
+ */
268
+ clearSession(sessionId) {
269
+ sessionCosts.delete(sessionId);
270
+ }
271
+
272
+ /**
273
+ * Reset all stats (for testing)
274
+ */
275
+ resetStats() {
276
+ sessionCosts.clear();
277
+ globalStats.totalCost = 0;
278
+ globalStats.totalSavings = 0;
279
+ globalStats.requestCount = 0;
280
+ globalStats.byProvider = {};
281
+ globalStats.byTier = {};
282
+ }
283
+ }
284
+
285
+ // Singleton instance
286
+ let instance = null;
287
+
288
+ function getCostOptimizer() {
289
+ if (!instance) {
290
+ instance = new CostOptimizer();
291
+ }
292
+ return instance;
293
+ }
294
+
295
+ async function getCostOptimizerAsync() {
296
+ const optimizer = getCostOptimizer();
297
+ await optimizer.initialize();
298
+ return optimizer;
299
+ }
300
+
301
+ module.exports = {
302
+ CostOptimizer,
303
+ getCostOptimizer,
304
+ getCostOptimizerAsync,
305
+ };