adaptive-memory-multi-model-router 1.2.2 → 1.3.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (195) hide show
  1. package/LICENSE +21 -0
  2. package/README.md +146 -66
  3. package/dist/index.d.ts +1 -1
  4. package/dist/index.js +1 -1
  5. package/dist/integrations/airtable.js +20 -0
  6. package/dist/integrations/discord.js +18 -0
  7. package/dist/integrations/github.js +23 -0
  8. package/dist/integrations/gmail.js +19 -0
  9. package/dist/integrations/google-calendar.js +18 -0
  10. package/dist/integrations/index.js +61 -0
  11. package/dist/integrations/jira.js +21 -0
  12. package/dist/integrations/linear.js +19 -0
  13. package/dist/integrations/notion.js +19 -0
  14. package/dist/integrations/slack.js +18 -0
  15. package/dist/integrations/telegram.js +19 -0
  16. package/dist/providers/registry.js +7 -3
  17. package/docs/ARCHITECTURAL-IMPROVEMENTS-2025.md +1391 -0
  18. package/docs/ARCHITECTURAL-IMPROVEMENTS-REVISED-2025.md +1051 -0
  19. package/docs/CONFIGURATION.md +476 -0
  20. package/docs/COUNCIL_DECISION.json +308 -0
  21. package/docs/COUNCIL_SUMMARY.md +265 -0
  22. package/docs/COUNCIL_V2.2_DECISION.md +416 -0
  23. package/docs/IMPROVEMENT_ROADMAP.md +515 -0
  24. package/docs/LLM_COUNCIL_DECISION.md +508 -0
  25. package/docs/QUICK_START_VISIBILITY.md +782 -0
  26. package/docs/REDDIT_GAP_ANALYSIS.md +299 -0
  27. package/docs/RESEARCH_BACKED_IMPROVEMENTS.md +1180 -0
  28. package/docs/TMLPD_QNA.md +751 -0
  29. package/docs/TMLPD_V2.1_COMPLETE.md +763 -0
  30. package/docs/TMLPD_V2.2_RESEARCH_ROADMAP.md +754 -0
  31. package/docs/V2.2_IMPLEMENTATION_COMPLETE.md +446 -0
  32. package/docs/V2_IMPLEMENTATION_GUIDE.md +388 -0
  33. package/docs/VISIBILITY_ADOPTION_PLAN.md +1005 -0
  34. package/docs/launch-content/LAUNCH_EXECUTION_CHECKLIST.md +421 -0
  35. package/docs/launch-content/README.md +457 -0
  36. package/docs/launch-content/assets/cost_comparison_100_tasks.png +0 -0
  37. package/docs/launch-content/assets/cumulative_savings.png +0 -0
  38. package/docs/launch-content/assets/parallel_speedup.png +0 -0
  39. package/docs/launch-content/assets/provider_pricing_comparison.png +0 -0
  40. package/docs/launch-content/assets/task_breakdown_comparison.png +0 -0
  41. package/docs/launch-content/generate_charts.py +313 -0
  42. package/docs/launch-content/hn_show_post.md +139 -0
  43. package/docs/launch-content/partner_outreach_templates.md +745 -0
  44. package/docs/launch-content/reddit_posts.md +467 -0
  45. package/docs/launch-content/twitter_thread.txt +460 -0
  46. package/examples/QUICKSTART.md +1 -1
  47. package/openclaw-alexa-bridge/ALL_REMAINING_FIXES_PLAN.md +313 -0
  48. package/openclaw-alexa-bridge/REMAINING_FIXES_SUMMARY.md +277 -0
  49. package/openclaw-alexa-bridge/src/alexa_handler_no_tmlpd.js +1234 -0
  50. package/openclaw-alexa-bridge/test_fixes.js +77 -0
  51. package/package.json +120 -29
  52. package/package.json.tmp +0 -0
  53. package/qna/TMLPD_QNA.md +3 -3
  54. package/skill/SKILL.md +2 -2
  55. package/src/__tests__/integration/tmpld_integration.test.py +540 -0
  56. package/src/agents/skill_enhanced_agent.py +318 -0
  57. package/src/memory/__init__.py +15 -0
  58. package/src/memory/agentic_memory.py +353 -0
  59. package/src/memory/semantic_memory.py +444 -0
  60. package/src/memory/simple_memory.py +466 -0
  61. package/src/memory/working_memory.py +447 -0
  62. package/src/orchestration/__init__.py +52 -0
  63. package/src/orchestration/execution_engine.py +353 -0
  64. package/src/orchestration/halo_orchestrator.py +367 -0
  65. package/src/orchestration/mcts_workflow.py +498 -0
  66. package/src/orchestration/role_assigner.py +473 -0
  67. package/src/orchestration/task_planner.py +522 -0
  68. package/src/providers/__init__.py +67 -0
  69. package/src/providers/anthropic.py +304 -0
  70. package/src/providers/base.py +241 -0
  71. package/src/providers/cerebras.py +373 -0
  72. package/src/providers/registry.py +476 -0
  73. package/src/routing/__init__.py +30 -0
  74. package/src/routing/universal_router.py +621 -0
  75. package/src/skills/TMLPD-QUICKREF.md +210 -0
  76. package/src/skills/TMLPD-SETUP-SUMMARY.md +157 -0
  77. package/src/skills/TMLPD.md +540 -0
  78. package/src/skills/__tests__/skill_manager.test.ts +328 -0
  79. package/src/skills/skill_manager.py +385 -0
  80. package/src/skills/test-tmlpd.sh +108 -0
  81. package/src/skills/tmlpd-category.yaml +67 -0
  82. package/src/skills/tmlpd-monitoring.yaml +188 -0
  83. package/src/skills/tmlpd-phase.yaml +132 -0
  84. package/src/state/__init__.py +17 -0
  85. package/src/state/simple_checkpoint.py +508 -0
  86. package/src/tmlpd_agent.py +464 -0
  87. package/src/tmpld_v2.py +427 -0
  88. package/src/workflows/__init__.py +18 -0
  89. package/src/workflows/advanced_difficulty_classifier.py +377 -0
  90. package/src/workflows/chaining_executor.py +417 -0
  91. package/src/workflows/difficulty_integration.py +209 -0
  92. package/src/workflows/orchestrator.py +469 -0
  93. package/src/workflows/orchestrator_executor.py +456 -0
  94. package/src/workflows/parallelization_executor.py +382 -0
  95. package/src/workflows/router.py +311 -0
  96. package/test_integration_simple.py +86 -0
  97. package/test_mcts_workflow.py +150 -0
  98. package/test_templd_integration.py +262 -0
  99. package/test_universal_router.py +275 -0
  100. package/tmlpd-pi-extension/README.md +36 -0
  101. package/tmlpd-pi-extension/dist/cache/prefixCache.d.ts +114 -0
  102. package/tmlpd-pi-extension/dist/cache/prefixCache.d.ts.map +1 -0
  103. package/tmlpd-pi-extension/dist/cache/prefixCache.js +285 -0
  104. package/tmlpd-pi-extension/dist/cache/prefixCache.js.map +1 -0
  105. package/tmlpd-pi-extension/dist/cache/responseCache.d.ts +58 -0
  106. package/tmlpd-pi-extension/dist/cache/responseCache.d.ts.map +1 -0
  107. package/tmlpd-pi-extension/dist/cache/responseCache.js +153 -0
  108. package/tmlpd-pi-extension/dist/cache/responseCache.js.map +1 -0
  109. package/tmlpd-pi-extension/dist/cli.js +59 -0
  110. package/tmlpd-pi-extension/dist/cost/costTracker.d.ts +95 -0
  111. package/tmlpd-pi-extension/dist/cost/costTracker.d.ts.map +1 -0
  112. package/tmlpd-pi-extension/dist/cost/costTracker.js +240 -0
  113. package/tmlpd-pi-extension/dist/cost/costTracker.js.map +1 -0
  114. package/tmlpd-pi-extension/dist/index.d.ts +723 -0
  115. package/tmlpd-pi-extension/dist/index.d.ts.map +1 -0
  116. package/tmlpd-pi-extension/dist/index.js +239 -0
  117. package/tmlpd-pi-extension/dist/index.js.map +1 -0
  118. package/tmlpd-pi-extension/dist/memory/episodicMemory.d.ts +82 -0
  119. package/tmlpd-pi-extension/dist/memory/episodicMemory.d.ts.map +1 -0
  120. package/tmlpd-pi-extension/dist/memory/episodicMemory.js +145 -0
  121. package/tmlpd-pi-extension/dist/memory/episodicMemory.js.map +1 -0
  122. package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.d.ts +102 -0
  123. package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.d.ts.map +1 -0
  124. package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.js +207 -0
  125. package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.js.map +1 -0
  126. package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.d.ts +85 -0
  127. package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.d.ts.map +1 -0
  128. package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.js +210 -0
  129. package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.js.map +1 -0
  130. package/tmlpd-pi-extension/dist/providers/localProvider.d.ts +102 -0
  131. package/tmlpd-pi-extension/dist/providers/localProvider.d.ts.map +1 -0
  132. package/tmlpd-pi-extension/dist/providers/localProvider.js +338 -0
  133. package/tmlpd-pi-extension/dist/providers/localProvider.js.map +1 -0
  134. package/tmlpd-pi-extension/dist/providers/registry.d.ts +55 -0
  135. package/tmlpd-pi-extension/dist/providers/registry.d.ts.map +1 -0
  136. package/tmlpd-pi-extension/dist/providers/registry.js +138 -0
  137. package/tmlpd-pi-extension/dist/providers/registry.js.map +1 -0
  138. package/tmlpd-pi-extension/dist/routing/advancedRouter.d.ts +68 -0
  139. package/tmlpd-pi-extension/dist/routing/advancedRouter.d.ts.map +1 -0
  140. package/tmlpd-pi-extension/dist/routing/advancedRouter.js +332 -0
  141. package/tmlpd-pi-extension/dist/routing/advancedRouter.js.map +1 -0
  142. package/tmlpd-pi-extension/dist/tools/tmlpdTools.d.ts +101 -0
  143. package/tmlpd-pi-extension/dist/tools/tmlpdTools.d.ts.map +1 -0
  144. package/tmlpd-pi-extension/dist/tools/tmlpdTools.js +368 -0
  145. package/tmlpd-pi-extension/dist/tools/tmlpdTools.js.map +1 -0
  146. package/tmlpd-pi-extension/dist/utils/batchProcessor.d.ts +96 -0
  147. package/tmlpd-pi-extension/dist/utils/batchProcessor.d.ts.map +1 -0
  148. package/tmlpd-pi-extension/dist/utils/batchProcessor.js +170 -0
  149. package/tmlpd-pi-extension/dist/utils/batchProcessor.js.map +1 -0
  150. package/tmlpd-pi-extension/dist/utils/compression.d.ts +61 -0
  151. package/tmlpd-pi-extension/dist/utils/compression.d.ts.map +1 -0
  152. package/tmlpd-pi-extension/dist/utils/compression.js +281 -0
  153. package/tmlpd-pi-extension/dist/utils/compression.js.map +1 -0
  154. package/tmlpd-pi-extension/dist/utils/reliability.d.ts +74 -0
  155. package/tmlpd-pi-extension/dist/utils/reliability.d.ts.map +1 -0
  156. package/tmlpd-pi-extension/dist/utils/reliability.js +177 -0
  157. package/tmlpd-pi-extension/dist/utils/reliability.js.map +1 -0
  158. package/tmlpd-pi-extension/dist/utils/speculativeDecoding.d.ts +117 -0
  159. package/tmlpd-pi-extension/dist/utils/speculativeDecoding.d.ts.map +1 -0
  160. package/tmlpd-pi-extension/dist/utils/speculativeDecoding.js +246 -0
  161. package/tmlpd-pi-extension/dist/utils/speculativeDecoding.js.map +1 -0
  162. package/tmlpd-pi-extension/dist/utils/tokenUtils.d.ts +50 -0
  163. package/tmlpd-pi-extension/dist/utils/tokenUtils.d.ts.map +1 -0
  164. package/tmlpd-pi-extension/dist/utils/tokenUtils.js +124 -0
  165. package/tmlpd-pi-extension/dist/utils/tokenUtils.js.map +1 -0
  166. package/tmlpd-pi-extension/examples/QUICKSTART.md +183 -0
  167. package/tmlpd-pi-extension/package-lock.json +75 -0
  168. package/tmlpd-pi-extension/package.json +172 -0
  169. package/tmlpd-pi-extension/python/examples.py +53 -0
  170. package/tmlpd-pi-extension/python/integrations.py +330 -0
  171. package/tmlpd-pi-extension/python/setup.py +28 -0
  172. package/tmlpd-pi-extension/python/tmlpd.py +369 -0
  173. package/tmlpd-pi-extension/qna/REDDIT_GAP_ANALYSIS.md +299 -0
  174. package/tmlpd-pi-extension/qna/TMLPD_QNA.md +751 -0
  175. package/tmlpd-pi-extension/skill/SKILL.md +238 -0
  176. package/{src → tmlpd-pi-extension/src}/index.ts +1 -1
  177. package/tmlpd-pi-extension/tsconfig.json +18 -0
  178. package/demo/research-demo.js +0 -266
  179. package/notebooks/quickstart.ipynb +0 -157
  180. package/rust/tmlpd.h +0 -268
  181. package/src/cache/prefixCache.ts +0 -365
  182. package/src/routing/advancedRouter.ts +0 -406
  183. package/src/utils/speculativeDecoding.ts +0 -344
  184. /package/{src → tmlpd-pi-extension/src}/cache/responseCache.ts +0 -0
  185. /package/{src → tmlpd-pi-extension/src}/cost/costTracker.ts +0 -0
  186. /package/{src → tmlpd-pi-extension/src}/memory/episodicMemory.ts +0 -0
  187. /package/{src → tmlpd-pi-extension/src}/orchestration/haloOrchestrator.ts +0 -0
  188. /package/{src → tmlpd-pi-extension/src}/orchestration/mctsWorkflow.ts +0 -0
  189. /package/{src → tmlpd-pi-extension/src}/providers/localProvider.ts +0 -0
  190. /package/{src → tmlpd-pi-extension/src}/providers/registry.ts +0 -0
  191. /package/{src → tmlpd-pi-extension/src}/tools/tmlpdTools.ts +0 -0
  192. /package/{src → tmlpd-pi-extension/src}/utils/batchProcessor.ts +0 -0
  193. /package/{src → tmlpd-pi-extension/src}/utils/compression.ts +0 -0
  194. /package/{src → tmlpd-pi-extension/src}/utils/reliability.ts +0 -0
  195. /package/{src → tmlpd-pi-extension/src}/utils/tokenUtils.ts +0 -0
@@ -0,0 +1,332 @@
1
+ "use strict";
2
+ /**
3
+ * TMLPD Advanced Routing - RouteLLM Style
4
+ *
5
+ * Learned routing based on arXiv:2404.06035 (RouteLLM)
6
+ * Balances cost-quality tradeoff with confidence-based model selection
7
+ */
8
+ Object.defineProperty(exports, "__esModule", { value: true });
9
+ exports.MODEL_PROFILES = void 0;
10
+ exports.extractQueryFeatures = extractQueryFeatures;
11
+ exports.routeQuery = routeQuery;
12
+ exports.routeBatch = routeBatch;
13
+ exports.recommendForTask = recommendForTask;
14
+ exports.updateModelProfile = updateModelProfile;
15
+ const tokenUtils_1 = require("../utils/tokenUtils");
16
+ // Pre-configured model profiles
17
+ exports.MODEL_PROFILES = {
18
+ "openai/gpt-4o": {
19
+ name: "openai/gpt-4o",
20
+ provider: "openai",
21
+ cost_per_1k_input: 2.50,
22
+ cost_per_1k_output: 10.00,
23
+ latency_ms: 2000,
24
+ quality_score: 0.95,
25
+ strengths: ["reasoning", "coding", "analysis"],
26
+ context_window: 128000
27
+ },
28
+ "openai/gpt-4o-mini": {
29
+ name: "openai/gpt-4o-mini",
30
+ provider: "openai",
31
+ cost_per_1k_input: 0.15,
32
+ cost_per_1k_output: 0.60,
33
+ latency_ms: 500,
34
+ quality_score: 0.85,
35
+ strengths: ["fast", "coding"],
36
+ context_window: 128000
37
+ },
38
+ "anthropic/claude-3.5-sonnet": {
39
+ name: "anthropic/claude-3.5-sonnet",
40
+ provider: "anthropic",
41
+ cost_per_1k_input: 3.00,
42
+ cost_per_1k_output: 15.00,
43
+ latency_ms: 2500,
44
+ quality_score: 0.96,
45
+ strengths: ["reasoning", "creative", "analysis"],
46
+ context_window: 200000
47
+ },
48
+ "anthropic/claude-3-haiku": {
49
+ name: "anthropic/claude-3-haiku",
50
+ provider: "anthropic",
51
+ cost_per_1k_input: 0.25,
52
+ cost_per_1k_output: 1.25,
53
+ latency_ms: 500,
54
+ quality_score: 0.80,
55
+ strengths: ["fast", "simple"],
56
+ context_window: 200000
57
+ },
58
+ "google/gemini-2.0-flash": {
59
+ name: "google/gemini-2.0-flash",
60
+ provider: "google",
61
+ cost_per_1k_input: 0.00, // Free
62
+ cost_per_1k_output: 0.00,
63
+ latency_ms: 800,
64
+ quality_score: 0.88,
65
+ strengths: ["fast", "multilingual"],
66
+ context_window: 1000000
67
+ },
68
+ "google/gemini-1.5-pro": {
69
+ name: "google/gemini-1.5-pro",
70
+ provider: "google",
71
+ cost_per_1k_input: 1.25,
72
+ cost_per_1k_output: 5.00,
73
+ latency_ms: 1500,
74
+ quality_score: 0.92,
75
+ strengths: ["reasoning", "long-context"],
76
+ context_window: 2000000
77
+ },
78
+ "groq/llama-3.3-70b": {
79
+ name: "groq/llama-3.3-70b",
80
+ provider: "groq",
81
+ cost_per_1k_input: 0.59,
82
+ cost_per_1k_output: 0.79,
83
+ latency_ms: 400,
84
+ quality_score: 0.82,
85
+ strengths: ["fast", "coding"],
86
+ context_window: 128000
87
+ },
88
+ "cerebras/llama-3.3-70b": {
89
+ name: "cerebras/llama-3.3-70b",
90
+ provider: "cerebras",
91
+ cost_per_1k_input: 0.60,
92
+ cost_per_1k_output: 0.60,
93
+ latency_ms: 350,
94
+ quality_score: 0.82,
95
+ strengths: ["fast", "budget"],
96
+ context_window: 128000
97
+ },
98
+ "local/llama-3.3-70b": {
99
+ name: "local/llama-3.3-70b",
100
+ provider: "ollama",
101
+ cost_per_1k_input: 0.00,
102
+ cost_per_1k_output: 0.00,
103
+ latency_ms: 100,
104
+ quality_score: 0.75,
105
+ strengths: ["privacy", "free"],
106
+ context_window: 128000
107
+ }
108
+ };
109
+ /**
110
+ * Extract features from prompt for routing decision
111
+ */
112
+ function extractQueryFeatures(prompt) {
113
+ const lower = prompt.toLowerCase();
114
+ // Code patterns
115
+ const code_indicators = [
116
+ "function", "class ", "def ", "import ", "const ", "let ",
117
+ "python", "javascript", "typescript", "java", "cpp", "rust",
118
+ "```", "=>", "->", "async", "await"
119
+ ];
120
+ const has_code = code_indicators.some(pattern => lower.includes(pattern));
121
+ // Math patterns (expanded for unicode and common notation)
122
+ const math_indicators = [
123
+ "equation", "formula", "calculate", "sqrt", "^", "log",
124
+ "sin", "cos", "tan", "integral", "derivative", "$", "math",
125
+ "∫", "∂", "∑", "∏", "√", "∞", "π", "θ", "β",
126
+ "dx", "dy", "dz", "=", "solver", "compute"
127
+ ];
128
+ const has_math = math_indicators.some(pattern => prompt.includes(pattern));
129
+ // Multilingual
130
+ const lang_patterns = [
131
+ /[\u4e00-\u9fff]/, // Chinese
132
+ /[\u3040-\u309f\u30a0-\u30ff]/, // Japanese
133
+ /[\uac00-\ud7af]/, // Korean
134
+ /[а-яА-Я]/, // Russian
135
+ /[áéíóúñ]/ // Spanish accented
136
+ ];
137
+ const is_multilingual = lang_patterns.some(pattern => pattern.test(prompt));
138
+ // Creative writing
139
+ const creative_indicators = [
140
+ "write a", "story", "poem", "creative", "imagine",
141
+ "describe", "explain in", "tell me", "narrative"
142
+ ];
143
+ const is_creative = creative_indicators.some(pattern => lower.includes(pattern));
144
+ // Reasoning
145
+ const reasoning_indicators = [
146
+ "explain", "why", "because", "therefore", "thus",
147
+ "analyze", "think", "consider", "reason", "logic"
148
+ ];
149
+ const requires_reasoning = reasoning_indicators.some(pattern => lower.includes(pattern));
150
+ // Complexity estimation based on length and patterns
151
+ const tokens = (0, tokenUtils_1.countTokens)(prompt, "gpt-4o");
152
+ let complexity = 0.3;
153
+ if (tokens > 1000)
154
+ complexity += 0.2;
155
+ if (has_code)
156
+ complexity += 0.15;
157
+ if (has_math)
158
+ complexity += 0.2;
159
+ if (requires_reasoning)
160
+ complexity += 0.15;
161
+ if (is_creative)
162
+ complexity += 0.1;
163
+ complexity = Math.min(1.0, complexity);
164
+ return {
165
+ complexity,
166
+ length: tokens,
167
+ has_code,
168
+ has_math,
169
+ is_multilingual,
170
+ is_creative,
171
+ requires_reasoning
172
+ };
173
+ }
174
+ /**
175
+ * Score model fit for query
176
+ */
177
+ function scoreModelFit(model, features) {
178
+ let score = model.quality_score * 0.4; // Base quality
179
+ // Strengths matching
180
+ if (features.has_code && model.strengths.includes("coding")) {
181
+ score += 0.2;
182
+ }
183
+ if (features.requires_reasoning && model.strengths.includes("reasoning")) {
184
+ score += 0.2;
185
+ }
186
+ if (features.is_creative && model.strengths.includes("creative")) {
187
+ score += 0.15;
188
+ }
189
+ if (features.is_multilingual && model.strengths.includes("multilingual")) {
190
+ score += 0.15;
191
+ }
192
+ if (features.has_math && model.strengths.includes("analysis")) {
193
+ score += 0.15;
194
+ }
195
+ // Speed bonus for simple tasks
196
+ if (features.complexity < 0.4 && model.latency_ms < 1000) {
197
+ score += 0.1;
198
+ }
199
+ return score;
200
+ }
201
+ /**
202
+ * Cost efficiency score (inverse of normalized cost)
203
+ */
204
+ function costEfficiency(model, features) {
205
+ const avg_cost = (model.cost_per_1k_input + model.cost_per_1k_output) / 2;
206
+ // For simple tasks, prioritize cost efficiency
207
+ if (features.complexity < 0.5) {
208
+ return (1 - Math.min(avg_cost / 10, 1)) * 0.6;
209
+ }
210
+ // For complex tasks, deprioritize cost
211
+ return (1 - Math.min(avg_cost / 10, 1)) * 0.2;
212
+ }
213
+ /**
214
+ * RouteLLM-style learned routing decision
215
+ */
216
+ function routeQuery(prompt, available_models, budget_multiplier = 1.0) {
217
+ const features = extractQueryFeatures(prompt);
218
+ const candidate_names = available_models || Object.keys(exports.MODEL_PROFILES);
219
+ const candidates = candidate_names
220
+ .filter(name => exports.MODEL_PROFILES[name])
221
+ .map(name => {
222
+ const profile = exports.MODEL_PROFILES[name];
223
+ const quality = scoreModelFit(profile, features);
224
+ const cost = costEfficiency(profile, features);
225
+ return {
226
+ name,
227
+ profile,
228
+ quality_score: quality,
229
+ cost_score: cost,
230
+ total_score: quality + cost
231
+ };
232
+ });
233
+ // Sort by total score (quality vs cost tradeoff based on complexity)
234
+ const complexity_bias = features.complexity > 0.6 ? 0.7 : 0.3; // High complexity = quality bias
235
+ candidates.sort((a, b) => {
236
+ const score_a = a.quality_score * complexity_bias + a.cost_score * (1 - complexity_bias);
237
+ const score_b = b.quality_score * complexity_bias + b.cost_score * (1 - complexity_bias);
238
+ return score_b - score_a;
239
+ });
240
+ const primary = candidates[0];
241
+ const secondary = candidates.slice(1, 3);
242
+ // Calculate confidence based on score gap
243
+ let confidence = 0.5;
244
+ if (candidates.length > 1) {
245
+ const gap = primary.total_score - candidates[1].total_score;
246
+ confidence = Math.min(0.95, 0.5 + gap * 2);
247
+ }
248
+ // Build reasoning
249
+ const reasons = [];
250
+ if (features.has_code)
251
+ reasons.push("code detected");
252
+ if (features.requires_reasoning)
253
+ reasons.push("reasoning needed");
254
+ if (features.complexity > 0.6)
255
+ reasons.push("high complexity");
256
+ if (features.is_multilingual)
257
+ reasons.push("multilingual");
258
+ const estimated_tokens = features.length * 1.5; // rough completion estimate
259
+ const estimated_cost = (0, tokenUtils_1.estimateCost)(features.length, estimated_tokens, primary.name);
260
+ return {
261
+ primary_model: primary.name,
262
+ fallback_models: secondary.map(c => c.name),
263
+ confidence,
264
+ reasoning: `Selected ${primary.profile.provider}/${primary.name.split("/")[1]} for ${reasons.join(", ") || "general query"}`,
265
+ estimated_cost: estimated_cost * budget_multiplier,
266
+ estimated_latency_ms: primary.profile.latency_ms
267
+ };
268
+ }
269
+ /**
270
+ * Batch routing for multiple prompts
271
+ */
272
+ function routeBatch(prompts, options) {
273
+ const decisions = prompts.map(p => routeQuery(p));
274
+ if (options?.same_model && decisions.length > 0) {
275
+ // Use first decision's model for all (for batch consistency)
276
+ const primary_model = decisions[0].primary_model;
277
+ decisions.forEach(d => {
278
+ d.primary_model = primary_model;
279
+ d.fallback_models = decisions[0].fallback_models;
280
+ });
281
+ }
282
+ if (options?.max_cost_per_prompt) {
283
+ decisions.forEach(d => {
284
+ if (d.estimated_cost > options.max_cost_per_prompt) {
285
+ // Route to cheaper alternative
286
+ const cheap = Object.entries(exports.MODEL_PROFILES)
287
+ .find(([name, p]) => p.cost_per_1k_input < 0.5);
288
+ if (cheap) {
289
+ d.primary_model = cheap[0];
290
+ d.reasoning = `Budget-limited routing to ${cheap[1].provider}`;
291
+ }
292
+ }
293
+ });
294
+ }
295
+ return decisions;
296
+ }
297
+ /**
298
+ * Get model recommendation for task type
299
+ */
300
+ function recommendForTask(task) {
301
+ const features = extractQueryFeatures(task);
302
+ const decision = routeQuery(task);
303
+ // Return primary + fallbacks
304
+ return [decision.primary_model, ...decision.fallback_models];
305
+ }
306
+ /**
307
+ * Update model profile from execution feedback (online learning)
308
+ */
309
+ function updateModelProfile(model_name, actual_latency_ms, actual_cost, quality_rating // 0-1
310
+ ) {
311
+ const profile = exports.MODEL_PROFILES[model_name];
312
+ if (!profile)
313
+ return;
314
+ // Exponential moving average update
315
+ const alpha = 0.2; // Learning rate
316
+ profile.latency_ms = profile.latency_ms * (1 - alpha) + actual_latency_ms * alpha;
317
+ profile.quality_score = profile.quality_score * (1 - alpha) + quality_rating * alpha;
318
+ // Adjust cost perception
319
+ const actual_cost_per_1k = actual_cost * 1000;
320
+ const current_avg_cost = (profile.cost_per_1k_input + profile.cost_per_1k_output) / 2;
321
+ // Keep stored costs as reference, but note actual in profile
322
+ console.log(`[RouteLLM] Updated ${model_name}: latency=${profile.latency_ms.toFixed(0)}ms, quality=${profile.quality_score.toFixed(2)}`);
323
+ }
324
+ exports.default = {
325
+ extractQueryFeatures,
326
+ routeQuery,
327
+ routeBatch,
328
+ recommendForTask,
329
+ updateModelProfile,
330
+ MODEL_PROFILES: exports.MODEL_PROFILES
331
+ };
332
+ //# sourceMappingURL=advancedRouter.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"advancedRouter.js","sourceRoot":"","sources":["../../src/routing/advancedRouter.ts"],"names":[],"mappings":";AAAA;;;;;GAKG;;;AAmIH,oDAiEC;AAmDD,gCAoEC;AAKD,gCAkCC;AAKD,4CAMC;AAKD,gDAqBC;AArYD,oDAAgE;AAgChE,gCAAgC;AACnB,QAAA,cAAc,GAAiC;IAC1D,eAAe,EAAE;QACf,IAAI,EAAE,eAAe;QACrB,QAAQ,EAAE,QAAQ;QAClB,iBAAiB,EAAE,IAAI;QACvB,kBAAkB,EAAE,KAAK;QACzB,UAAU,EAAE,IAAI;QAChB,aAAa,EAAE,IAAI;QACnB,SAAS,EAAE,CAAC,WAAW,EAAE,QAAQ,EAAE,UAAU,CAAC;QAC9C,cAAc,EAAE,MAAM;KACvB;IACD,oBAAoB,EAAE;QACpB,IAAI,EAAE,oBAAoB;QAC1B,QAAQ,EAAE,QAAQ;QAClB,iBAAiB,EAAE,IAAI;QACvB,kBAAkB,EAAE,IAAI;QACxB,UAAU,EAAE,GAAG;QACf,aAAa,EAAE,IAAI;QACnB,SAAS,EAAE,CAAC,MAAM,EAAE,QAAQ,CAAC;QAC7B,cAAc,EAAE,MAAM;KACvB;IACD,6BAA6B,EAAE;QAC7B,IAAI,EAAE,6BAA6B;QACnC,QAAQ,EAAE,WAAW;QACrB,iBAAiB,EAAE,IAAI;QACvB,kBAAkB,EAAE,KAAK;QACzB,UAAU,EAAE,IAAI;QAChB,aAAa,EAAE,IAAI;QACnB,SAAS,EAAE,CAAC,WAAW,EAAE,UAAU,EAAE,UAAU,CAAC;QAChD,cAAc,EAAE,MAAM;KACvB;IACD,0BAA0B,EAAE;QAC1B,IAAI,EAAE,0BAA0B;QAChC,QAAQ,EAAE,WAAW;QACrB,iBAAiB,EAAE,IAAI;QACvB,kBAAkB,EAAE,IAAI;QACxB,UAAU,EAAE,GAAG;QACf,aAAa,EAAE,IAAI;QACnB,SAAS,EAAE,CAAC,MAAM,EAAE,QAAQ,CAAC;QAC7B,cAAc,EAAE,MAAM;KACvB;IACD,yBAAyB,EAAE;QACzB,IAAI,EAAE,yBAAyB;QAC/B,QAAQ,EAAE,QAAQ;QAClB,iBAAiB,EAAE,IAAI,EAAG,OAAO;QACjC,kBAAkB,EAAE,IAAI;QACxB,UAAU,EAAE,GAAG;QACf,aAAa,EAAE,IAAI;QACnB,SAAS,EAAE,CAAC,MAAM,EAAE,cAAc,CAAC;QACnC,cAAc,EAAE,OAAO;KACxB;IACD,uBAAuB,EAAE;QACvB,IAAI,EAAE,uBAAuB;QAC7B,QAAQ,EAAE,QAAQ;QAClB,iBAAiB,EAAE,IAAI;QACvB,kBAAkB,EAAE,IAAI;QACxB,UAAU,EAAE,IAAI;QAChB,aAAa,EAAE,IAAI;QACnB,SAAS,EAAE,CAAC,WAAW,EAAE,cAAc,CAAC;QACxC,cAAc,EAAE,OAAO;KACxB;IACD,oBAAoB,EAAE;QACpB,IAAI,EAAE,oBAAoB;QAC1B,QAAQ,EAAE,MAAM;QAChB,iBAAiB,EAAE,IAAI;QACvB,kBAAkB,EAAE,IAAI;QACxB,UAAU,EAAE,GAAG;QACf,aAAa,EAAE,IAAI;QACnB,SAAS,EAAE,CAAC,MAAM,EAAE,QAAQ,CAAC;QAC7B,cAAc,EAAE,MAAM;KACvB;IACD,wBAAwB,EAAE;QACxB,IAAI,EAAE,wBAAwB;QAC9B,QAAQ,EAAE,UAAU;QACpB,iBAAiB,EAAE,IAAI;QACvB,kBAAkB,EAAE,IAAI;QACxB,UAAU,EAAE,GAAG;QACf,aAAa,EAAE,IAAI;QACnB,SAAS,EAAE,CAAC,MAAM,EAAE,QAAQ,CAAC;QAC7B,cAAc,EAAE,MAAM;KACvB;IACD,qBAAqB,EAAE;QACrB,IAAI,EAAE,qBAAqB;QAC3B,QAAQ,EAAE,QAAQ;QAClB,iBAAiB,EAAE,IAAI;QACvB,kBAAkB,EAAE,IAAI;QACxB,UAAU,EAAE,GAAG;QACf,aAAa,EAAE,IAAI;QACnB,SAAS,EAAE,CAAC,SAAS,EAAE,MAAM,CAAC;QAC9B,cAAc,EAAE,MAAM;KACvB;CACF,CAAC;AAEF;;GAEG;AACH,SAAgB,oBAAoB,CAAC,MAAc;IACjD,MAAM,KAAK,GAAG,MAAM,CAAC,WAAW,EAAE,CAAC;IAEnC,gBAAgB;IAChB,MAAM,eAAe,GAAG;QACtB,UAAU,EAAE,QAAQ,EAAE,MAAM,EAAE,SAAS,EAAE,QAAQ,EAAE,MAAM;QACzD,QAAQ,EAAE,YAAY,EAAE,YAAY,EAAE,MAAM,EAAE,KAAK,EAAE,MAAM;QAC3D,KAAK,EAAE,IAAI,EAAE,IAAI,EAAE,OAAO,EAAE,OAAO;KACpC,CAAC;IACF,MAAM,QAAQ,GAAG,eAAe,CAAC,IAAI,CAAC,OAAO,CAAC,EAAE,CAAC,KAAK,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC,CAAC;IAE1E,2DAA2D;IAC3D,MAAM,eAAe,GAAG;QACtB,UAAU,EAAE,SAAS,EAAE,WAAW,EAAE,MAAM,EAAE,GAAG,EAAE,KAAK;QACtD,KAAK,EAAE,KAAK,EAAE,KAAK,EAAE,UAAU,EAAE,YAAY,EAAE,GAAG,EAAE,MAAM;QAC1D,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG;QAC3C,IAAI,EAAE,IAAI,EAAE,IAAI,EAAE,GAAG,EAAE,QAAQ,EAAE,SAAS;KAC3C,CAAC;IACF,MAAM,QAAQ,GAAG,eAAe,CAAC,IAAI,CAAC,OAAO,CAAC,EAAE,CAAC,MAAM,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC,CAAC;IAE3E,eAAe;IACf,MAAM,aAAa,GAAG;QACpB,iBAAiB,EAAG,UAAU;QAC9B,8BAA8B,EAAG,WAAW;QAC5C,iBAAiB,EAAG,SAAS;QAC7B,UAAU,EAAG,UAAU;QACvB,UAAU,CAAG,mBAAmB;KACjC,CAAC;IACF,MAAM,eAAe,GAAG,aAAa,CAAC,IAAI,CAAC,OAAO,CAAC,EAAE,CAAC,OAAO,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC,CAAC;IAE5E,mBAAmB;IACnB,MAAM,mBAAmB,GAAG;QAC1B,SAAS,EAAE,OAAO,EAAE,MAAM,EAAE,UAAU,EAAE,SAAS;QACjD,UAAU,EAAE,YAAY,EAAE,SAAS,EAAE,WAAW;KACjD,CAAC;IACF,MAAM,WAAW,GAAG,mBAAmB,CAAC,IAAI,CAAC,OAAO,CAAC,EAAE,CAAC,KAAK,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC,CAAC;IAEjF,YAAY;IACZ,MAAM,oBAAoB,GAAG;QAC3B,SAAS,EAAE,KAAK,EAAE,SAAS,EAAE,WAAW,EAAE,MAAM;QAChD,SAAS,EAAE,OAAO,EAAE,UAAU,EAAE,QAAQ,EAAE,OAAO;KAClD,CAAC;IACF,MAAM,kBAAkB,GAAG,oBAAoB,CAAC,IAAI,CAAC,OAAO,CAAC,EAAE,CAAC,KAAK,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC,CAAC;IAEzF,qDAAqD;IACrD,MAAM,MAAM,GAAG,IAAA,wBAAW,EAAC,MAAM,EAAE,QAAQ,CAAC,CAAC;IAC7C,IAAI,UAAU,GAAG,GAAG,CAAC;IAErB,IAAI,MAAM,GAAG,IAAI;QAAE,UAAU,IAAI,GAAG,CAAC;IACrC,IAAI,QAAQ;QAAE,UAAU,IAAI,IAAI,CAAC;IACjC,IAAI,QAAQ;QAAE,UAAU,IAAI,GAAG,CAAC;IAChC,IAAI,kBAAkB;QAAE,UAAU,IAAI,IAAI,CAAC;IAC3C,IAAI,WAAW;QAAE,UAAU,IAAI,GAAG,CAAC;IAEnC,UAAU,GAAG,IAAI,CAAC,GAAG,CAAC,GAAG,EAAE,UAAU,CAAC,CAAC;IAEvC,OAAO;QACL,UAAU;QACV,MAAM,EAAE,MAAM;QACd,QAAQ;QACR,QAAQ;QACR,eAAe;QACf,WAAW;QACX,kBAAkB;KACnB,CAAC;AACJ,CAAC;AAED;;GAEG;AACH,SAAS,aAAa,CAAC,KAAmB,EAAE,QAAuB;IACjE,IAAI,KAAK,GAAG,KAAK,CAAC,aAAa,GAAG,GAAG,CAAC,CAAE,eAAe;IAEvD,qBAAqB;IACrB,IAAI,QAAQ,CAAC,QAAQ,IAAI,KAAK,CAAC,SAAS,CAAC,QAAQ,CAAC,QAAQ,CAAC,EAAE,CAAC;QAC5D,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IACD,IAAI,QAAQ,CAAC,kBAAkB,IAAI,KAAK,CAAC,SAAS,CAAC,QAAQ,CAAC,WAAW,CAAC,EAAE,CAAC;QACzE,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IACD,IAAI,QAAQ,CAAC,WAAW,IAAI,KAAK,CAAC,SAAS,CAAC,QAAQ,CAAC,UAAU,CAAC,EAAE,CAAC;QACjE,KAAK,IAAI,IAAI,CAAC;IAChB,CAAC;IACD,IAAI,QAAQ,CAAC,eAAe,IAAI,KAAK,CAAC,SAAS,CAAC,QAAQ,CAAC,cAAc,CAAC,EAAE,CAAC;QACzE,KAAK,IAAI,IAAI,CAAC;IAChB,CAAC;IACD,IAAI,QAAQ,CAAC,QAAQ,IAAI,KAAK,CAAC,SAAS,CAAC,QAAQ,CAAC,UAAU,CAAC,EAAE,CAAC;QAC9D,KAAK,IAAI,IAAI,CAAC;IAChB,CAAC;IAED,+BAA+B;IAC/B,IAAI,QAAQ,CAAC,UAAU,GAAG,GAAG,IAAI,KAAK,CAAC,UAAU,GAAG,IAAI,EAAE,CAAC;QACzD,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,OAAO,KAAK,CAAC;AACf,CAAC;AAED;;GAEG;AACH,SAAS,cAAc,CAAC,KAAmB,EAAE,QAAuB;IAClE,MAAM,QAAQ,GAAG,CAAC,KAAK,CAAC,iBAAiB,GAAG,KAAK,CAAC,kBAAkB,CAAC,GAAG,CAAC,CAAC;IAE1E,+CAA+C;IAC/C,IAAI,QAAQ,CAAC,UAAU,GAAG,GAAG,EAAE,CAAC;QAC9B,OAAO,CAAC,CAAC,GAAG,IAAI,CAAC,GAAG,CAAC,QAAQ,GAAG,EAAE,EAAE,CAAC,CAAC,CAAC,GAAG,GAAG,CAAC;IAChD,CAAC;IAED,uCAAuC;IACvC,OAAO,CAAC,CAAC,GAAG,IAAI,CAAC,GAAG,CAAC,QAAQ,GAAG,EAAE,EAAE,CAAC,CAAC,CAAC,GAAG,GAAG,CAAC;AAChD,CAAC;AAED;;GAEG;AACH,SAAgB,UAAU,CACxB,MAAc,EACd,gBAA2B,EAC3B,oBAA4B,GAAG;IAE/B,MAAM,QAAQ,GAAG,oBAAoB,CAAC,MAAM,CAAC,CAAC;IAC9C,MAAM,eAAe,GAAG,gBAAgB,IAAI,MAAM,CAAC,IAAI,CAAC,sBAAc,CAAC,CAAC;IAWxE,MAAM,UAAU,GAAkB,eAAe;SAC9C,MAAM,CAAC,IAAI,CAAC,EAAE,CAAC,sBAAc,CAAC,IAAI,CAAC,CAAC;SACpC,GAAG,CAAC,IAAI,CAAC,EAAE;QACV,MAAM,OAAO,GAAG,sBAAc,CAAC,IAAI,CAAE,CAAC;QACtC,MAAM,OAAO,GAAG,aAAa,CAAC,OAAO,EAAE,QAAQ,CAAC,CAAC;QACjD,MAAM,IAAI,GAAG,cAAc,CAAC,OAAO,EAAE,QAAQ,CAAC,CAAC;QAC/C,OAAO;YACL,IAAI;YACJ,OAAO;YACP,aAAa,EAAE,OAAO;YACtB,UAAU,EAAE,IAAI;YAChB,WAAW,EAAE,OAAO,GAAG,IAAI;SAC5B,CAAC;IACJ,CAAC,CAAC,CAAC;IAEL,qEAAqE;IACrE,MAAM,eAAe,GAAG,QAAQ,CAAC,UAAU,GAAG,GAAG,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,GAAG,CAAC,CAAE,iCAAiC;IACjG,UAAU,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE;QACvB,MAAM,OAAO,GAAG,CAAC,CAAC,aAAa,GAAG,eAAe,GAAG,CAAC,CAAC,UAAU,GAAG,CAAC,CAAC,GAAG,eAAe,CAAC,CAAC;QACzF,MAAM,OAAO,GAAG,CAAC,CAAC,aAAa,GAAG,eAAe,GAAG,CAAC,CAAC,UAAU,GAAG,CAAC,CAAC,GAAG,eAAe,CAAC,CAAC;QACzF,OAAO,OAAO,GAAG,OAAO,CAAC;IAC3B,CAAC,CAAC,CAAC;IAEH,MAAM,OAAO,GAAG,UAAU,CAAC,CAAC,CAAC,CAAC;IAC9B,MAAM,SAAS,GAAG,UAAU,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC;IAEzC,0CAA0C;IAC1C,IAAI,UAAU,GAAG,GAAG,CAAC;IACrB,IAAI,UAAU,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QAC1B,MAAM,GAAG,GAAG,OAAO,CAAC,WAAW,GAAG,UAAU,CAAC,CAAC,CAAC,CAAC,WAAW,CAAC;QAC5D,UAAU,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,EAAE,GAAG,GAAG,GAAG,GAAG,CAAC,CAAC,CAAC;IAC7C,CAAC;IAED,kBAAkB;IAClB,MAAM,OAAO,GAAa,EAAE,CAAC;IAC7B,IAAI,QAAQ,CAAC,QAAQ;QAAE,OAAO,CAAC,IAAI,CAAC,eAAe,CAAC,CAAC;IACrD,IAAI,QAAQ,CAAC,kBAAkB;QAAE,OAAO,CAAC,IAAI,CAAC,kBAAkB,CAAC,CAAC;IAClE,IAAI,QAAQ,CAAC,UAAU,GAAG,GAAG;QAAE,OAAO,CAAC,IAAI,CAAC,iBAAiB,CAAC,CAAC;IAC/D,IAAI,QAAQ,CAAC,eAAe;QAAE,OAAO,CAAC,IAAI,CAAC,cAAc,CAAC,CAAC;IAE3D,MAAM,gBAAgB,GAAG,QAAQ,CAAC,MAAM,GAAG,GAAG,CAAC,CAAE,4BAA4B;IAC7E,MAAM,cAAc,GAAG,IAAA,yBAAY,EAAC,QAAQ,CAAC,MAAM,EAAE,gBAAgB,EAAE,OAAO,CAAC,IAAI,CAAC,CAAC;IAErF,OAAO;QACL,aAAa,EAAE,OAAO,CAAC,IAAI;QAC3B,eAAe,EAAE,SAAS,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC;QAC3C,UAAU;QACV,SAAS,EAAE,YAAY,OAAO,CAAC,OAAO,CAAC,QAAQ,IAAI,OAAO,CAAC,IAAI,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,QAAQ,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,IAAI,eAAe,EAAE;QAC5H,cAAc,EAAE,cAAc,GAAG,iBAAiB;QAClD,oBAAoB,EAAE,OAAO,CAAC,OAAO,CAAC,UAAU;KACjD,CAAC;AACJ,CAAC;AAED;;GAEG;AACH,SAAgB,UAAU,CACxB,OAAiB,EACjB,OAIC;IAED,MAAM,SAAS,GAAG,OAAO,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC,CAAC;IAElD,IAAI,OAAO,EAAE,UAAU,IAAI,SAAS,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QAChD,6DAA6D;QAC7D,MAAM,aAAa,GAAG,SAAS,CAAC,CAAC,CAAC,CAAC,aAAa,CAAC;QACjD,SAAS,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE;YACpB,CAAC,CAAC,aAAa,GAAG,aAAa,CAAC;YAChC,CAAC,CAAC,eAAe,GAAG,SAAS,CAAC,CAAC,CAAC,CAAC,eAAe,CAAC;QACnD,CAAC,CAAC,CAAC;IACL,CAAC;IAED,IAAI,OAAO,EAAE,mBAAmB,EAAE,CAAC;QACjC,SAAS,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE;YACpB,IAAI,CAAC,CAAC,cAAc,GAAG,OAAO,CAAC,mBAAoB,EAAE,CAAC;gBACpD,+BAA+B;gBAC/B,MAAM,KAAK,GAAG,MAAM,CAAC,OAAO,CAAC,sBAAc,CAAC;qBACzC,IAAI,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,iBAAiB,GAAG,GAAG,CAAC,CAAC;gBAClD,IAAI,KAAK,EAAE,CAAC;oBACV,CAAC,CAAC,aAAa,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC;oBAC3B,CAAC,CAAC,SAAS,GAAG,6BAA6B,KAAK,CAAC,CAAC,CAAC,CAAC,QAAQ,EAAE,CAAC;gBACjE,CAAC;YACH,CAAC;QACH,CAAC,CAAC,CAAC;IACL,CAAC;IAED,OAAO,SAAS,CAAC;AACnB,CAAC;AAED;;GAEG;AACH,SAAgB,gBAAgB,CAAC,IAAY;IAC3C,MAAM,QAAQ,GAAG,oBAAoB,CAAC,IAAI,CAAC,CAAC;IAC5C,MAAM,QAAQ,GAAG,UAAU,CAAC,IAAI,CAAC,CAAC;IAElC,6BAA6B;IAC7B,OAAO,CAAC,QAAQ,CAAC,aAAa,EAAE,GAAG,QAAQ,CAAC,eAAe,CAAC,CAAC;AAC/D,CAAC;AAED;;GAEG;AACH,SAAgB,kBAAkB,CAChC,UAAkB,EAClB,iBAAyB,EACzB,WAAmB,EACnB,cAAsB,CAAE,MAAM;;IAE9B,MAAM,OAAO,GAAG,sBAAc,CAAC,UAAU,CAAC,CAAC;IAC3C,IAAI,CAAC,OAAO;QAAE,OAAO;IAErB,oCAAoC;IACpC,MAAM,KAAK,GAAG,GAAG,CAAC,CAAE,gBAAgB;IAEpC,OAAO,CAAC,UAAU,GAAG,OAAO,CAAC,UAAU,GAAG,CAAC,CAAC,GAAG,KAAK,CAAC,GAAG,iBAAiB,GAAG,KAAK,CAAC;IAClF,OAAO,CAAC,aAAa,GAAG,OAAO,CAAC,aAAa,GAAG,CAAC,CAAC,GAAG,KAAK,CAAC,GAAG,cAAc,GAAG,KAAK,CAAC;IAErF,yBAAyB;IACzB,MAAM,kBAAkB,GAAG,WAAW,GAAG,IAAI,CAAC;IAC9C,MAAM,gBAAgB,GAAG,CAAC,OAAO,CAAC,iBAAiB,GAAG,OAAO,CAAC,kBAAkB,CAAC,GAAG,CAAC,CAAC;IACtF,6DAA6D;IAE7D,OAAO,CAAC,GAAG,CAAC,sBAAsB,UAAU,aAAa,OAAO,CAAC,UAAU,CAAC,OAAO,CAAC,CAAC,CAAC,eAAe,OAAO,CAAC,aAAa,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC;AAC3I,CAAC;AAED,kBAAe;IACb,oBAAoB;IACpB,UAAU;IACV,UAAU;IACV,gBAAgB;IAChB,kBAAkB;IAClB,cAAc,EAAd,sBAAc;CACf,CAAC"}
@@ -0,0 +1,101 @@
1
+ /**
2
+ * TMLPD PI Tools
3
+ *
4
+ * Main tools exposed to the PI agent via the MCP bridge.
5
+ * Features: streaming, caching, cost tracking, reliability.
6
+ */
7
+ import { CacheConfig } from "../cache/responseCache";
8
+ import { BudgetConfig, CostSummary } from "../cost/costTracker";
9
+ import { RetryConfig } from "../utils/reliability";
10
+ export interface TMLPDConfig {
11
+ cache?: Partial<CacheConfig>;
12
+ budget?: BudgetConfig;
13
+ retry?: Partial<RetryConfig>;
14
+ maxConcurrent?: number;
15
+ }
16
+ export interface ExecuteResult {
17
+ success: boolean;
18
+ content?: string;
19
+ error?: string;
20
+ model: string;
21
+ provider: string;
22
+ tokens?: number;
23
+ cost?: number;
24
+ cached?: boolean;
25
+ duration_ms?: number;
26
+ attempts?: number;
27
+ }
28
+ export interface ParallelResult {
29
+ responses: ExecuteResult[];
30
+ total_models: number;
31
+ successful_models: number;
32
+ total_cost: number;
33
+ duration_ms: number;
34
+ }
35
+ export interface StreamingConfig {
36
+ enabled: boolean;
37
+ chunk_size?: number;
38
+ on_chunk?: (chunk: string) => void;
39
+ }
40
+ export declare class TMLPDTools {
41
+ private cache;
42
+ private costTracker;
43
+ private registry;
44
+ private circuitBreakers;
45
+ private retryConfig;
46
+ private maxConcurrent;
47
+ constructor(config?: TMLPDConfig);
48
+ /**
49
+ * Get cost summary
50
+ */
51
+ getCostSummary(): CostSummary;
52
+ /**
53
+ * Get remaining budget
54
+ */
55
+ getRemainingBudget(): {
56
+ daily: number | null;
57
+ monthly: number | null;
58
+ per_model: Record<string, number>;
59
+ };
60
+ /**
61
+ * Get cache stats
62
+ */
63
+ getCacheStats(): {
64
+ hits: number;
65
+ misses: number;
66
+ size: number;
67
+ hit_rate: number;
68
+ };
69
+ /**
70
+ * Get provider status
71
+ */
72
+ getProviderStatus(): Record<string, any>;
73
+ /**
74
+ * Execute single prompt with optional streaming
75
+ */
76
+ execute(prompt: string, model?: string, streaming?: StreamingConfig): Promise<ExecuteResult>;
77
+ /**
78
+ * Execute parallel across multiple models
79
+ */
80
+ executeParallel(prompt: string, models?: string[], streaming?: StreamingConfig): Promise<ParallelResult>;
81
+ /**
82
+ * Get circuit breaker for provider
83
+ */
84
+ private getCircuitBreaker;
85
+ /**
86
+ * Execute HTTP request to provider
87
+ */
88
+ private executeRequest;
89
+ private executeOpenAI;
90
+ private executeAnthropic;
91
+ private executeGemini;
92
+ }
93
+ /**
94
+ * Create a TMLPD instance
95
+ */
96
+ export declare function createTMLPD(config?: TMLPDConfig): TMLPDTools;
97
+ /**
98
+ * Get default singleton instance
99
+ */
100
+ export declare function getDefault(): TMLPDTools;
101
+ //# sourceMappingURL=tmlpdTools.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"tmlpdTools.d.ts","sourceRoot":"","sources":["../../src/tools/tmlpdTools.ts"],"names":[],"mappings":"AAAA;;;;;GAKG;AAEH,OAAO,EAAiB,WAAW,EAAE,MAAM,wBAAwB,CAAC;AACpE,OAAO,EAAe,YAAY,EAAE,WAAW,EAAE,MAAM,qBAAqB,CAAC;AAE7E,OAAO,EAA6B,WAAW,EAAwB,MAAM,sBAAsB,CAAC;AAIpG,MAAM,WAAW,WAAW;IAC1B,KAAK,CAAC,EAAE,OAAO,CAAC,WAAW,CAAC,CAAC;IAC7B,MAAM,CAAC,EAAE,YAAY,CAAC;IACtB,KAAK,CAAC,EAAE,OAAO,CAAC,WAAW,CAAC,CAAC;IAC7B,aAAa,CAAC,EAAE,MAAM,CAAC;CACxB;AAED,MAAM,WAAW,aAAa;IAC5B,OAAO,EAAE,OAAO,CAAC;IACjB,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,KAAK,EAAE,MAAM,CAAC;IACd,QAAQ,EAAE,MAAM,CAAC;IACjB,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,IAAI,CAAC,EAAE,MAAM,CAAC;IACd,MAAM,CAAC,EAAE,OAAO,CAAC;IACjB,WAAW,CAAC,EAAE,MAAM,CAAC;IACrB,QAAQ,CAAC,EAAE,MAAM,CAAC;CACnB;AAED,MAAM,WAAW,cAAc;IAC7B,SAAS,EAAE,aAAa,EAAE,CAAC;IAC3B,YAAY,EAAE,MAAM,CAAC;IACrB,iBAAiB,EAAE,MAAM,CAAC;IAC1B,UAAU,EAAE,MAAM,CAAC;IACnB,WAAW,EAAE,MAAM,CAAC;CACrB;AAED,MAAM,WAAW,eAAe;IAC9B,OAAO,EAAE,OAAO,CAAC;IACjB,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,QAAQ,CAAC,EAAE,CAAC,KAAK,EAAE,MAAM,KAAK,IAAI,CAAC;CACpC;AAED,qBAAa,UAAU;IACrB,OAAO,CAAC,KAAK,CAAgB;IAC7B,OAAO,CAAC,WAAW,CAAc;IACjC,OAAO,CAAC,QAAQ,CAAmB;IACnC,OAAO,CAAC,eAAe,CAA0C;IACjE,OAAO,CAAC,WAAW,CAAc;IACjC,OAAO,CAAC,aAAa,CAAS;gBAElB,MAAM,GAAE,WAAgB;IAQpC;;OAEG;IACH,cAAc,IAAI,WAAW;IAI7B;;OAEG;IACH,kBAAkB,IAAI;QAAE,KAAK,EAAE,MAAM,GAAG,IAAI,CAAC;QAAC,OAAO,EAAE,MAAM,GAAG,IAAI,CAAC;QAAC,SAAS,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAA;KAAE;IAIzG;;OAEG;IACH,aAAa,IAAI;QAAE,IAAI,EAAE,MAAM,CAAC;QAAC,MAAM,EAAE,MAAM,CAAC;QAAC,IAAI,EAAE,MAAM,CAAC;QAAC,QAAQ,EAAE,MAAM,CAAA;KAAE;IAIjF;;OAEG;IACH,iBAAiB,IAAI,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC;IAIxC;;OAEG;IACG,OAAO,CACX,MAAM,EAAE,MAAM,EACd,KAAK,CAAC,EAAE,MAAM,EACd,SAAS,CAAC,EAAE,eAAe,GAC1B,OAAO,CAAC,aAAa,CAAC;IAiFzB;;OAEG;IACG,eAAe,CACnB,MAAM,EAAE,MAAM,EACd,MAAM,CAAC,EAAE,MAAM,EAAE,EACjB,SAAS,CAAC,EAAE,eAAe,GAC1B,OAAO,CAAC,cAAc,CAAC;IAiC1B;;OAEG;IACH,OAAO,CAAC,iBAAiB;IAOzB;;OAEG;YACW,cAAc;YAqBd,aAAa;YAqDb,gBAAgB;YAqDhB,aAAa;CAkD5B;AAOD;;GAEG;AACH,wBAAgB,WAAW,CAAC,MAAM,CAAC,EAAE,WAAW,GAAG,UAAU,CAE5D;AAED;;GAEG;AACH,wBAAgB,UAAU,IAAI,UAAU,CAKvC"}