adaptive-memory-multi-model-router 2.14.46 → 2.14.47

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (598) hide show
  1. package/{docs/llms.txt → llms.txt.bak} +6 -6
  2. package/package.json +13 -84
  3. package/src/routing/advancedRouter.ts.bak +650 -0
  4. package/test.js.bak +376 -0
  5. package/.dockerignore +0 -82
  6. package/.env.example +0 -303
  7. package/.github/DISCUSSIONS_WELCOME.md +0 -27
  8. package/.github/DISCUSSION_TEMPLATE.yml +0 -5
  9. package/.github/FUNDING.yml +0 -2
  10. package/.github/ISSUE_TEMPLATE/bug_report.md +0 -94
  11. package/.github/ISSUE_TEMPLATE/config.yml +0 -17
  12. package/.github/ISSUE_TEMPLATE/feature_request.md +0 -71
  13. package/.github/PULL_REQUEST_TEMPLATE.md +0 -71
  14. package/.github/dependabot.yml +0 -9
  15. package/.github/workflows/auto-publish.yml +0 -51
  16. package/.github/workflows/ci.yml +0 -263
  17. package/.github/workflows/codeql.yml +0 -38
  18. package/.github/workflows/npm-publish.yml +0 -20
  19. package/.github/workflows/pages.yml +0 -37
  20. package/.github/workflows/stale.yml +0 -54
  21. package/.publish-tick +0 -1
  22. package/.well-known/ai-plugin.json +0 -16
  23. package/AGENT_COUNCIL_FINDINGS.md +0 -142
  24. package/ARCHITECTURE.md +0 -346
  25. package/AUDIT_REPORT.md +0 -28
  26. package/CODE_OF_CONDUCT.md +0 -128
  27. package/CONTRIBUTING.md +0 -50
  28. package/CONTRIBUTORS.md +0 -20
  29. package/Dockerfile +0 -53
  30. package/Dockerfile.proxy +0 -33
  31. package/HEALTH_REPORT.md +0 -118
  32. package/IMPROVEMENT_PLAN.md +0 -107
  33. package/LANDING.md +0 -43
  34. package/LAUNCH-PAIN-DRIVEN.md +0 -339
  35. package/LAUNCH.md +0 -337
  36. package/LAUNCH_CHECKLIST.md +0 -141
  37. package/LAUNCH_SNAPSHOT.md +0 -260
  38. package/MANIFESTO.md +0 -41
  39. package/POPULARITY_BOOSTERS.md +0 -285
  40. package/PR_STATUS_REPORT.md +0 -148
  41. package/REDESIGN.md +0 -95
  42. package/RUNKIT.md +0 -83
  43. package/SECURITY.md +0 -29
  44. package/SUBMISSIONS.md +0 -43
  45. package/_schema.html +0 -53
  46. package/ai-plugin.json +0 -16
  47. package/articles/AI_AGENT_LLM_ROUTING.md +0 -150
  48. package/articles/CHINESE_DIRECTORIES.md +0 -100
  49. package/articles/CHINESE_SUBMISSIONS_READY.md +0 -322
  50. package/articles/COMPETITOR_ALERTS.md +0 -31
  51. package/articles/COMPLETE_POSTING_DIRECTORY.md +0 -147
  52. package/articles/CONTENT_STRUCTURE.md +0 -292
  53. package/articles/DEVTO_COST_GUIDE.md +0 -473
  54. package/articles/DEVTO_FINAL.md +0 -416
  55. package/articles/DEVTO_MULTI_PROVIDER.md +0 -542
  56. package/articles/DEVTO_READY.md +0 -255
  57. package/articles/DEVTO_V2_ANNOUNCEMENT.md +0 -160
  58. package/articles/DEVTO_VIRAL_GROWTH.md +0 -280
  59. package/articles/FRESH_devto.md +0 -460
  60. package/articles/FRESH_devto_2026_05.md +0 -73
  61. package/articles/FRESH_hackernews.md +0 -14
  62. package/articles/FRESH_reddit_ml.md +0 -90
  63. package/articles/FRESH_reddit_node.md +0 -198
  64. package/articles/FRESH_reddit_sideproject.md +0 -72
  65. package/articles/FRESH_reddit_webdev.md +0 -130
  66. package/articles/FROM_ZERO_TO_10K.md +0 -107
  67. package/articles/HN_10X_BETTER.md +0 -430
  68. package/articles/HN_ACCOUNT_GUIDE.md +0 -21
  69. package/articles/HN_CHINESE_STYLE.md +0 -308
  70. package/articles/HN_FINAL.md +0 -148
  71. package/articles/HN_POSTED_VERSION.md +0 -56
  72. package/articles/HN_POST_READY.md +0 -137
  73. package/articles/HN_RESEARCH.md +0 -364
  74. package/articles/HN_SHOW_routerarena.md +0 -17
  75. package/articles/HN_TIMING_GUIDE.md +0 -52
  76. package/articles/INDIEHACKERS_POST.md +0 -52
  77. package/articles/INDIEHACKERS_READY.md +0 -120
  78. package/articles/LLM_BENCHMARK_DEEP_DIVE.md +0 -153
  79. package/articles/MASTER_POSTING_DIRECTORY.md +0 -189
  80. package/articles/NEWSLETTER_SEND_NOW.md +0 -259
  81. package/articles/NEWSLETTER_SUBMISSIONS.md +0 -112
  82. package/articles/PAIN-DRIVEN-devto-v2.md +0 -308
  83. package/articles/PAIN-DRIVEN-devto-v3.md +0 -268
  84. package/articles/PAIN-DRIVEN-devto.md +0 -242
  85. package/articles/PAIN-DRIVEN-hackernews-v2.md +0 -138
  86. package/articles/PAIN-DRIVEN-hackernews-v3.md +0 -151
  87. package/articles/PAIN-DRIVEN-hackernews.md +0 -131
  88. package/articles/PAIN-DRIVEN-reddit-v2.md +0 -301
  89. package/articles/PAIN-DRIVEN-reddit-v3.md +0 -236
  90. package/articles/PAIN-DRIVEN-reddit.md +0 -218
  91. package/articles/PAIN-DRIVEN-twitter-v2.md +0 -110
  92. package/articles/PAIN-DRIVEN-twitter-v3.md +0 -121
  93. package/articles/PAIN-DRIVEN-twitter.md +0 -120
  94. package/articles/PORTKEY_VS_A3M.md +0 -147
  95. package/articles/POSTING_KIT_2026_05.md +0 -67
  96. package/articles/PRESS_KIT_routerarena.md +0 -77
  97. package/articles/PRODUCTHUNT_LISTING.md +0 -48
  98. package/articles/PRODUCTHUNT_READY.md +0 -106
  99. package/articles/PR_PLAN_vault.md +0 -125
  100. package/articles/REDDIT_FINAL.md +0 -232
  101. package/articles/REDDIT_POST.md +0 -67
  102. package/articles/REDDIT_SUBMISSION_READY.md +0 -348
  103. package/articles/ROUTERARENA_LEADER.md +0 -45
  104. package/articles/SHOW_HN_FINAL.md +0 -29
  105. package/articles/TWEETS_10K_DOWNLOADS.md +0 -47
  106. package/articles/TWEETS_BENCHMARK_FIRST.md +0 -46
  107. package/articles/TWEETS_MCP_PLAY.md +0 -51
  108. package/articles/TWEETS_SEQUENTIAL_BROKEN.md +0 -49
  109. package/articles/TWEETS_WHY_BUILD.md +0 -54
  110. package/articles/TWEETS_routerarena_leader.md +0 -53
  111. package/articles/TWEET_STORM_READY.md +0 -165
  112. package/articles/TWITTER_FINAL.md +0 -167
  113. package/articles/WHY_10X_BETTER.md +0 -261
  114. package/articles/WHY_CHINESE_STYLE_BETTER.md +0 -323
  115. package/articles/ai-discoverability-llm-routing.md +0 -210
  116. package/articles/devto-llm-routing.md +0 -138
  117. package/articles/hackernews-show-hn.md +0 -54
  118. package/articles/hashnode-llm-cost-optimization.md +0 -125
  119. package/articles/hn_show_2026_05.md +0 -11
  120. package/articles/medium-building-llm-router.md +0 -205
  121. package/articles/reddit-ml.md +0 -76
  122. package/articles/twitter-thread-cost-savings.md +0 -50
  123. package/articles/youtube-tutorial-script.md +0 -262
  124. package/assets/a3m_3blue1brown.mp4 +0 -0
  125. package/assets/banner.svg +0 -109
  126. package/assets/chart-cost-v2.svg +0 -91
  127. package/assets/chart-cost-v3.svg +0 -143
  128. package/assets/chart-features-v2.svg +0 -132
  129. package/assets/chart-features-v3.svg +0 -211
  130. package/assets/chart-growth-v2.svg +0 -122
  131. package/assets/chart-growth-v3.svg +0 -189
  132. package/assets/cost-comparison.svg +0 -134
  133. package/assets/cost-simple.svg +0 -64
  134. package/assets/demo-hn.gif +0 -0
  135. package/assets/feature-matrix.svg +0 -136
  136. package/assets/growth-chart-animated.svg +0 -76
  137. package/assets/growth-chart.svg +0 -82
  138. package/assets/growth-simple.svg +0 -69
  139. package/assets/hero-diagram.svg +0 -81
  140. package/assets/logo-new.svg +0 -21
  141. package/assets/logo.svg +0 -68
  142. package/assets/provider-comparison.svg +0 -121
  143. package/assets/social-preview-new.svg +0 -100
  144. package/assets/social-preview.svg +0 -194
  145. package/assets/social-v2.svg +0 -130
  146. package/assets/social-v3.svg +0 -212
  147. package/benchmark-provider-results.json +0 -245
  148. package/benchmark-results.json +0 -54
  149. package/council-votes/architecture-vote.md +0 -121
  150. package/council-votes/coverage-vote.md +0 -93
  151. package/data/adaptive-benchmark.json +0 -92
  152. package/data/benchmark-results.json +0 -47
  153. package/data/labeled-benchmark.json +0 -88
  154. package/demo/3blue1brown_video.py +0 -285
  155. package/demo/3blue1brown_video_v2.py +0 -310
  156. package/demo/IMPROVED_PROMPTS.md +0 -229
  157. package/demo/VEO3_PROMPTS.md +0 -269
  158. package/demo/VIDEO_PRODUCTION_GUIDE.md +0 -333
  159. package/demo/a3m_3blue1brown.mp4 +0 -0
  160. package/demo/asciinema-demo.sh +0 -195
  161. package/demo/demo-hn.tape +0 -74
  162. package/demo/demo-script.md +0 -53
  163. package/demo/demo-script.sh +0 -62
  164. package/demo/demo.svg +0 -75
  165. package/demo/frame1_ai_data_center.png +0 -0
  166. package/demo/frame1_sunset_video.mp4 +0 -0
  167. package/demo/frame2_cost_comparison.png +0 -0
  168. package/demo/frame2_cost_comparison_fallback.png +0 -0
  169. package/demo/frame3_parallel_execution.png +0 -0
  170. package/demo/frame3_parallel_execution_fallback.png +0 -0
  171. package/demo/frame4_providers.png +0 -0
  172. package/demo/frame4_providers_fallback.png +0 -0
  173. package/demo/frame5_endcard.png +0 -0
  174. package/demo/frame5_endcard_fallback.png +0 -0
  175. package/demo/new_frame1_hook.png +0 -0
  176. package/demo/new_frame2_proof.png +0 -0
  177. package/demo/new_frame3_wow.png +0 -0
  178. package/demo/new_frame4_social.png +0 -0
  179. package/demo/new_frame5_cta.png +0 -0
  180. package/demo/package.json +0 -13
  181. package/demo/product-video-final.mp4 +0 -0
  182. package/demo/product-video-hype-v1.mp4 +0 -0
  183. package/demo/product-video-v1.mp4 +0 -0
  184. package/demo/public/index.html +0 -762
  185. package/demo/recording.cast +0 -55
  186. package/demo/server.js +0 -405
  187. package/demo-new.tape +0 -71
  188. package/demo-real.sh +0 -198
  189. package/demo-simple.tape +0 -205
  190. package/demo.html +0 -520
  191. package/demo.sh +0 -85
  192. package/demo.tape +0 -259
  193. package/dist/analytics/costAnalytics.d.ts.map +0 -1
  194. package/dist/analytics/costAnalytics.js.map +0 -1
  195. package/dist/benchmark/comprehensive.js.map +0 -1
  196. package/dist/benchmark/reproducible.d.ts.map +0 -1
  197. package/dist/benchmark/reproducible.js.map +0 -1
  198. package/dist/cache/prefixCache.d.ts.map +0 -1
  199. package/dist/cache/prefixCache.js.map +0 -1
  200. package/dist/cache/responseCache.d.ts.map +0 -1
  201. package/dist/cache/responseCache.js.map +0 -1
  202. package/dist/cache/semanticCache.d.ts.map +0 -1
  203. package/dist/cache/semanticCache.js.map +0 -1
  204. package/dist/cli/setupWizard.d.ts.map +0 -1
  205. package/dist/cli/setupWizard.js.map +0 -1
  206. package/dist/cost/budgetEnforcer.d.ts.map +0 -1
  207. package/dist/cost/budgetEnforcer.js.map +0 -1
  208. package/dist/cost/costTracker.d.ts.map +0 -1
  209. package/dist/cost/costTracker.js.map +0 -1
  210. package/dist/ensemble/multiRoundDialog.js.map +0 -1
  211. package/dist/ensemble/shapleyValue.js.map +0 -1
  212. package/dist/integrations/langchainAdapter.d.ts.map +0 -1
  213. package/dist/integrations/langchainAdapter.js.map +0 -1
  214. package/dist/integrations/oauth.d.ts.map +0 -1
  215. package/dist/integrations/oauth.js.map +0 -1
  216. package/dist/integrations/scienceAdapter.js.map +0 -1
  217. package/dist/memory/autoFetch.d.ts.map +0 -1
  218. package/dist/memory/autoFetch.js.map +0 -1
  219. package/dist/memory/episodicMemory.d.ts.map +0 -1
  220. package/dist/memory/episodicMemory.js.map +0 -1
  221. package/dist/memory/hybridMemory.js.map +0 -1
  222. package/dist/memory/memoryTree.d.ts.map +0 -1
  223. package/dist/memory/memoryTree.js.map +0 -1
  224. package/dist/memory/obsidianVault.d.ts.map +0 -1
  225. package/dist/memory/obsidianVault.js.map +0 -1
  226. package/dist/memory/reasoningBank.js.map +0 -1
  227. package/dist/observability/changeWatch.d.ts.map +0 -1
  228. package/dist/observability/changeWatch.js.map +0 -1
  229. package/dist/observability/fatigueDetector.d.ts.map +0 -1
  230. package/dist/observability/fatigueDetector.js.map +0 -1
  231. package/dist/observability/index.d.ts.map +0 -1
  232. package/dist/observability/index.js.map +0 -1
  233. package/dist/observability/metrics.d.ts.map +0 -1
  234. package/dist/observability/metrics.js.map +0 -1
  235. package/dist/observability/middleware.d.ts.map +0 -1
  236. package/dist/observability/middleware.js.map +0 -1
  237. package/dist/observability/tracer.d.ts.map +0 -1
  238. package/dist/observability/tracer.js.map +0 -1
  239. package/dist/observability/types.d.ts.map +0 -1
  240. package/dist/observability/types.js.map +0 -1
  241. package/dist/orchestration/haloOrchestrator.d.ts.map +0 -1
  242. package/dist/orchestration/haloOrchestrator.js.map +0 -1
  243. package/dist/orchestration/mctsWorkflow.d.ts.map +0 -1
  244. package/dist/orchestration/mctsWorkflow.js.map +0 -1
  245. package/dist/providers/localProvider.d.ts.map +0 -1
  246. package/dist/providers/localProvider.js.map +0 -1
  247. package/dist/providers/providerConfig.d.ts.map +0 -1
  248. package/dist/providers/providerConfig.js.map +0 -1
  249. package/dist/providers/registry.d.ts.map +0 -1
  250. package/dist/providers/registry.js.map +0 -1
  251. package/dist/routing/advancedRouter.d.ts.map +0 -1
  252. package/dist/routing/advancedRouter.js.map +0 -1
  253. package/dist/routing/crossModelValidation.d.ts.map +0 -1
  254. package/dist/routing/crossModelValidation.js.map +0 -1
  255. package/dist/routing/providerHealth.d.ts.map +0 -1
  256. package/dist/routing/providerHealth.js.map +0 -1
  257. package/dist/routing/providerRetry.d.ts.map +0 -1
  258. package/dist/routing/providerRetry.js.map +0 -1
  259. package/dist/scripts/banner.js +0 -29
  260. package/dist/security/guardrails.d.ts.map +0 -1
  261. package/dist/security/guardrails.js.map +0 -1
  262. package/dist/server/dashboard.d.ts.map +0 -1
  263. package/dist/server/dashboard.js.map +0 -1
  264. package/dist/server/modelMapper.d.ts.map +0 -1
  265. package/dist/server/modelMapper.js.map +0 -1
  266. package/dist/server/proxyServer.d.ts.map +0 -1
  267. package/dist/server/proxyServer.js.map +0 -1
  268. package/dist/skills/__tests__/skill_manager.test.d.ts +0 -2
  269. package/dist/skills/__tests__/skill_manager.test.d.ts.map +0 -1
  270. package/dist/skills/__tests__/skill_manager.test.js +0 -268
  271. package/dist/skills/__tests__/skill_manager.test.js.map +0 -1
  272. package/dist/tools/tmlpdTools.d.ts.map +0 -1
  273. package/dist/tools/tmlpdTools.js.map +0 -1
  274. package/dist/tui/dashboard.d.ts.map +0 -1
  275. package/dist/tui/dashboard.js.map +0 -1
  276. package/dist/tui/index.d.ts.map +0 -1
  277. package/dist/tui/index.js.map +0 -1
  278. package/dist/utils/batchProcessor.d.ts.map +0 -1
  279. package/dist/utils/batchProcessor.js.map +0 -1
  280. package/dist/utils/compression.d.ts.map +0 -1
  281. package/dist/utils/compression.js.map +0 -1
  282. package/dist/utils/costUtils.d.ts.map +0 -1
  283. package/dist/utils/costUtils.js.map +0 -1
  284. package/dist/utils/reliability.d.ts.map +0 -1
  285. package/dist/utils/reliability.js.map +0 -1
  286. package/dist/utils/sorting.d.ts.map +0 -1
  287. package/dist/utils/sorting.js.map +0 -1
  288. package/dist/utils/speculativeDecoding.d.ts.map +0 -1
  289. package/dist/utils/speculativeDecoding.js.map +0 -1
  290. package/dist/utils/tokenUtils.d.ts.map +0 -1
  291. package/dist/utils/tokenUtils.js.map +0 -1
  292. package/docs/.nojekyll +0 -0
  293. package/docs/ANALYSIS_PRINCIPLES.md +0 -162
  294. package/docs/API.md +0 -855
  295. package/docs/ARCHITECTURAL-IMPROVEMENTS-2025.md +0 -1391
  296. package/docs/ARCHITECTURAL-IMPROVEMENTS-REVISED-2025.md +0 -1051
  297. package/docs/BENCHMARK.md +0 -170
  298. package/docs/CHINESE_PROVIDER_RELIABILITY.md +0 -37
  299. package/docs/CITATIONS.md +0 -74
  300. package/docs/CLAIMS_AND_EVIDENCE.md +0 -58
  301. package/docs/CONFIGURATION.md +0 -476
  302. package/docs/COUNCIL_DECISION.json +0 -816
  303. package/docs/COUNCIL_SUMMARY.md +0 -319
  304. package/docs/COUNCIL_V2.2_DECISION.md +0 -416
  305. package/docs/ENGINEERING_SPEC.md +0 -55
  306. package/docs/FACTORY_RESET.md +0 -34
  307. package/docs/GEO.md +0 -66
  308. package/docs/GEO_OPTIMIZATION.md +0 -30
  309. package/docs/GEO_ROOT_CAUSE.md +0 -136
  310. package/docs/GEO_STATUS.md +0 -85
  311. package/docs/GEO_TEST_RESULTS.md +0 -176
  312. package/docs/HN_CHECKLIST.md +0 -38
  313. package/docs/HN_FOUNDER_COMMENT.md +0 -17
  314. package/docs/HN_SUBMISSION_FINAL.md +0 -180
  315. package/docs/HN_SUBMISSION_V3.md +0 -56
  316. package/docs/IMPROVEMENT_ROADMAP.md +0 -515
  317. package/docs/INTEGRATIONS.md +0 -420
  318. package/docs/LANGCHAIN_INTEGRATION.md +0 -147
  319. package/docs/LLM_COUNCIL_DECISION.md +0 -508
  320. package/docs/MIDDLEWARE_CHAIN.md +0 -35
  321. package/docs/PROMO_CHECKLIST.md +0 -200
  322. package/docs/QUICKSTART.md +0 -271
  323. package/docs/QUICK_START.md +0 -43
  324. package/docs/QUICK_START_VISIBILITY.md +0 -782
  325. package/docs/REDDIT_GAP_ANALYSIS.md +0 -299
  326. package/docs/RELEASE_CHECKLIST.md +0 -32
  327. package/docs/REPRODUCIBILITY.md +0 -63
  328. package/docs/RESEARCH_BACKED_IMPROVEMENTS.md +0 -1180
  329. package/docs/ROUTING_RUBRIC.md +0 -197
  330. package/docs/SEO_AUDIT.md +0 -186
  331. package/docs/SOCIAL_LISTENING.md +0 -219
  332. package/docs/TMLPD_QNA.md +0 -751
  333. package/docs/TMLPD_V2.1_COMPLETE.md +0 -763
  334. package/docs/TMLPD_V2.2_RESEARCH_ROADMAP.md +0 -754
  335. package/docs/UPDATE_TOPICS.md +0 -15
  336. package/docs/USE_CASES.md +0 -59
  337. package/docs/V2.2_IMPLEMENTATION_COMPLETE.md +0 -446
  338. package/docs/V2_IMPLEMENTATION_GUIDE.md +0 -388
  339. package/docs/VERCEL_AI_SDK.md +0 -209
  340. package/docs/VISIBILITY_ADOPTION_PLAN.md +0 -1005
  341. package/docs/_config.yml +0 -49
  342. package/docs/ai-plugin.json +0 -16
  343. package/docs/api.html +0 -513
  344. package/docs/architecture-diagram.md +0 -40
  345. package/docs/benchmark-chart.png +0 -0
  346. package/docs/benchmark.html +0 -387
  347. package/docs/blog/routerarena-number-one.html +0 -73
  348. package/docs/cli-cheatsheet.md +0 -339
  349. package/docs/compare.md +0 -109
  350. package/docs/comparison-litellm.md +0 -88
  351. package/docs/comparison.md +0 -108
  352. package/docs/cost-chart-ascii.md +0 -42
  353. package/docs/cost-comparison-chart.svg +0 -88
  354. package/docs/curl-examples.md +0 -247
  355. package/docs/demo-auto.html +0 -264
  356. package/docs/demo.html +0 -416
  357. package/docs/geo/GENERATIVE_ENGINE_OPTIMIZATION.md +0 -232
  358. package/docs/index.html +0 -507
  359. package/docs/launch-content/LAUNCH_EXECUTION_CHECKLIST.md +0 -421
  360. package/docs/launch-content/README.md +0 -457
  361. package/docs/launch-content/assets/cost_comparison_100_tasks.png +0 -0
  362. package/docs/launch-content/assets/cumulative_savings.png +0 -0
  363. package/docs/launch-content/assets/parallel_speedup.png +0 -0
  364. package/docs/launch-content/assets/provider_pricing_comparison.png +0 -0
  365. package/docs/launch-content/assets/task_breakdown_comparison.png +0 -0
  366. package/docs/launch-content/generate_charts.py +0 -313
  367. package/docs/launch-content/hn_show_post.md +0 -139
  368. package/docs/launch-content/partner_outreach_templates.md +0 -745
  369. package/docs/launch-content/reddit_posts.md +0 -467
  370. package/docs/launch-content/twitter_thread.txt +0 -460
  371. package/docs/npm-downloads-chart.svg +0 -43
  372. package/docs/openapi.json +0 -139
  373. package/docs/openapi.yaml +0 -1318
  374. package/docs/quick-start.html +0 -366
  375. package/docs/robots.txt +0 -52
  376. package/docs/sitemap.xml +0 -57
  377. package/docs/styles.css +0 -682
  378. package/docs/well-known/ai-plugin.json +0 -16
  379. package/docs/wellknown/ai-plugin.json +0 -16
  380. package/docs-site/assets/og-banner.svg +0 -194
  381. package/docs-site/index.html +0 -632
  382. package/eval/README.md +0 -46
  383. package/eval/baselines/main.json +0 -12
  384. package/eval/benchmark_dataset.jsonl +0 -16
  385. package/eval/check_golden_routes.js +0 -64
  386. package/eval/datasets/catalog.json +0 -33
  387. package/eval/datasets/slices/cn_provider_reliability_v1.jsonl +0 -3
  388. package/eval/datasets/slices/cost_pressure_v1.jsonl +0 -3
  389. package/eval/datasets/slices/safety_guardrails_v1.jsonl +0 -3
  390. package/eval/evals.json +0 -199
  391. package/eval/fault_injection_thresholds.json +0 -3
  392. package/eval/generate_report.js +0 -128
  393. package/eval/golden_routes.json +0 -114
  394. package/eval/lib/experiment_registry.js +0 -24
  395. package/eval/run_eval.js +0 -197
  396. package/eval/run_fault_injection.js +0 -201
  397. package/eval/run_shadow_eval.js +0 -85
  398. package/eval/thresholds.json +0 -9
  399. package/examples/QUICKSTART.md +0 -183
  400. package/examples/README.md +0 -61
  401. package/examples/a3m-sdk.js +0 -124
  402. package/examples/basic-route.js +0 -54
  403. package/examples/chat-loop.js +0 -202
  404. package/examples/classify-then-route.js +0 -102
  405. package/examples/cost-compare.js +0 -120
  406. package/examples/ensemble.js +0 -160
  407. package/examples/whatsapp-telegram-bridge-demo.js +0 -302
  408. package/examples/whatsapp-telegram-bridge.js +0 -269
  409. package/hf-space/README.md +0 -23
  410. package/hf-space/app.py +0 -240
  411. package/hf-space/requirements.txt +0 -1
  412. package/huggingface_space/README.md +0 -35
  413. package/huggingface_space/app.py +0 -126
  414. package/huggingface_space/create_space.py +0 -208
  415. package/huggingface_space/requirements.txt +0 -1
  416. package/mcp-server/README.md +0 -188
  417. package/mcp-server/package.json +0 -29
  418. package/mcp-server/src/index.ts +0 -744
  419. package/mcp-server/tsconfig.json +0 -19
  420. package/openclaw-alexa-bridge/ALL_REMAINING_FIXES_PLAN.md +0 -313
  421. package/openclaw-alexa-bridge/REMAINING_FIXES_SUMMARY.md +0 -277
  422. package/openclaw-alexa-bridge/src/alexa_handler_no_tmlpd.js +0 -1234
  423. package/openclaw-alexa-bridge/test_fixes.js +0 -77
  424. package/playground/README.md +0 -51
  425. package/playground/codesandbox.json +0 -12
  426. package/playground/index.js +0 -39
  427. package/proxy/README.md +0 -227
  428. package/proxy/package-lock.json +0 -831
  429. package/proxy/package.json +0 -17
  430. package/proxy/rate-limit.js +0 -145
  431. package/proxy/rate-limit.test.js +0 -311
  432. package/proxy/server.js +0 -970
  433. package/python/README.md +0 -102
  434. package/python/a3m/__init__.py +0 -6
  435. package/python/a3m/client.py +0 -190
  436. package/python/a3m/models.py +0 -40
  437. package/python/a3m/sync_client.py +0 -61
  438. package/python/examples.py +0 -53
  439. package/python/integrations.py +0 -330
  440. package/python/pyproject.toml +0 -23
  441. package/python/setup.py +0 -28
  442. package/python/tmlpd.py +0 -369
  443. package/qna/REDDIT_GAP_ANALYSIS.md +0 -299
  444. package/qna/TMLPD_QNA.md +0 -751
  445. package/research/FINDING_001_safety.md +0 -28
  446. package/research/FINDING_002_error_diversity.md +0 -32
  447. package/research/FINDING_003_confidence_weighted_voting.md +0 -32
  448. package/research/FINDING_004_cross_model_semantic_detection.md +0 -37
  449. package/research/FINDING_005_knowledge_gap_orthogonality.md +0 -34
  450. package/research/HALLUCINATION_RESEARCH.md +0 -27
  451. package/research/ensemble-voting.md +0 -324
  452. package/research/loss-functions.md +0 -545
  453. package/research-log.md +0 -49
  454. package/scripts/banner.js +0 -29
  455. package/scripts/benchmark-local-routerarena.ts +0 -176
  456. package/scripts/benchmark.js +0 -145
  457. package/scripts/benchmark.sh +0 -61
  458. package/scripts/compare-providers.sh +0 -230
  459. package/scripts/content-planner.js +0 -25
  460. package/scripts/create-labeled-benchmark.ts +0 -105
  461. package/scripts/cross_post.py +0 -443
  462. package/scripts/local-router-benchmark.ts +0 -154
  463. package/scripts/post-all.sh +0 -41
  464. package/scripts/publish_fcc.py +0 -106
  465. package/scripts/push-to-gitee.sh +0 -25
  466. package/scripts/routerarena_ensemble.js +0 -144
  467. package/scripts/routing-benchmark-v2.js +0 -373
  468. package/scripts/routing-benchmark-v3.js +0 -118
  469. package/scripts/routing-benchmark.js +0 -462
  470. package/scripts/run-labeled-benchmark.mjs +0 -104
  471. package/scripts/run-mmlu-benchmark.js +0 -176
  472. package/scripts/run-provider-benchmark.js +0 -244
  473. package/scripts/update-npm-badges.js +0 -158
  474. package/skill/SKILL.md +0 -238
  475. package/src/__tests__/integration/tmpld_integration.test.py +0 -540
  476. package/src/skills/__tests__/skill_manager.test.ts +0 -328
  477. package/submissions/benchmarks/ALL_PLATFORMS_SUBMISSION.md +0 -94
  478. package/submissions/benchmarks/LLMROUTERBENCH_SUBMISSION.md +0 -121
  479. package/submissions/benchmarks/MMRBENCH_SUBMISSION.md +0 -94
  480. package/submissions/benchmarks/ROUTERARENA_UPDATE.md +0 -83
  481. package/submissions/benchmarks/ROUTERBENCH_SUBMISSION.md +0 -225
  482. package/test-council/1-structure-tests.test.js +0 -353
  483. package/test-council/1-structure-tests.test.ts +0 -353
  484. package/test-council/2-edge-case-tests.test.ts +0 -361
  485. package/test-council/3-performance-tests.test.ts +0 -669
  486. package/test-council/4-integration-tests.test.ts +0 -391
  487. package/test-council/5-agent-council-eval.test.ts +0 -413
  488. package/test-council/AGENT_COUNCIL_ARCHITECTURE.md +0 -349
  489. package/test-council/TEST_COUNCIL_REPORT.md +0 -201
  490. package/test-council/agents/edge-case-agent.ts +0 -363
  491. package/test-council/agents/performance-agent.ts +0 -426
  492. package/test-council/agents/structure-agent.ts +0 -227
  493. package/test-council/council.md +0 -183
  494. package/tests/__mocks__/tokenUtils.ts +0 -8
  495. package/tests/memory/episodicMemory.test.ts +0 -227
  496. package/tests/package-lock.json +0 -1628
  497. package/tests/package.json +0 -18
  498. package/tests/routing/ensembleVoting.test.ts +0 -236
  499. package/tests/routing/providerRetry.test.ts +0 -360
  500. package/tests/routing/queryTypePresets.test.ts +0 -208
  501. package/tests/security/guardrailEngine.test.ts +0 -700
  502. package/tests/tsconfig.json +0 -21
  503. package/tests/vitest.config.ts +0 -18
  504. package/tmlpd-pi-extension/README.md +0 -66
  505. package/tmlpd-pi-extension/dist/cache/prefixCache.d.ts +0 -114
  506. package/tmlpd-pi-extension/dist/cache/prefixCache.d.ts.map +0 -1
  507. package/tmlpd-pi-extension/dist/cache/prefixCache.js +0 -285
  508. package/tmlpd-pi-extension/dist/cache/prefixCache.js.map +0 -1
  509. package/tmlpd-pi-extension/dist/cache/responseCache.d.ts +0 -58
  510. package/tmlpd-pi-extension/dist/cache/responseCache.d.ts.map +0 -1
  511. package/tmlpd-pi-extension/dist/cache/responseCache.js +0 -153
  512. package/tmlpd-pi-extension/dist/cache/responseCache.js.map +0 -1
  513. package/tmlpd-pi-extension/dist/cli.js +0 -59
  514. package/tmlpd-pi-extension/dist/cost/costTracker.d.ts +0 -95
  515. package/tmlpd-pi-extension/dist/cost/costTracker.d.ts.map +0 -1
  516. package/tmlpd-pi-extension/dist/cost/costTracker.js +0 -240
  517. package/tmlpd-pi-extension/dist/cost/costTracker.js.map +0 -1
  518. package/tmlpd-pi-extension/dist/index.d.ts +0 -723
  519. package/tmlpd-pi-extension/dist/index.d.ts.map +0 -1
  520. package/tmlpd-pi-extension/dist/index.js +0 -239
  521. package/tmlpd-pi-extension/dist/index.js.map +0 -1
  522. package/tmlpd-pi-extension/dist/memory/episodicMemory.d.ts +0 -82
  523. package/tmlpd-pi-extension/dist/memory/episodicMemory.d.ts.map +0 -1
  524. package/tmlpd-pi-extension/dist/memory/episodicMemory.js +0 -145
  525. package/tmlpd-pi-extension/dist/memory/episodicMemory.js.map +0 -1
  526. package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.d.ts +0 -102
  527. package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.d.ts.map +0 -1
  528. package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.js +0 -207
  529. package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.js.map +0 -1
  530. package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.d.ts +0 -85
  531. package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.d.ts.map +0 -1
  532. package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.js +0 -210
  533. package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.js.map +0 -1
  534. package/tmlpd-pi-extension/dist/providers/localProvider.d.ts +0 -102
  535. package/tmlpd-pi-extension/dist/providers/localProvider.d.ts.map +0 -1
  536. package/tmlpd-pi-extension/dist/providers/localProvider.js +0 -338
  537. package/tmlpd-pi-extension/dist/providers/localProvider.js.map +0 -1
  538. package/tmlpd-pi-extension/dist/providers/registry.d.ts +0 -55
  539. package/tmlpd-pi-extension/dist/providers/registry.d.ts.map +0 -1
  540. package/tmlpd-pi-extension/dist/providers/registry.js +0 -138
  541. package/tmlpd-pi-extension/dist/providers/registry.js.map +0 -1
  542. package/tmlpd-pi-extension/dist/routing/advancedRouter.d.ts +0 -68
  543. package/tmlpd-pi-extension/dist/routing/advancedRouter.d.ts.map +0 -1
  544. package/tmlpd-pi-extension/dist/routing/advancedRouter.js +0 -332
  545. package/tmlpd-pi-extension/dist/routing/advancedRouter.js.map +0 -1
  546. package/tmlpd-pi-extension/dist/tools/tmlpdTools.d.ts +0 -101
  547. package/tmlpd-pi-extension/dist/tools/tmlpdTools.d.ts.map +0 -1
  548. package/tmlpd-pi-extension/dist/tools/tmlpdTools.js +0 -368
  549. package/tmlpd-pi-extension/dist/tools/tmlpdTools.js.map +0 -1
  550. package/tmlpd-pi-extension/dist/utils/batchProcessor.d.ts +0 -96
  551. package/tmlpd-pi-extension/dist/utils/batchProcessor.d.ts.map +0 -1
  552. package/tmlpd-pi-extension/dist/utils/batchProcessor.js +0 -170
  553. package/tmlpd-pi-extension/dist/utils/batchProcessor.js.map +0 -1
  554. package/tmlpd-pi-extension/dist/utils/compression.d.ts +0 -61
  555. package/tmlpd-pi-extension/dist/utils/compression.d.ts.map +0 -1
  556. package/tmlpd-pi-extension/dist/utils/compression.js +0 -281
  557. package/tmlpd-pi-extension/dist/utils/compression.js.map +0 -1
  558. package/tmlpd-pi-extension/dist/utils/reliability.d.ts +0 -74
  559. package/tmlpd-pi-extension/dist/utils/reliability.d.ts.map +0 -1
  560. package/tmlpd-pi-extension/dist/utils/reliability.js +0 -177
  561. package/tmlpd-pi-extension/dist/utils/reliability.js.map +0 -1
  562. package/tmlpd-pi-extension/dist/utils/speculativeDecoding.d.ts +0 -117
  563. package/tmlpd-pi-extension/dist/utils/speculativeDecoding.d.ts.map +0 -1
  564. package/tmlpd-pi-extension/dist/utils/speculativeDecoding.js +0 -246
  565. package/tmlpd-pi-extension/dist/utils/speculativeDecoding.js.map +0 -1
  566. package/tmlpd-pi-extension/dist/utils/tokenUtils.d.ts +0 -50
  567. package/tmlpd-pi-extension/dist/utils/tokenUtils.d.ts.map +0 -1
  568. package/tmlpd-pi-extension/dist/utils/tokenUtils.js +0 -124
  569. package/tmlpd-pi-extension/dist/utils/tokenUtils.js.map +0 -1
  570. package/tmlpd-pi-extension/examples/QUICKSTART.md +0 -183
  571. package/tmlpd-pi-extension/package-lock.json +0 -79
  572. package/tmlpd-pi-extension/package.json +0 -172
  573. package/tmlpd-pi-extension/python/examples.py +0 -53
  574. package/tmlpd-pi-extension/python/integrations.py +0 -330
  575. package/tmlpd-pi-extension/python/setup.py +0 -28
  576. package/tmlpd-pi-extension/python/tmlpd.py +0 -369
  577. package/tmlpd-pi-extension/qna/REDDIT_GAP_ANALYSIS.md +0 -299
  578. package/tmlpd-pi-extension/qna/TMLPD_QNA.md +0 -751
  579. package/tmlpd-pi-extension/skill/SKILL.md +0 -238
  580. package/tmlpd-pi-extension/src/cache/responseCache.ts +0 -147
  581. package/tmlpd-pi-extension/src/cost/costTracker.ts +0 -302
  582. package/tmlpd-pi-extension/src/index.ts +0 -232
  583. package/tmlpd-pi-extension/src/memory/episodicMemory.ts +0 -257
  584. package/tmlpd-pi-extension/src/orchestration/haloOrchestrator.ts +0 -266
  585. package/tmlpd-pi-extension/src/orchestration/mctsWorkflow.ts +0 -262
  586. package/tmlpd-pi-extension/src/providers/localProvider.ts +0 -406
  587. package/tmlpd-pi-extension/src/providers/registry.ts +0 -164
  588. package/tmlpd-pi-extension/src/routing/ensembleVoting.ts +0 -159
  589. package/tmlpd-pi-extension/src/routing/queryTypePresets.ts +0 -136
  590. package/tmlpd-pi-extension/src/tools/tmlpdTools.ts +0 -433
  591. package/tmlpd-pi-extension/src/utils/batchProcessor.ts +0 -232
  592. package/tmlpd-pi-extension/src/utils/compression.ts +0 -325
  593. package/tmlpd-pi-extension/src/utils/reliability.ts +0 -221
  594. package/tmlpd-pi-extension/src/utils/tokenUtils.ts +0 -145
  595. package/tmlpd-pi-extension/tsconfig.json +0 -18
  596. package/tsconfig.build.json +0 -29
  597. package/tsconfig.json +0 -18
  598. /package/{docs/llms-full.txt → llms-full.txt.bak} +0 -0
@@ -1,325 +0,0 @@
1
- /**
2
- * TMLPD Context Compression Utilities
3
- *
4
- * Strategies for reducing context window usage:
5
- * - Smart truncation
6
- * - Message summarization
7
- * - ISON-style encoding (inspired by Reddit ISON format)
8
- * - Context window management
9
- */
10
-
11
- export interface Message {
12
- role: "system" | "user" | "assistant";
13
- content: string;
14
- name?: string;
15
- tool_calls?: any[];
16
- tool_call_id?: string;
17
- }
18
-
19
- export type CompressionStrategy = "smart" | "first" | "last" | "isentropy";
20
-
21
- /**
22
- * ISON (Intelligence-Sparse Object Notation)
23
- *
24
- * A compression format that reduces token count by:
25
- * - Removing redundant whitespace
26
- * - Shortening common phrases
27
- * - Using abbreviations strategically
28
- *
29
- * Example: "The quick brown fox jumps over the lazy dog"
30
- * → "quick brown fox jumps lazy dog" (removes articles, repeated words)
31
- */
32
-
33
- const ISON_REPLACEMENTS: Array<[RegExp, string]> = [
34
- // Common phrase abbreviations
35
- [/\bthe\b/g, ""],
36
- [/\ba\b/g, ""],
37
- [/\ban\b/g, ""],
38
- [/\bthat\b/g, "that"],
39
- [/\bthis\b/g, "this"],
40
- [/\bwith\b/g, "w/"],
41
- [/\bwithout\b/g, "w/o"],
42
- [/\band\b/g, "&"],
43
- [/\bor\b/g, "|"],
44
- [/\bfor\b/g, "4"],
45
- [/\bto\b/g, "2"],
46
- [/\binto\b/g, "2"],
47
- [/\bfrom\b/g, "fr"],
48
- [/\bplease\b/gi, ""],
49
- [/\bthank you\b/gi, "thx"],
50
- [/\byou are\b/gi, "u r"],
51
- [/\byou can\b/gi, "u c"],
52
- [/\bcan you\b/gi, "c?"],
53
- [/\bhow do\b/gi, "how 2"],
54
- [/\bwhat is\b/gi, "wat"],
55
- [/\bwhat are\b/gi, "wat"],
56
-
57
- // Whitespace normalization
58
- [/\s+/g, " "],
59
- [/^\s+|\s+$/g, ""],
60
-
61
- // Remove repeated characters
62
- [/(\w)\1{2,}/g, "$1$1"],
63
-
64
- // Shorten common technical terms
65
- [/\binformation\b/gi, "info"],
66
- [/\bprocessing\b/gi, "proc"],
67
- [/\bdevelopment\b/gi, "dev"],
68
- [/\bapplication\b/gi, "app"],
69
- [/\bconfiguration\b/gi, "config"],
70
- [/\brepresentation\b/gi, "repr"],
71
- [/\bunderstanding\b/gi, "unders"],
72
- [/\brecommendation\b/gi, "rec"],
73
- ];
74
-
75
- const ISON_UNREPLACEMENTS: Array<[RegExp, string]> = [
76
- [/w\//g, "with "],
77
- [/w\/o/g, "without "],
78
- [/&/g, " and "],
79
- [/\b4\b/g, " for "],
80
- [/\b2\b/g, " to "],
81
- [/\bfr\b/g, "from "],
82
- [/\bthx\b/gi, "thank you"],
83
- [/\bu r\b/gi, "you are"],
84
- [/\bu c\b/gi, "you can"],
85
- [/\bc\?\b/g, "can you"],
86
- [/how 2\b/gi, "how do"],
87
- [/\bwat\b/g, "what is"],
88
- ];
89
-
90
- export interface CompressionResult {
91
- original_tokens: number;
92
- compressed_tokens: number;
93
- ratio: number;
94
- compressed_text: string;
95
- }
96
-
97
- /**
98
- * ISON encode text for token reduction.
99
- */
100
- export function isonEncode(text: string): string {
101
- let result = text;
102
-
103
- // Apply replacements
104
- for (const [pattern, replacement] of ISON_REPLACEMENTS) {
105
- result = result.replace(pattern, replacement);
106
- }
107
-
108
- // Remove extra spaces and trim
109
- result = result.replace(/\s+/g, " ").trim();
110
-
111
- return result;
112
- }
113
-
114
- /**
115
- * Decode ISON encoded text.
116
- */
117
- export function isonDecode(text: string): string {
118
- let result = text;
119
-
120
- // Apply un-replacements
121
- for (const [pattern, replacement] of ISON_UNREPLACEMENTS) {
122
- result = result.replace(pattern, replacement);
123
- }
124
-
125
- return result;
126
- }
127
-
128
- /**
129
- * Compress text using ISON encoding.
130
- */
131
- export function compressText(text: string): CompressionResult {
132
- const original_tokens = estimateTokens(text);
133
- const compressed = isonEncode(text);
134
- const compressed_tokens = estimateTokens(compressed);
135
-
136
- return {
137
- original_tokens,
138
- compressed_tokens,
139
- ratio: compressed_tokens / original_tokens,
140
- compressed_text: compressed
141
- };
142
- }
143
-
144
- /**
145
- * Estimate tokens (fallback if no model specified).
146
- */
147
- function estimateTokens(text: string): number {
148
- const words = text.trim().split(/\s+/).filter(w => w.length > 0);
149
- return Math.ceil(words.length * 1.3);
150
- }
151
-
152
- /**
153
- * Truncate messages to fit within token budget.
154
- *
155
- * @param messages - Conversation messages
156
- * @param max_tokens - Maximum tokens allowed
157
- * @param strategy - "smart" (preserve system + recent), "first" (keep start), "last" (keep end)
158
- */
159
- export function truncateMessages(
160
- messages: Message[],
161
- max_tokens: number,
162
- strategy: CompressionStrategy = "smart"
163
- ): Message[] {
164
- if (!messages || messages.length === 0) return [];
165
-
166
- // Calculate total tokens
167
- const totalTokens = (msg: Message) => {
168
- const content = typeof msg.content === 'string' ? msg.content : JSON.stringify(msg.content);
169
- return estimateTokens(content) + 4; // +4 for role/format overhead
170
- };
171
-
172
- let currentTokens = messages.reduce((sum, m) => sum + totalTokens(m), 0);
173
-
174
- if (currentTokens <= max_tokens) {
175
- return messages; // Already fits
176
- }
177
-
178
- const result: Message[] = [];
179
-
180
- if (strategy === "first") {
181
- // Keep system (first) messages, truncate from middle
182
- let keepTokens = 0;
183
- for (const msg of messages) {
184
- const msgTokens = totalTokens(msg);
185
- if (keepTokens + msgTokens <= max_tokens) {
186
- result.push(msg);
187
- keepTokens += msgTokens;
188
- } else if (msg.role === "system" && result.length === 0) {
189
- // Always keep system message, possibly truncated
190
- const systemContent = typeof msg.content === 'string' ? msg.content : "";
191
- const truncated = truncateToTokenBudget(systemContent, max_tokens - 4);
192
- result.push({ ...msg, content: truncated });
193
- break;
194
- } else {
195
- break;
196
- }
197
- }
198
- } else if (strategy === "last") {
199
- // Keep only most recent messages
200
- for (let i = messages.length - 1; i >= 0; i--) {
201
- const msg = messages[i];
202
- const msgTokens = totalTokens(msg);
203
-
204
- if (currentTokens - msgTokens <= max_tokens) {
205
- result.unshift(msg);
206
- currentTokens -= msgTokens;
207
- } else if (msg.role === "user") {
208
- // Try to keep a truncated user message
209
- const truncated = truncateToTokenBudget(msg.content as string, max_tokens - currentTokens);
210
- if (truncated.length > 20) {
211
- result.unshift({ ...msg, content: truncated });
212
- }
213
- break;
214
- }
215
- }
216
- } else if (strategy === "smart") {
217
- // Keep system, compress middle, keep recent
218
- const systemMessages: Message[] = [];
219
- const middleMessages: Message[] = [];
220
- const recentMessages: Message[] = [];
221
-
222
- for (const msg of messages) {
223
- if (msg.role === "system") {
224
- systemMessages.push(msg);
225
- } else if (messages.indexOf(msg) >= messages.length - 3) {
226
- recentMessages.push(msg);
227
- } else {
228
- middleMessages.push(msg);
229
- }
230
- }
231
-
232
- // Start with system
233
- for (const msg of systemMessages) {
234
- const msgTokens = totalTokens(msg);
235
- if (currentTokens <= max_tokens) {
236
- result.push(msg);
237
- currentTokens -= msgTokens;
238
- } else {
239
- // Truncate system message
240
- const truncated = truncateToTokenBudget(msg.content as string, max_tokens - currentTokens - 10);
241
- result.push({ ...msg, content: truncated });
242
- currentTokens = max_tokens;
243
- break;
244
- }
245
- }
246
-
247
- // Add compressed middle
248
- if (currentTokens > max_tokens / 2 && middleMessages.length > 0) {
249
- // Compress middle messages into a summary
250
- const middleContent = middleMessages
251
- .map(m => m.content)
252
- .join("\n");
253
- const summaryTokenBudget = Math.min(
254
- max_tokens / 4,
255
- max_tokens - currentTokens
256
- );
257
- const summary = truncateToTokenBudget(
258
- `[Previous ${middleMessages.length} messages]: ${middleContent}`,
259
- summaryTokenBudget
260
- );
261
- result.push({ role: "assistant", content: summary });
262
- currentTokens -= estimateTokens(summary);
263
- }
264
-
265
- // Add recent messages if room
266
- for (const msg of recentMessages) {
267
- const msgTokens = totalTokens(msg);
268
- if (currentTokens + msgTokens <= max_tokens) {
269
- result.push(msg);
270
- currentTokens += msgTokens;
271
- }
272
- }
273
- }
274
-
275
- return result;
276
- }
277
-
278
- /**
279
- * Truncate a single string to fit within token budget.
280
- */
281
- export function truncateToTokenBudget(text: string, max_tokens: number): string {
282
- const words = text.split(/\s+/);
283
- let current = 0;
284
- const targetWords: string[] = [];
285
-
286
- for (const word of words) {
287
- const wordTokens = estimateTokens(word);
288
- if (current + wordTokens <= max_tokens) {
289
- targetWords.push(word);
290
- current += wordTokens;
291
- } else {
292
- break;
293
- }
294
- }
295
-
296
- let result = targetWords.join(" ");
297
-
298
- // If we truncated, add ellipsis
299
- if (result.length < text.length) {
300
- result += "...";
301
- }
302
-
303
- return result;
304
- }
305
-
306
- /**
307
- * Calculate compression ratio for context.
308
- */
309
- export function calculateCompressionRatio(messages: Message[], max_tokens: number): number {
310
- const totalTokens = messages.reduce((sum, m) => {
311
- const content = typeof m.content === 'string' ? m.content : JSON.stringify(m.content);
312
- return sum + estimateTokens(content) + 4;
313
- }, 0);
314
-
315
- return Math.min(1, max_tokens / totalTokens);
316
- }
317
-
318
- export default {
319
- isonEncode,
320
- isonDecode,
321
- compressText,
322
- truncateMessages,
323
- truncateToTokenBudget,
324
- calculateCompressionRatio
325
- };
@@ -1,221 +0,0 @@
1
- /**
2
- * TMLPD Reliability Engine
3
- *
4
- * Circuit breaker, retry with jitter, and enhanced cooldown logic.
5
- * Designed to handle flaky API calls gracefully.
6
- */
7
-
8
- export interface RetryConfig {
9
- max_attempts: number;
10
- base_delay_ms: number;
11
- max_delay_ms: number;
12
- jitter: number; // 0-1, percentage of delay to randomize
13
- retryable_status_codes: number[];
14
- }
15
-
16
- export interface CircuitBreakerConfig {
17
- failure_threshold: number;
18
- recovery_timeout_ms: number;
19
- half_open_max_calls: number;
20
- }
21
-
22
- export interface CircuitState {
23
- status: "closed" | "open" | "half_open";
24
- failure_count: number;
25
- last_failure_time: number | null;
26
- last_success_time: number | null;
27
- consecutive_successes: number;
28
- }
29
-
30
- export const DEFAULT_RETRY_CONFIG: RetryConfig = {
31
- max_attempts: 3,
32
- base_delay_ms: 500,
33
- max_delay_ms: 30000,
34
- jitter: 0.3,
35
- retryable_status_codes: [408, 429, 500, 502, 503, 504],
36
- };
37
-
38
- export const DEFAULT_CIRCUIT_BREAKER_CONFIG: CircuitBreakerConfig = {
39
- failure_threshold: 5,
40
- recovery_timeout_ms: 60000,
41
- half_open_max_calls: 3,
42
- };
43
-
44
- /**
45
- * Calculate delay with exponential backoff and jitter
46
- */
47
- export function calculateRetryDelay(
48
- attempt: number,
49
- config: RetryConfig = DEFAULT_RETRY_CONFIG
50
- ): number {
51
- // Exponential backoff
52
- const exponential_delay = config.base_delay_ms * Math.pow(2, attempt - 1);
53
-
54
- // Cap at max delay
55
- const capped_delay = Math.min(exponential_delay, config.max_delay_ms);
56
-
57
- // Add jitter
58
- const jitter_range = capped_delay * config.jitter;
59
- const jitter = (Math.random() * 2 - 1) * jitter_range;
60
-
61
- return Math.round(capped_delay + jitter);
62
- }
63
-
64
- /**
65
- * Check if status code is retryable
66
- */
67
- export function isRetryableStatus(statusCode: number | null, config: RetryConfig = DEFAULT_RETRY_CONFIG): boolean {
68
- if (statusCode === null) return true; // Network errors are retryable
69
- return config.retryable_status_codes.includes(statusCode);
70
- }
71
-
72
- /**
73
- * Circuit Breaker implementation
74
- */
75
- export class CircuitBreaker {
76
- private config: CircuitBreakerConfig;
77
- private state: CircuitState;
78
- private half_open_calls = 0;
79
-
80
- constructor(config: Partial<CircuitBreakerConfig> = {}) {
81
- this.config = { ...DEFAULT_CIRCUIT_BREAKER_CONFIG, ...config };
82
- this.state = {
83
- status: "closed",
84
- failure_count: 0,
85
- last_failure_time: null,
86
- last_success_time: null,
87
- consecutive_successes: 0,
88
- };
89
- }
90
-
91
- /**
92
- * Check if circuit allows requests
93
- */
94
- canExecute(): boolean {
95
- if (this.state.status === "closed") return true;
96
-
97
- if (this.state.status === "open") {
98
- // Check if recovery timeout has passed
99
- if (this.state.last_failure_time && Date.now() - this.state.last_failure_time >= this.config.recovery_timeout_ms) {
100
- this.state.status = "half_open";
101
- this.half_open_calls = 0;
102
- return true;
103
- }
104
- return false;
105
- }
106
-
107
- // half_open
108
- return this.half_open_calls < this.config.half_open_max_calls;
109
- }
110
-
111
- /**
112
- * Record a successful execution
113
- */
114
- recordSuccess(): void {
115
- this.state.last_success_time = Date.now();
116
- this.half_open_calls++;
117
-
118
- if (this.state.status === "half_open") {
119
- this.state.consecutive_successes++;
120
- if (this.state.consecutive_successes >= this.config.half_open_max_calls) {
121
- // Circuit recovered
122
- this.state.status = "closed";
123
- this.state.failure_count = 0;
124
- this.state.consecutive_successes = 0;
125
- }
126
- } else {
127
- this.state.failure_count = 0;
128
- }
129
- }
130
-
131
- /**
132
- * Record a failed execution
133
- */
134
- recordFailure(): void {
135
- this.state.last_failure_time = Date.now();
136
- this.state.failure_count++;
137
- this.state.consecutive_successes = 0;
138
-
139
- if (this.state.status === "half_open") {
140
- // Trip circuit back open
141
- this.state.status = "open";
142
- } else if (this.state.failure_count >= this.config.failure_threshold) {
143
- this.state.status = "open";
144
- }
145
- }
146
-
147
- /**
148
- * Get current circuit state
149
- */
150
- getState(): CircuitState {
151
- return { ...this.state };
152
- }
153
-
154
- /**
155
- * Force reset circuit
156
- */
157
- reset(): void {
158
- this.state = {
159
- status: "closed",
160
- failure_count: 0,
161
- last_failure_time: null,
162
- last_success_time: null,
163
- consecutive_successes: 0,
164
- };
165
- this.half_open_calls = 0;
166
- }
167
- }
168
-
169
- /**
170
- * Enhanced retry wrapper with circuit breaker integration
171
- */
172
- export async function withRetry<T>(
173
- fn: () => Promise<T>,
174
- config: Partial<RetryConfig> = {},
175
- circuitBreaker?: CircuitBreaker
176
- ): Promise<{ result: T | null; error: Error | null; attempts: number; circuit_tripped: boolean }> {
177
- const retryConfig = { ...DEFAULT_RETRY_CONFIG, ...config };
178
- let lastError: Error | null = null;
179
- let attempts = 0;
180
- let circuit_tripped = false;
181
-
182
- for (let i = 0; i < retryConfig.max_attempts; i++) {
183
- attempts++;
184
-
185
- try {
186
- // Check circuit breaker before attempt
187
- if (circuitBreaker && !circuitBreaker.canExecute()) {
188
- circuit_tripped = true;
189
- throw new Error("Circuit breaker is open");
190
- }
191
-
192
- const result = await fn();
193
-
194
- if (circuitBreaker) {
195
- circuitBreaker.recordSuccess();
196
- }
197
-
198
- return { result, error: null, attempts, circuit_tripped };
199
- } catch (error) {
200
- lastError = error instanceof Error ? error : new Error(String(error));
201
-
202
- // Check if should retry
203
- const statusCode = (error as any).statusCode || (error as any).response?.statusCode || null;
204
- if (!isRetryableStatus(statusCode, retryConfig)) {
205
- return { result: null, error: lastError, attempts, circuit_tripped };
206
- }
207
-
208
- if (circuitBreaker) {
209
- circuitBreaker.recordFailure();
210
- }
211
-
212
- // Don't wait after last attempt
213
- if (i < retryConfig.max_attempts - 1) {
214
- const delay = calculateRetryDelay(i + 1, retryConfig);
215
- await new Promise((resolve) => setTimeout(resolve, delay));
216
- }
217
- }
218
- }
219
-
220
- return { result: null, error: lastError, attempts, circuit_tripped };
221
- }
@@ -1,145 +0,0 @@
1
- /**
2
- * TMLPD Token Utilities
3
- *
4
- * Token counting, cost estimation, and context management.
5
- */
6
-
7
- export interface TokenCost {
8
- input_per_1k: number;
9
- output_per_1k: number;
10
- }
11
-
12
- // Current provider rates (2024-2025)
13
- export const MODEL_COSTS: Record<string, TokenCost> = {
14
- // OpenAI
15
- "gpt-4o": { input_per_1k: 2.50, output_per_1k: 10.00 },
16
- "gpt-4o-mini": { input_per_1k: 0.15, output_per_1k: 0.60 },
17
- "gpt-4-turbo": { input_per_1k: 10.00, output_per_1k: 30.00 },
18
- "gpt-3.5-turbo": { input_per_1k: 0.50, output_per_1k: 1.50 },
19
-
20
- // Anthropic
21
- "claude-3.5-sonnet": { input_per_1k: 3.00, output_per_1k: 15.00 },
22
- "claude-3-opus": { input_per_1k: 15.00, output_per_1k: 75.00 },
23
- "claude-3-haiku": { input_per_1k: 0.25, output_per_1k: 1.25 },
24
-
25
- // Google
26
- "gemini-2.0-flash": { input_per_1k: 0.00, output_per_1k: 0.00 }, // Free
27
- "gemini-1.5-pro": { input_per_1k: 1.25, output_per_1k: 5.00 },
28
- "gemini-1.5-flash": { input_per_1k: 0.075, output_per_1k: 0.30 },
29
-
30
- // Groq
31
- "groq/llama-3.3-70b": { input_per_1k: 0.59, output_per_1k: 0.79 },
32
- "groq/llama-3.1-8b": { input_per_1k: 0.05, output_per_1k: 0.08 },
33
-
34
- // Cerebras
35
- "cerebras/llama-3.3-70b": { input_per_1k: 0.60, output_per_1k: 0.60 },
36
-
37
- // Mistral
38
- "mistral-large": { input_per_1k: 2.00, output_per_1k: 6.00 },
39
- "mistral-small": { input_per_1k: 0.20, output_per_1k: 0.60 },
40
- };
41
-
42
- /**
43
- * Count tokens in text (approximate for English).
44
- * Based on ~1.3 tokens per word for typical English text.
45
- */
46
- export function countTokens(text: string, model: string = "gpt-4o"): number {
47
- if (!text || text.length === 0) return 0;
48
-
49
- // Use model-specific approximation if available
50
- // Otherwise use generic word-based estimate
51
- const words = text.trim().split(/\s+/).length;
52
-
53
- // Fine-tune based on model family
54
- if (model.includes("claude")) {
55
- // Anthropic models: ~1.5 tokens per word
56
- return Math.ceil(words * 1.5);
57
- } else if (model.includes("gemini")) {
58
- // Google: ~1.2 tokens per word (SentencePiece)
59
- return Math.ceil(words * 1.2);
60
- } else if (model.includes("llama")) {
61
- // Llama: ~1.4 tokens per word (BPE)
62
- return Math.ceil(words * 1.4);
63
- }
64
-
65
- // Default: ~1.3 tokens per word (GPT-4 average)
66
- return Math.ceil(words * 1.3);
67
- }
68
-
69
- /**
70
- * Estimate cost for a prompt/completion pair.
71
- */
72
- export function estimateCost(
73
- prompt_tokens: number,
74
- completion_tokens: number,
75
- model: string
76
- ): number {
77
- const costs = MODEL_COSTS[model] || MODEL_COSTS["gpt-4o"];
78
-
79
- const input_cost = (prompt_tokens / 1000) * costs.input_per_1k;
80
- const output_cost = (completion_tokens / 1000) * costs.output_per_1k;
81
-
82
- return input_cost + output_cost;
83
- }
84
-
85
- /**
86
- * Estimate cost from raw text (approximates both prompt and completion).
87
- */
88
- export function estimateCostFromText(
89
- prompt: string,
90
- completion: string,
91
- model: string
92
- ): number {
93
- const prompt_tokens = countTokens(prompt, model);
94
- // Completion typically has higher token density
95
- const completion_tokens = Math.ceil(countTokens(completion, model) * 1.2);
96
-
97
- return estimateCost(prompt_tokens, completion_tokens, model);
98
- }
99
-
100
- /**
101
- * Get cost info for a model.
102
- */
103
- export function getModelCost(model: string): TokenCost {
104
- return MODEL_COSTS[model] || MODEL_COSTS["gpt-4o"];
105
- }
106
-
107
- /**
108
- * List all supported models with their costs.
109
- */
110
- export function listModelsByCost(): Array<{ model: string; input: number; output: number }> {
111
- return Object.entries(MODEL_COSTS)
112
- .map(([model, cost]) => ({
113
- model,
114
- input: cost.input_per_1k,
115
- output: cost.output_per_1k
116
- }))
117
- .sort((a, b) => (a.input + a.output) - (b.input + b.output));
118
- }
119
-
120
- /**
121
- * Find cheapest models for a given task.
122
- */
123
- export function findCheapestModels(task: "fast" | "quality" | "balanced" | "coding", count: number = 3): string[] {
124
- const sorted = listModelsByCost();
125
-
126
- // Different profiles for different needs
127
- const profiles = {
128
- fast: sorted.filter(m => m.output < 1.0).slice(0, count).map(m => m.model),
129
- quality: sorted.filter(m => m.output > 10).slice(0, count).map(m => m.model),
130
- balanced: sorted.slice(0, count * 2).slice(count, count * 2).map(m => m.model),
131
- coding: sorted.filter(m => m.model.includes("codex") || m.model.includes("claude") || m.model.includes("llama")).slice(0, count).map(m => m.model)
132
- };
133
-
134
- return profiles[task] || profiles.balanced;
135
- }
136
-
137
- export default {
138
- countTokens,
139
- estimateCost,
140
- estimateCostFromText,
141
- getModelCost,
142
- listModelsByCost,
143
- findCheapestModels,
144
- MODEL_COSTS
145
- };
@@ -1,18 +0,0 @@
1
- {
2
- "compilerOptions": {
3
- "target": "ES2022",
4
- "module": "commonjs",
5
- "lib": ["ES2022"],
6
- "outDir": "./dist",
7
- "rootDir": "./src",
8
- "strict": true,
9
- "esModuleInterop": true,
10
- "skipLibCheck": true,
11
- "forceConsistentCasingInFileNames": true,
12
- "declaration": true,
13
- "declarationMap": true,
14
- "sourceMap": true
15
- },
16
- "include": ["src/**/*"],
17
- "exclude": ["node_modules", "dist"]
18
- }