adaptive-memory-multi-model-router 2.14.49 → 2.14.52

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (605) hide show
  1. package/.dockerignore +82 -0
  2. package/.env.example +303 -0
  3. package/.github/DISCUSSIONS_WELCOME.md +27 -0
  4. package/.github/DISCUSSION_TEMPLATE.yml +5 -0
  5. package/.github/FUNDING.yml +2 -0
  6. package/.github/ISSUE_TEMPLATE/bug_report.md +94 -0
  7. package/.github/ISSUE_TEMPLATE/config.yml +17 -0
  8. package/.github/ISSUE_TEMPLATE/feature_request.md +71 -0
  9. package/.github/PULL_REQUEST_TEMPLATE.md +71 -0
  10. package/.github/dependabot.yml +9 -0
  11. package/.github/workflows/ci.yml +263 -0
  12. package/.github/workflows/codeql.yml +38 -0
  13. package/.github/workflows/npm-publish.yml +20 -0
  14. package/.github/workflows/pages.yml +37 -0
  15. package/.github/workflows/stale.yml +54 -0
  16. package/.publish-tick +1 -0
  17. package/.well-known/ai-plugin.json +16 -0
  18. package/AGENT_COUNCIL_FINDINGS.md +142 -0
  19. package/ARCHITECTURE.md +346 -0
  20. package/AUDIT_REPORT.md +28 -0
  21. package/CODE_OF_CONDUCT.md +128 -0
  22. package/CONTRIBUTING.md +50 -0
  23. package/CONTRIBUTORS.md +20 -0
  24. package/Dockerfile +53 -0
  25. package/Dockerfile.proxy +33 -0
  26. package/HEALTH_REPORT.md +118 -0
  27. package/IMPROVEMENT_PLAN.md +107 -0
  28. package/LANDING.md +43 -0
  29. package/LAUNCH-PAIN-DRIVEN.md +339 -0
  30. package/LAUNCH.md +337 -0
  31. package/LAUNCH_CHECKLIST.md +141 -0
  32. package/LAUNCH_SNAPSHOT.md +260 -0
  33. package/MANIFESTO.md +41 -0
  34. package/POPULARITY_BOOSTERS.md +285 -0
  35. package/PR_STATUS_REPORT.md +148 -0
  36. package/README.md +25 -14
  37. package/REDESIGN.md +95 -0
  38. package/RUNKIT.md +83 -0
  39. package/SECURITY.md +29 -0
  40. package/SUBMISSIONS.md +43 -0
  41. package/_schema.html +53 -0
  42. package/ai-plugin.json +16 -0
  43. package/articles/AI_AGENT_LLM_ROUTING.md +150 -0
  44. package/articles/CHINESE_DIRECTORIES.md +100 -0
  45. package/articles/CHINESE_SUBMISSIONS_READY.md +322 -0
  46. package/articles/COMPETITOR_ALERTS.md +31 -0
  47. package/articles/COMPLETE_POSTING_DIRECTORY.md +147 -0
  48. package/articles/CONTENT_STRUCTURE.md +292 -0
  49. package/articles/DEVTO_COST_GUIDE.md +473 -0
  50. package/articles/DEVTO_FINAL.md +416 -0
  51. package/articles/DEVTO_MULTI_PROVIDER.md +542 -0
  52. package/articles/DEVTO_READY.md +255 -0
  53. package/articles/DEVTO_V2_ANNOUNCEMENT.md +160 -0
  54. package/articles/DEVTO_VIRAL_GROWTH.md +280 -0
  55. package/articles/FRESH_devto.md +460 -0
  56. package/articles/FRESH_devto_2026_05.md +73 -0
  57. package/articles/FRESH_hackernews.md +14 -0
  58. package/articles/FRESH_reddit_ml.md +90 -0
  59. package/articles/FRESH_reddit_node.md +198 -0
  60. package/articles/FRESH_reddit_sideproject.md +72 -0
  61. package/articles/FRESH_reddit_webdev.md +130 -0
  62. package/articles/FROM_ZERO_TO_10K.md +107 -0
  63. package/articles/HN_10X_BETTER.md +430 -0
  64. package/articles/HN_ACCOUNT_GUIDE.md +21 -0
  65. package/articles/HN_CHINESE_STYLE.md +308 -0
  66. package/articles/HN_FINAL.md +148 -0
  67. package/articles/HN_POSTED_VERSION.md +56 -0
  68. package/articles/HN_POST_READY.md +137 -0
  69. package/articles/HN_RESEARCH.md +364 -0
  70. package/articles/HN_SHOW_routerarena.md +17 -0
  71. package/articles/HN_TIMING_GUIDE.md +52 -0
  72. package/articles/INDIEHACKERS_POST.md +52 -0
  73. package/articles/INDIEHACKERS_READY.md +120 -0
  74. package/articles/LLM_BENCHMARK_DEEP_DIVE.md +153 -0
  75. package/articles/MASTER_POSTING_DIRECTORY.md +189 -0
  76. package/articles/NEWSLETTER_SEND_NOW.md +259 -0
  77. package/articles/NEWSLETTER_SUBMISSIONS.md +112 -0
  78. package/articles/PAIN-DRIVEN-devto-v2.md +308 -0
  79. package/articles/PAIN-DRIVEN-devto-v3.md +268 -0
  80. package/articles/PAIN-DRIVEN-devto.md +242 -0
  81. package/articles/PAIN-DRIVEN-hackernews-v2.md +138 -0
  82. package/articles/PAIN-DRIVEN-hackernews-v3.md +151 -0
  83. package/articles/PAIN-DRIVEN-hackernews.md +131 -0
  84. package/articles/PAIN-DRIVEN-reddit-v2.md +301 -0
  85. package/articles/PAIN-DRIVEN-reddit-v3.md +236 -0
  86. package/articles/PAIN-DRIVEN-reddit.md +218 -0
  87. package/articles/PAIN-DRIVEN-twitter-v2.md +110 -0
  88. package/articles/PAIN-DRIVEN-twitter-v3.md +121 -0
  89. package/articles/PAIN-DRIVEN-twitter.md +120 -0
  90. package/articles/PORTKEY_VS_A3M.md +147 -0
  91. package/articles/POSTING_KIT_2026_05.md +67 -0
  92. package/articles/PRESS_KIT_routerarena.md +77 -0
  93. package/articles/PRODUCTHUNT_LISTING.md +48 -0
  94. package/articles/PRODUCTHUNT_READY.md +106 -0
  95. package/articles/PR_PLAN_vault.md +125 -0
  96. package/articles/REDDIT_FINAL.md +232 -0
  97. package/articles/REDDIT_POST.md +67 -0
  98. package/articles/REDDIT_SUBMISSION_READY.md +348 -0
  99. package/articles/ROUTERARENA_9677.md +78 -0
  100. package/articles/ROUTERARENA_LEADER.md +45 -0
  101. package/articles/SHOW_HN_FINAL.md +29 -0
  102. package/articles/TWEETS_10K_DOWNLOADS.md +47 -0
  103. package/articles/TWEETS_BENCHMARK_FIRST.md +46 -0
  104. package/articles/TWEETS_MCP_PLAY.md +51 -0
  105. package/articles/TWEETS_SEQUENTIAL_BROKEN.md +49 -0
  106. package/articles/TWEETS_WHY_BUILD.md +54 -0
  107. package/articles/TWEETS_routerarena_leader.md +53 -0
  108. package/articles/TWEET_STORM_READY.md +165 -0
  109. package/articles/TWITTER_FINAL.md +167 -0
  110. package/articles/WHY_10X_BETTER.md +261 -0
  111. package/articles/WHY_CHINESE_STYLE_BETTER.md +323 -0
  112. package/articles/ai-discoverability-llm-routing.md +210 -0
  113. package/articles/devto-llm-routing.md +138 -0
  114. package/articles/hackernews-show-hn.md +54 -0
  115. package/articles/hashnode-llm-cost-optimization.md +125 -0
  116. package/articles/hn_show_2026_05.md +11 -0
  117. package/articles/medium-building-llm-router.md +205 -0
  118. package/articles/reddit-ml.md +76 -0
  119. package/articles/twitter-thread-cost-savings.md +50 -0
  120. package/articles/youtube-tutorial-script.md +262 -0
  121. package/assets/a3m_3blue1brown.mp4 +0 -0
  122. package/assets/banner.svg +109 -0
  123. package/assets/chart-cost-v2.svg +91 -0
  124. package/assets/chart-cost-v3.svg +143 -0
  125. package/assets/chart-features-v2.svg +132 -0
  126. package/assets/chart-features-v3.svg +211 -0
  127. package/assets/chart-growth-v2.svg +122 -0
  128. package/assets/chart-growth-v3.svg +189 -0
  129. package/assets/cost-comparison.svg +134 -0
  130. package/assets/cost-simple.svg +64 -0
  131. package/assets/demo-hn.gif +0 -0
  132. package/assets/feature-matrix.svg +136 -0
  133. package/assets/growth-chart-animated.svg +76 -0
  134. package/assets/growth-chart.svg +82 -0
  135. package/assets/growth-simple.svg +69 -0
  136. package/assets/hero-diagram.svg +81 -0
  137. package/assets/logo-new.svg +21 -0
  138. package/assets/logo.svg +68 -0
  139. package/assets/provider-comparison.svg +121 -0
  140. package/assets/social-preview-new.svg +100 -0
  141. package/assets/social-preview.svg +194 -0
  142. package/assets/social-v2.svg +130 -0
  143. package/assets/social-v3.svg +212 -0
  144. package/benchmark-provider-results.json +245 -0
  145. package/benchmark-results.json +54 -0
  146. package/council-votes/architecture-vote.md +121 -0
  147. package/council-votes/coverage-vote.md +93 -0
  148. package/data/adaptive-benchmark.json +92 -0
  149. package/data/benchmark-results.json +47 -0
  150. package/data/labeled-benchmark.json +88 -0
  151. package/demo/3blue1brown_video.py +285 -0
  152. package/demo/3blue1brown_video_v2.py +310 -0
  153. package/demo/IMPROVED_PROMPTS.md +229 -0
  154. package/demo/VEO3_PROMPTS.md +269 -0
  155. package/demo/VIDEO_PRODUCTION_GUIDE.md +333 -0
  156. package/demo/a3m_3blue1brown.mp4 +0 -0
  157. package/demo/asciinema-demo.sh +195 -0
  158. package/demo/demo-hn.tape +74 -0
  159. package/demo/demo-script.md +53 -0
  160. package/demo/demo-script.sh +62 -0
  161. package/demo/demo.svg +75 -0
  162. package/demo/frame1_ai_data_center.png +0 -0
  163. package/demo/frame1_sunset_video.mp4 +0 -0
  164. package/demo/frame2_cost_comparison.png +0 -0
  165. package/demo/frame2_cost_comparison_fallback.png +0 -0
  166. package/demo/frame3_parallel_execution.png +0 -0
  167. package/demo/frame3_parallel_execution_fallback.png +0 -0
  168. package/demo/frame4_providers.png +0 -0
  169. package/demo/frame4_providers_fallback.png +0 -0
  170. package/demo/frame5_endcard.png +0 -0
  171. package/demo/frame5_endcard_fallback.png +0 -0
  172. package/demo/new_frame1_hook.png +0 -0
  173. package/demo/new_frame2_proof.png +0 -0
  174. package/demo/new_frame3_wow.png +0 -0
  175. package/demo/new_frame4_social.png +0 -0
  176. package/demo/new_frame5_cta.png +0 -0
  177. package/demo/package.json +13 -0
  178. package/demo/product-video-final.mp4 +0 -0
  179. package/demo/product-video-hype-v1.mp4 +0 -0
  180. package/demo/product-video-v1.mp4 +0 -0
  181. package/demo/public/index.html +762 -0
  182. package/demo/recording.cast +55 -0
  183. package/demo/server.js +405 -0
  184. package/demo-new.tape +71 -0
  185. package/demo-real.sh +198 -0
  186. package/demo-simple.tape +205 -0
  187. package/demo.html +520 -0
  188. package/demo.sh +85 -0
  189. package/demo.tape +259 -0
  190. package/dist/analytics/costAnalytics.d.ts.map +1 -0
  191. package/dist/analytics/costAnalytics.js.map +1 -0
  192. package/dist/benchmark/comprehensive.js.map +1 -0
  193. package/dist/benchmark/reproducible.d.ts.map +1 -0
  194. package/dist/benchmark/reproducible.js.map +1 -0
  195. package/dist/cache/prefixCache.d.ts.map +1 -0
  196. package/dist/cache/prefixCache.js.map +1 -0
  197. package/dist/cache/responseCache.d.ts.map +1 -0
  198. package/dist/cache/responseCache.js.map +1 -0
  199. package/dist/cache/semanticCache.d.ts.map +1 -0
  200. package/dist/cache/semanticCache.js.map +1 -0
  201. package/dist/cli/setupWizard.d.ts.map +1 -0
  202. package/dist/cli/setupWizard.js.map +1 -0
  203. package/dist/cost/budgetEnforcer.d.ts.map +1 -0
  204. package/dist/cost/budgetEnforcer.js.map +1 -0
  205. package/dist/cost/costTracker.d.ts.map +1 -0
  206. package/dist/cost/costTracker.js.map +1 -0
  207. package/dist/ensemble/multiRoundDialog.js.map +1 -0
  208. package/dist/ensemble/shapleyValue.js.map +1 -0
  209. package/dist/integrations/langchainAdapter.d.ts.map +1 -0
  210. package/dist/integrations/langchainAdapter.js.map +1 -0
  211. package/dist/integrations/oauth.d.ts.map +1 -0
  212. package/dist/integrations/oauth.js.map +1 -0
  213. package/dist/integrations/scienceAdapter.js.map +1 -0
  214. package/dist/memory/autoFetch.d.ts.map +1 -0
  215. package/dist/memory/autoFetch.js.map +1 -0
  216. package/dist/memory/episodicMemory.d.ts.map +1 -0
  217. package/dist/memory/episodicMemory.js.map +1 -0
  218. package/dist/memory/hybridMemory.js.map +1 -0
  219. package/dist/memory/memoryTree.d.ts.map +1 -0
  220. package/dist/memory/memoryTree.js.map +1 -0
  221. package/dist/memory/obsidianVault.d.ts.map +1 -0
  222. package/dist/memory/obsidianVault.js.map +1 -0
  223. package/dist/memory/reasoningBank.js.map +1 -0
  224. package/dist/observability/changeWatch.d.ts.map +1 -0
  225. package/dist/observability/changeWatch.js.map +1 -0
  226. package/dist/observability/fatigueDetector.d.ts.map +1 -0
  227. package/dist/observability/fatigueDetector.js.map +1 -0
  228. package/dist/observability/index.d.ts.map +1 -0
  229. package/dist/observability/index.js.map +1 -0
  230. package/dist/observability/metrics.d.ts.map +1 -0
  231. package/dist/observability/metrics.js.map +1 -0
  232. package/dist/observability/middleware.d.ts.map +1 -0
  233. package/dist/observability/middleware.js.map +1 -0
  234. package/dist/observability/tracer.d.ts.map +1 -0
  235. package/dist/observability/tracer.js.map +1 -0
  236. package/dist/observability/types.d.ts.map +1 -0
  237. package/dist/observability/types.js.map +1 -0
  238. package/dist/orchestration/haloOrchestrator.d.ts.map +1 -0
  239. package/dist/orchestration/haloOrchestrator.js.map +1 -0
  240. package/dist/orchestration/mctsWorkflow.d.ts.map +1 -0
  241. package/dist/orchestration/mctsWorkflow.js.map +1 -0
  242. package/dist/providers/localProvider.d.ts.map +1 -0
  243. package/dist/providers/localProvider.js.map +1 -0
  244. package/dist/providers/providerConfig.d.ts.map +1 -0
  245. package/dist/providers/providerConfig.js.map +1 -0
  246. package/dist/providers/registry.d.ts.map +1 -0
  247. package/dist/providers/registry.js.map +1 -0
  248. package/dist/routing/advancedRouter.d.ts.map +1 -0
  249. package/dist/routing/advancedRouter.js +1 -1
  250. package/dist/routing/advancedRouter.js.map +1 -0
  251. package/dist/routing/crossModelValidation.d.ts.map +1 -0
  252. package/dist/routing/crossModelValidation.js.map +1 -0
  253. package/dist/routing/providerHealth.d.ts.map +1 -0
  254. package/dist/routing/providerHealth.js.map +1 -0
  255. package/dist/routing/providerRetry.d.ts.map +1 -0
  256. package/dist/routing/providerRetry.js.map +1 -0
  257. package/dist/scripts/banner.js +29 -0
  258. package/dist/security/guardrails.d.ts.map +1 -0
  259. package/dist/security/guardrails.js.map +1 -0
  260. package/dist/server/dashboard.d.ts.map +1 -0
  261. package/dist/server/dashboard.js.map +1 -0
  262. package/dist/server/modelMapper.d.ts.map +1 -0
  263. package/dist/server/modelMapper.js.map +1 -0
  264. package/dist/server/proxyServer.d.ts.map +1 -0
  265. package/dist/server/proxyServer.js.map +1 -0
  266. package/dist/skills/__tests__/skill_manager.test.d.ts +2 -0
  267. package/dist/skills/__tests__/skill_manager.test.d.ts.map +1 -0
  268. package/dist/skills/__tests__/skill_manager.test.js +268 -0
  269. package/dist/skills/__tests__/skill_manager.test.js.map +1 -0
  270. package/dist/tools/tmlpdTools.d.ts.map +1 -0
  271. package/dist/tools/tmlpdTools.js.map +1 -0
  272. package/dist/tui/dashboard.d.ts.map +1 -0
  273. package/dist/tui/dashboard.js.map +1 -0
  274. package/dist/tui/index.d.ts.map +1 -0
  275. package/dist/tui/index.js.map +1 -0
  276. package/dist/utils/batchProcessor.d.ts.map +1 -0
  277. package/dist/utils/batchProcessor.js.map +1 -0
  278. package/dist/utils/compression.d.ts.map +1 -0
  279. package/dist/utils/compression.js.map +1 -0
  280. package/dist/utils/costUtils.d.ts.map +1 -0
  281. package/dist/utils/costUtils.js.map +1 -0
  282. package/dist/utils/reliability.d.ts.map +1 -0
  283. package/dist/utils/reliability.js.map +1 -0
  284. package/dist/utils/sorting.d.ts.map +1 -0
  285. package/dist/utils/sorting.js.map +1 -0
  286. package/dist/utils/speculativeDecoding.d.ts.map +1 -0
  287. package/dist/utils/speculativeDecoding.js.map +1 -0
  288. package/dist/utils/tokenUtils.d.ts.map +1 -0
  289. package/dist/utils/tokenUtils.js.map +1 -0
  290. package/docs/.nojekyll +0 -0
  291. package/docs/ANALYSIS_PRINCIPLES.md +162 -0
  292. package/docs/API.md +855 -0
  293. package/docs/ARCHITECTURAL-IMPROVEMENTS-2025.md +1391 -0
  294. package/docs/ARCHITECTURAL-IMPROVEMENTS-REVISED-2025.md +1051 -0
  295. package/docs/BENCHMARK.md +170 -0
  296. package/docs/CHINESE_PROVIDER_RELIABILITY.md +37 -0
  297. package/docs/CITATIONS.md +74 -0
  298. package/docs/CLAIMS_AND_EVIDENCE.md +58 -0
  299. package/docs/CONFIGURATION.md +476 -0
  300. package/docs/COUNCIL_DECISION.json +816 -0
  301. package/docs/COUNCIL_SUMMARY.md +319 -0
  302. package/docs/COUNCIL_V2.2_DECISION.md +416 -0
  303. package/docs/ENGINEERING_SPEC.md +55 -0
  304. package/docs/FACTORY_RESET.md +34 -0
  305. package/docs/GEO.md +66 -0
  306. package/docs/GEO_OPTIMIZATION.md +30 -0
  307. package/docs/GEO_ROOT_CAUSE.md +136 -0
  308. package/docs/GEO_STATUS.md +85 -0
  309. package/docs/GEO_TEST_RESULTS.md +176 -0
  310. package/docs/HN_CHECKLIST.md +38 -0
  311. package/docs/HN_FOUNDER_COMMENT.md +17 -0
  312. package/docs/HN_SUBMISSION_FINAL.md +180 -0
  313. package/docs/HN_SUBMISSION_V3.md +56 -0
  314. package/docs/IMPROVEMENT_ROADMAP.md +515 -0
  315. package/docs/INTEGRATIONS.md +420 -0
  316. package/docs/LANGCHAIN_INTEGRATION.md +147 -0
  317. package/docs/LLM_COUNCIL_DECISION.md +508 -0
  318. package/docs/MIDDLEWARE_CHAIN.md +35 -0
  319. package/docs/PROMO_CHECKLIST.md +200 -0
  320. package/docs/QUICKSTART.md +271 -0
  321. package/docs/QUICK_START.md +43 -0
  322. package/docs/QUICK_START_VISIBILITY.md +782 -0
  323. package/docs/REDDIT_GAP_ANALYSIS.md +299 -0
  324. package/docs/RELEASE_CHECKLIST.md +32 -0
  325. package/docs/REPRODUCIBILITY.md +63 -0
  326. package/docs/RESEARCH_BACKED_IMPROVEMENTS.md +1180 -0
  327. package/docs/ROUTING_RUBRIC.md +197 -0
  328. package/docs/SEO_AUDIT.md +186 -0
  329. package/docs/SOCIAL_LISTENING.md +219 -0
  330. package/docs/TMLPD_QNA.md +751 -0
  331. package/docs/TMLPD_V2.1_COMPLETE.md +763 -0
  332. package/docs/TMLPD_V2.2_RESEARCH_ROADMAP.md +754 -0
  333. package/docs/UPDATE_TOPICS.md +15 -0
  334. package/docs/USE_CASES.md +59 -0
  335. package/docs/V2.2_IMPLEMENTATION_COMPLETE.md +446 -0
  336. package/docs/V2_IMPLEMENTATION_GUIDE.md +388 -0
  337. package/docs/VERCEL_AI_SDK.md +209 -0
  338. package/docs/VISIBILITY_ADOPTION_PLAN.md +1005 -0
  339. package/docs/_config.yml +49 -0
  340. package/docs/ai-plugin.json +16 -0
  341. package/docs/api.html +513 -0
  342. package/docs/architecture-diagram.md +40 -0
  343. package/docs/benchmark-chart.png +0 -0
  344. package/docs/benchmark.html +387 -0
  345. package/docs/blog/routerarena-9677.html +92 -0
  346. package/docs/blog/routerarena-number-one.html +73 -0
  347. package/docs/cli-cheatsheet.md +339 -0
  348. package/docs/compare.md +109 -0
  349. package/docs/comparison-litellm.md +88 -0
  350. package/docs/comparison.md +108 -0
  351. package/docs/cost-chart-ascii.md +42 -0
  352. package/docs/cost-comparison-chart.svg +88 -0
  353. package/docs/curl-examples.md +247 -0
  354. package/docs/demo-auto.html +264 -0
  355. package/docs/demo.html +416 -0
  356. package/docs/geo/GENERATIVE_ENGINE_OPTIMIZATION.md +232 -0
  357. package/docs/index.html +507 -0
  358. package/docs/launch-content/LAUNCH_EXECUTION_CHECKLIST.md +421 -0
  359. package/docs/launch-content/README.md +457 -0
  360. package/docs/launch-content/assets/cost_comparison_100_tasks.png +0 -0
  361. package/docs/launch-content/assets/cumulative_savings.png +0 -0
  362. package/docs/launch-content/assets/parallel_speedup.png +0 -0
  363. package/docs/launch-content/assets/provider_pricing_comparison.png +0 -0
  364. package/docs/launch-content/assets/task_breakdown_comparison.png +0 -0
  365. package/docs/launch-content/generate_charts.py +313 -0
  366. package/docs/launch-content/hn_show_post.md +139 -0
  367. package/docs/launch-content/partner_outreach_templates.md +745 -0
  368. package/docs/launch-content/reddit_posts.md +467 -0
  369. package/docs/launch-content/twitter_thread.txt +460 -0
  370. package/{llms.txt.bak → docs/llms.txt} +6 -6
  371. package/docs/npm-downloads-chart.svg +43 -0
  372. package/docs/openapi.json +139 -0
  373. package/docs/openapi.yaml +1318 -0
  374. package/docs/quick-start.html +366 -0
  375. package/docs/robots.txt +52 -0
  376. package/docs/sitemap.xml +57 -0
  377. package/docs/styles.css +682 -0
  378. package/docs/well-known/ai-plugin.json +16 -0
  379. package/docs/wellknown/ai-plugin.json +16 -0
  380. package/docs-site/assets/og-banner.svg +194 -0
  381. package/docs-site/index.html +632 -0
  382. package/eval/README.md +46 -0
  383. package/eval/baselines/main.json +12 -0
  384. package/eval/benchmark_dataset.jsonl +16 -0
  385. package/eval/check_golden_routes.js +64 -0
  386. package/eval/datasets/catalog.json +33 -0
  387. package/eval/datasets/slices/cn_provider_reliability_v1.jsonl +3 -0
  388. package/eval/datasets/slices/cost_pressure_v1.jsonl +3 -0
  389. package/eval/datasets/slices/safety_guardrails_v1.jsonl +3 -0
  390. package/eval/evals.json +199 -0
  391. package/eval/fault_injection_thresholds.json +3 -0
  392. package/eval/generate_report.js +128 -0
  393. package/eval/golden_routes.json +114 -0
  394. package/eval/lib/experiment_registry.js +24 -0
  395. package/eval/run_eval.js +197 -0
  396. package/eval/run_fault_injection.js +201 -0
  397. package/eval/run_shadow_eval.js +85 -0
  398. package/eval/thresholds.json +9 -0
  399. package/examples/QUICKSTART.md +183 -0
  400. package/examples/README.md +61 -0
  401. package/examples/a3m-sdk.js +124 -0
  402. package/examples/basic-route.js +54 -0
  403. package/examples/chat-loop.js +202 -0
  404. package/examples/classify-then-route.js +102 -0
  405. package/examples/cost-compare.js +120 -0
  406. package/examples/ensemble.js +160 -0
  407. package/examples/whatsapp-telegram-bridge-demo.js +302 -0
  408. package/examples/whatsapp-telegram-bridge.js +269 -0
  409. package/hf-space/README.md +23 -0
  410. package/hf-space/app.py +240 -0
  411. package/hf-space/requirements.txt +1 -0
  412. package/huggingface_space/README.md +35 -0
  413. package/huggingface_space/app.py +126 -0
  414. package/huggingface_space/create_space.py +208 -0
  415. package/huggingface_space/requirements.txt +1 -0
  416. package/index.html +1 -1
  417. package/mcp-server/README.md +188 -0
  418. package/mcp-server/package.json +29 -0
  419. package/mcp-server/src/index.ts +744 -0
  420. package/mcp-server/tsconfig.json +19 -0
  421. package/openclaw-alexa-bridge/ALL_REMAINING_FIXES_PLAN.md +313 -0
  422. package/openclaw-alexa-bridge/REMAINING_FIXES_SUMMARY.md +277 -0
  423. package/openclaw-alexa-bridge/src/alexa_handler_no_tmlpd.js +1234 -0
  424. package/openclaw-alexa-bridge/test_fixes.js +77 -0
  425. package/package.json +76 -272
  426. package/playground/README.md +51 -0
  427. package/playground/codesandbox.json +12 -0
  428. package/playground/index.js +39 -0
  429. package/proxy/README.md +227 -0
  430. package/proxy/package-lock.json +831 -0
  431. package/proxy/package.json +17 -0
  432. package/proxy/rate-limit.js +145 -0
  433. package/proxy/rate-limit.test.js +311 -0
  434. package/proxy/server.js +970 -0
  435. package/python/README.md +102 -0
  436. package/python/a3m/__init__.py +6 -0
  437. package/python/a3m/client.py +190 -0
  438. package/python/a3m/models.py +40 -0
  439. package/python/a3m/sync_client.py +61 -0
  440. package/python/examples.py +53 -0
  441. package/python/integrations.py +330 -0
  442. package/python/pyproject.toml +23 -0
  443. package/python/setup.py +28 -0
  444. package/python/tmlpd.py +369 -0
  445. package/qna/REDDIT_GAP_ANALYSIS.md +299 -0
  446. package/qna/TMLPD_QNA.md +751 -0
  447. package/research/FINDING_001_safety.md +28 -0
  448. package/research/FINDING_002_error_diversity.md +32 -0
  449. package/research/FINDING_003_confidence_weighted_voting.md +32 -0
  450. package/research/FINDING_004_cross_model_semantic_detection.md +37 -0
  451. package/research/FINDING_005_knowledge_gap_orthogonality.md +34 -0
  452. package/research/HALLUCINATION_RESEARCH.md +27 -0
  453. package/research/ensemble-voting.md +324 -0
  454. package/research/loss-functions.md +545 -0
  455. package/research-log.md +49 -0
  456. package/scripts/banner.js +29 -0
  457. package/scripts/benchmark-local-routerarena.ts +176 -0
  458. package/scripts/benchmark.js +145 -0
  459. package/scripts/benchmark.sh +61 -0
  460. package/scripts/compare-providers.sh +230 -0
  461. package/scripts/content-planner.js +25 -0
  462. package/scripts/create-labeled-benchmark.ts +105 -0
  463. package/scripts/cross_post.py +443 -0
  464. package/scripts/local-router-benchmark.ts +154 -0
  465. package/scripts/post-all.sh +41 -0
  466. package/scripts/publish_fcc.py +106 -0
  467. package/scripts/push-to-gitee.sh +25 -0
  468. package/scripts/routerarena_ensemble.js +144 -0
  469. package/scripts/routing-benchmark-v2.js +373 -0
  470. package/scripts/routing-benchmark-v3.js +118 -0
  471. package/scripts/routing-benchmark.js +462 -0
  472. package/scripts/run-labeled-benchmark.mjs +104 -0
  473. package/scripts/run-mmlu-benchmark.js +176 -0
  474. package/scripts/run-provider-benchmark.js +244 -0
  475. package/scripts/update-npm-badges.js +158 -0
  476. package/skill/SKILL.md +238 -0
  477. package/src/__tests__/integration/tmpld_integration.test.py +540 -0
  478. package/src/ensemble.ts +2 -0
  479. package/src/routing/advancedRouter.ts +1 -1
  480. package/src/skills/__tests__/skill_manager.test.ts +328 -0
  481. package/submissions/benchmarks/ALL_PLATFORMS_SUBMISSION.md +94 -0
  482. package/submissions/benchmarks/LLMROUTERBENCH_SUBMISSION.md +121 -0
  483. package/submissions/benchmarks/MMRBENCH_SUBMISSION.md +94 -0
  484. package/submissions/benchmarks/ROUTERARENA_UPDATE.md +83 -0
  485. package/submissions/benchmarks/ROUTERBENCH_SUBMISSION.md +225 -0
  486. package/test-council/1-structure-tests.test.js +353 -0
  487. package/test-council/1-structure-tests.test.ts +353 -0
  488. package/test-council/2-edge-case-tests.test.ts +361 -0
  489. package/test-council/3-performance-tests.test.ts +652 -0
  490. package/test-council/4-integration-tests.test.ts +391 -0
  491. package/test-council/5-agent-council-eval.test.ts +413 -0
  492. package/test-council/AGENT_COUNCIL_ARCHITECTURE.md +349 -0
  493. package/test-council/TEST_COUNCIL_REPORT.md +201 -0
  494. package/test-council/agents/edge-case-agent.ts +363 -0
  495. package/test-council/agents/performance-agent.ts +426 -0
  496. package/test-council/agents/structure-agent.ts +227 -0
  497. package/test-council/council.md +183 -0
  498. package/tests/__mocks__/tokenUtils.ts +8 -0
  499. package/tests/memory/episodicMemory.test.ts +227 -0
  500. package/tests/package-lock.json +1785 -0
  501. package/tests/package.json +19 -0
  502. package/tests/routing/ensembleVoting.test.ts +236 -0
  503. package/tests/routing/providerRetry.test.ts +360 -0
  504. package/tests/routing/queryTypePresets.test.ts +208 -0
  505. package/tests/security/guardrailEngine.test.ts +700 -0
  506. package/tests/tsconfig.json +21 -0
  507. package/tests/vitest.config.ts +18 -0
  508. package/tmlpd-pi-extension/README.md +66 -0
  509. package/tmlpd-pi-extension/dist/cache/prefixCache.d.ts +114 -0
  510. package/tmlpd-pi-extension/dist/cache/prefixCache.d.ts.map +1 -0
  511. package/tmlpd-pi-extension/dist/cache/prefixCache.js +285 -0
  512. package/tmlpd-pi-extension/dist/cache/prefixCache.js.map +1 -0
  513. package/tmlpd-pi-extension/dist/cache/responseCache.d.ts +58 -0
  514. package/tmlpd-pi-extension/dist/cache/responseCache.d.ts.map +1 -0
  515. package/tmlpd-pi-extension/dist/cache/responseCache.js +153 -0
  516. package/tmlpd-pi-extension/dist/cache/responseCache.js.map +1 -0
  517. package/tmlpd-pi-extension/dist/cli.js +59 -0
  518. package/tmlpd-pi-extension/dist/cost/costTracker.d.ts +95 -0
  519. package/tmlpd-pi-extension/dist/cost/costTracker.d.ts.map +1 -0
  520. package/tmlpd-pi-extension/dist/cost/costTracker.js +240 -0
  521. package/tmlpd-pi-extension/dist/cost/costTracker.js.map +1 -0
  522. package/tmlpd-pi-extension/dist/index.d.ts +723 -0
  523. package/tmlpd-pi-extension/dist/index.d.ts.map +1 -0
  524. package/tmlpd-pi-extension/dist/index.js +239 -0
  525. package/tmlpd-pi-extension/dist/index.js.map +1 -0
  526. package/tmlpd-pi-extension/dist/memory/episodicMemory.d.ts +82 -0
  527. package/tmlpd-pi-extension/dist/memory/episodicMemory.d.ts.map +1 -0
  528. package/tmlpd-pi-extension/dist/memory/episodicMemory.js +145 -0
  529. package/tmlpd-pi-extension/dist/memory/episodicMemory.js.map +1 -0
  530. package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.d.ts +102 -0
  531. package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.d.ts.map +1 -0
  532. package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.js +207 -0
  533. package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.js.map +1 -0
  534. package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.d.ts +85 -0
  535. package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.d.ts.map +1 -0
  536. package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.js +210 -0
  537. package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.js.map +1 -0
  538. package/tmlpd-pi-extension/dist/providers/localProvider.d.ts +102 -0
  539. package/tmlpd-pi-extension/dist/providers/localProvider.d.ts.map +1 -0
  540. package/tmlpd-pi-extension/dist/providers/localProvider.js +338 -0
  541. package/tmlpd-pi-extension/dist/providers/localProvider.js.map +1 -0
  542. package/tmlpd-pi-extension/dist/providers/registry.d.ts +55 -0
  543. package/tmlpd-pi-extension/dist/providers/registry.d.ts.map +1 -0
  544. package/tmlpd-pi-extension/dist/providers/registry.js +138 -0
  545. package/tmlpd-pi-extension/dist/providers/registry.js.map +1 -0
  546. package/tmlpd-pi-extension/dist/routing/advancedRouter.d.ts +68 -0
  547. package/tmlpd-pi-extension/dist/routing/advancedRouter.d.ts.map +1 -0
  548. package/tmlpd-pi-extension/dist/routing/advancedRouter.js +332 -0
  549. package/tmlpd-pi-extension/dist/routing/advancedRouter.js.map +1 -0
  550. package/tmlpd-pi-extension/dist/tools/tmlpdTools.d.ts +101 -0
  551. package/tmlpd-pi-extension/dist/tools/tmlpdTools.d.ts.map +1 -0
  552. package/tmlpd-pi-extension/dist/tools/tmlpdTools.js +368 -0
  553. package/tmlpd-pi-extension/dist/tools/tmlpdTools.js.map +1 -0
  554. package/tmlpd-pi-extension/dist/utils/batchProcessor.d.ts +96 -0
  555. package/tmlpd-pi-extension/dist/utils/batchProcessor.d.ts.map +1 -0
  556. package/tmlpd-pi-extension/dist/utils/batchProcessor.js +170 -0
  557. package/tmlpd-pi-extension/dist/utils/batchProcessor.js.map +1 -0
  558. package/tmlpd-pi-extension/dist/utils/compression.d.ts +61 -0
  559. package/tmlpd-pi-extension/dist/utils/compression.d.ts.map +1 -0
  560. package/tmlpd-pi-extension/dist/utils/compression.js +281 -0
  561. package/tmlpd-pi-extension/dist/utils/compression.js.map +1 -0
  562. package/tmlpd-pi-extension/dist/utils/reliability.d.ts +74 -0
  563. package/tmlpd-pi-extension/dist/utils/reliability.d.ts.map +1 -0
  564. package/tmlpd-pi-extension/dist/utils/reliability.js +177 -0
  565. package/tmlpd-pi-extension/dist/utils/reliability.js.map +1 -0
  566. package/tmlpd-pi-extension/dist/utils/speculativeDecoding.d.ts +117 -0
  567. package/tmlpd-pi-extension/dist/utils/speculativeDecoding.d.ts.map +1 -0
  568. package/tmlpd-pi-extension/dist/utils/speculativeDecoding.js +246 -0
  569. package/tmlpd-pi-extension/dist/utils/speculativeDecoding.js.map +1 -0
  570. package/tmlpd-pi-extension/dist/utils/tokenUtils.d.ts +50 -0
  571. package/tmlpd-pi-extension/dist/utils/tokenUtils.d.ts.map +1 -0
  572. package/tmlpd-pi-extension/dist/utils/tokenUtils.js +124 -0
  573. package/tmlpd-pi-extension/dist/utils/tokenUtils.js.map +1 -0
  574. package/tmlpd-pi-extension/examples/QUICKSTART.md +183 -0
  575. package/tmlpd-pi-extension/package-lock.json +79 -0
  576. package/tmlpd-pi-extension/package.json +172 -0
  577. package/tmlpd-pi-extension/python/examples.py +53 -0
  578. package/tmlpd-pi-extension/python/integrations.py +330 -0
  579. package/tmlpd-pi-extension/python/setup.py +28 -0
  580. package/tmlpd-pi-extension/python/tmlpd.py +369 -0
  581. package/tmlpd-pi-extension/qna/REDDIT_GAP_ANALYSIS.md +299 -0
  582. package/tmlpd-pi-extension/qna/TMLPD_QNA.md +751 -0
  583. package/tmlpd-pi-extension/skill/SKILL.md +238 -0
  584. package/tmlpd-pi-extension/src/cache/responseCache.ts +147 -0
  585. package/tmlpd-pi-extension/src/cost/costTracker.ts +302 -0
  586. package/tmlpd-pi-extension/src/index.ts +232 -0
  587. package/tmlpd-pi-extension/src/memory/episodicMemory.ts +257 -0
  588. package/tmlpd-pi-extension/src/orchestration/haloOrchestrator.ts +266 -0
  589. package/tmlpd-pi-extension/src/orchestration/mctsWorkflow.ts +262 -0
  590. package/tmlpd-pi-extension/src/providers/localProvider.ts +406 -0
  591. package/tmlpd-pi-extension/src/providers/registry.ts +164 -0
  592. package/tmlpd-pi-extension/src/routing/ensembleVoting.ts +159 -0
  593. package/tmlpd-pi-extension/src/routing/queryTypePresets.ts +136 -0
  594. package/tmlpd-pi-extension/src/tools/tmlpdTools.ts +433 -0
  595. package/tmlpd-pi-extension/src/utils/batchProcessor.ts +232 -0
  596. package/tmlpd-pi-extension/src/utils/compression.ts +325 -0
  597. package/tmlpd-pi-extension/src/utils/reliability.ts +221 -0
  598. package/tmlpd-pi-extension/src/utils/tokenUtils.ts +145 -0
  599. package/tmlpd-pi-extension/tsconfig.json +18 -0
  600. package/tsconfig.build.json +29 -0
  601. package/tsconfig.json +18 -0
  602. package/README.md.bak +0 -1185
  603. package/src/routing/advancedRouter.ts.bak +0 -650
  604. package/test.js.bak +0 -376
  605. /package/{llms-full.txt.bak → docs/llms-full.txt} +0 -0
@@ -0,0 +1,197 @@
1
+ # A3M Router — Routing Quality Rubric
2
+
3
+ Five dimensions, each measured against real evidence from production routing data. The composite score drives the pulse metric and surfaces where routing quality degrades.
4
+
5
+ ## Formula
6
+
7
+ ```
8
+ composite_score = 0.30 × RoutingAccuracy
9
+ + 0.25 × CostEfficiency
10
+ + 0.20 × Latency
11
+ + 0.15 × ErrorHandling
12
+ + 0.10 × CacheHitRate
13
+ ```
14
+
15
+ **Weight justification:**
16
+ - **30% Accuracy** — Getting the right provider for the right query is the primary function. Everything else is secondary.
17
+ - **25% Cost Efficiency** — The core value proposition. If accuracy is perfect but costs are high, we failed at the value prop.
18
+ - **20% Latency** — Developer experience. A router that's slow gets bypassed regardless of accuracy.
19
+ - **15% Error Handling** — Reliability under provider failures. Matters most in production.
20
+ - **10% Cache Hit Rate** — Bonus optimization. Only matters at scale.
21
+
22
+ ---
23
+
24
+ ## 1. Routing Accuracy (30%)
25
+
26
+ *"Did the router send the query to the right tier?"*
27
+
28
+ ### Scoring
29
+
30
+ | Score | Criterion |
31
+ |-------|-----------|
32
+ | 90-100 | >95% within ±1 tier. RouterArena score above 70. Fewer than 1 in 20 queries misrouted by more than one tier. |
33
+ | 75-89 | 85-95% within ±1 tier. RouterArena score 60-70. Occasional over-tiering on simple queries. |
34
+ | 60-74 | 70-85% within ±1 tier. RouterArena score 50-60. Noticeable over-tiering on medium queries. |
35
+ | 45-59 | 50-70% within ±1 tier. Frequent misrouting on complex/expert queries. |
36
+ | <45 | <50% within ±1 tier. Router is essentially random. Major overhaul needed. |
37
+
38
+ ### Evidence to capture
39
+
40
+ - **RouteLLM comparison** — where RouteLLM routes vs A3M (reference benchmark)
41
+ - **Tier confusion matrix** — which query types cause the most over/under-tiering
42
+ - **RouterArena score** — the single-number benchmark (current: 70.32)
43
+ - **Golden route deviation** — percentage of queries where A3M disagrees with golden route
44
+
45
+ ### Common failure patterns
46
+
47
+ | Pattern | Fix |
48
+ |---------|-----|
49
+ | All queries go to free tier (0% to mid/premium) | Add confidence floor. If no provider has confidence > 0.5, fallback to premium |
50
+ | Code queries misrouted to creative models | Strengthen code-detection signals (``` blocks, function syntax) |
51
+ | Legal/medical routed to cheap models | Add domain detection for 5 safety-critical domains |
52
+ | Ambiguous queries bounce between tiers | Implement query-type confidence threshold |
53
+
54
+ ### Dollar Impact
55
+
56
+ ```
57
+ Wasted = (MismatchCount × AvgCostDelta)
58
+ AvgCostDelta = |ActualCost - OptimalCost|
59
+ ```
60
+
61
+ ---
62
+
63
+ ## 2. Cost Efficiency (25%)
64
+
65
+ *"Did the router save money compared to all-premium routing?"*
66
+
67
+ ### Scoring
68
+
69
+ | Score | Savings vs All-Premium | CPP (Cost Per Query) |
70
+ |-------|----------------------|---------------------|
71
+ | 90-100 | >70% savings | <$0.001/query |
72
+ | 75-89 | 50-70% savings | $0.001-$0.003/query |
73
+ | 60-74 | 30-50% savings | $0.003-$0.006/query |
74
+ | 45-59 | 15-30% savings | $0.006-$0.01/query |
75
+ | <45 | <15% savings | >$0.01/query |
76
+
77
+ ### Evidence to capture
78
+
79
+ - **Cost per query** over the measurement window
80
+ - **Savings vs all-premium** — total cost if every query went to GPT-4o
81
+ - **Free tier utilization** — % of queries handled by free/cheap providers
82
+ - **Budget cap hits** — how often budget enforcement is triggered
83
+ - **Provider cost breakdown** — cost per provider
84
+
85
+ ### Common failure patterns
86
+
87
+ | Pattern | Fix |
88
+ |---------|-----|
89
+ | Everything routes to free (0% accuracy) | Add quality floor to cost optimization |
90
+ | Budget cap tripped too often | Increase budget cap or reduce free-tier usage |
91
+ | Premium providers selected for trivial queries | Lower confidence threshold for mid-tier |
92
+
93
+ ### Dollar Impact
94
+
95
+ ```
96
+ Savings = (TotalQueryCount × AvgPremiumCost) - ActualTotalCost
97
+ MonthlySavings = Savings × (30 / MeasurementDays)
98
+ ```
99
+
100
+ ---
101
+
102
+ ## 3. Latency (20%)
103
+
104
+ *"How fast is the router decision?"*
105
+
106
+ ### Scoring (P95 Latency)
107
+
108
+ | Score | P95 Latency | Overhead vs Direct |
109
+ |-------|------------|-------------------|
110
+ | 90-100 | <200ms | <50ms overhead |
111
+ | 75-89 | 200-500ms | 50-100ms overhead |
112
+ | 60-74 | 500-1000ms | 100-200ms overhead |
113
+ | 45-59 | 1-3s | 200-500ms overhead |
114
+ | <45 | >3s | >500ms overhead |
115
+
116
+ ### Evidence to capture
117
+
118
+ - **P50, P95, P99 latency** — distribution
119
+ - **Routing decision overhead** — time spent in routing logic vs provider response
120
+ - **Slowest providers** — top 5 by latency
121
+ - **Cache response time** — cached vs uncached query time
122
+
123
+ ---
124
+
125
+ ## 4. Error Handling (15%)
126
+
127
+ *"How well does the router handle failures?"*
128
+
129
+ ### Scoring
130
+
131
+ | Score | Criterion |
132
+ |-------|-----------|
133
+ | 90-100 | 0 unhandled failures. All provider failures caught by circuit breaker. Graceful fallback 100% of the time. |
134
+ | 75-89 | <1% unhandled failures. Circuit breaker catches most issues. Fallback succeeds >95%. |
135
+ | 60-74 | 1-3% unhandled failures. Occasional circuit breaker misses. Fallback succeeds >80%. |
136
+ | 45-59 | 3-10% unhandled failures. Circuit breaker coverage gaps. Fallback degrades. |
137
+ | <45 | >10% unhandled failures. Critical reliability issues. |
138
+
139
+ ### Evidence to capture
140
+
141
+ - **Circuit breaker trips** — how many times each provider was disabled
142
+ - **Fallback success rate** — % of attempts where fallback succeeded
143
+ - **Unhandled failures** — queries that returned no response
144
+ - **Provider health score** — current health of each provider
145
+
146
+ ### Common failure patterns
147
+
148
+ | Pattern | Fix |
149
+ |---------|-----|
150
+ | Circuit breaker never fires (wasteful retries) | Lower threshold for circuit breaker trip |
151
+ | Circuit breaker fires too often | Increase threshold, add validation before trip |
152
+ | All providers fail simultaneously | Add cold-start provider as emergency fallback |
153
+
154
+ ---
155
+
156
+ ## 5. Cache Hit Rate (10%)
157
+
158
+ *"How often does semantic cache avoid a duplicate provider call?"*
159
+
160
+ ### Scoring
161
+
162
+ | Score | Cache Hit Rate |
163
+ |-------|---------------|
164
+ | 90-100 | >40% |
165
+ | 75-89 | 30-40% |
166
+ | 60-74 | 20-30% |
167
+ | 45-59 | 10-20% |
168
+ | <45 | <10% |
169
+
170
+ ### Evidence to capture
171
+
172
+ - **Global cache hit rate** — across all queries
173
+ - **Per-query-type cache rate** — which query types benefit most
174
+ - **Cache latency savings** — total time saved by cache hits
175
+ - **Cache cost savings** — how much money cache saved
176
+
177
+ ---
178
+
179
+ ## Composite Score Bands
180
+
181
+ | Band | Score | Meaning |
182
+ |------|-------|---------|
183
+ | 🟢 Excellent | 85-100 | Production-ready. Fine-tune edge cases. |
184
+ | 🟡 Good | 70-84 | Working well. Some optimization opportunities. |
185
+ | 🟠 Fair | 55-69 | Functional but needs attention. |
186
+ | 🔴 Poor | 40-54 | Quality issues. Investigate root cause. |
187
+ | ⚫ Critical | <40 | Router needs significant work. |
188
+
189
+ ## Usage
190
+
191
+ Calculate after every 100 queries or at least once per week:
192
+
193
+ ```bash
194
+ a3m-router metrics # Quick pulse
195
+ a3m-router metrics --full # Full rubric with all dimensions
196
+ a3m-router metrics --export # Raw JSON for analysis
197
+ ```
@@ -0,0 +1,186 @@
1
+ # SEO Audit: A3M Router (adaptive-memory-multi-model-router)
2
+
3
+ **Date:** 2026-05-18 (Updated)
4
+ **Package:** adaptive-memory-multi-model-router
5
+ **NPM URL:** https://www.npmjs.com/package/adaptive-memory-multi-model-router
6
+ **GitHub URL:** https://github.com/Das-rebel/a3m-router
7
+
8
+ ---
9
+
10
+ ## 1. Keyword Research
11
+
12
+ ### Primary Keywords (benchmark-driven, high intent)
13
+
14
+ | Keyword | Est. Monthly Volume | Competition | Intent | Priority |
15
+ |---------|---------------------|-------------|--------|----------|
16
+ | `llm router benchmark` | 1,200-2,000 | Low | Commercial | P0 |
17
+ | `llm routing accuracy` | 800-1,500 | Low | Informational | P0 |
18
+ | `routellm alternative` | 1,500-3,000 | Low-Medium | Commercial | P0 |
19
+ | `litellm alternative` | 1,500-3,000 | Low-Medium | Commercial | P0 |
20
+ | `llm cost optimization` | 800-1,500 | Low | Commercial | P0 |
21
+ | `openai proxy free` | 2,000-4,000 | Medium | Transactional | P0 |
22
+ | `llm gateway open source` | 1,000-2,000 | Low-Medium | Commercial | P0 |
23
+
24
+ ### Long-Tail Keywords (FAQ/content targets)
25
+
26
+ | Keyword | Est. Monthly Volume | Competition | Intent | Priority |
27
+ |---------|---------------------|-------------|--------|----------|
28
+ | `how to reduce openai api costs` | 1,500-3,000 | Low | Informational | P0 |
29
+ | `llm routing without gpu` | 300-600 | Very Low | Informational | P0 |
30
+ | `lightweight llm router` | 500-1,000 | Low | Commercial | P0 |
31
+ | `keyword-based llm routing` | 100-300 | Very Low | Informational | P1 |
32
+ | `drop-in openai proxy` | 300-600 | Low | Commercial | P0 |
33
+ | `free llm proxy` | 800-1,500 | Low | Transactional | P0 |
34
+ | `cheapest openai api alternative` | 500-1,000 | Low | Commercial | P0 |
35
+
36
+ ### Competitive/Comparison Keywords (HIGH VALUE)
37
+
38
+ | Keyword | Est. Monthly Volume | Competition | Priority |
39
+ |---------|---------------------|-------------|----------|
40
+ | `routellm alternative` | 1,500-3,000 | Low-Medium | P0 |
41
+ | `litellm alternative` | 1,500-3,000 | Low-Medium | P0 |
42
+ | `a3m router vs litellm` | 50-100 | Very Low | P1 |
43
+ | `a3m router vs routellm` | 50-100 | Very Low | P1 |
44
+ | `openrouter alternative` | 200-400 | Low | P1 |
45
+ | `portkey alternative` | 100-200 | Very Low | P2 |
46
+
47
+ ### Secondary Keywords
48
+
49
+ | Keyword | Est. Monthly Volume | Competition | Priority |
50
+ |---------|---------------------|-------------|----------|
51
+ | `ai gateway` | 5,000-8,000 | High | P1 |
52
+ | `model routing` | 500-1,000 | Low | P1 |
53
+ | `llm proxy` | 1,000-2,000 | Low-Medium | P1 |
54
+ | `openai compatible proxy` | 500-1,000 | Low | P1 |
55
+ | `llm load balancer` | 300-800 | Low | P1 |
56
+ | `llm provider comparison` | 1,000-2,000 | Medium | P1 |
57
+
58
+ ---
59
+
60
+ ## 2. Key Messages (use everywhere)
61
+
62
+ 1. **"82.5% routing accuracy without ML"** — Lead metric, differentiator
63
+ 2. **"Matches RouteLLM BERT within 2.5%"** — Competitive positioning
64
+ 3. **"30x more efficient than GPU-based routing"** — Efficiency story
65
+ 4. **"Only router besides RouteLLM with published benchmarks"** — Trust signal
66
+ 5. **"245% growth, 2,775 downloads in 3 days"** — Social proof
67
+
68
+ ---
69
+
70
+ ## 3. Competitive Positioning
71
+
72
+ ### RouteLLM Alternative (HIGH VALUE)
73
+
74
+ "RouteLLM alternative" is our highest-value keyword because:
75
+ - RouteLLM users are actively looking for alternatives (GPU cost, complexity)
76
+ - We have a direct benchmark comparison (within 2.5%)
77
+ - We offer features RouteLLM lacks (proxy, cache, guardrails)
78
+
79
+ **Positioning:** "A3M Router matches RouteLLM BERT within 2.5% — without GPU. Plus proxy, cache, guardrails."
80
+
81
+ ### LiteLLM Alternative (HIGH VALUE)
82
+
83
+ "LiteLLM alternative" captures users who want:
84
+ - Published routing benchmarks
85
+ - Zero-config setup
86
+ - Built-in semantic caching
87
+
88
+ **Positioning:** "A3M Router is the only LiteLLM alternative with published routing benchmarks (82.5% accuracy)."
89
+
90
+ ### Competitive Table
91
+
92
+ | Competitor | NPM Weekly Downloads | Our Edge |
93
+ |------------|---------------------|----------|
94
+ | litellm | ~80,000 | Published benchmarks, zero-config, semantic cache |
95
+ | openrouter-sdk | ~5,000 | Self-hosted, no middleman fees, published accuracy |
96
+ | portkey-ai | ~3,000 | Open-source, free, no signup, benchmarks |
97
+ | routellm | ~1,000 | No GPU needed, proxy included, 39 providers |
98
+
99
+ ---
100
+
101
+ ## 4. On-Page SEO Checklist
102
+
103
+ ### docs-site/index.html
104
+
105
+ | Element | Status | Target |
106
+ |---------|--------|--------|
107
+ | Title tag | UPDATED | "A3M Router — 82.5% Routing Accuracy Without ML \| Matches RouteLLM" |
108
+ | Meta description | UPDATED | 30x efficiency story with accuracy metric |
109
+ | Keywords meta | UPDATED | All 12 primary/long-tail keywords |
110
+ | H1 tag | UPDATED | "LLM Routing That Matches GPU Models — Without GPU" |
111
+ | Stats section | UPDATED | Leads with 82.5% accuracy, 2.5% gap, 30x efficiency |
112
+ | FAQ schema | UPDATED | 8 questions targeting AI search queries |
113
+ | OG tags | UPDATED | Benchmark-first messaging |
114
+ | Twitter cards | UPDATED | Benchmark-first messaging |
115
+
116
+ ### Content Structure (H-tag hierarchy)
117
+
118
+ ```
119
+ H1: LLM Routing That Matches GPU Models — Without GPU
120
+ H2: Intelligent LLM Routing (feature)
121
+ H2: Cost Optimization (feature)
122
+ H2: Smart Fallback & Retry (feature)
123
+ H2: Real-time Analytics (feature)
124
+ H2: Security Guardrails (feature)
125
+ H2: Semantic Cache (feature)
126
+ H2: LLM Provider Pricing Tiers (section)
127
+ H3: Free/Budget/Mid/Premium Tier
128
+ H2: Quick Start: LLM Routing in 30 Seconds
129
+ H2: Frequently Asked Questions
130
+ H3: What is LLM routing accuracy?
131
+ H3: How does keyword-based routing compare to ML routing?
132
+ H3: What is the best lightweight LLM router?
133
+ H3: How to reduce OpenAI API costs?
134
+ H3: How does A3M Router compare to RouteLLM?
135
+ H3: How does A3M Router compare to LiteLLM?
136
+ ```
137
+
138
+ ---
139
+
140
+ ## 5. Technical SEO
141
+
142
+ ### robots.txt (UPDATED)
143
+ - Allows full crawling
144
+ - Explicitly allows docs/, assets/, llms.txt, README.md
145
+ - Sitemap reference included
146
+ - Blocks /node_modules/, /dist/, /test/, /src/, /.git/
147
+
148
+ ### sitemap.xml (UPDATED)
149
+ - 11 URLs including all key pages
150
+ - New: GEO.md, SEO_AUDIT.md, CONFIGURATION.md, INTEGRATIONS.md, benchmark-results.json, llms.txt
151
+ - Priority weighting: homepage (1.0) > GitHub (0.9) > NPM (0.9) > docs (0.7-0.8)
152
+
153
+ ### llms.txt (UPDATED)
154
+ - Leads with benchmark story (82.5% accuracy)
155
+ - Includes comparison table vs RouteLLM/LiteLLM
156
+ - Structured data section for AI extraction
157
+ - All 5 key messages included
158
+
159
+ ---
160
+
161
+ ## 6. GEO (Generative Engine Optimization)
162
+
163
+ See `docs/GEO.md` for full GEO strategy. Key elements:
164
+
165
+ 1. **FAQ format** answering AI-searchable questions
166
+ 2. **Comparison tables** with verifiable data AI engines cite
167
+ 3. **Structured key-value block** for direct AI extraction
168
+ 4. **Target AI queries** mapped to A3M Router answers
169
+
170
+ ---
171
+
172
+ ## 7. Action Items
173
+
174
+ - [x] Update docs-site/index.html title, meta, H1, stats, FAQ
175
+ - [x] Update FAQ schema with benchmark-focused questions
176
+ - [x] Update OG/Twitter cards with benchmark messaging
177
+ - [x] Update llms.txt with benchmark story
178
+ - [x] Create docs/GEO.md with AI search optimization
179
+ - [x] Update docs/SEO_AUDIT.md with new keywords
180
+ - [x] Update public/sitemap.xml with all key pages
181
+ - [x] Update public/robots.txt with better crawling rules
182
+ - [x] Update package.json keywords (optimized)
183
+ - [ ] Create OG banner image with benchmark metrics
184
+ - [ ] Write comparison articles (A3M vs RouteLLM, vs LiteLLM)
185
+ - [ ] Submit sitemap to Google Search Console
186
+ - [ ] Set up Google Search Console for das-rebel.github.io
@@ -0,0 +1,219 @@
1
+ # A3M Router — Social Listening & Reply Playbook
2
+
3
+ > "Set up Google Alerts for competitors → find discussions about routing/cost → craft reply that converts"
4
+ > — Vault insight, score 29.3
5
+
6
+ ## 1. Monitoring Setup
7
+
8
+ ### Google Alerts (free)
9
+ Set up alerts for these keywords. Frequency: "As it happens."
10
+
11
+ | Alert | Keyword | Why |
12
+ |-------|---------|-----|
13
+ | **A** | `"LLM routing" OR "model routing"` | Direct mention of the space |
14
+ | **B** | `"AI gateway" OR "LLM gateway"` | Competitor category |
15
+ | **C** | `"LiteLLM" OR "portkey" OR "route LLM"` | Competitor names |
16
+ | **D** | `"switch between LLMs" OR "multi-model"` | Pain point search |
17
+ | **E** | `"LLM too expensive" OR "API costs"` | Pain point — cost |
18
+ | **F** | `"open source LLM router"` | Direct search intent |
19
+
20
+ ### F5bot (free tier)
21
+ Monitor Hacker News for:
22
+ - `llm router` `model routing` `ai gateway` `openrouter` `litellm` `route llm`
23
+
24
+ Setup: https://f5bot.com — enter keywords, get email alerts.
25
+
26
+ ### ReplyGuy (paid, ~$15/mo)
27
+ Automated reply system for Reddit, HN, X, YouTube:
28
+ - Monitors keywords across platforms
29
+ - Suggests replies that are contextual, not spammy
30
+ - Setup: https://replyguy.com
31
+
32
+ ### Morebirds (HN specific)
33
+ Monitors Hacker News for keywords and competitors:
34
+ - https://morebirds.com
35
+
36
+ ---
37
+
38
+ ## 2. Keywords to Monitor (Priority Order)
39
+
40
+ ### Tier 1: High Intent (reply immediately)
41
+ ```
42
+ "llm routing" "model routing" "ai gateway" "llm gateway" "routing llm"
43
+ "open source router" "llm router alternative" "best model router"
44
+ "switch between models" "model fallback" "intelligent routing"
45
+ ```
46
+
47
+ ### Tier 2: Pain Point (reply with empathy + solution)
48
+ ```
49
+ "llm costs too high" "gpt too expensive" "api cost too much"
50
+ "openai bill too high" "reduce llm costs" "need cheaper llm"
51
+ "paying too much for ai" "api costs killing me"
52
+ ```
53
+
54
+ ### Tier 3: Competitor (reply as comparison, not attack)
55
+ ```
56
+ "LitellLm" "Portkey" "RouteLLM" "OpenRouter" "Helicone"
57
+ "LangSmith" "AI Gateway (Cloudflare)" "GenAI Gateway"
58
+ ```
59
+ When someone has issues with these, offer A3M as a working alternative.
60
+
61
+ ### Tier 4: Educational (reply with knowledge, mention tool naturally)
62
+ ```
63
+ "how to choose llm" "which model to use" "compare models"
64
+ "llm benchmark" "model evaluation" "provider comparison"
65
+ ```
66
+
67
+ ---
68
+
69
+ ## 3. Reply Templates
70
+
71
+ ### Template 1: Cost Pain
72
+ **Trigger:** Someone says "my OpenAI bill is too high" or "LLM API costs are crazy"
73
+
74
+ **Platform:** HN, Reddit, X
75
+
76
+ **Reply:**
77
+ ```
78
+ We were in the same boat — $800/month on GPT-4. Built A3M Router to route smart queries to cheaper models and keep hard ones on premium.
79
+
80
+ Same answers (RouterArena #1 at 70.32). Cost dropped to ~$5.
81
+
82
+ Open source, MIT. Run it yourself:
83
+ npx a3m-router route "your query"
84
+
85
+ Or verify: npx a3m-router benchmark --reproducible
86
+ ```
87
+
88
+ ### Template 2: "Which tool should I use?"
89
+ **Trigger:** Someone comparing LiteLLM, Portkey, RouteLLM
90
+
91
+ **Platform:** Reddit, HN
92
+
93
+ **Reply:**
94
+ ```
95
+ We evaluated all of them before building A3M. What we wanted:
96
+ - Open source (MIT)
97
+ - Actually routes to cheapest capable model, not just round-robin
98
+ - Works with existing OpenAI SDK
99
+ - Has a reproducible benchmark
100
+
101
+ A3M Router hits all of those. #1 on RouterArena (70.32). Costs $0.047/1K vs GPT-5 at $10/1K.
102
+
103
+ npx a3m-router route "test it out"
104
+ ```
105
+
106
+ ### Template 3: "Building an AI gateway"
107
+ **Trigger:** Someone asks how to build multi-model routing, or shows their architecture
108
+
109
+ **Platform:** HN, Reddit, DevTo
110
+
111
+ **Reply:**
112
+ ```
113
+ We built something similar. Spent months on it. Eventually open-sourced it as A3M Router.
114
+
115
+ Biggest lessons:
116
+ 1. Cost-based routing saves 200x vs always-pick-premium
117
+ 2. Quality scores persist across sessions (memory)
118
+ 3. Cache + parallel execution cut latency 3x
119
+
120
+ The whole thing is MIT on GitHub. Beats GPT-5 on RouterArena.
121
+
122
+ npx a3m-router benchmark --reproducible
123
+ ```
124
+
125
+ ### Template 4: "My provider is rate-limiting / failing"
126
+ **Trigger:** Someone complaining about OpenAI/Groq/Claude rate limits or failures
127
+
128
+ **Platform:** HN, Reddit, X
129
+
130
+ **Reply:**
131
+ ```
132
+ A3M Router handles this automatically — fallback to next available provider when one fails or throttles.
133
+
134
+ 47+ providers. Automatic failover. Same response format.
135
+
136
+ Open source: npx a3m-router route "try it"
137
+ ```
138
+
139
+ ### Template 5: "Looking for alternatives"
140
+ **Trigger:** Someone asking for alternatives to a specific tool or service
141
+
142
+ **Platform:** HN, Reddit, X
143
+
144
+ **Reply:**
145
+ ```
146
+ If you're evaluating options, A3M Router is worth a look:
147
+ - MIT licensed (not source-available)
148
+ - RouterArena #1 (70.32)
149
+ - Same API as OpenAI SDK
150
+ - $0.047/1K vs $10/1K for GPT-5
151
+
152
+ npx a3m-router route "test" or npx a3m-router benchmark --reproducible
153
+ ```
154
+
155
+ ### Template 6: "Model comparison question"
156
+ **Trigger:** Someone asking which model is best for task X
157
+
158
+ **Platform:** HN, Reddit
159
+
160
+ **Reply:**
161
+ ```
162
+ A3M Router actually solves this — it routes each query to the best model based on: complexity, cost budget, latency needs, and past quality scores.
163
+
164
+ You define 47+ providers and it picks automatically. Results tracked in memory so it gets smarter over time.
165
+
166
+ npx a3m-router recommend "coding" # See what it would pick
167
+ npx a3m-router route "test it" # Route a real query
168
+ ```
169
+
170
+ ### Template 7: Show HN / Launches (competitor)
171
+ **Trigger:** A competitor launches on HN or Product Hunt
172
+
173
+ **Platform:** HN comments
174
+
175
+ **Reply:**
176
+ ```
177
+ Cool project! Curious how it compares on RouterArena. We got 70.32 — would love to see benchmarks head-to-head.
178
+
179
+ For anyone evaluating, A3M Router is open source (MIT) with a reproducible benchmark:
180
+ npx a3m-router benchmark --reproducible
181
+ ```
182
+
183
+ ---
184
+
185
+ ## 4. Cadence
186
+
187
+ | Frequency | Action | Time |
188
+ |-----------|--------|------|
189
+ | **Daily (5 min)** | Check Google Alerts + F5bot notifications | Morning |
190
+ | **Daily (10 min)** | Scan HN for relevant threads | 8-10am ET |
191
+ | **Every 2 days** | Check Reddit for keyword matches | Random |
192
+ | **Weekly** | Write 1 educational post on DevTo/blog | Weekend |
193
+ | **Bi-weekly** | Review tracking table, adjust templates | Sunday |
194
+
195
+ ### Golden Rules
196
+ 1. **Never pitch in top-level posts** — only reply when relevant
197
+ 2. **First sentence = empathy/understanding**, not self-promo
198
+ 3. **Always include an action they can take** (a command to run)
199
+ 4. **Never copy-paste** — adapt template to the specific conversation
200
+ 5. **No URLs in first reply** unless asked (appears spammy)
201
+
202
+ ---
203
+
204
+ ## 5. Tracking Table
205
+
206
+ | Date | Platform | URL | Template | Reply | Clicks/Installs |
207
+ |------|----------|-----|----------|-------|-----------------|
208
+ | | | | | | |
209
+ | | | | | | |
210
+
211
+ Keep a running log. Review weekly to see which templates convert best.
212
+
213
+ ---
214
+
215
+ ## 6. Success Metric
216
+
217
+ Goal: **10 replies per week → 5 conversations → 1 GitHub star or npm install**
218
+
219
+ At this rate: 50 stars/month, 250 npm installs/month from social listening alone.