adaptive-memory-multi-model-router 2.14.49 → 2.14.52
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.dockerignore +82 -0
- package/.env.example +303 -0
- package/.github/DISCUSSIONS_WELCOME.md +27 -0
- package/.github/DISCUSSION_TEMPLATE.yml +5 -0
- package/.github/FUNDING.yml +2 -0
- package/.github/ISSUE_TEMPLATE/bug_report.md +94 -0
- package/.github/ISSUE_TEMPLATE/config.yml +17 -0
- package/.github/ISSUE_TEMPLATE/feature_request.md +71 -0
- package/.github/PULL_REQUEST_TEMPLATE.md +71 -0
- package/.github/dependabot.yml +9 -0
- package/.github/workflows/ci.yml +263 -0
- package/.github/workflows/codeql.yml +38 -0
- package/.github/workflows/npm-publish.yml +20 -0
- package/.github/workflows/pages.yml +37 -0
- package/.github/workflows/stale.yml +54 -0
- package/.publish-tick +1 -0
- package/.well-known/ai-plugin.json +16 -0
- package/AGENT_COUNCIL_FINDINGS.md +142 -0
- package/ARCHITECTURE.md +346 -0
- package/AUDIT_REPORT.md +28 -0
- package/CODE_OF_CONDUCT.md +128 -0
- package/CONTRIBUTING.md +50 -0
- package/CONTRIBUTORS.md +20 -0
- package/Dockerfile +53 -0
- package/Dockerfile.proxy +33 -0
- package/HEALTH_REPORT.md +118 -0
- package/IMPROVEMENT_PLAN.md +107 -0
- package/LANDING.md +43 -0
- package/LAUNCH-PAIN-DRIVEN.md +339 -0
- package/LAUNCH.md +337 -0
- package/LAUNCH_CHECKLIST.md +141 -0
- package/LAUNCH_SNAPSHOT.md +260 -0
- package/MANIFESTO.md +41 -0
- package/POPULARITY_BOOSTERS.md +285 -0
- package/PR_STATUS_REPORT.md +148 -0
- package/README.md +25 -14
- package/REDESIGN.md +95 -0
- package/RUNKIT.md +83 -0
- package/SECURITY.md +29 -0
- package/SUBMISSIONS.md +43 -0
- package/_schema.html +53 -0
- package/ai-plugin.json +16 -0
- package/articles/AI_AGENT_LLM_ROUTING.md +150 -0
- package/articles/CHINESE_DIRECTORIES.md +100 -0
- package/articles/CHINESE_SUBMISSIONS_READY.md +322 -0
- package/articles/COMPETITOR_ALERTS.md +31 -0
- package/articles/COMPLETE_POSTING_DIRECTORY.md +147 -0
- package/articles/CONTENT_STRUCTURE.md +292 -0
- package/articles/DEVTO_COST_GUIDE.md +473 -0
- package/articles/DEVTO_FINAL.md +416 -0
- package/articles/DEVTO_MULTI_PROVIDER.md +542 -0
- package/articles/DEVTO_READY.md +255 -0
- package/articles/DEVTO_V2_ANNOUNCEMENT.md +160 -0
- package/articles/DEVTO_VIRAL_GROWTH.md +280 -0
- package/articles/FRESH_devto.md +460 -0
- package/articles/FRESH_devto_2026_05.md +73 -0
- package/articles/FRESH_hackernews.md +14 -0
- package/articles/FRESH_reddit_ml.md +90 -0
- package/articles/FRESH_reddit_node.md +198 -0
- package/articles/FRESH_reddit_sideproject.md +72 -0
- package/articles/FRESH_reddit_webdev.md +130 -0
- package/articles/FROM_ZERO_TO_10K.md +107 -0
- package/articles/HN_10X_BETTER.md +430 -0
- package/articles/HN_ACCOUNT_GUIDE.md +21 -0
- package/articles/HN_CHINESE_STYLE.md +308 -0
- package/articles/HN_FINAL.md +148 -0
- package/articles/HN_POSTED_VERSION.md +56 -0
- package/articles/HN_POST_READY.md +137 -0
- package/articles/HN_RESEARCH.md +364 -0
- package/articles/HN_SHOW_routerarena.md +17 -0
- package/articles/HN_TIMING_GUIDE.md +52 -0
- package/articles/INDIEHACKERS_POST.md +52 -0
- package/articles/INDIEHACKERS_READY.md +120 -0
- package/articles/LLM_BENCHMARK_DEEP_DIVE.md +153 -0
- package/articles/MASTER_POSTING_DIRECTORY.md +189 -0
- package/articles/NEWSLETTER_SEND_NOW.md +259 -0
- package/articles/NEWSLETTER_SUBMISSIONS.md +112 -0
- package/articles/PAIN-DRIVEN-devto-v2.md +308 -0
- package/articles/PAIN-DRIVEN-devto-v3.md +268 -0
- package/articles/PAIN-DRIVEN-devto.md +242 -0
- package/articles/PAIN-DRIVEN-hackernews-v2.md +138 -0
- package/articles/PAIN-DRIVEN-hackernews-v3.md +151 -0
- package/articles/PAIN-DRIVEN-hackernews.md +131 -0
- package/articles/PAIN-DRIVEN-reddit-v2.md +301 -0
- package/articles/PAIN-DRIVEN-reddit-v3.md +236 -0
- package/articles/PAIN-DRIVEN-reddit.md +218 -0
- package/articles/PAIN-DRIVEN-twitter-v2.md +110 -0
- package/articles/PAIN-DRIVEN-twitter-v3.md +121 -0
- package/articles/PAIN-DRIVEN-twitter.md +120 -0
- package/articles/PORTKEY_VS_A3M.md +147 -0
- package/articles/POSTING_KIT_2026_05.md +67 -0
- package/articles/PRESS_KIT_routerarena.md +77 -0
- package/articles/PRODUCTHUNT_LISTING.md +48 -0
- package/articles/PRODUCTHUNT_READY.md +106 -0
- package/articles/PR_PLAN_vault.md +125 -0
- package/articles/REDDIT_FINAL.md +232 -0
- package/articles/REDDIT_POST.md +67 -0
- package/articles/REDDIT_SUBMISSION_READY.md +348 -0
- package/articles/ROUTERARENA_9677.md +78 -0
- package/articles/ROUTERARENA_LEADER.md +45 -0
- package/articles/SHOW_HN_FINAL.md +29 -0
- package/articles/TWEETS_10K_DOWNLOADS.md +47 -0
- package/articles/TWEETS_BENCHMARK_FIRST.md +46 -0
- package/articles/TWEETS_MCP_PLAY.md +51 -0
- package/articles/TWEETS_SEQUENTIAL_BROKEN.md +49 -0
- package/articles/TWEETS_WHY_BUILD.md +54 -0
- package/articles/TWEETS_routerarena_leader.md +53 -0
- package/articles/TWEET_STORM_READY.md +165 -0
- package/articles/TWITTER_FINAL.md +167 -0
- package/articles/WHY_10X_BETTER.md +261 -0
- package/articles/WHY_CHINESE_STYLE_BETTER.md +323 -0
- package/articles/ai-discoverability-llm-routing.md +210 -0
- package/articles/devto-llm-routing.md +138 -0
- package/articles/hackernews-show-hn.md +54 -0
- package/articles/hashnode-llm-cost-optimization.md +125 -0
- package/articles/hn_show_2026_05.md +11 -0
- package/articles/medium-building-llm-router.md +205 -0
- package/articles/reddit-ml.md +76 -0
- package/articles/twitter-thread-cost-savings.md +50 -0
- package/articles/youtube-tutorial-script.md +262 -0
- package/assets/a3m_3blue1brown.mp4 +0 -0
- package/assets/banner.svg +109 -0
- package/assets/chart-cost-v2.svg +91 -0
- package/assets/chart-cost-v3.svg +143 -0
- package/assets/chart-features-v2.svg +132 -0
- package/assets/chart-features-v3.svg +211 -0
- package/assets/chart-growth-v2.svg +122 -0
- package/assets/chart-growth-v3.svg +189 -0
- package/assets/cost-comparison.svg +134 -0
- package/assets/cost-simple.svg +64 -0
- package/assets/demo-hn.gif +0 -0
- package/assets/feature-matrix.svg +136 -0
- package/assets/growth-chart-animated.svg +76 -0
- package/assets/growth-chart.svg +82 -0
- package/assets/growth-simple.svg +69 -0
- package/assets/hero-diagram.svg +81 -0
- package/assets/logo-new.svg +21 -0
- package/assets/logo.svg +68 -0
- package/assets/provider-comparison.svg +121 -0
- package/assets/social-preview-new.svg +100 -0
- package/assets/social-preview.svg +194 -0
- package/assets/social-v2.svg +130 -0
- package/assets/social-v3.svg +212 -0
- package/benchmark-provider-results.json +245 -0
- package/benchmark-results.json +54 -0
- package/council-votes/architecture-vote.md +121 -0
- package/council-votes/coverage-vote.md +93 -0
- package/data/adaptive-benchmark.json +92 -0
- package/data/benchmark-results.json +47 -0
- package/data/labeled-benchmark.json +88 -0
- package/demo/3blue1brown_video.py +285 -0
- package/demo/3blue1brown_video_v2.py +310 -0
- package/demo/IMPROVED_PROMPTS.md +229 -0
- package/demo/VEO3_PROMPTS.md +269 -0
- package/demo/VIDEO_PRODUCTION_GUIDE.md +333 -0
- package/demo/a3m_3blue1brown.mp4 +0 -0
- package/demo/asciinema-demo.sh +195 -0
- package/demo/demo-hn.tape +74 -0
- package/demo/demo-script.md +53 -0
- package/demo/demo-script.sh +62 -0
- package/demo/demo.svg +75 -0
- package/demo/frame1_ai_data_center.png +0 -0
- package/demo/frame1_sunset_video.mp4 +0 -0
- package/demo/frame2_cost_comparison.png +0 -0
- package/demo/frame2_cost_comparison_fallback.png +0 -0
- package/demo/frame3_parallel_execution.png +0 -0
- package/demo/frame3_parallel_execution_fallback.png +0 -0
- package/demo/frame4_providers.png +0 -0
- package/demo/frame4_providers_fallback.png +0 -0
- package/demo/frame5_endcard.png +0 -0
- package/demo/frame5_endcard_fallback.png +0 -0
- package/demo/new_frame1_hook.png +0 -0
- package/demo/new_frame2_proof.png +0 -0
- package/demo/new_frame3_wow.png +0 -0
- package/demo/new_frame4_social.png +0 -0
- package/demo/new_frame5_cta.png +0 -0
- package/demo/package.json +13 -0
- package/demo/product-video-final.mp4 +0 -0
- package/demo/product-video-hype-v1.mp4 +0 -0
- package/demo/product-video-v1.mp4 +0 -0
- package/demo/public/index.html +762 -0
- package/demo/recording.cast +55 -0
- package/demo/server.js +405 -0
- package/demo-new.tape +71 -0
- package/demo-real.sh +198 -0
- package/demo-simple.tape +205 -0
- package/demo.html +520 -0
- package/demo.sh +85 -0
- package/demo.tape +259 -0
- package/dist/analytics/costAnalytics.d.ts.map +1 -0
- package/dist/analytics/costAnalytics.js.map +1 -0
- package/dist/benchmark/comprehensive.js.map +1 -0
- package/dist/benchmark/reproducible.d.ts.map +1 -0
- package/dist/benchmark/reproducible.js.map +1 -0
- package/dist/cache/prefixCache.d.ts.map +1 -0
- package/dist/cache/prefixCache.js.map +1 -0
- package/dist/cache/responseCache.d.ts.map +1 -0
- package/dist/cache/responseCache.js.map +1 -0
- package/dist/cache/semanticCache.d.ts.map +1 -0
- package/dist/cache/semanticCache.js.map +1 -0
- package/dist/cli/setupWizard.d.ts.map +1 -0
- package/dist/cli/setupWizard.js.map +1 -0
- package/dist/cost/budgetEnforcer.d.ts.map +1 -0
- package/dist/cost/budgetEnforcer.js.map +1 -0
- package/dist/cost/costTracker.d.ts.map +1 -0
- package/dist/cost/costTracker.js.map +1 -0
- package/dist/ensemble/multiRoundDialog.js.map +1 -0
- package/dist/ensemble/shapleyValue.js.map +1 -0
- package/dist/integrations/langchainAdapter.d.ts.map +1 -0
- package/dist/integrations/langchainAdapter.js.map +1 -0
- package/dist/integrations/oauth.d.ts.map +1 -0
- package/dist/integrations/oauth.js.map +1 -0
- package/dist/integrations/scienceAdapter.js.map +1 -0
- package/dist/memory/autoFetch.d.ts.map +1 -0
- package/dist/memory/autoFetch.js.map +1 -0
- package/dist/memory/episodicMemory.d.ts.map +1 -0
- package/dist/memory/episodicMemory.js.map +1 -0
- package/dist/memory/hybridMemory.js.map +1 -0
- package/dist/memory/memoryTree.d.ts.map +1 -0
- package/dist/memory/memoryTree.js.map +1 -0
- package/dist/memory/obsidianVault.d.ts.map +1 -0
- package/dist/memory/obsidianVault.js.map +1 -0
- package/dist/memory/reasoningBank.js.map +1 -0
- package/dist/observability/changeWatch.d.ts.map +1 -0
- package/dist/observability/changeWatch.js.map +1 -0
- package/dist/observability/fatigueDetector.d.ts.map +1 -0
- package/dist/observability/fatigueDetector.js.map +1 -0
- package/dist/observability/index.d.ts.map +1 -0
- package/dist/observability/index.js.map +1 -0
- package/dist/observability/metrics.d.ts.map +1 -0
- package/dist/observability/metrics.js.map +1 -0
- package/dist/observability/middleware.d.ts.map +1 -0
- package/dist/observability/middleware.js.map +1 -0
- package/dist/observability/tracer.d.ts.map +1 -0
- package/dist/observability/tracer.js.map +1 -0
- package/dist/observability/types.d.ts.map +1 -0
- package/dist/observability/types.js.map +1 -0
- package/dist/orchestration/haloOrchestrator.d.ts.map +1 -0
- package/dist/orchestration/haloOrchestrator.js.map +1 -0
- package/dist/orchestration/mctsWorkflow.d.ts.map +1 -0
- package/dist/orchestration/mctsWorkflow.js.map +1 -0
- package/dist/providers/localProvider.d.ts.map +1 -0
- package/dist/providers/localProvider.js.map +1 -0
- package/dist/providers/providerConfig.d.ts.map +1 -0
- package/dist/providers/providerConfig.js.map +1 -0
- package/dist/providers/registry.d.ts.map +1 -0
- package/dist/providers/registry.js.map +1 -0
- package/dist/routing/advancedRouter.d.ts.map +1 -0
- package/dist/routing/advancedRouter.js +1 -1
- package/dist/routing/advancedRouter.js.map +1 -0
- package/dist/routing/crossModelValidation.d.ts.map +1 -0
- package/dist/routing/crossModelValidation.js.map +1 -0
- package/dist/routing/providerHealth.d.ts.map +1 -0
- package/dist/routing/providerHealth.js.map +1 -0
- package/dist/routing/providerRetry.d.ts.map +1 -0
- package/dist/routing/providerRetry.js.map +1 -0
- package/dist/scripts/banner.js +29 -0
- package/dist/security/guardrails.d.ts.map +1 -0
- package/dist/security/guardrails.js.map +1 -0
- package/dist/server/dashboard.d.ts.map +1 -0
- package/dist/server/dashboard.js.map +1 -0
- package/dist/server/modelMapper.d.ts.map +1 -0
- package/dist/server/modelMapper.js.map +1 -0
- package/dist/server/proxyServer.d.ts.map +1 -0
- package/dist/server/proxyServer.js.map +1 -0
- package/dist/skills/__tests__/skill_manager.test.d.ts +2 -0
- package/dist/skills/__tests__/skill_manager.test.d.ts.map +1 -0
- package/dist/skills/__tests__/skill_manager.test.js +268 -0
- package/dist/skills/__tests__/skill_manager.test.js.map +1 -0
- package/dist/tools/tmlpdTools.d.ts.map +1 -0
- package/dist/tools/tmlpdTools.js.map +1 -0
- package/dist/tui/dashboard.d.ts.map +1 -0
- package/dist/tui/dashboard.js.map +1 -0
- package/dist/tui/index.d.ts.map +1 -0
- package/dist/tui/index.js.map +1 -0
- package/dist/utils/batchProcessor.d.ts.map +1 -0
- package/dist/utils/batchProcessor.js.map +1 -0
- package/dist/utils/compression.d.ts.map +1 -0
- package/dist/utils/compression.js.map +1 -0
- package/dist/utils/costUtils.d.ts.map +1 -0
- package/dist/utils/costUtils.js.map +1 -0
- package/dist/utils/reliability.d.ts.map +1 -0
- package/dist/utils/reliability.js.map +1 -0
- package/dist/utils/sorting.d.ts.map +1 -0
- package/dist/utils/sorting.js.map +1 -0
- package/dist/utils/speculativeDecoding.d.ts.map +1 -0
- package/dist/utils/speculativeDecoding.js.map +1 -0
- package/dist/utils/tokenUtils.d.ts.map +1 -0
- package/dist/utils/tokenUtils.js.map +1 -0
- package/docs/.nojekyll +0 -0
- package/docs/ANALYSIS_PRINCIPLES.md +162 -0
- package/docs/API.md +855 -0
- package/docs/ARCHITECTURAL-IMPROVEMENTS-2025.md +1391 -0
- package/docs/ARCHITECTURAL-IMPROVEMENTS-REVISED-2025.md +1051 -0
- package/docs/BENCHMARK.md +170 -0
- package/docs/CHINESE_PROVIDER_RELIABILITY.md +37 -0
- package/docs/CITATIONS.md +74 -0
- package/docs/CLAIMS_AND_EVIDENCE.md +58 -0
- package/docs/CONFIGURATION.md +476 -0
- package/docs/COUNCIL_DECISION.json +816 -0
- package/docs/COUNCIL_SUMMARY.md +319 -0
- package/docs/COUNCIL_V2.2_DECISION.md +416 -0
- package/docs/ENGINEERING_SPEC.md +55 -0
- package/docs/FACTORY_RESET.md +34 -0
- package/docs/GEO.md +66 -0
- package/docs/GEO_OPTIMIZATION.md +30 -0
- package/docs/GEO_ROOT_CAUSE.md +136 -0
- package/docs/GEO_STATUS.md +85 -0
- package/docs/GEO_TEST_RESULTS.md +176 -0
- package/docs/HN_CHECKLIST.md +38 -0
- package/docs/HN_FOUNDER_COMMENT.md +17 -0
- package/docs/HN_SUBMISSION_FINAL.md +180 -0
- package/docs/HN_SUBMISSION_V3.md +56 -0
- package/docs/IMPROVEMENT_ROADMAP.md +515 -0
- package/docs/INTEGRATIONS.md +420 -0
- package/docs/LANGCHAIN_INTEGRATION.md +147 -0
- package/docs/LLM_COUNCIL_DECISION.md +508 -0
- package/docs/MIDDLEWARE_CHAIN.md +35 -0
- package/docs/PROMO_CHECKLIST.md +200 -0
- package/docs/QUICKSTART.md +271 -0
- package/docs/QUICK_START.md +43 -0
- package/docs/QUICK_START_VISIBILITY.md +782 -0
- package/docs/REDDIT_GAP_ANALYSIS.md +299 -0
- package/docs/RELEASE_CHECKLIST.md +32 -0
- package/docs/REPRODUCIBILITY.md +63 -0
- package/docs/RESEARCH_BACKED_IMPROVEMENTS.md +1180 -0
- package/docs/ROUTING_RUBRIC.md +197 -0
- package/docs/SEO_AUDIT.md +186 -0
- package/docs/SOCIAL_LISTENING.md +219 -0
- package/docs/TMLPD_QNA.md +751 -0
- package/docs/TMLPD_V2.1_COMPLETE.md +763 -0
- package/docs/TMLPD_V2.2_RESEARCH_ROADMAP.md +754 -0
- package/docs/UPDATE_TOPICS.md +15 -0
- package/docs/USE_CASES.md +59 -0
- package/docs/V2.2_IMPLEMENTATION_COMPLETE.md +446 -0
- package/docs/V2_IMPLEMENTATION_GUIDE.md +388 -0
- package/docs/VERCEL_AI_SDK.md +209 -0
- package/docs/VISIBILITY_ADOPTION_PLAN.md +1005 -0
- package/docs/_config.yml +49 -0
- package/docs/ai-plugin.json +16 -0
- package/docs/api.html +513 -0
- package/docs/architecture-diagram.md +40 -0
- package/docs/benchmark-chart.png +0 -0
- package/docs/benchmark.html +387 -0
- package/docs/blog/routerarena-9677.html +92 -0
- package/docs/blog/routerarena-number-one.html +73 -0
- package/docs/cli-cheatsheet.md +339 -0
- package/docs/compare.md +109 -0
- package/docs/comparison-litellm.md +88 -0
- package/docs/comparison.md +108 -0
- package/docs/cost-chart-ascii.md +42 -0
- package/docs/cost-comparison-chart.svg +88 -0
- package/docs/curl-examples.md +247 -0
- package/docs/demo-auto.html +264 -0
- package/docs/demo.html +416 -0
- package/docs/geo/GENERATIVE_ENGINE_OPTIMIZATION.md +232 -0
- package/docs/index.html +507 -0
- package/docs/launch-content/LAUNCH_EXECUTION_CHECKLIST.md +421 -0
- package/docs/launch-content/README.md +457 -0
- package/docs/launch-content/assets/cost_comparison_100_tasks.png +0 -0
- package/docs/launch-content/assets/cumulative_savings.png +0 -0
- package/docs/launch-content/assets/parallel_speedup.png +0 -0
- package/docs/launch-content/assets/provider_pricing_comparison.png +0 -0
- package/docs/launch-content/assets/task_breakdown_comparison.png +0 -0
- package/docs/launch-content/generate_charts.py +313 -0
- package/docs/launch-content/hn_show_post.md +139 -0
- package/docs/launch-content/partner_outreach_templates.md +745 -0
- package/docs/launch-content/reddit_posts.md +467 -0
- package/docs/launch-content/twitter_thread.txt +460 -0
- package/{llms.txt.bak → docs/llms.txt} +6 -6
- package/docs/npm-downloads-chart.svg +43 -0
- package/docs/openapi.json +139 -0
- package/docs/openapi.yaml +1318 -0
- package/docs/quick-start.html +366 -0
- package/docs/robots.txt +52 -0
- package/docs/sitemap.xml +57 -0
- package/docs/styles.css +682 -0
- package/docs/well-known/ai-plugin.json +16 -0
- package/docs/wellknown/ai-plugin.json +16 -0
- package/docs-site/assets/og-banner.svg +194 -0
- package/docs-site/index.html +632 -0
- package/eval/README.md +46 -0
- package/eval/baselines/main.json +12 -0
- package/eval/benchmark_dataset.jsonl +16 -0
- package/eval/check_golden_routes.js +64 -0
- package/eval/datasets/catalog.json +33 -0
- package/eval/datasets/slices/cn_provider_reliability_v1.jsonl +3 -0
- package/eval/datasets/slices/cost_pressure_v1.jsonl +3 -0
- package/eval/datasets/slices/safety_guardrails_v1.jsonl +3 -0
- package/eval/evals.json +199 -0
- package/eval/fault_injection_thresholds.json +3 -0
- package/eval/generate_report.js +128 -0
- package/eval/golden_routes.json +114 -0
- package/eval/lib/experiment_registry.js +24 -0
- package/eval/run_eval.js +197 -0
- package/eval/run_fault_injection.js +201 -0
- package/eval/run_shadow_eval.js +85 -0
- package/eval/thresholds.json +9 -0
- package/examples/QUICKSTART.md +183 -0
- package/examples/README.md +61 -0
- package/examples/a3m-sdk.js +124 -0
- package/examples/basic-route.js +54 -0
- package/examples/chat-loop.js +202 -0
- package/examples/classify-then-route.js +102 -0
- package/examples/cost-compare.js +120 -0
- package/examples/ensemble.js +160 -0
- package/examples/whatsapp-telegram-bridge-demo.js +302 -0
- package/examples/whatsapp-telegram-bridge.js +269 -0
- package/hf-space/README.md +23 -0
- package/hf-space/app.py +240 -0
- package/hf-space/requirements.txt +1 -0
- package/huggingface_space/README.md +35 -0
- package/huggingface_space/app.py +126 -0
- package/huggingface_space/create_space.py +208 -0
- package/huggingface_space/requirements.txt +1 -0
- package/index.html +1 -1
- package/mcp-server/README.md +188 -0
- package/mcp-server/package.json +29 -0
- package/mcp-server/src/index.ts +744 -0
- package/mcp-server/tsconfig.json +19 -0
- package/openclaw-alexa-bridge/ALL_REMAINING_FIXES_PLAN.md +313 -0
- package/openclaw-alexa-bridge/REMAINING_FIXES_SUMMARY.md +277 -0
- package/openclaw-alexa-bridge/src/alexa_handler_no_tmlpd.js +1234 -0
- package/openclaw-alexa-bridge/test_fixes.js +77 -0
- package/package.json +76 -272
- package/playground/README.md +51 -0
- package/playground/codesandbox.json +12 -0
- package/playground/index.js +39 -0
- package/proxy/README.md +227 -0
- package/proxy/package-lock.json +831 -0
- package/proxy/package.json +17 -0
- package/proxy/rate-limit.js +145 -0
- package/proxy/rate-limit.test.js +311 -0
- package/proxy/server.js +970 -0
- package/python/README.md +102 -0
- package/python/a3m/__init__.py +6 -0
- package/python/a3m/client.py +190 -0
- package/python/a3m/models.py +40 -0
- package/python/a3m/sync_client.py +61 -0
- package/python/examples.py +53 -0
- package/python/integrations.py +330 -0
- package/python/pyproject.toml +23 -0
- package/python/setup.py +28 -0
- package/python/tmlpd.py +369 -0
- package/qna/REDDIT_GAP_ANALYSIS.md +299 -0
- package/qna/TMLPD_QNA.md +751 -0
- package/research/FINDING_001_safety.md +28 -0
- package/research/FINDING_002_error_diversity.md +32 -0
- package/research/FINDING_003_confidence_weighted_voting.md +32 -0
- package/research/FINDING_004_cross_model_semantic_detection.md +37 -0
- package/research/FINDING_005_knowledge_gap_orthogonality.md +34 -0
- package/research/HALLUCINATION_RESEARCH.md +27 -0
- package/research/ensemble-voting.md +324 -0
- package/research/loss-functions.md +545 -0
- package/research-log.md +49 -0
- package/scripts/banner.js +29 -0
- package/scripts/benchmark-local-routerarena.ts +176 -0
- package/scripts/benchmark.js +145 -0
- package/scripts/benchmark.sh +61 -0
- package/scripts/compare-providers.sh +230 -0
- package/scripts/content-planner.js +25 -0
- package/scripts/create-labeled-benchmark.ts +105 -0
- package/scripts/cross_post.py +443 -0
- package/scripts/local-router-benchmark.ts +154 -0
- package/scripts/post-all.sh +41 -0
- package/scripts/publish_fcc.py +106 -0
- package/scripts/push-to-gitee.sh +25 -0
- package/scripts/routerarena_ensemble.js +144 -0
- package/scripts/routing-benchmark-v2.js +373 -0
- package/scripts/routing-benchmark-v3.js +118 -0
- package/scripts/routing-benchmark.js +462 -0
- package/scripts/run-labeled-benchmark.mjs +104 -0
- package/scripts/run-mmlu-benchmark.js +176 -0
- package/scripts/run-provider-benchmark.js +244 -0
- package/scripts/update-npm-badges.js +158 -0
- package/skill/SKILL.md +238 -0
- package/src/__tests__/integration/tmpld_integration.test.py +540 -0
- package/src/ensemble.ts +2 -0
- package/src/routing/advancedRouter.ts +1 -1
- package/src/skills/__tests__/skill_manager.test.ts +328 -0
- package/submissions/benchmarks/ALL_PLATFORMS_SUBMISSION.md +94 -0
- package/submissions/benchmarks/LLMROUTERBENCH_SUBMISSION.md +121 -0
- package/submissions/benchmarks/MMRBENCH_SUBMISSION.md +94 -0
- package/submissions/benchmarks/ROUTERARENA_UPDATE.md +83 -0
- package/submissions/benchmarks/ROUTERBENCH_SUBMISSION.md +225 -0
- package/test-council/1-structure-tests.test.js +353 -0
- package/test-council/1-structure-tests.test.ts +353 -0
- package/test-council/2-edge-case-tests.test.ts +361 -0
- package/test-council/3-performance-tests.test.ts +652 -0
- package/test-council/4-integration-tests.test.ts +391 -0
- package/test-council/5-agent-council-eval.test.ts +413 -0
- package/test-council/AGENT_COUNCIL_ARCHITECTURE.md +349 -0
- package/test-council/TEST_COUNCIL_REPORT.md +201 -0
- package/test-council/agents/edge-case-agent.ts +363 -0
- package/test-council/agents/performance-agent.ts +426 -0
- package/test-council/agents/structure-agent.ts +227 -0
- package/test-council/council.md +183 -0
- package/tests/__mocks__/tokenUtils.ts +8 -0
- package/tests/memory/episodicMemory.test.ts +227 -0
- package/tests/package-lock.json +1785 -0
- package/tests/package.json +19 -0
- package/tests/routing/ensembleVoting.test.ts +236 -0
- package/tests/routing/providerRetry.test.ts +360 -0
- package/tests/routing/queryTypePresets.test.ts +208 -0
- package/tests/security/guardrailEngine.test.ts +700 -0
- package/tests/tsconfig.json +21 -0
- package/tests/vitest.config.ts +18 -0
- package/tmlpd-pi-extension/README.md +66 -0
- package/tmlpd-pi-extension/dist/cache/prefixCache.d.ts +114 -0
- package/tmlpd-pi-extension/dist/cache/prefixCache.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/cache/prefixCache.js +285 -0
- package/tmlpd-pi-extension/dist/cache/prefixCache.js.map +1 -0
- package/tmlpd-pi-extension/dist/cache/responseCache.d.ts +58 -0
- package/tmlpd-pi-extension/dist/cache/responseCache.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/cache/responseCache.js +153 -0
- package/tmlpd-pi-extension/dist/cache/responseCache.js.map +1 -0
- package/tmlpd-pi-extension/dist/cli.js +59 -0
- package/tmlpd-pi-extension/dist/cost/costTracker.d.ts +95 -0
- package/tmlpd-pi-extension/dist/cost/costTracker.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/cost/costTracker.js +240 -0
- package/tmlpd-pi-extension/dist/cost/costTracker.js.map +1 -0
- package/tmlpd-pi-extension/dist/index.d.ts +723 -0
- package/tmlpd-pi-extension/dist/index.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/index.js +239 -0
- package/tmlpd-pi-extension/dist/index.js.map +1 -0
- package/tmlpd-pi-extension/dist/memory/episodicMemory.d.ts +82 -0
- package/tmlpd-pi-extension/dist/memory/episodicMemory.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/memory/episodicMemory.js +145 -0
- package/tmlpd-pi-extension/dist/memory/episodicMemory.js.map +1 -0
- package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.d.ts +102 -0
- package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.js +207 -0
- package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.js.map +1 -0
- package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.d.ts +85 -0
- package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.js +210 -0
- package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.js.map +1 -0
- package/tmlpd-pi-extension/dist/providers/localProvider.d.ts +102 -0
- package/tmlpd-pi-extension/dist/providers/localProvider.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/providers/localProvider.js +338 -0
- package/tmlpd-pi-extension/dist/providers/localProvider.js.map +1 -0
- package/tmlpd-pi-extension/dist/providers/registry.d.ts +55 -0
- package/tmlpd-pi-extension/dist/providers/registry.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/providers/registry.js +138 -0
- package/tmlpd-pi-extension/dist/providers/registry.js.map +1 -0
- package/tmlpd-pi-extension/dist/routing/advancedRouter.d.ts +68 -0
- package/tmlpd-pi-extension/dist/routing/advancedRouter.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/routing/advancedRouter.js +332 -0
- package/tmlpd-pi-extension/dist/routing/advancedRouter.js.map +1 -0
- package/tmlpd-pi-extension/dist/tools/tmlpdTools.d.ts +101 -0
- package/tmlpd-pi-extension/dist/tools/tmlpdTools.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/tools/tmlpdTools.js +368 -0
- package/tmlpd-pi-extension/dist/tools/tmlpdTools.js.map +1 -0
- package/tmlpd-pi-extension/dist/utils/batchProcessor.d.ts +96 -0
- package/tmlpd-pi-extension/dist/utils/batchProcessor.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/utils/batchProcessor.js +170 -0
- package/tmlpd-pi-extension/dist/utils/batchProcessor.js.map +1 -0
- package/tmlpd-pi-extension/dist/utils/compression.d.ts +61 -0
- package/tmlpd-pi-extension/dist/utils/compression.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/utils/compression.js +281 -0
- package/tmlpd-pi-extension/dist/utils/compression.js.map +1 -0
- package/tmlpd-pi-extension/dist/utils/reliability.d.ts +74 -0
- package/tmlpd-pi-extension/dist/utils/reliability.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/utils/reliability.js +177 -0
- package/tmlpd-pi-extension/dist/utils/reliability.js.map +1 -0
- package/tmlpd-pi-extension/dist/utils/speculativeDecoding.d.ts +117 -0
- package/tmlpd-pi-extension/dist/utils/speculativeDecoding.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/utils/speculativeDecoding.js +246 -0
- package/tmlpd-pi-extension/dist/utils/speculativeDecoding.js.map +1 -0
- package/tmlpd-pi-extension/dist/utils/tokenUtils.d.ts +50 -0
- package/tmlpd-pi-extension/dist/utils/tokenUtils.d.ts.map +1 -0
- package/tmlpd-pi-extension/dist/utils/tokenUtils.js +124 -0
- package/tmlpd-pi-extension/dist/utils/tokenUtils.js.map +1 -0
- package/tmlpd-pi-extension/examples/QUICKSTART.md +183 -0
- package/tmlpd-pi-extension/package-lock.json +79 -0
- package/tmlpd-pi-extension/package.json +172 -0
- package/tmlpd-pi-extension/python/examples.py +53 -0
- package/tmlpd-pi-extension/python/integrations.py +330 -0
- package/tmlpd-pi-extension/python/setup.py +28 -0
- package/tmlpd-pi-extension/python/tmlpd.py +369 -0
- package/tmlpd-pi-extension/qna/REDDIT_GAP_ANALYSIS.md +299 -0
- package/tmlpd-pi-extension/qna/TMLPD_QNA.md +751 -0
- package/tmlpd-pi-extension/skill/SKILL.md +238 -0
- package/tmlpd-pi-extension/src/cache/responseCache.ts +147 -0
- package/tmlpd-pi-extension/src/cost/costTracker.ts +302 -0
- package/tmlpd-pi-extension/src/index.ts +232 -0
- package/tmlpd-pi-extension/src/memory/episodicMemory.ts +257 -0
- package/tmlpd-pi-extension/src/orchestration/haloOrchestrator.ts +266 -0
- package/tmlpd-pi-extension/src/orchestration/mctsWorkflow.ts +262 -0
- package/tmlpd-pi-extension/src/providers/localProvider.ts +406 -0
- package/tmlpd-pi-extension/src/providers/registry.ts +164 -0
- package/tmlpd-pi-extension/src/routing/ensembleVoting.ts +159 -0
- package/tmlpd-pi-extension/src/routing/queryTypePresets.ts +136 -0
- package/tmlpd-pi-extension/src/tools/tmlpdTools.ts +433 -0
- package/tmlpd-pi-extension/src/utils/batchProcessor.ts +232 -0
- package/tmlpd-pi-extension/src/utils/compression.ts +325 -0
- package/tmlpd-pi-extension/src/utils/reliability.ts +221 -0
- package/tmlpd-pi-extension/src/utils/tokenUtils.ts +145 -0
- package/tmlpd-pi-extension/tsconfig.json +18 -0
- package/tsconfig.build.json +29 -0
- package/tsconfig.json +18 -0
- package/README.md.bak +0 -1185
- package/src/routing/advancedRouter.ts.bak +0 -650
- package/test.js.bak +0 -376
- /package/{llms-full.txt.bak → docs/llms-full.txt} +0 -0
|
@@ -0,0 +1,652 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Performance Tests - Latency, Throughput, Cost Accuracy
|
|
3
|
+
*
|
|
4
|
+
* Comprehensive benchmarks and performance regression tests.
|
|
5
|
+
* These tests verify the system meets performance requirements.
|
|
6
|
+
*
|
|
7
|
+
* @generated by performance-agent
|
|
8
|
+
*/
|
|
9
|
+
|
|
10
|
+
import { describe, it, expect, beforeEach } from 'vitest';
|
|
11
|
+
|
|
12
|
+
// Import modules
|
|
13
|
+
const {
|
|
14
|
+
routeQuery,
|
|
15
|
+
routeBatch,
|
|
16
|
+
countTokens,
|
|
17
|
+
estimateTokens,
|
|
18
|
+
MemoryTree,
|
|
19
|
+
CostTracker,
|
|
20
|
+
createA3MRouter,
|
|
21
|
+
} = require('../dist/index.js');
|
|
22
|
+
|
|
23
|
+
// Try to load tokenUtils
|
|
24
|
+
let tokenUtils: any = null;
|
|
25
|
+
try {
|
|
26
|
+
tokenUtils = require('../dist/utils/tokenUtils.js');
|
|
27
|
+
} catch (e) {
|
|
28
|
+
// Fallback to inline implementation
|
|
29
|
+
}
|
|
30
|
+
|
|
31
|
+
// ============================================================
|
|
32
|
+
// PERFORMANCE TEST UTILITIES
|
|
33
|
+
// ============================================================
|
|
34
|
+
|
|
35
|
+
interface BenchmarkResult {
|
|
36
|
+
name: string;
|
|
37
|
+
iterations: number;
|
|
38
|
+
totalMs: number;
|
|
39
|
+
avgMs: number;
|
|
40
|
+
minMs: number;
|
|
41
|
+
maxMs: number;
|
|
42
|
+
p50Ms: number;
|
|
43
|
+
p95Ms: number;
|
|
44
|
+
p99Ms: number;
|
|
45
|
+
opsPerSecond: number;
|
|
46
|
+
}
|
|
47
|
+
|
|
48
|
+
function runBenchmark(name: string, fn: () => void, iterations: number = 1000): BenchmarkResult {
|
|
49
|
+
const times: number[] = [];
|
|
50
|
+
|
|
51
|
+
// Warmup
|
|
52
|
+
for (let i = 0; i < 10; i++) {
|
|
53
|
+
fn();
|
|
54
|
+
}
|
|
55
|
+
|
|
56
|
+
// Actual benchmark
|
|
57
|
+
for (let i = 0; i < iterations; i++) {
|
|
58
|
+
const start = performance.now();
|
|
59
|
+
fn();
|
|
60
|
+
const end = performance.now();
|
|
61
|
+
times.push(end - start);
|
|
62
|
+
}
|
|
63
|
+
|
|
64
|
+
times.sort((a, b) => a - b);
|
|
65
|
+
|
|
66
|
+
const totalMs = times.reduce((a, b) => a + b, 0);
|
|
67
|
+
|
|
68
|
+
return {
|
|
69
|
+
name,
|
|
70
|
+
iterations,
|
|
71
|
+
totalMs,
|
|
72
|
+
avgMs: totalMs / iterations,
|
|
73
|
+
minMs: times[0],
|
|
74
|
+
maxMs: times[times.length - 1],
|
|
75
|
+
p50Ms: times[Math.floor(iterations * 0.50)],
|
|
76
|
+
p95Ms: times[Math.floor(iterations * 0.95)],
|
|
77
|
+
p99Ms: times[Math.floor(iterations * 0.99)],
|
|
78
|
+
opsPerSecond: (iterations / totalMs) * 1000
|
|
79
|
+
};
|
|
80
|
+
}
|
|
81
|
+
|
|
82
|
+
function printBenchmark(result: BenchmarkResult): void {
|
|
83
|
+
console.log(`\n ${result.name}:`);
|
|
84
|
+
console.log(` Avg: ${result.avgMs.toFixed(4)}ms`);
|
|
85
|
+
console.log(` Min: ${result.minMs.toFixed(4)}ms`);
|
|
86
|
+
console.log(` Max: ${result.maxMs.toFixed(4)}ms`);
|
|
87
|
+
console.log(` p50: ${result.p50Ms.toFixed(4)}ms`);
|
|
88
|
+
console.log(` p95: ${result.p95Ms.toFixed(4)}ms`);
|
|
89
|
+
console.log(` p99: ${result.p99Ms.toFixed(4)}ms`);
|
|
90
|
+
console.log(` Ops/sec: ${result.opsPerSecond.toFixed(2)}`);
|
|
91
|
+
}
|
|
92
|
+
|
|
93
|
+
// ============================================================
|
|
94
|
+
// TOKEN COUNTING BENCHMARKS
|
|
95
|
+
// ============================================================
|
|
96
|
+
|
|
97
|
+
describe('1. Performance - Token Counting', () => {
|
|
98
|
+
|
|
99
|
+
describe('countTokens performance', () => {
|
|
100
|
+
it('benchmarks short text (~10 chars)', () => {
|
|
101
|
+
const result = runBenchmark('countTokens (short)', () => {
|
|
102
|
+
countTokens('Hello world');
|
|
103
|
+
});
|
|
104
|
+
printBenchmark(result);
|
|
105
|
+
|
|
106
|
+
expect(result.avgMs).toBeLessThan(1); // Should be very fast
|
|
107
|
+
expect(result.opsPerSecond).toBeGreaterThan(1000);
|
|
108
|
+
});
|
|
109
|
+
|
|
110
|
+
it('benchmarks medium text (~100 chars)', () => {
|
|
111
|
+
const result = runBenchmark('countTokens (medium)', () => {
|
|
112
|
+
countTokens('This is a moderately long sentence that contains a decent amount of text for benchmarking.');
|
|
113
|
+
});
|
|
114
|
+
printBenchmark(result);
|
|
115
|
+
|
|
116
|
+
expect(result.avgMs).toBeLessThan(2);
|
|
117
|
+
expect(result.opsPerSecond).toBeGreaterThan(500);
|
|
118
|
+
});
|
|
119
|
+
|
|
120
|
+
it('benchmarks long text (~2000 chars)', () => {
|
|
121
|
+
const longText = 'The quick brown fox jumps over the lazy dog. '.repeat(50);
|
|
122
|
+
const result = runBenchmark('countTokens (long)', () => {
|
|
123
|
+
countTokens(longText);
|
|
124
|
+
});
|
|
125
|
+
printBenchmark(result);
|
|
126
|
+
|
|
127
|
+
expect(result.avgMs).toBeLessThan(10);
|
|
128
|
+
expect(result.opsPerSecond).toBeGreaterThan(100);
|
|
129
|
+
});
|
|
130
|
+
|
|
131
|
+
it('benchmarks code text', () => {
|
|
132
|
+
const codeText = `function helloWorld() {
|
|
133
|
+
console.log("Hello, World!");
|
|
134
|
+
return 42;
|
|
135
|
+
}
|
|
136
|
+
const x = [1, 2, 3, 4, 5];
|
|
137
|
+
const obj = { a: 1, b: 2 };`;
|
|
138
|
+
const result = runBenchmark('countTokens (code)', () => {
|
|
139
|
+
countTokens(codeText);
|
|
140
|
+
});
|
|
141
|
+
printBenchmark(result);
|
|
142
|
+
|
|
143
|
+
expect(result.avgMs).toBeLessThan(5);
|
|
144
|
+
});
|
|
145
|
+
|
|
146
|
+
it('benchmarks unicode text', () => {
|
|
147
|
+
const result = runBenchmark('countTokens (unicode)', () => {
|
|
148
|
+
countTokens('こんにちは世界!これはテストです。日本語のテキストを処理しています。');
|
|
149
|
+
});
|
|
150
|
+
printBenchmark(result);
|
|
151
|
+
|
|
152
|
+
expect(result.avgMs).toBeLessThan(5);
|
|
153
|
+
});
|
|
154
|
+
});
|
|
155
|
+
|
|
156
|
+
describe('estimateTokens performance', () => {
|
|
157
|
+
it('benchmarks short text', () => {
|
|
158
|
+
const result = runBenchmark('estimateTokens (short)', () => {
|
|
159
|
+
estimateTokens('Hello world');
|
|
160
|
+
});
|
|
161
|
+
printBenchmark(result);
|
|
162
|
+
|
|
163
|
+
expect(result.avgMs).toBeLessThan(1);
|
|
164
|
+
});
|
|
165
|
+
|
|
166
|
+
it('benchmarks long text', () => {
|
|
167
|
+
const longText = 'word '.repeat(1000);
|
|
168
|
+
const result = runBenchmark('estimateTokens (long)', () => {
|
|
169
|
+
estimateTokens(longText);
|
|
170
|
+
});
|
|
171
|
+
printBenchmark(result);
|
|
172
|
+
|
|
173
|
+
expect(result.avgMs).toBeLessThan(10);
|
|
174
|
+
});
|
|
175
|
+
});
|
|
176
|
+
|
|
177
|
+
describe('Token estimation accuracy', () => {
|
|
178
|
+
it('countTokens is consistent for same input', () => {
|
|
179
|
+
const text = 'The quick brown fox jumps over the lazy dog';
|
|
180
|
+
const tokens1 = countTokens(text);
|
|
181
|
+
const tokens2 = countTokens(text);
|
|
182
|
+
const tokens3 = countTokens(text);
|
|
183
|
+
expect(tokens1).toBe(tokens2);
|
|
184
|
+
expect(tokens2).toBe(tokens3);
|
|
185
|
+
});
|
|
186
|
+
|
|
187
|
+
it('longer text has more tokens', () => {
|
|
188
|
+
const short = 'Hi';
|
|
189
|
+
const medium = 'Hello world, this is a test';
|
|
190
|
+
const long = 'Hello world, this is a test. The quick brown fox jumps over the lazy dog. ' +
|
|
191
|
+
'This is a longer text that should have more tokens than the medium one.';
|
|
192
|
+
|
|
193
|
+
const tokensShort = countTokens(short);
|
|
194
|
+
const tokensMedium = countTokens(medium);
|
|
195
|
+
const tokensLong = countTokens(long);
|
|
196
|
+
|
|
197
|
+
expect(tokensLong).toBeGreaterThan(tokensMedium);
|
|
198
|
+
expect(tokensMedium).toBeGreaterThan(tokensShort);
|
|
199
|
+
});
|
|
200
|
+
|
|
201
|
+
it('code has more tokens than plain text', () => {
|
|
202
|
+
const plainText = 'This is a sentence about functions and code';
|
|
203
|
+
const codeText = 'function test() { return 42; } const x = 1;';
|
|
204
|
+
|
|
205
|
+
const tokensPlain = countTokens(plainText);
|
|
206
|
+
const tokensCode = countTokens(codeText);
|
|
207
|
+
|
|
208
|
+
// Code should be tokenized differently (may have more or fewer tokens)
|
|
209
|
+
// Just verify they're both valid numbers
|
|
210
|
+
expect(tokensPlain).toBeGreaterThan(0);
|
|
211
|
+
expect(tokensCode).toBeGreaterThan(0);
|
|
212
|
+
});
|
|
213
|
+
});
|
|
214
|
+
});
|
|
215
|
+
|
|
216
|
+
// ============================================================
|
|
217
|
+
// ROUTING PERFORMANCE BENCHMARKS
|
|
218
|
+
// ============================================================
|
|
219
|
+
|
|
220
|
+
describe('2. Performance - Routing', () => {
|
|
221
|
+
|
|
222
|
+
describe('routeQuery performance', () => {
|
|
223
|
+
it('benchmarks simple query', () => {
|
|
224
|
+
const result = runBenchmark('routeQuery (simple)', () => {
|
|
225
|
+
routeQuery('Hello, how are you?');
|
|
226
|
+
});
|
|
227
|
+
printBenchmark(result);
|
|
228
|
+
|
|
229
|
+
expect(result.avgMs).toBeLessThan(50); // Should be fast
|
|
230
|
+
expect(result.opsPerSecond).toBeGreaterThan(20);
|
|
231
|
+
});
|
|
232
|
+
|
|
233
|
+
it('benchmarks complex query', () => {
|
|
234
|
+
const result = runBenchmark('routeQuery (complex)', () => {
|
|
235
|
+
routeQuery('Write a Python function to sort an array using quicksort algorithm with proper error handling');
|
|
236
|
+
});
|
|
237
|
+
printBenchmark(result);
|
|
238
|
+
|
|
239
|
+
expect(result.avgMs).toBeLessThan(100);
|
|
240
|
+
});
|
|
241
|
+
|
|
242
|
+
it('benchmarks very long query', () => {
|
|
243
|
+
const longQuery = 'Analyze the following code and suggest improvements: '.repeat(20);
|
|
244
|
+
const result = runBenchmark('routeQuery (long)', () => {
|
|
245
|
+
routeQuery(longQuery);
|
|
246
|
+
});
|
|
247
|
+
printBenchmark(result);
|
|
248
|
+
|
|
249
|
+
expect(result.avgMs).toBeLessThan(200);
|
|
250
|
+
});
|
|
251
|
+
|
|
252
|
+
it('benchmarks repeated queries (cache effectiveness)', () => {
|
|
253
|
+
const query = 'What is 2+2?';
|
|
254
|
+
|
|
255
|
+
// First call (cache miss)
|
|
256
|
+
routeQuery(query);
|
|
257
|
+
|
|
258
|
+
// Subsequent calls (should be faster if caching)
|
|
259
|
+
const result = runBenchmark('routeQuery (repeated)', () => {
|
|
260
|
+
routeQuery(query);
|
|
261
|
+
});
|
|
262
|
+
printBenchmark(result);
|
|
263
|
+
|
|
264
|
+
expect(result.avgMs).toBeLessThan(50);
|
|
265
|
+
});
|
|
266
|
+
});
|
|
267
|
+
|
|
268
|
+
describe('routeBatch performance', () => {
|
|
269
|
+
it('benchmarks batch of 10', () => {
|
|
270
|
+
const queries = Array(10).fill('Hello world');
|
|
271
|
+
const result = runBenchmark('routeBatch (10 items)', () => {
|
|
272
|
+
routeBatch(queries);
|
|
273
|
+
}, 100);
|
|
274
|
+
printBenchmark(result);
|
|
275
|
+
|
|
276
|
+
expect(result.avgMs).toBeLessThan(500);
|
|
277
|
+
});
|
|
278
|
+
|
|
279
|
+
it('benchmarks batch of 100', () => {
|
|
280
|
+
const queries = Array(100).fill('Test query');
|
|
281
|
+
const result = runBenchmark('routeBatch (100 items)', () => {
|
|
282
|
+
routeBatch(queries);
|
|
283
|
+
}, 50);
|
|
284
|
+
printBenchmark(result);
|
|
285
|
+
|
|
286
|
+
expect(result.avgMs).toBeLessThan(5000);
|
|
287
|
+
});
|
|
288
|
+
|
|
289
|
+
it('benchmarks batch scaling', () => {
|
|
290
|
+
const batch10 = Array(10).fill('test');
|
|
291
|
+
const batch100 = Array(100).fill('test');
|
|
292
|
+
|
|
293
|
+
const time10 = runBenchmark('routeBatch (10)', () => routeBatch(batch10), 50);
|
|
294
|
+
const time100 = runBenchmark('routeBatch (100)', () => routeBatch(batch100), 50);
|
|
295
|
+
|
|
296
|
+
printBenchmark(time10);
|
|
297
|
+
printBenchmark(time100);
|
|
298
|
+
|
|
299
|
+
// 100 items should not take 10x longer
|
|
300
|
+
expect(time100.avgMs).toBeLessThan(time10.avgMs * 20);
|
|
301
|
+
});
|
|
302
|
+
});
|
|
303
|
+
});
|
|
304
|
+
|
|
305
|
+
// ============================================================
|
|
306
|
+
// MEMORY OPERATION BENCHMARKS
|
|
307
|
+
// ============================================================
|
|
308
|
+
|
|
309
|
+
describe('3. Performance - Memory Operations', () => {
|
|
310
|
+
|
|
311
|
+
describe('MemoryTree.add performance', () => {
|
|
312
|
+
it('benchmarks single add', () => {
|
|
313
|
+
const result = runBenchmark('MemoryTree.add (1 entry)', () => {
|
|
314
|
+
const memory = new MemoryTree({ maxSize: 1000 });
|
|
315
|
+
memory.add('test entry', { tags: ['test'] });
|
|
316
|
+
}, 1000);
|
|
317
|
+
printBenchmark(result);
|
|
318
|
+
|
|
319
|
+
expect(result.avgMs).toBeLessThan(10);
|
|
320
|
+
});
|
|
321
|
+
|
|
322
|
+
// TODO: Rewrite to use proper async API - current MemoryTree.add is async
|
|
323
|
+
it.skip('benchmarks repeated adds to same instance', () => {
|
|
324
|
+
// MemoryTree.add is async and takes (data: string), not (data, {tags})
|
|
325
|
+
// This test needs to be rewritten to use proper async benchmarking
|
|
326
|
+
});
|
|
327
|
+
|
|
328
|
+
// TODO: Rewrite to use proper async API - current MemoryTree.add is async
|
|
329
|
+
it.skip('benchmarks add with metadata', () => {
|
|
330
|
+
// MemoryTree.add is async and takes (data: string), not an object with metadata
|
|
331
|
+
// This test needs to be rewritten to use proper async benchmarking
|
|
332
|
+
});
|
|
333
|
+
});
|
|
334
|
+
|
|
335
|
+
describe('MemoryTree.search performance', () => {
|
|
336
|
+
it('benchmarks search with few entries', () => {
|
|
337
|
+
const memory = new MemoryTree({ maxSize: 1000 });
|
|
338
|
+
for (let i = 0; i < 10; i++) {
|
|
339
|
+
memory.add(`test entry ${i}`, { tags: ['test'] });
|
|
340
|
+
}
|
|
341
|
+
|
|
342
|
+
const result = runBenchmark('MemoryTree.search (10 entries)', () => {
|
|
343
|
+
memory.search('test');
|
|
344
|
+
}, 1000);
|
|
345
|
+
printBenchmark(result);
|
|
346
|
+
|
|
347
|
+
expect(result.avgMs).toBeLessThan(10);
|
|
348
|
+
});
|
|
349
|
+
|
|
350
|
+
it('benchmarks search with many entries', () => {
|
|
351
|
+
const memory = new MemoryTree({ maxSize: 10000 });
|
|
352
|
+
for (let i = 0; i < 1000; i++) {
|
|
353
|
+
memory.add(`test entry ${i} with some content`, { tags: ['test'] });
|
|
354
|
+
}
|
|
355
|
+
|
|
356
|
+
const result = runBenchmark('MemoryTree.search (1000 entries)', () => {
|
|
357
|
+
memory.search('test');
|
|
358
|
+
}, 100);
|
|
359
|
+
printBenchmark(result);
|
|
360
|
+
|
|
361
|
+
expect(result.avgMs).toBeLessThan(50);
|
|
362
|
+
});
|
|
363
|
+
|
|
364
|
+
it('benchmarks search with no matches', () => {
|
|
365
|
+
const memory = new MemoryTree({ maxSize: 1000 });
|
|
366
|
+
for (let i = 0; i < 100; i++) {
|
|
367
|
+
memory.add(`unique entry ${i}`, { tags: ['test'] });
|
|
368
|
+
}
|
|
369
|
+
|
|
370
|
+
const result = runBenchmark('MemoryTree.search (no match)', () => {
|
|
371
|
+
memory.search('nonexistent query string');
|
|
372
|
+
}, 100);
|
|
373
|
+
printBenchmark(result);
|
|
374
|
+
|
|
375
|
+
expect(result.avgMs).toBeLessThan(20);
|
|
376
|
+
});
|
|
377
|
+
});
|
|
378
|
+
|
|
379
|
+
describe('MemoryTree.getStats performance', () => {
|
|
380
|
+
it('benchmarks getStats', () => {
|
|
381
|
+
const memory = new MemoryTree({ maxSize: 1000 });
|
|
382
|
+
for (let i = 0; i < 100; i++) {
|
|
383
|
+
memory.add(`test entry ${i}`, { tags: ['test'] });
|
|
384
|
+
}
|
|
385
|
+
|
|
386
|
+
const result = runBenchmark('MemoryTree.getStats', () => {
|
|
387
|
+
memory.getStats();
|
|
388
|
+
}, 100);
|
|
389
|
+
printBenchmark(result);
|
|
390
|
+
|
|
391
|
+
expect(result.avgMs).toBeLessThan(10);
|
|
392
|
+
});
|
|
393
|
+
});
|
|
394
|
+
});
|
|
395
|
+
|
|
396
|
+
// ============================================================
|
|
397
|
+
// COST TRACKING BENCHMARKS
|
|
398
|
+
// ============================================================
|
|
399
|
+
|
|
400
|
+
describe('4. Performance - Cost Tracking', () => {
|
|
401
|
+
|
|
402
|
+
describe('CostTracker performance', () => {
|
|
403
|
+
it('benchmarks record', () => {
|
|
404
|
+
const tracker = new CostTracker();
|
|
405
|
+
|
|
406
|
+
const result = runBenchmark('CostTracker.record', () => {
|
|
407
|
+
tracker.record('openai', 'gpt-4o', 100, 50);
|
|
408
|
+
}, 1000);
|
|
409
|
+
printBenchmark(result);
|
|
410
|
+
|
|
411
|
+
expect(result.avgMs).toBeLessThan(1);
|
|
412
|
+
});
|
|
413
|
+
|
|
414
|
+
it('benchmarks getSummary', () => {
|
|
415
|
+
const tracker = new CostTracker();
|
|
416
|
+
|
|
417
|
+
// Add some data
|
|
418
|
+
for (let i = 0; i < 100; i++) {
|
|
419
|
+
tracker.record('openai', 'gpt-4o', 100, 50);
|
|
420
|
+
}
|
|
421
|
+
|
|
422
|
+
const result = runBenchmark('CostTracker.getSummary', () => {
|
|
423
|
+
tracker.getSummary();
|
|
424
|
+
}, 100);
|
|
425
|
+
printBenchmark(result);
|
|
426
|
+
|
|
427
|
+
expect(result.avgMs).toBeLessThan(5);
|
|
428
|
+
});
|
|
429
|
+
});
|
|
430
|
+
});
|
|
431
|
+
|
|
432
|
+
// ============================================================
|
|
433
|
+
// FACTORY PERFORMANCE
|
|
434
|
+
// ============================================================
|
|
435
|
+
|
|
436
|
+
describe('5. Performance - Router Factory', () => {
|
|
437
|
+
|
|
438
|
+
describe('createA3MRouter performance', () => {
|
|
439
|
+
it('benchmarks router creation', () => {
|
|
440
|
+
const result = runBenchmark('createA3MRouter', () => {
|
|
441
|
+
createA3MRouter({});
|
|
442
|
+
}, 100);
|
|
443
|
+
printBenchmark(result);
|
|
444
|
+
|
|
445
|
+
expect(result.avgMs).toBeLessThan(50);
|
|
446
|
+
});
|
|
447
|
+
|
|
448
|
+
it('benchmarks router.route', () => {
|
|
449
|
+
const router = createA3MRouter({});
|
|
450
|
+
|
|
451
|
+
const result = runBenchmark('router.route', () => {
|
|
452
|
+
router.route('test query');
|
|
453
|
+
}, 100);
|
|
454
|
+
printBenchmark(result);
|
|
455
|
+
|
|
456
|
+
expect(result.avgMs).toBeLessThan(50);
|
|
457
|
+
});
|
|
458
|
+
|
|
459
|
+
it('benchmarks router.routeBatch', () => {
|
|
460
|
+
const router = createA3MRouter({});
|
|
461
|
+
|
|
462
|
+
const result = runBenchmark('router.routeBatch (10 items)', () => {
|
|
463
|
+
router.routeBatch(Array(10).fill('test'));
|
|
464
|
+
}, 100);
|
|
465
|
+
printBenchmark(result);
|
|
466
|
+
|
|
467
|
+
expect(result.avgMs).toBeLessThan(500);
|
|
468
|
+
});
|
|
469
|
+
});
|
|
470
|
+
});
|
|
471
|
+
|
|
472
|
+
// ============================================================
|
|
473
|
+
// THROUGHPUT TESTS
|
|
474
|
+
// ============================================================
|
|
475
|
+
|
|
476
|
+
describe('6. Performance - Throughput', () => {
|
|
477
|
+
|
|
478
|
+
it('sustains 50+ queries per second', () => {
|
|
479
|
+
const queries = Array(50).fill('test query');
|
|
480
|
+
const start = Date.now();
|
|
481
|
+
routeBatch(queries);
|
|
482
|
+
const elapsed = Date.now() - start;
|
|
483
|
+
|
|
484
|
+
const qps = (50 / elapsed) * 1000;
|
|
485
|
+
console.log(`\n Throughput: ${qps.toFixed(2)} queries/sec`);
|
|
486
|
+
|
|
487
|
+
expect(qps).toBeGreaterThan(50);
|
|
488
|
+
});
|
|
489
|
+
|
|
490
|
+
it('sustains 100+ queries per second', () => {
|
|
491
|
+
const queries = Array(100).fill('test query');
|
|
492
|
+
const start = Date.now();
|
|
493
|
+
routeBatch(queries);
|
|
494
|
+
const elapsed = Date.now() - start;
|
|
495
|
+
|
|
496
|
+
const qps = (100 / elapsed) * 1000;
|
|
497
|
+
console.log(`\n Throughput: ${qps.toFixed(2)} queries/sec`);
|
|
498
|
+
|
|
499
|
+
expect(qps).toBeGreaterThan(100);
|
|
500
|
+
});
|
|
501
|
+
|
|
502
|
+
it('handles burst traffic', () => {
|
|
503
|
+
const start = Date.now();
|
|
504
|
+
|
|
505
|
+
// Simulate burst of 200 queries
|
|
506
|
+
for (let i = 0; i < 200; i++) {
|
|
507
|
+
routeQuery('burst test');
|
|
508
|
+
}
|
|
509
|
+
|
|
510
|
+
const elapsed = Date.now() - start;
|
|
511
|
+
console.log(`\n Burst of 200 queries: ${elapsed}ms`);
|
|
512
|
+
|
|
513
|
+
expect(elapsed).toBeLessThan(10000); // Should handle burst within 10s
|
|
514
|
+
});
|
|
515
|
+
});
|
|
516
|
+
|
|
517
|
+
// ============================================================
|
|
518
|
+
// LATENCY DISTRIBUTION TESTS
|
|
519
|
+
// ============================================================
|
|
520
|
+
|
|
521
|
+
describe('7. Performance - Latency Distribution', () => {
|
|
522
|
+
|
|
523
|
+
it('routeQuery p95 latency is acceptable', () => {
|
|
524
|
+
const times: number[] = [];
|
|
525
|
+
|
|
526
|
+
// Warmup
|
|
527
|
+
for (let i = 0; i < 10; i++) {
|
|
528
|
+
routeQuery('test');
|
|
529
|
+
}
|
|
530
|
+
|
|
531
|
+
// Measure
|
|
532
|
+
for (let i = 0; i < 100; i++) {
|
|
533
|
+
const start = performance.now();
|
|
534
|
+
routeQuery('test query for latency measurement');
|
|
535
|
+
times.push(performance.now() - start);
|
|
536
|
+
}
|
|
537
|
+
|
|
538
|
+
times.sort((a, b) => a - b);
|
|
539
|
+
const p95 = times[Math.floor(times.length * 0.95)];
|
|
540
|
+
const p99 = times[Math.floor(times.length * 0.99)];
|
|
541
|
+
|
|
542
|
+
console.log(`\n routeQuery latency:`);
|
|
543
|
+
console.log(` p95: ${p95.toFixed(2)}ms`);
|
|
544
|
+
console.log(` p99: ${p99.toFixed(2)}ms`);
|
|
545
|
+
|
|
546
|
+
expect(p95).toBeLessThan(200);
|
|
547
|
+
expect(p99).toBeLessThan(500);
|
|
548
|
+
});
|
|
549
|
+
|
|
550
|
+
it('MemoryTree operations have low latency', () => {
|
|
551
|
+
const memory = new MemoryTree({ maxSize: 1000 });
|
|
552
|
+
memory.add('test entry', { tags: ['test'] });
|
|
553
|
+
|
|
554
|
+
const times: number[] = [];
|
|
555
|
+
|
|
556
|
+
for (let i = 0; i < 100; i++) {
|
|
557
|
+
const start = performance.now();
|
|
558
|
+
memory.search('test');
|
|
559
|
+
times.push(performance.now() - start);
|
|
560
|
+
}
|
|
561
|
+
|
|
562
|
+
times.sort((a, b) => a - b);
|
|
563
|
+
const p95 = times[Math.floor(times.length * 0.95)];
|
|
564
|
+
|
|
565
|
+
console.log(`\n MemoryTree.search p95: ${p95.toFixed(2)}ms`);
|
|
566
|
+
|
|
567
|
+
expect(p95).toBeLessThan(50);
|
|
568
|
+
});
|
|
569
|
+
});
|
|
570
|
+
|
|
571
|
+
// ============================================================
|
|
572
|
+
// MEMORY USAGE TESTS
|
|
573
|
+
// ============================================================
|
|
574
|
+
|
|
575
|
+
describe('8. Performance - Memory Usage', () => {
|
|
576
|
+
|
|
577
|
+
it('MemoryTree does not leak memory on repeated operations', async () => {
|
|
578
|
+
const memory = new MemoryTree({ maxSize: 1000 });
|
|
579
|
+
|
|
580
|
+
// Perform many operations
|
|
581
|
+
for (let i = 0; i < 1000; i++) {
|
|
582
|
+
await memory.add(`entry ${i}`);
|
|
583
|
+
}
|
|
584
|
+
|
|
585
|
+
const finalStats = memory.getStats();
|
|
586
|
+
|
|
587
|
+
// Stats should be accurate
|
|
588
|
+
expect(finalStats.totalChunks).toBeGreaterThan(0);
|
|
589
|
+
});
|
|
590
|
+
|
|
591
|
+
it('CostTracker does not leak memory', () => {
|
|
592
|
+
const tracker = new CostTracker();
|
|
593
|
+
|
|
594
|
+
for (let i = 0; i < 1000; i++) {
|
|
595
|
+
tracker.record('test', 'test-model', 100, 50);
|
|
596
|
+
}
|
|
597
|
+
|
|
598
|
+
const summary = tracker.getSummary();
|
|
599
|
+
expect(summary.request_count).toBe(1000);
|
|
600
|
+
});
|
|
601
|
+
});
|
|
602
|
+
|
|
603
|
+
// ============================================================
|
|
604
|
+
// REGRESSION GATES
|
|
605
|
+
// ============================================================
|
|
606
|
+
|
|
607
|
+
describe('9. Performance - Regression Gates', () => {
|
|
608
|
+
|
|
609
|
+
// These tests fail if performance degrades beyond threshold
|
|
610
|
+
|
|
611
|
+
it('countTokens must complete in < 1ms avg', () => {
|
|
612
|
+
const result = runBenchmark('REGRESSION: countTokens', () => {
|
|
613
|
+
countTokens('test string for regression check');
|
|
614
|
+
}, 1000);
|
|
615
|
+
|
|
616
|
+
console.log(`\n Regression check - countTokens: ${result.avgMs.toFixed(4)}ms avg`);
|
|
617
|
+
expect(result.avgMs).toBeLessThan(1);
|
|
618
|
+
});
|
|
619
|
+
|
|
620
|
+
it('routeQuery must complete in < 100ms avg', () => {
|
|
621
|
+
const result = runBenchmark('REGRESSION: routeQuery', () => {
|
|
622
|
+
routeQuery('test query for regression check');
|
|
623
|
+
}, 100);
|
|
624
|
+
|
|
625
|
+
console.log(`\n Regression check - routeQuery: ${result.avgMs.toFixed(4)}ms avg`);
|
|
626
|
+
expect(result.avgMs).toBeLessThan(100);
|
|
627
|
+
});
|
|
628
|
+
|
|
629
|
+
it('MemoryTree.add must complete in < 10ms avg', () => {
|
|
630
|
+
const result = runBenchmark('REGRESSION: MemoryTree.add', () => {
|
|
631
|
+
const memory = new MemoryTree({ maxSize: 1000 });
|
|
632
|
+
memory.add('regression test', { tags: ['test'] });
|
|
633
|
+
}, 100);
|
|
634
|
+
|
|
635
|
+
console.log(`\n Regression check - MemoryTree.add: ${result.avgMs.toFixed(4)}ms avg`);
|
|
636
|
+
expect(result.avgMs).toBeLessThan(10);
|
|
637
|
+
});
|
|
638
|
+
|
|
639
|
+
it('MemoryTree.search must complete in < 20ms avg', () => {
|
|
640
|
+
const memory = new MemoryTree({ maxSize: 1000 });
|
|
641
|
+
for (let i = 0; i < 100; i++) {
|
|
642
|
+
memory.add(`test entry ${i}`, { tags: ['test'] });
|
|
643
|
+
}
|
|
644
|
+
|
|
645
|
+
const result = runBenchmark('REGRESSION: MemoryTree.search', () => {
|
|
646
|
+
memory.search('test');
|
|
647
|
+
}, 100);
|
|
648
|
+
|
|
649
|
+
console.log(`\n Regression check - MemoryTree.search: ${result.avgMs.toFixed(4)}ms avg`);
|
|
650
|
+
expect(result.avgMs).toBeLessThan(20);
|
|
651
|
+
});
|
|
652
|
+
});
|