adaptive-memory-multi-model-router 2.14.45 → 2.14.47
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/index.d.ts +4 -0
- package/dist/index.js +8 -2
- package/dist/memory/hybridMemory.d.ts +71 -0
- package/dist/memory/hybridMemory.js +124 -0
- package/dist/memory/reasoningBank.d.ts +88 -0
- package/dist/memory/reasoningBank.js +303 -0
- package/{docs/llms.txt → llms.txt.bak} +6 -6
- package/package.json +13 -84
- package/src/index.ts +8 -0
- package/src/memory/hybridMemory.ts +155 -0
- package/src/memory/reasoningBank.ts +335 -0
- package/src/routing/advancedRouter.ts.bak +650 -0
- package/test.js.bak +376 -0
- package/.dockerignore +0 -82
- package/.env.example +0 -303
- package/.github/DISCUSSIONS_WELCOME.md +0 -27
- package/.github/DISCUSSION_TEMPLATE.yml +0 -5
- package/.github/FUNDING.yml +0 -2
- package/.github/ISSUE_TEMPLATE/bug_report.md +0 -94
- package/.github/ISSUE_TEMPLATE/config.yml +0 -17
- package/.github/ISSUE_TEMPLATE/feature_request.md +0 -71
- package/.github/PULL_REQUEST_TEMPLATE.md +0 -71
- package/.github/dependabot.yml +0 -9
- package/.github/workflows/auto-publish.yml +0 -51
- package/.github/workflows/ci.yml +0 -263
- package/.github/workflows/codeql.yml +0 -38
- package/.github/workflows/npm-publish.yml +0 -20
- package/.github/workflows/pages.yml +0 -37
- package/.github/workflows/stale.yml +0 -54
- package/.publish-tick +0 -1
- package/.well-known/ai-plugin.json +0 -16
- package/AGENT_COUNCIL_FINDINGS.md +0 -142
- package/ARCHITECTURE.md +0 -346
- package/AUDIT_REPORT.md +0 -28
- package/CODE_OF_CONDUCT.md +0 -128
- package/CONTRIBUTING.md +0 -50
- package/CONTRIBUTORS.md +0 -20
- package/Dockerfile +0 -53
- package/Dockerfile.proxy +0 -33
- package/HEALTH_REPORT.md +0 -118
- package/IMPROVEMENT_PLAN.md +0 -107
- package/LANDING.md +0 -43
- package/LAUNCH-PAIN-DRIVEN.md +0 -339
- package/LAUNCH.md +0 -337
- package/LAUNCH_CHECKLIST.md +0 -141
- package/LAUNCH_SNAPSHOT.md +0 -260
- package/MANIFESTO.md +0 -41
- package/POPULARITY_BOOSTERS.md +0 -285
- package/PR_STATUS_REPORT.md +0 -148
- package/REDESIGN.md +0 -95
- package/RUNKIT.md +0 -83
- package/SECURITY.md +0 -29
- package/SUBMISSIONS.md +0 -43
- package/_schema.html +0 -53
- package/ai-plugin.json +0 -16
- package/articles/AI_AGENT_LLM_ROUTING.md +0 -150
- package/articles/CHINESE_DIRECTORIES.md +0 -100
- package/articles/CHINESE_SUBMISSIONS_READY.md +0 -322
- package/articles/COMPETITOR_ALERTS.md +0 -31
- package/articles/COMPLETE_POSTING_DIRECTORY.md +0 -147
- package/articles/CONTENT_STRUCTURE.md +0 -292
- package/articles/DEVTO_COST_GUIDE.md +0 -473
- package/articles/DEVTO_FINAL.md +0 -416
- package/articles/DEVTO_MULTI_PROVIDER.md +0 -542
- package/articles/DEVTO_READY.md +0 -255
- package/articles/DEVTO_V2_ANNOUNCEMENT.md +0 -160
- package/articles/DEVTO_VIRAL_GROWTH.md +0 -280
- package/articles/FRESH_devto.md +0 -460
- package/articles/FRESH_devto_2026_05.md +0 -73
- package/articles/FRESH_hackernews.md +0 -14
- package/articles/FRESH_reddit_ml.md +0 -90
- package/articles/FRESH_reddit_node.md +0 -198
- package/articles/FRESH_reddit_sideproject.md +0 -72
- package/articles/FRESH_reddit_webdev.md +0 -130
- package/articles/FROM_ZERO_TO_10K.md +0 -107
- package/articles/HN_10X_BETTER.md +0 -430
- package/articles/HN_ACCOUNT_GUIDE.md +0 -21
- package/articles/HN_CHINESE_STYLE.md +0 -308
- package/articles/HN_FINAL.md +0 -148
- package/articles/HN_POSTED_VERSION.md +0 -56
- package/articles/HN_POST_READY.md +0 -137
- package/articles/HN_RESEARCH.md +0 -364
- package/articles/HN_SHOW_routerarena.md +0 -17
- package/articles/HN_TIMING_GUIDE.md +0 -52
- package/articles/INDIEHACKERS_POST.md +0 -52
- package/articles/INDIEHACKERS_READY.md +0 -120
- package/articles/LLM_BENCHMARK_DEEP_DIVE.md +0 -153
- package/articles/MASTER_POSTING_DIRECTORY.md +0 -189
- package/articles/NEWSLETTER_SEND_NOW.md +0 -259
- package/articles/NEWSLETTER_SUBMISSIONS.md +0 -112
- package/articles/PAIN-DRIVEN-devto-v2.md +0 -308
- package/articles/PAIN-DRIVEN-devto-v3.md +0 -268
- package/articles/PAIN-DRIVEN-devto.md +0 -242
- package/articles/PAIN-DRIVEN-hackernews-v2.md +0 -138
- package/articles/PAIN-DRIVEN-hackernews-v3.md +0 -151
- package/articles/PAIN-DRIVEN-hackernews.md +0 -131
- package/articles/PAIN-DRIVEN-reddit-v2.md +0 -301
- package/articles/PAIN-DRIVEN-reddit-v3.md +0 -236
- package/articles/PAIN-DRIVEN-reddit.md +0 -218
- package/articles/PAIN-DRIVEN-twitter-v2.md +0 -110
- package/articles/PAIN-DRIVEN-twitter-v3.md +0 -121
- package/articles/PAIN-DRIVEN-twitter.md +0 -120
- package/articles/PORTKEY_VS_A3M.md +0 -147
- package/articles/POSTING_KIT_2026_05.md +0 -67
- package/articles/PRESS_KIT_routerarena.md +0 -77
- package/articles/PRODUCTHUNT_LISTING.md +0 -48
- package/articles/PRODUCTHUNT_READY.md +0 -106
- package/articles/PR_PLAN_vault.md +0 -125
- package/articles/REDDIT_FINAL.md +0 -232
- package/articles/REDDIT_POST.md +0 -67
- package/articles/REDDIT_SUBMISSION_READY.md +0 -348
- package/articles/ROUTERARENA_LEADER.md +0 -45
- package/articles/SHOW_HN_FINAL.md +0 -29
- package/articles/TWEETS_10K_DOWNLOADS.md +0 -47
- package/articles/TWEETS_BENCHMARK_FIRST.md +0 -46
- package/articles/TWEETS_MCP_PLAY.md +0 -51
- package/articles/TWEETS_SEQUENTIAL_BROKEN.md +0 -49
- package/articles/TWEETS_WHY_BUILD.md +0 -54
- package/articles/TWEETS_routerarena_leader.md +0 -53
- package/articles/TWEET_STORM_READY.md +0 -165
- package/articles/TWITTER_FINAL.md +0 -167
- package/articles/WHY_10X_BETTER.md +0 -261
- package/articles/WHY_CHINESE_STYLE_BETTER.md +0 -323
- package/articles/ai-discoverability-llm-routing.md +0 -210
- package/articles/devto-llm-routing.md +0 -138
- package/articles/hackernews-show-hn.md +0 -54
- package/articles/hashnode-llm-cost-optimization.md +0 -125
- package/articles/hn_show_2026_05.md +0 -11
- package/articles/medium-building-llm-router.md +0 -205
- package/articles/reddit-ml.md +0 -76
- package/articles/twitter-thread-cost-savings.md +0 -50
- package/articles/youtube-tutorial-script.md +0 -262
- package/assets/a3m_3blue1brown.mp4 +0 -0
- package/assets/banner.svg +0 -109
- package/assets/chart-cost-v2.svg +0 -91
- package/assets/chart-cost-v3.svg +0 -143
- package/assets/chart-features-v2.svg +0 -132
- package/assets/chart-features-v3.svg +0 -211
- package/assets/chart-growth-v2.svg +0 -122
- package/assets/chart-growth-v3.svg +0 -189
- package/assets/cost-comparison.svg +0 -134
- package/assets/cost-simple.svg +0 -64
- package/assets/demo-hn.gif +0 -0
- package/assets/feature-matrix.svg +0 -136
- package/assets/growth-chart-animated.svg +0 -76
- package/assets/growth-chart.svg +0 -82
- package/assets/growth-simple.svg +0 -69
- package/assets/hero-diagram.svg +0 -81
- package/assets/logo-new.svg +0 -21
- package/assets/logo.svg +0 -68
- package/assets/provider-comparison.svg +0 -121
- package/assets/social-preview-new.svg +0 -100
- package/assets/social-preview.svg +0 -194
- package/assets/social-v2.svg +0 -130
- package/assets/social-v3.svg +0 -212
- package/benchmark-provider-results.json +0 -245
- package/benchmark-results.json +0 -54
- package/council-votes/architecture-vote.md +0 -121
- package/council-votes/coverage-vote.md +0 -93
- package/data/adaptive-benchmark.json +0 -92
- package/data/benchmark-results.json +0 -47
- package/data/labeled-benchmark.json +0 -88
- package/demo/3blue1brown_video.py +0 -285
- package/demo/3blue1brown_video_v2.py +0 -310
- package/demo/IMPROVED_PROMPTS.md +0 -229
- package/demo/VEO3_PROMPTS.md +0 -269
- package/demo/VIDEO_PRODUCTION_GUIDE.md +0 -333
- package/demo/a3m_3blue1brown.mp4 +0 -0
- package/demo/asciinema-demo.sh +0 -195
- package/demo/demo-hn.tape +0 -74
- package/demo/demo-script.md +0 -53
- package/demo/demo-script.sh +0 -62
- package/demo/demo.svg +0 -75
- package/demo/frame1_ai_data_center.png +0 -0
- package/demo/frame1_sunset_video.mp4 +0 -0
- package/demo/frame2_cost_comparison.png +0 -0
- package/demo/frame2_cost_comparison_fallback.png +0 -0
- package/demo/frame3_parallel_execution.png +0 -0
- package/demo/frame3_parallel_execution_fallback.png +0 -0
- package/demo/frame4_providers.png +0 -0
- package/demo/frame4_providers_fallback.png +0 -0
- package/demo/frame5_endcard.png +0 -0
- package/demo/frame5_endcard_fallback.png +0 -0
- package/demo/new_frame1_hook.png +0 -0
- package/demo/new_frame2_proof.png +0 -0
- package/demo/new_frame3_wow.png +0 -0
- package/demo/new_frame4_social.png +0 -0
- package/demo/new_frame5_cta.png +0 -0
- package/demo/package.json +0 -13
- package/demo/product-video-final.mp4 +0 -0
- package/demo/product-video-hype-v1.mp4 +0 -0
- package/demo/product-video-v1.mp4 +0 -0
- package/demo/public/index.html +0 -762
- package/demo/recording.cast +0 -55
- package/demo/server.js +0 -405
- package/demo-new.tape +0 -71
- package/demo-real.sh +0 -198
- package/demo-simple.tape +0 -205
- package/demo.html +0 -520
- package/demo.sh +0 -85
- package/demo.tape +0 -259
- package/dist/analytics/costAnalytics.d.ts.map +0 -1
- package/dist/analytics/costAnalytics.js.map +0 -1
- package/dist/benchmark/comprehensive.js.map +0 -1
- package/dist/benchmark/reproducible.d.ts.map +0 -1
- package/dist/benchmark/reproducible.js.map +0 -1
- package/dist/cache/prefixCache.d.ts.map +0 -1
- package/dist/cache/prefixCache.js.map +0 -1
- package/dist/cache/responseCache.d.ts.map +0 -1
- package/dist/cache/responseCache.js.map +0 -1
- package/dist/cache/semanticCache.d.ts.map +0 -1
- package/dist/cache/semanticCache.js.map +0 -1
- package/dist/cli/setupWizard.d.ts.map +0 -1
- package/dist/cli/setupWizard.js.map +0 -1
- package/dist/cost/budgetEnforcer.d.ts.map +0 -1
- package/dist/cost/budgetEnforcer.js.map +0 -1
- package/dist/cost/costTracker.d.ts.map +0 -1
- package/dist/cost/costTracker.js.map +0 -1
- package/dist/ensemble/multiRoundDialog.js.map +0 -1
- package/dist/ensemble/shapleyValue.js.map +0 -1
- package/dist/integrations/langchainAdapter.d.ts.map +0 -1
- package/dist/integrations/langchainAdapter.js.map +0 -1
- package/dist/integrations/oauth.d.ts.map +0 -1
- package/dist/integrations/oauth.js.map +0 -1
- package/dist/integrations/scienceAdapter.js.map +0 -1
- package/dist/memory/autoFetch.d.ts.map +0 -1
- package/dist/memory/autoFetch.js.map +0 -1
- package/dist/memory/episodicMemory.d.ts.map +0 -1
- package/dist/memory/episodicMemory.js.map +0 -1
- package/dist/memory/memoryTree.d.ts.map +0 -1
- package/dist/memory/memoryTree.js.map +0 -1
- package/dist/memory/obsidianVault.d.ts.map +0 -1
- package/dist/memory/obsidianVault.js.map +0 -1
- package/dist/observability/changeWatch.d.ts.map +0 -1
- package/dist/observability/changeWatch.js.map +0 -1
- package/dist/observability/fatigueDetector.d.ts.map +0 -1
- package/dist/observability/fatigueDetector.js.map +0 -1
- package/dist/observability/index.d.ts.map +0 -1
- package/dist/observability/index.js.map +0 -1
- package/dist/observability/metrics.d.ts.map +0 -1
- package/dist/observability/metrics.js.map +0 -1
- package/dist/observability/middleware.d.ts.map +0 -1
- package/dist/observability/middleware.js.map +0 -1
- package/dist/observability/tracer.d.ts.map +0 -1
- package/dist/observability/tracer.js.map +0 -1
- package/dist/observability/types.d.ts.map +0 -1
- package/dist/observability/types.js.map +0 -1
- package/dist/orchestration/haloOrchestrator.d.ts.map +0 -1
- package/dist/orchestration/haloOrchestrator.js.map +0 -1
- package/dist/orchestration/mctsWorkflow.d.ts.map +0 -1
- package/dist/orchestration/mctsWorkflow.js.map +0 -1
- package/dist/providers/localProvider.d.ts.map +0 -1
- package/dist/providers/localProvider.js.map +0 -1
- package/dist/providers/providerConfig.d.ts.map +0 -1
- package/dist/providers/providerConfig.js.map +0 -1
- package/dist/providers/registry.d.ts.map +0 -1
- package/dist/providers/registry.js.map +0 -1
- package/dist/routing/advancedRouter.d.ts.map +0 -1
- package/dist/routing/advancedRouter.js.map +0 -1
- package/dist/routing/crossModelValidation.d.ts.map +0 -1
- package/dist/routing/crossModelValidation.js.map +0 -1
- package/dist/routing/providerHealth.d.ts.map +0 -1
- package/dist/routing/providerHealth.js.map +0 -1
- package/dist/routing/providerRetry.d.ts.map +0 -1
- package/dist/routing/providerRetry.js.map +0 -1
- package/dist/scripts/banner.js +0 -29
- package/dist/security/guardrails.d.ts.map +0 -1
- package/dist/security/guardrails.js.map +0 -1
- package/dist/server/dashboard.d.ts.map +0 -1
- package/dist/server/dashboard.js.map +0 -1
- package/dist/server/modelMapper.d.ts.map +0 -1
- package/dist/server/modelMapper.js.map +0 -1
- package/dist/server/proxyServer.d.ts.map +0 -1
- package/dist/server/proxyServer.js.map +0 -1
- package/dist/skills/__tests__/skill_manager.test.d.ts +0 -2
- package/dist/skills/__tests__/skill_manager.test.d.ts.map +0 -1
- package/dist/skills/__tests__/skill_manager.test.js +0 -268
- package/dist/skills/__tests__/skill_manager.test.js.map +0 -1
- package/dist/tools/tmlpdTools.d.ts.map +0 -1
- package/dist/tools/tmlpdTools.js.map +0 -1
- package/dist/tui/dashboard.d.ts.map +0 -1
- package/dist/tui/dashboard.js.map +0 -1
- package/dist/tui/index.d.ts.map +0 -1
- package/dist/tui/index.js.map +0 -1
- package/dist/utils/batchProcessor.d.ts.map +0 -1
- package/dist/utils/batchProcessor.js.map +0 -1
- package/dist/utils/compression.d.ts.map +0 -1
- package/dist/utils/compression.js.map +0 -1
- package/dist/utils/costUtils.d.ts.map +0 -1
- package/dist/utils/costUtils.js.map +0 -1
- package/dist/utils/reliability.d.ts.map +0 -1
- package/dist/utils/reliability.js.map +0 -1
- package/dist/utils/sorting.d.ts.map +0 -1
- package/dist/utils/sorting.js.map +0 -1
- package/dist/utils/speculativeDecoding.d.ts.map +0 -1
- package/dist/utils/speculativeDecoding.js.map +0 -1
- package/dist/utils/tokenUtils.d.ts.map +0 -1
- package/dist/utils/tokenUtils.js.map +0 -1
- package/docs/.nojekyll +0 -0
- package/docs/ANALYSIS_PRINCIPLES.md +0 -162
- package/docs/API.md +0 -855
- package/docs/ARCHITECTURAL-IMPROVEMENTS-2025.md +0 -1391
- package/docs/ARCHITECTURAL-IMPROVEMENTS-REVISED-2025.md +0 -1051
- package/docs/BENCHMARK.md +0 -170
- package/docs/CHINESE_PROVIDER_RELIABILITY.md +0 -37
- package/docs/CITATIONS.md +0 -74
- package/docs/CLAIMS_AND_EVIDENCE.md +0 -58
- package/docs/CONFIGURATION.md +0 -476
- package/docs/COUNCIL_DECISION.json +0 -816
- package/docs/COUNCIL_SUMMARY.md +0 -319
- package/docs/COUNCIL_V2.2_DECISION.md +0 -416
- package/docs/ENGINEERING_SPEC.md +0 -55
- package/docs/FACTORY_RESET.md +0 -34
- package/docs/GEO.md +0 -66
- package/docs/GEO_OPTIMIZATION.md +0 -30
- package/docs/GEO_ROOT_CAUSE.md +0 -136
- package/docs/GEO_STATUS.md +0 -85
- package/docs/GEO_TEST_RESULTS.md +0 -176
- package/docs/HN_CHECKLIST.md +0 -38
- package/docs/HN_FOUNDER_COMMENT.md +0 -17
- package/docs/HN_SUBMISSION_FINAL.md +0 -180
- package/docs/HN_SUBMISSION_V3.md +0 -56
- package/docs/IMPROVEMENT_ROADMAP.md +0 -515
- package/docs/INTEGRATIONS.md +0 -420
- package/docs/LANGCHAIN_INTEGRATION.md +0 -147
- package/docs/LLM_COUNCIL_DECISION.md +0 -508
- package/docs/MIDDLEWARE_CHAIN.md +0 -35
- package/docs/PROMO_CHECKLIST.md +0 -200
- package/docs/QUICKSTART.md +0 -271
- package/docs/QUICK_START.md +0 -43
- package/docs/QUICK_START_VISIBILITY.md +0 -782
- package/docs/REDDIT_GAP_ANALYSIS.md +0 -299
- package/docs/RELEASE_CHECKLIST.md +0 -32
- package/docs/REPRODUCIBILITY.md +0 -63
- package/docs/RESEARCH_BACKED_IMPROVEMENTS.md +0 -1180
- package/docs/ROUTING_RUBRIC.md +0 -197
- package/docs/SEO_AUDIT.md +0 -186
- package/docs/SOCIAL_LISTENING.md +0 -219
- package/docs/TMLPD_QNA.md +0 -751
- package/docs/TMLPD_V2.1_COMPLETE.md +0 -763
- package/docs/TMLPD_V2.2_RESEARCH_ROADMAP.md +0 -754
- package/docs/UPDATE_TOPICS.md +0 -15
- package/docs/USE_CASES.md +0 -59
- package/docs/V2.2_IMPLEMENTATION_COMPLETE.md +0 -446
- package/docs/V2_IMPLEMENTATION_GUIDE.md +0 -388
- package/docs/VERCEL_AI_SDK.md +0 -209
- package/docs/VISIBILITY_ADOPTION_PLAN.md +0 -1005
- package/docs/_config.yml +0 -49
- package/docs/ai-plugin.json +0 -16
- package/docs/api.html +0 -513
- package/docs/architecture-diagram.md +0 -40
- package/docs/benchmark-chart.png +0 -0
- package/docs/benchmark.html +0 -387
- package/docs/blog/routerarena-number-one.html +0 -73
- package/docs/cli-cheatsheet.md +0 -339
- package/docs/compare.md +0 -109
- package/docs/comparison-litellm.md +0 -88
- package/docs/comparison.md +0 -108
- package/docs/cost-chart-ascii.md +0 -42
- package/docs/cost-comparison-chart.svg +0 -88
- package/docs/curl-examples.md +0 -247
- package/docs/demo-auto.html +0 -264
- package/docs/demo.html +0 -416
- package/docs/geo/GENERATIVE_ENGINE_OPTIMIZATION.md +0 -232
- package/docs/index.html +0 -507
- package/docs/launch-content/LAUNCH_EXECUTION_CHECKLIST.md +0 -421
- package/docs/launch-content/README.md +0 -457
- package/docs/launch-content/assets/cost_comparison_100_tasks.png +0 -0
- package/docs/launch-content/assets/cumulative_savings.png +0 -0
- package/docs/launch-content/assets/parallel_speedup.png +0 -0
- package/docs/launch-content/assets/provider_pricing_comparison.png +0 -0
- package/docs/launch-content/assets/task_breakdown_comparison.png +0 -0
- package/docs/launch-content/generate_charts.py +0 -313
- package/docs/launch-content/hn_show_post.md +0 -139
- package/docs/launch-content/partner_outreach_templates.md +0 -745
- package/docs/launch-content/reddit_posts.md +0 -467
- package/docs/launch-content/twitter_thread.txt +0 -460
- package/docs/npm-downloads-chart.svg +0 -43
- package/docs/openapi.json +0 -139
- package/docs/openapi.yaml +0 -1318
- package/docs/quick-start.html +0 -366
- package/docs/robots.txt +0 -52
- package/docs/sitemap.xml +0 -57
- package/docs/styles.css +0 -682
- package/docs/well-known/ai-plugin.json +0 -16
- package/docs/wellknown/ai-plugin.json +0 -16
- package/docs-site/assets/og-banner.svg +0 -194
- package/docs-site/index.html +0 -632
- package/eval/README.md +0 -46
- package/eval/baselines/main.json +0 -12
- package/eval/benchmark_dataset.jsonl +0 -16
- package/eval/check_golden_routes.js +0 -64
- package/eval/datasets/catalog.json +0 -33
- package/eval/datasets/slices/cn_provider_reliability_v1.jsonl +0 -3
- package/eval/datasets/slices/cost_pressure_v1.jsonl +0 -3
- package/eval/datasets/slices/safety_guardrails_v1.jsonl +0 -3
- package/eval/evals.json +0 -199
- package/eval/fault_injection_thresholds.json +0 -3
- package/eval/generate_report.js +0 -128
- package/eval/golden_routes.json +0 -114
- package/eval/lib/experiment_registry.js +0 -24
- package/eval/run_eval.js +0 -197
- package/eval/run_fault_injection.js +0 -201
- package/eval/run_shadow_eval.js +0 -85
- package/eval/thresholds.json +0 -9
- package/examples/QUICKSTART.md +0 -183
- package/examples/README.md +0 -61
- package/examples/a3m-sdk.js +0 -124
- package/examples/basic-route.js +0 -54
- package/examples/chat-loop.js +0 -202
- package/examples/classify-then-route.js +0 -102
- package/examples/cost-compare.js +0 -120
- package/examples/ensemble.js +0 -160
- package/examples/whatsapp-telegram-bridge-demo.js +0 -302
- package/examples/whatsapp-telegram-bridge.js +0 -269
- package/hf-space/README.md +0 -23
- package/hf-space/app.py +0 -240
- package/hf-space/requirements.txt +0 -1
- package/huggingface_space/README.md +0 -35
- package/huggingface_space/app.py +0 -126
- package/huggingface_space/create_space.py +0 -208
- package/huggingface_space/requirements.txt +0 -1
- package/mcp-server/README.md +0 -188
- package/mcp-server/package.json +0 -29
- package/mcp-server/src/index.ts +0 -744
- package/mcp-server/tsconfig.json +0 -19
- package/openclaw-alexa-bridge/ALL_REMAINING_FIXES_PLAN.md +0 -313
- package/openclaw-alexa-bridge/REMAINING_FIXES_SUMMARY.md +0 -277
- package/openclaw-alexa-bridge/src/alexa_handler_no_tmlpd.js +0 -1234
- package/openclaw-alexa-bridge/test_fixes.js +0 -77
- package/playground/README.md +0 -51
- package/playground/codesandbox.json +0 -12
- package/playground/index.js +0 -39
- package/proxy/README.md +0 -227
- package/proxy/package-lock.json +0 -831
- package/proxy/package.json +0 -17
- package/proxy/rate-limit.js +0 -145
- package/proxy/rate-limit.test.js +0 -311
- package/proxy/server.js +0 -970
- package/python/README.md +0 -102
- package/python/a3m/__init__.py +0 -6
- package/python/a3m/client.py +0 -190
- package/python/a3m/models.py +0 -40
- package/python/a3m/sync_client.py +0 -61
- package/python/examples.py +0 -53
- package/python/integrations.py +0 -330
- package/python/pyproject.toml +0 -23
- package/python/setup.py +0 -28
- package/python/tmlpd.py +0 -369
- package/qna/REDDIT_GAP_ANALYSIS.md +0 -299
- package/qna/TMLPD_QNA.md +0 -751
- package/research/FINDING_001_safety.md +0 -28
- package/research/FINDING_002_error_diversity.md +0 -32
- package/research/FINDING_003_confidence_weighted_voting.md +0 -32
- package/research/FINDING_004_cross_model_semantic_detection.md +0 -37
- package/research/FINDING_005_knowledge_gap_orthogonality.md +0 -34
- package/research/HALLUCINATION_RESEARCH.md +0 -27
- package/research/ensemble-voting.md +0 -324
- package/research/loss-functions.md +0 -545
- package/research-log.md +0 -49
- package/scripts/banner.js +0 -29
- package/scripts/benchmark-local-routerarena.ts +0 -176
- package/scripts/benchmark.js +0 -145
- package/scripts/benchmark.sh +0 -61
- package/scripts/compare-providers.sh +0 -230
- package/scripts/content-planner.js +0 -25
- package/scripts/create-labeled-benchmark.ts +0 -105
- package/scripts/cross_post.py +0 -443
- package/scripts/local-router-benchmark.ts +0 -154
- package/scripts/post-all.sh +0 -41
- package/scripts/publish_fcc.py +0 -106
- package/scripts/push-to-gitee.sh +0 -25
- package/scripts/routerarena_ensemble.js +0 -144
- package/scripts/routing-benchmark-v2.js +0 -373
- package/scripts/routing-benchmark-v3.js +0 -118
- package/scripts/routing-benchmark.js +0 -462
- package/scripts/run-labeled-benchmark.mjs +0 -104
- package/scripts/run-mmlu-benchmark.js +0 -176
- package/scripts/run-provider-benchmark.js +0 -244
- package/scripts/update-npm-badges.js +0 -158
- package/skill/SKILL.md +0 -238
- package/src/__tests__/integration/tmpld_integration.test.py +0 -540
- package/src/skills/__tests__/skill_manager.test.ts +0 -328
- package/submissions/benchmarks/ALL_PLATFORMS_SUBMISSION.md +0 -94
- package/submissions/benchmarks/LLMROUTERBENCH_SUBMISSION.md +0 -121
- package/submissions/benchmarks/MMRBENCH_SUBMISSION.md +0 -94
- package/submissions/benchmarks/ROUTERARENA_UPDATE.md +0 -83
- package/submissions/benchmarks/ROUTERBENCH_SUBMISSION.md +0 -225
- package/test-council/1-structure-tests.test.js +0 -353
- package/test-council/1-structure-tests.test.ts +0 -353
- package/test-council/2-edge-case-tests.test.ts +0 -361
- package/test-council/3-performance-tests.test.ts +0 -669
- package/test-council/4-integration-tests.test.ts +0 -391
- package/test-council/5-agent-council-eval.test.ts +0 -413
- package/test-council/AGENT_COUNCIL_ARCHITECTURE.md +0 -349
- package/test-council/TEST_COUNCIL_REPORT.md +0 -201
- package/test-council/agents/edge-case-agent.ts +0 -363
- package/test-council/agents/performance-agent.ts +0 -426
- package/test-council/agents/structure-agent.ts +0 -227
- package/test-council/council.md +0 -183
- package/tests/__mocks__/tokenUtils.ts +0 -8
- package/tests/memory/episodicMemory.test.ts +0 -227
- package/tests/package-lock.json +0 -1628
- package/tests/package.json +0 -18
- package/tests/routing/ensembleVoting.test.ts +0 -236
- package/tests/routing/providerRetry.test.ts +0 -360
- package/tests/routing/queryTypePresets.test.ts +0 -208
- package/tests/security/guardrailEngine.test.ts +0 -700
- package/tests/tsconfig.json +0 -21
- package/tests/vitest.config.ts +0 -18
- package/tmlpd-pi-extension/README.md +0 -66
- package/tmlpd-pi-extension/dist/cache/prefixCache.d.ts +0 -114
- package/tmlpd-pi-extension/dist/cache/prefixCache.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/cache/prefixCache.js +0 -285
- package/tmlpd-pi-extension/dist/cache/prefixCache.js.map +0 -1
- package/tmlpd-pi-extension/dist/cache/responseCache.d.ts +0 -58
- package/tmlpd-pi-extension/dist/cache/responseCache.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/cache/responseCache.js +0 -153
- package/tmlpd-pi-extension/dist/cache/responseCache.js.map +0 -1
- package/tmlpd-pi-extension/dist/cli.js +0 -59
- package/tmlpd-pi-extension/dist/cost/costTracker.d.ts +0 -95
- package/tmlpd-pi-extension/dist/cost/costTracker.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/cost/costTracker.js +0 -240
- package/tmlpd-pi-extension/dist/cost/costTracker.js.map +0 -1
- package/tmlpd-pi-extension/dist/index.d.ts +0 -723
- package/tmlpd-pi-extension/dist/index.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/index.js +0 -239
- package/tmlpd-pi-extension/dist/index.js.map +0 -1
- package/tmlpd-pi-extension/dist/memory/episodicMemory.d.ts +0 -82
- package/tmlpd-pi-extension/dist/memory/episodicMemory.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/memory/episodicMemory.js +0 -145
- package/tmlpd-pi-extension/dist/memory/episodicMemory.js.map +0 -1
- package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.d.ts +0 -102
- package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.js +0 -207
- package/tmlpd-pi-extension/dist/orchestration/haloOrchestrator.js.map +0 -1
- package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.d.ts +0 -85
- package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.js +0 -210
- package/tmlpd-pi-extension/dist/orchestration/mctsWorkflow.js.map +0 -1
- package/tmlpd-pi-extension/dist/providers/localProvider.d.ts +0 -102
- package/tmlpd-pi-extension/dist/providers/localProvider.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/providers/localProvider.js +0 -338
- package/tmlpd-pi-extension/dist/providers/localProvider.js.map +0 -1
- package/tmlpd-pi-extension/dist/providers/registry.d.ts +0 -55
- package/tmlpd-pi-extension/dist/providers/registry.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/providers/registry.js +0 -138
- package/tmlpd-pi-extension/dist/providers/registry.js.map +0 -1
- package/tmlpd-pi-extension/dist/routing/advancedRouter.d.ts +0 -68
- package/tmlpd-pi-extension/dist/routing/advancedRouter.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/routing/advancedRouter.js +0 -332
- package/tmlpd-pi-extension/dist/routing/advancedRouter.js.map +0 -1
- package/tmlpd-pi-extension/dist/tools/tmlpdTools.d.ts +0 -101
- package/tmlpd-pi-extension/dist/tools/tmlpdTools.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/tools/tmlpdTools.js +0 -368
- package/tmlpd-pi-extension/dist/tools/tmlpdTools.js.map +0 -1
- package/tmlpd-pi-extension/dist/utils/batchProcessor.d.ts +0 -96
- package/tmlpd-pi-extension/dist/utils/batchProcessor.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/utils/batchProcessor.js +0 -170
- package/tmlpd-pi-extension/dist/utils/batchProcessor.js.map +0 -1
- package/tmlpd-pi-extension/dist/utils/compression.d.ts +0 -61
- package/tmlpd-pi-extension/dist/utils/compression.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/utils/compression.js +0 -281
- package/tmlpd-pi-extension/dist/utils/compression.js.map +0 -1
- package/tmlpd-pi-extension/dist/utils/reliability.d.ts +0 -74
- package/tmlpd-pi-extension/dist/utils/reliability.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/utils/reliability.js +0 -177
- package/tmlpd-pi-extension/dist/utils/reliability.js.map +0 -1
- package/tmlpd-pi-extension/dist/utils/speculativeDecoding.d.ts +0 -117
- package/tmlpd-pi-extension/dist/utils/speculativeDecoding.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/utils/speculativeDecoding.js +0 -246
- package/tmlpd-pi-extension/dist/utils/speculativeDecoding.js.map +0 -1
- package/tmlpd-pi-extension/dist/utils/tokenUtils.d.ts +0 -50
- package/tmlpd-pi-extension/dist/utils/tokenUtils.d.ts.map +0 -1
- package/tmlpd-pi-extension/dist/utils/tokenUtils.js +0 -124
- package/tmlpd-pi-extension/dist/utils/tokenUtils.js.map +0 -1
- package/tmlpd-pi-extension/examples/QUICKSTART.md +0 -183
- package/tmlpd-pi-extension/package-lock.json +0 -79
- package/tmlpd-pi-extension/package.json +0 -172
- package/tmlpd-pi-extension/python/examples.py +0 -53
- package/tmlpd-pi-extension/python/integrations.py +0 -330
- package/tmlpd-pi-extension/python/setup.py +0 -28
- package/tmlpd-pi-extension/python/tmlpd.py +0 -369
- package/tmlpd-pi-extension/qna/REDDIT_GAP_ANALYSIS.md +0 -299
- package/tmlpd-pi-extension/qna/TMLPD_QNA.md +0 -751
- package/tmlpd-pi-extension/skill/SKILL.md +0 -238
- package/tmlpd-pi-extension/src/cache/responseCache.ts +0 -147
- package/tmlpd-pi-extension/src/cost/costTracker.ts +0 -302
- package/tmlpd-pi-extension/src/index.ts +0 -232
- package/tmlpd-pi-extension/src/memory/episodicMemory.ts +0 -257
- package/tmlpd-pi-extension/src/orchestration/haloOrchestrator.ts +0 -266
- package/tmlpd-pi-extension/src/orchestration/mctsWorkflow.ts +0 -262
- package/tmlpd-pi-extension/src/providers/localProvider.ts +0 -406
- package/tmlpd-pi-extension/src/providers/registry.ts +0 -164
- package/tmlpd-pi-extension/src/routing/ensembleVoting.ts +0 -159
- package/tmlpd-pi-extension/src/routing/queryTypePresets.ts +0 -136
- package/tmlpd-pi-extension/src/tools/tmlpdTools.ts +0 -433
- package/tmlpd-pi-extension/src/utils/batchProcessor.ts +0 -232
- package/tmlpd-pi-extension/src/utils/compression.ts +0 -325
- package/tmlpd-pi-extension/src/utils/reliability.ts +0 -221
- package/tmlpd-pi-extension/src/utils/tokenUtils.ts +0 -145
- package/tmlpd-pi-extension/tsconfig.json +0 -18
- package/tsconfig.build.json +0 -29
- package/tsconfig.json +0 -18
- /package/{docs/llms-full.txt → llms-full.txt.bak} +0 -0
package/docs/demo.html
DELETED
|
@@ -1,416 +0,0 @@
|
|
|
1
|
-
<!DOCTYPE html>
|
|
2
|
-
<html lang="en">
|
|
3
|
-
<head>
|
|
4
|
-
<meta charset="UTF-8">
|
|
5
|
-
<meta name="viewport" content="width=device-width, initial-scale=1.0">
|
|
6
|
-
<title>A3M Router - One prompt in. The right model out.</title>
|
|
7
|
-
<style>
|
|
8
|
-
* { margin: 0; padding: 0; box-sizing: border-box; }
|
|
9
|
-
|
|
10
|
-
body {
|
|
11
|
-
background: #0d1117;
|
|
12
|
-
color: #e6edf3;
|
|
13
|
-
font-family: 'JetBrains Mono', 'Fira Code', 'SF Mono', Monaco, monospace;
|
|
14
|
-
min-height: 100vh;
|
|
15
|
-
display: flex;
|
|
16
|
-
flex-direction: column;
|
|
17
|
-
align-items: center;
|
|
18
|
-
justify-content: center;
|
|
19
|
-
padding: 20px;
|
|
20
|
-
}
|
|
21
|
-
|
|
22
|
-
.container { max-width: 900px; width: 100%; }
|
|
23
|
-
|
|
24
|
-
.header { text-align: center; margin-bottom: 32px; }
|
|
25
|
-
h1 { font-size: 2.2rem; color: #58a6ff; margin-bottom: 8px; }
|
|
26
|
-
.tagline { font-size: 1.2rem; color: #a371f7; margin-bottom: 16px; }
|
|
27
|
-
.subtitle { color: #8b949e; font-size: 0.95rem; }
|
|
28
|
-
|
|
29
|
-
.scene {
|
|
30
|
-
background: #161b22;
|
|
31
|
-
border: 1px solid #30363d;
|
|
32
|
-
border-radius: 12px;
|
|
33
|
-
padding: 24px;
|
|
34
|
-
margin: 16px 0;
|
|
35
|
-
display: none;
|
|
36
|
-
animation: fadeIn 0.5s ease;
|
|
37
|
-
}
|
|
38
|
-
.scene.active { display: block; }
|
|
39
|
-
|
|
40
|
-
@keyframes fadeIn {
|
|
41
|
-
from { opacity: 0; transform: translateY(20px); }
|
|
42
|
-
to { opacity: 1; transform: translateY(0); }
|
|
43
|
-
}
|
|
44
|
-
|
|
45
|
-
.line { margin: 6px 0; line-height: 1.6; }
|
|
46
|
-
.comment { color: #8b949e; }
|
|
47
|
-
.keyword { color: #ff7b72; }
|
|
48
|
-
.string { color: #a5d6ff; }
|
|
49
|
-
|
|
50
|
-
.box {
|
|
51
|
-
background: #21262d;
|
|
52
|
-
border-radius: 8px;
|
|
53
|
-
padding: 16px;
|
|
54
|
-
margin: 12px 0;
|
|
55
|
-
}
|
|
56
|
-
.box.success { border-left: 3px solid #3fb950; }
|
|
57
|
-
.box.info { border-left: 3px solid #58a6ff; }
|
|
58
|
-
.box.warning { border-left: 3px solid #d29922; }
|
|
59
|
-
.box.error { border-left: 3px solid #f85149; }
|
|
60
|
-
|
|
61
|
-
.success-text { color: #3fb950; }
|
|
62
|
-
.info-text { color: #58a6ff; }
|
|
63
|
-
.warning-text { color: #d29922; }
|
|
64
|
-
.muted { color: #8b949e; }
|
|
65
|
-
.money { color: #3fb950; font-size: 1.4rem; font-weight: bold; }
|
|
66
|
-
|
|
67
|
-
.providers {
|
|
68
|
-
display: flex;
|
|
69
|
-
flex-wrap: wrap;
|
|
70
|
-
gap: 8px;
|
|
71
|
-
margin: 12px 0;
|
|
72
|
-
}
|
|
73
|
-
.provider {
|
|
74
|
-
background: #30363d;
|
|
75
|
-
padding: 4px 10px;
|
|
76
|
-
border-radius: 4px;
|
|
77
|
-
font-size: 0.8rem;
|
|
78
|
-
color: #8b949e;
|
|
79
|
-
}
|
|
80
|
-
.provider.highlight { background: #238636; color: white; }
|
|
81
|
-
|
|
82
|
-
.comparison {
|
|
83
|
-
display: flex;
|
|
84
|
-
gap: 20px;
|
|
85
|
-
margin: 16px 0;
|
|
86
|
-
}
|
|
87
|
-
.col {
|
|
88
|
-
flex: 1;
|
|
89
|
-
padding: 16px;
|
|
90
|
-
border-radius: 8px;
|
|
91
|
-
text-align: center;
|
|
92
|
-
}
|
|
93
|
-
.col.bad { background: rgba(248,81,73,0.1); border: 1px solid rgba(248,81,73,0.3); }
|
|
94
|
-
.col.good { background: rgba(63,185,80,0.1); border: 1px solid rgba(63,185,80,0.3); }
|
|
95
|
-
.col .label { font-size: 0.85rem; color: #8b949e; margin-bottom: 8px; }
|
|
96
|
-
.col .amount { font-size: 2rem; font-weight: bold; }
|
|
97
|
-
.col.bad .amount { color: #f85149; }
|
|
98
|
-
.col.good .amount { color: #3fb950; }
|
|
99
|
-
.col .sub { font-size: 0.8rem; color: #8b949e; margin-top: 4px; }
|
|
100
|
-
|
|
101
|
-
.ascii {
|
|
102
|
-
background: #0d1117;
|
|
103
|
-
padding: 12px;
|
|
104
|
-
border-radius: 6px;
|
|
105
|
-
font-size: 0.8rem;
|
|
106
|
-
white-space: pre;
|
|
107
|
-
overflow-x: auto;
|
|
108
|
-
}
|
|
109
|
-
|
|
110
|
-
.install-box {
|
|
111
|
-
background: #161b22;
|
|
112
|
-
border: 2px solid #58a6ff;
|
|
113
|
-
border-radius: 12px;
|
|
114
|
-
padding: 24px;
|
|
115
|
-
text-align: center;
|
|
116
|
-
}
|
|
117
|
-
.install-cmd {
|
|
118
|
-
background: #0d1117;
|
|
119
|
-
padding: 12px 24px;
|
|
120
|
-
border-radius: 6px;
|
|
121
|
-
font-size: 1.1rem;
|
|
122
|
-
color: #3fb950;
|
|
123
|
-
margin: 12px 0;
|
|
124
|
-
font-family: monospace;
|
|
125
|
-
}
|
|
126
|
-
|
|
127
|
-
.features {
|
|
128
|
-
display: grid;
|
|
129
|
-
grid-template-columns: repeat(2, 1fr);
|
|
130
|
-
gap: 12px;
|
|
131
|
-
margin: 16px 0;
|
|
132
|
-
}
|
|
133
|
-
.feature {
|
|
134
|
-
background: #21262d;
|
|
135
|
-
padding: 12px;
|
|
136
|
-
border-radius: 6px;
|
|
137
|
-
font-size: 0.85rem;
|
|
138
|
-
}
|
|
139
|
-
.feature-name { color: #58a6ff; font-weight: bold; margin-bottom: 4px; }
|
|
140
|
-
|
|
141
|
-
.stat-row {
|
|
142
|
-
display: flex;
|
|
143
|
-
justify-content: center;
|
|
144
|
-
gap: 32px;
|
|
145
|
-
margin: 16px 0;
|
|
146
|
-
}
|
|
147
|
-
.stat { text-align: center; }
|
|
148
|
-
.stat-value { font-size: 1.5rem; font-weight: bold; color: #58a6ff; }
|
|
149
|
-
.stat-label { font-size: 0.8rem; color: #8b949e; }
|
|
150
|
-
|
|
151
|
-
.progress { display: flex; gap: 8px; justify-content: center; margin: 20px 0; }
|
|
152
|
-
.dot { width: 10px; height: 10px; background: #30363d; border-radius: 50%; }
|
|
153
|
-
.dot.done { background: #58a6ff; }
|
|
154
|
-
|
|
155
|
-
.footer {
|
|
156
|
-
margin-top: 24px;
|
|
157
|
-
color: #8b949e;
|
|
158
|
-
text-align: center;
|
|
159
|
-
font-size: 0.85rem;
|
|
160
|
-
}
|
|
161
|
-
</style>
|
|
162
|
-
</head>
|
|
163
|
-
<body>
|
|
164
|
-
<div class="container">
|
|
165
|
-
<!-- SCENE 1: One line change -->
|
|
166
|
-
<div class="scene active" id="s1">
|
|
167
|
-
<div class="header">
|
|
168
|
-
<h1>🔀 A3M Router</h1>
|
|
169
|
-
<p class="tagline">One prompt in. The right model out.</p>
|
|
170
|
-
<p class="subtitle">47+ providers. Budget enforcement. Semantic cache. Intelligent failover.</p>
|
|
171
|
-
</div>
|
|
172
|
-
|
|
173
|
-
<div class="box error">
|
|
174
|
-
<div class="line comment"># Your app today — every request goes to GPT-4o</div>
|
|
175
|
-
<div class="line keyword">const</span> response = <span class="keyword">await</span> openai.chat.completions.create({</div>
|
|
176
|
-
<div class="line"> model: <span class="string">"gpt-4o"</span>,</div>
|
|
177
|
-
<div class="line"> messages: [{ role: <span class="string">"user"</span>, content: <span class="string">"Explain quantum entanglement"</span> }]</div>
|
|
178
|
-
<div class="line">});</div>
|
|
179
|
-
</div>
|
|
180
|
-
|
|
181
|
-
<div class="box error">
|
|
182
|
-
<div class="line" style="color: #f85149;">❌ $0.003 per request — no fallback if OpenAI goes down</div>
|
|
183
|
-
</div>
|
|
184
|
-
|
|
185
|
-
<div class="box info">
|
|
186
|
-
<div class="line comment"># One line change — A3M routes to the cheapest capable model</div>
|
|
187
|
-
<div class="line keyword">const</span> response = <span class="keyword">await</span> fetch(<span class="string">"http://localhost:8787/v1/chat/completions"</span>, {</div>
|
|
188
|
-
<div class="line"> body: JSON.stringify({</div>
|
|
189
|
-
<div class="line"> model: <span class="string">"auto"</span>, <span class="comment">// ← A3M picks the best model</span></div>
|
|
190
|
-
<div class="line"> messages: [{ role: <span class="string">"user"</span>, content: <span class="string">"Explain quantum entanglement"</span> }]</div>
|
|
191
|
-
<div class="line"> })</div>
|
|
192
|
-
<div class="line">});</div>
|
|
193
|
-
</div>
|
|
194
|
-
|
|
195
|
-
<div class="box success">
|
|
196
|
-
<div class="line success-text">✅ Routed to: Groq (FREE)</div>
|
|
197
|
-
<div class="line muted"> $0.00 per request — automatic fallback chain if Groq fails</div>
|
|
198
|
-
</div>
|
|
199
|
-
</div>
|
|
200
|
-
|
|
201
|
-
<!-- SCENE 2: Providers -->
|
|
202
|
-
<div class="scene" id="s2">
|
|
203
|
-
<h2 style="color: #58a6ff; margin-bottom: 16px;">🌏 47+ Providers</h2>
|
|
204
|
-
|
|
205
|
-
<div class="box info">
|
|
206
|
-
<div class="line info-text">Chinese Providers (special handling)</div>
|
|
207
|
-
<div class="providers">
|
|
208
|
-
<span class="provider highlight">Groq (FREE)</span>
|
|
209
|
-
<span class="provider">DeepSeek</span>
|
|
210
|
-
<span class="provider">Kimi</span>
|
|
211
|
-
<span class="provider">Qwen</span>
|
|
212
|
-
<span class="provider">Zhipu</span>
|
|
213
|
-
<span class="provider">Yi</span>
|
|
214
|
-
<span class="provider">Stepfun</span>
|
|
215
|
-
<span class="provider">Moonshot</span>
|
|
216
|
-
<span class="provider">01.AI</span>
|
|
217
|
-
<span class="provider">Tencent</span>
|
|
218
|
-
<span class="provider">Baidu</span>
|
|
219
|
-
<span class="provider">Alibaba</span>
|
|
220
|
-
</div>
|
|
221
|
-
</div>
|
|
222
|
-
|
|
223
|
-
<div class="box info">
|
|
224
|
-
<div class="line info-text">Global Providers</div>
|
|
225
|
-
<div class="providers">
|
|
226
|
-
<span class="provider">OpenAI</span>
|
|
227
|
-
<span class="provider">Anthropic</span>
|
|
228
|
-
<span class="provider">Google</span>
|
|
229
|
-
<span class="provider">Mistral</span>
|
|
230
|
-
<span class="provider">Cohere</span>
|
|
231
|
-
<span class="provider">Groq</span>
|
|
232
|
-
<span class="provider">Perplexity</span>
|
|
233
|
-
<span class="provider">AWS Bedrock</span>
|
|
234
|
-
<span class="provider">Azure</span>
|
|
235
|
-
<span class="provider">Replicate</span>
|
|
236
|
-
<span class="provider">HuggingFace</span>
|
|
237
|
-
</div>
|
|
238
|
-
</div>
|
|
239
|
-
|
|
240
|
-
<div class="box success">
|
|
241
|
-
<div class="line success-text">✅ A3M routes to the cheapest healthy provider</div>
|
|
242
|
-
<div class="line muted"> Health checks + circuit breakers + intelligent fallback</div>
|
|
243
|
-
</div>
|
|
244
|
-
</div>
|
|
245
|
-
|
|
246
|
-
<!-- SCENE 3: Cost Savings -->
|
|
247
|
-
<div class="scene" id="s3">
|
|
248
|
-
<h2 style="color: #3fb950; margin-bottom: 16px;">💰 Save 62% on API Costs</h2>
|
|
249
|
-
|
|
250
|
-
<div class="comparison">
|
|
251
|
-
<div class="col bad">
|
|
252
|
-
<div class="label">WITHOUT A3M</div>
|
|
253
|
-
<div class="amount">$0.003</div>
|
|
254
|
-
<div class="sub">per request (GPT-4o)</div>
|
|
255
|
-
<div class="sub" style="margin-top: 8px;">$3.41 per 1K requests</div>
|
|
256
|
-
</div>
|
|
257
|
-
<div class="col good">
|
|
258
|
-
<div class="label">WITH A3M</div>
|
|
259
|
-
<div class="amount">$0.00</div>
|
|
260
|
-
<div class="sub">47% → Groq (free)</div>
|
|
261
|
-
<div class="sub">30% → DeepSeek ($0.14/M)</div>
|
|
262
|
-
<div class="sub">23% → GPT-4o-mini ($0.15/M)</div>
|
|
263
|
-
<div class="sub" style="margin-top: 8px;">$1.24 per 1K requests</div>
|
|
264
|
-
</div>
|
|
265
|
-
</div>
|
|
266
|
-
|
|
267
|
-
<div class="stat-row">
|
|
268
|
-
<div class="stat">
|
|
269
|
-
<div class="stat-value">62%</div>
|
|
270
|
-
<div class="stat-label">Cost Savings</div>
|
|
271
|
-
</div>
|
|
272
|
-
<div class="stat">
|
|
273
|
-
<div class="stat-value">70.32</div>
|
|
274
|
-
<div class="stat-label">Routing Accuracy</div>
|
|
275
|
-
</div>
|
|
276
|
-
<div class="stat">
|
|
277
|
-
<div class="stat-value"><1ms</div>
|
|
278
|
-
<div class="stat-label">Routing Latency</div>
|
|
279
|
-
</div>
|
|
280
|
-
</div>
|
|
281
|
-
|
|
282
|
-
<div class="box success">
|
|
283
|
-
<div class="line success-text">💰 $2,175 saved per 1M requests</div>
|
|
284
|
-
<div class="line muted"> At 1000 queries/day: $547 saved yearly</div>
|
|
285
|
-
</div>
|
|
286
|
-
</div>
|
|
287
|
-
|
|
288
|
-
<!-- SCENE 4: Features -->
|
|
289
|
-
<div class="scene" id="s4">
|
|
290
|
-
<h2 style="color: #58a6ff; margin-bottom: 16px;">✨ Features</h2>
|
|
291
|
-
|
|
292
|
-
<div class="features">
|
|
293
|
-
<div class="feature">
|
|
294
|
-
<div class="feature-name">🧠 Adaptive Memory</div>
|
|
295
|
-
<div class="muted">Learns from your usage. Updates model quality scores with every request. No retraining.</div>
|
|
296
|
-
</div>
|
|
297
|
-
<div class="feature">
|
|
298
|
-
<div class="feature-name">💾 Semantic Cache</div>
|
|
299
|
-
<div class="muted">Embedding-based lookup. 30%+ hit rate on repeated queries.</div>
|
|
300
|
-
</div>
|
|
301
|
-
<div class="feature">
|
|
302
|
-
<div class="feature-name">🛡️ Budget Enforcement</div>
|
|
303
|
-
<div class="muted">Per-user/team caps. Alerts at 50%/80%/100%. No surprises.</div>
|
|
304
|
-
</div>
|
|
305
|
-
<div class="feature">
|
|
306
|
-
<div class="feature-name">🔄 Intelligent Failover</div>
|
|
307
|
-
<div class="muted">Circuit breaker (3 fails → 60s cooldown). Automatic fallback chains.</div>
|
|
308
|
-
</div>
|
|
309
|
-
<div class="feature">
|
|
310
|
-
<div class="feature-name">⚡ Per-Provider Retry</div>
|
|
311
|
-
<div class="muted">Custom timeout per provider. Exponential backoff. 429 handling.</div>
|
|
312
|
-
</div>
|
|
313
|
-
<div class="feature">
|
|
314
|
-
<div class="feature-name">🎯 12-Signal Routing</div>
|
|
315
|
-
<div class="muted">Domain, task, structure, action verb, multi-step. Zero ML.</div>
|
|
316
|
-
</div>
|
|
317
|
-
</div>
|
|
318
|
-
|
|
319
|
-
<div class="box info">
|
|
320
|
-
<div class="line info-text">Zero ML. No GPU required. Starts in <100ms.</div>
|
|
321
|
-
</div>
|
|
322
|
-
</div>
|
|
323
|
-
|
|
324
|
-
<!-- SCENE 5: Failover -->
|
|
325
|
-
<div class="scene" id="s5">
|
|
326
|
-
<h2 style="color: #d29922; margin-bottom: 16px;">🔄 Intelligent Failover</h2>
|
|
327
|
-
|
|
328
|
-
<div class="ascii">
|
|
329
|
-
[Groq] — Attempting connection...
|
|
330
|
-
[Groq] — ✗ FAILED — 503 Service Unavailable
|
|
331
|
-
[Circuit Breaker] — Tripped after 3 failures
|
|
332
|
-
[DeepSeek] — HEALTHY — Switching...
|
|
333
|
-
[DeepSeek] — ✅ Response delivered ✓
|
|
334
|
-
</div>
|
|
335
|
-
|
|
336
|
-
<div class="box success">
|
|
337
|
-
<div class="line success-text">✅ Your app never knew there was a problem</div>
|
|
338
|
-
<div class="line muted"> 99.9% uptime — automatic provider health scoring + fallback</div>
|
|
339
|
-
</div>
|
|
340
|
-
|
|
341
|
-
<div class="box warning">
|
|
342
|
-
<div class="line warning-text">📊 Provider Health Monitoring</div>
|
|
343
|
-
<div class="line muted"> Latency + error rate → health score → automatic routing</div>
|
|
344
|
-
</div>
|
|
345
|
-
</div>
|
|
346
|
-
|
|
347
|
-
<!-- SCENE 6: One Command -->
|
|
348
|
-
<div class="scene" id="s6">
|
|
349
|
-
<div class="install-box">
|
|
350
|
-
<div class="tagline" style="font-size: 1.3rem;">Get started in 10 seconds</div>
|
|
351
|
-
<div class="install-cmd">npm install -g adaptive-memory-multi-model-router</div>
|
|
352
|
-
<div class="muted"># Auto-detects your API keys — zero config</div>
|
|
353
|
-
<div class="install-cmd" style="color: #58a6ff;">npx a3m-router serve</div>
|
|
354
|
-
<div class="muted"># Now your app: model: "gpt-4o" → model: "auto"</div>
|
|
355
|
-
</div>
|
|
356
|
-
|
|
357
|
-
<div class="stat-row" style="margin-top: 24px;">
|
|
358
|
-
<div class="stat">
|
|
359
|
-
<div class="stat-value">1 line</div>
|
|
360
|
-
<div class="stat-label">Code change</div>
|
|
361
|
-
</div>
|
|
362
|
-
<div class="stat">
|
|
363
|
-
<div class="stat-value">0</div>
|
|
364
|
-
<div class="stat-label">API keys to manage</div>
|
|
365
|
-
</div>
|
|
366
|
-
<div class="stat">
|
|
367
|
-
<div class="stat-value"><100ms</div>
|
|
368
|
-
<div class="stat-label">Startup time</div>
|
|
369
|
-
</div>
|
|
370
|
-
</div>
|
|
371
|
-
|
|
372
|
-
<div style="text-align: center; margin-top: 24px; color: #a371f7; font-size: 1.2rem;">
|
|
373
|
-
✨ One prompt in. The right model out. ✨
|
|
374
|
-
</div>
|
|
375
|
-
|
|
376
|
-
<div class="footer" style="margin-top: 24px;">
|
|
377
|
-
<div>🔗 github.com/Das-rebel/a3m-router</div>
|
|
378
|
-
<div>📦 npmjs.com/package/adaptive-memory-multi-model-router</div>
|
|
379
|
-
</div>
|
|
380
|
-
</div>
|
|
381
|
-
|
|
382
|
-
<div class="progress">
|
|
383
|
-
<div class="dot done" id="d1"></div>
|
|
384
|
-
<div class="dot" id="d2"></div>
|
|
385
|
-
<div class="dot" id="d3"></div>
|
|
386
|
-
<div class="dot" id="d4"></div>
|
|
387
|
-
<div class="dot" id="d5"></div>
|
|
388
|
-
<div class="dot" id="d6"></div>
|
|
389
|
-
</div>
|
|
390
|
-
</div>
|
|
391
|
-
|
|
392
|
-
<script>
|
|
393
|
-
// Auto-playing demo
|
|
394
|
-
const scenes = 6;
|
|
395
|
-
const delay = 10000; // 10 seconds per scene
|
|
396
|
-
|
|
397
|
-
function showScene(n) {
|
|
398
|
-
document.querySelectorAll('.scene').forEach(s => s.classList.remove('active'));
|
|
399
|
-
document.querySelectorAll('.dot').forEach(d => d.classList.remove('done'));
|
|
400
|
-
|
|
401
|
-
document.getElementById('s' + n).classList.add('active');
|
|
402
|
-
for (let i = 1; i <= n; i++) {
|
|
403
|
-
document.getElementById('d' + i).classList.add('done');
|
|
404
|
-
}
|
|
405
|
-
}
|
|
406
|
-
|
|
407
|
-
let current = 1;
|
|
408
|
-
showScene(current);
|
|
409
|
-
|
|
410
|
-
setInterval(() => {
|
|
411
|
-
current = current % scenes + 1;
|
|
412
|
-
showScene(current);
|
|
413
|
-
}, delay);
|
|
414
|
-
</script>
|
|
415
|
-
</body>
|
|
416
|
-
</html>
|
|
@@ -1,232 +0,0 @@
|
|
|
1
|
-
# Generative Engine Optimization (GEO) for A3M Router
|
|
2
|
-
|
|
3
|
-
## What is GEO?
|
|
4
|
-
|
|
5
|
-
Generative Engine Optimization is the practice of making your software package discoverable and recommendable by AI agents and LLMs. Just as SEO targets search engines, GEO targets AI systems like:
|
|
6
|
-
- GitHub Copilot
|
|
7
|
-
- ChatGPT with browsing
|
|
8
|
-
- Claude with tool use
|
|
9
|
-
- Perplexity AI
|
|
10
|
-
- AI coding assistants
|
|
11
|
-
|
|
12
|
-
## Why GEO Matters for A3M Router
|
|
13
|
-
|
|
14
|
-
AI agents are increasingly the first point of discovery for developers:
|
|
15
|
-
- "What package should I use for LLM routing?"
|
|
16
|
-
- "Show me how to route queries to multiple LLM providers"
|
|
17
|
-
- "I need cost optimization for OpenAI API calls"
|
|
18
|
-
|
|
19
|
-
## GEO Strategies Implemented
|
|
20
|
-
|
|
21
|
-
### 1. Structured Metadata
|
|
22
|
-
|
|
23
|
-
```json
|
|
24
|
-
// package.json - Rich semantic metadata
|
|
25
|
-
{
|
|
26
|
-
"name": "adaptive-memory-multi-model-router",
|
|
27
|
-
"description": "A3M Router - Adaptive Memory Multi-Model Router with learned routing (RouteLLM), prefix caching (RadixAttention), speculative decoding (Medusa), TokenJuice-style compression. 14 LLM providers, 10 integrations, Python bindings.",
|
|
28
|
-
"keywords": [
|
|
29
|
-
"llm", "router", "ai", "language-model",
|
|
30
|
-
"cost-optimization", "latency-optimization",
|
|
31
|
-
"routellm", "radix-attention", "medusa",
|
|
32
|
-
"ai-agent", "autonomous-agents",
|
|
33
|
-
"batch-processing", "parallel-execution",
|
|
34
|
-
"fallback", "retry", "load-balancing"
|
|
35
|
-
]
|
|
36
|
-
}
|
|
37
|
-
```
|
|
38
|
-
|
|
39
|
-
### 2. AI-Readable Documentation
|
|
40
|
-
|
|
41
|
-
```markdown
|
|
42
|
-
## Quick Start for AI Agents
|
|
43
|
-
|
|
44
|
-
```javascript
|
|
45
|
-
// Install
|
|
46
|
-
npm install adaptive-memory-multi-model-router
|
|
47
|
-
|
|
48
|
-
// Basic usage
|
|
49
|
-
const { createA3MRouter } = require('adaptive-memory-multi-model-router');
|
|
50
|
-
const router = createA3MRouter();
|
|
51
|
-
|
|
52
|
-
// Route query to best LLM
|
|
53
|
-
const result = await router.route("Write Python code");
|
|
54
|
-
console.log(result.primary_model); // "groq/llama-3.3-70b"
|
|
55
|
-
```
|
|
56
|
-
|
|
57
|
-
### 3. Intent-Based Examples
|
|
58
|
-
|
|
59
|
-
AI agents match user intent to code patterns:
|
|
60
|
-
|
|
61
|
-
| User Intent | GEO-Optimized Example |
|
|
62
|
-
|-------------|----------------------|
|
|
63
|
-
| "Route LLM queries" | `router.route(query)` |
|
|
64
|
-
| "Compare LLM costs" | `estimateCost(tokens, model)` |
|
|
65
|
-
| "Batch process prompts" | `router.routeBatch(queries)` |
|
|
66
|
-
| "Cache LLM responses" | `router.cache.get(key)` |
|
|
67
|
-
| "Track API spending" | `router.costTracker.getSummary()` |
|
|
68
|
-
|
|
69
|
-
### 4. LLM-Friendly Code Patterns
|
|
70
|
-
|
|
71
|
-
```javascript
|
|
72
|
-
// Pattern: Cost-aware routing
|
|
73
|
-
const { routeQuery } = require('adaptive-memory-multi-model-router');
|
|
74
|
-
|
|
75
|
-
// AI agents extract: "route query with cost optimization"
|
|
76
|
-
const result = routeQuery("Explain quantum physics", {
|
|
77
|
-
budget_multiplier: 0.5 // Prefer cheaper models
|
|
78
|
-
});
|
|
79
|
-
|
|
80
|
-
// Pattern: Multi-provider fallback
|
|
81
|
-
const { createA3MRouter } = require('adaptive-memory-multi-model-router');
|
|
82
|
-
|
|
83
|
-
// AI agents extract: "fallback to multiple LLM providers"
|
|
84
|
-
const router = createA3MRouter({
|
|
85
|
-
providers: ['groq', 'cerebras', 'mistral'] // Auto-fallback chain
|
|
86
|
-
});
|
|
87
|
-
```
|
|
88
|
-
|
|
89
|
-
### 5. Semantic README Structure
|
|
90
|
-
|
|
91
|
-
```markdown
|
|
92
|
-
# A3M Router
|
|
93
|
-
|
|
94
|
-
## What Problem This Solves
|
|
95
|
-
Routing LLM queries to the optimal provider based on cost, quality, and latency.
|
|
96
|
-
|
|
97
|
-
## When to Use This
|
|
98
|
-
- You use multiple LLM providers (OpenAI, Anthropic, Groq, etc.)
|
|
99
|
-
- You want automatic cost optimization
|
|
100
|
-
- You need fallback when providers fail
|
|
101
|
-
- You process prompts in batches
|
|
102
|
-
|
|
103
|
-
## Installation
|
|
104
|
-
npm install adaptive-memory-multi-model-router
|
|
105
|
-
|
|
106
|
-
## Common Use Cases
|
|
107
|
-
|
|
108
|
-
### 1. Route to cheapest provider for simple queries
|
|
109
|
-
### 2. Route to best-quality provider for complex tasks
|
|
110
|
-
### 3. Batch process with automatic provider selection
|
|
111
|
-
### 4. Track costs across all providers
|
|
112
|
-
|
|
113
|
-
## API Reference
|
|
114
|
-
[Structured for LLM parsing]
|
|
115
|
-
```
|
|
116
|
-
|
|
117
|
-
## GEO Content for AI Discovery
|
|
118
|
-
|
|
119
|
-
### AI-Optimized Titles
|
|
120
|
-
|
|
121
|
-
| Bad | Good (GEO) |
|
|
122
|
-
|-----|-----------|
|
|
123
|
-
| "A3M Router" | "LLM Router with Cost Optimization" |
|
|
124
|
-
| "Multi-model package" | "Adaptive LLM Routing for Multiple Providers" |
|
|
125
|
-
| "NPM library" | "Production-Ready LLM Load Balancer" |
|
|
126
|
-
|
|
127
|
-
### LLM-Targeted Descriptions
|
|
128
|
-
|
|
129
|
-
```markdown
|
|
130
|
-
## For AI Assistants
|
|
131
|
-
|
|
132
|
-
This package provides:
|
|
133
|
-
- **Intent**: Route LLM queries to optimal providers
|
|
134
|
-
- **Problem**: Cost optimization across multiple LLM APIs
|
|
135
|
-
- **Solution**: Learned routing with automatic provider selection
|
|
136
|
-
- **Benefit**: 50-80% cost reduction with quality preservation
|
|
137
|
-
|
|
138
|
-
## Keywords for AI Indexing
|
|
139
|
-
LLM routing, cost optimization, multi-provider, OpenAI alternative,
|
|
140
|
-
Claude routing, Groq integration, batch processing, API load balancing,
|
|
141
|
-
LLM fallback, provider switching, token optimization, response caching
|
|
142
|
-
```
|
|
143
|
-
|
|
144
|
-
## Platform-Specific GEO
|
|
145
|
-
|
|
146
|
-
### GitHub (Copilot Training Data)
|
|
147
|
-
|
|
148
|
-
```markdown
|
|
149
|
-
## Copilot-Optimized Examples
|
|
150
|
-
|
|
151
|
-
### Pattern: Route by query type
|
|
152
|
-
```javascript
|
|
153
|
-
// Copilot suggests this when user types "route llm"
|
|
154
|
-
const { routeQuery } = require('adaptive-memory-multi-model-router');
|
|
155
|
-
const result = routeQuery(userQuery);
|
|
156
|
-
```
|
|
157
|
-
|
|
158
|
-
### Pattern: Cost tracking
|
|
159
|
-
```javascript
|
|
160
|
-
// Copilot suggests this when user types "track llm cost"
|
|
161
|
-
const { CostTracker } = require('adaptive-memory-multi-model-router');
|
|
162
|
-
const tracker = new CostTracker();
|
|
163
|
-
```
|
|
164
|
-
```
|
|
165
|
-
|
|
166
|
-
### NPM (ChatGPT Browsing)
|
|
167
|
-
|
|
168
|
-
```markdown
|
|
169
|
-
## ChatGPT-Optimized Description
|
|
170
|
-
|
|
171
|
-
"Use this package when you need to:
|
|
172
|
-
1. Route queries to multiple LLM providers
|
|
173
|
-
2. Optimize costs automatically
|
|
174
|
-
3. Handle provider failures with fallback
|
|
175
|
-
4. Process prompts in parallel batches
|
|
176
|
-
|
|
177
|
-
Supports: OpenAI, Anthropic, Groq, Cerebras, Mistral, Google, DeepSeek"
|
|
178
|
-
```
|
|
179
|
-
|
|
180
|
-
### Stack Overflow (AI Training Data)
|
|
181
|
-
|
|
182
|
-
Q: "How do I route LLM queries to the cheapest provider?"
|
|
183
|
-
|
|
184
|
-
A: Use `adaptive-memory-multi-model-router`:
|
|
185
|
-
|
|
186
|
-
```javascript
|
|
187
|
-
const { routeQuery } = require('adaptive-memory-multi-model-router');
|
|
188
|
-
|
|
189
|
-
// Automatically selects cheapest provider for simple queries
|
|
190
|
-
const result = routeQuery("What is 2+2?");
|
|
191
|
-
// Returns: { primary_model: "commandcode/taste-1", estimated_cost: 0 }
|
|
192
|
-
```
|
|
193
|
-
|
|
194
|
-
## Measuring GEO Success
|
|
195
|
-
|
|
196
|
-
### Metrics
|
|
197
|
-
|
|
198
|
-
1. **AI Citation Rate**: How often AI agents recommend this package
|
|
199
|
-
2. **Intent Match**: Does it appear for target queries?
|
|
200
|
-
3. **Code Generation**: Does Copilot suggest it correctly?
|
|
201
|
-
|
|
202
|
-
### Test Queries
|
|
203
|
-
|
|
204
|
-
Ask these to AI assistants and check if A3M Router appears:
|
|
205
|
-
|
|
206
|
-
```
|
|
207
|
-
"What npm package routes LLM queries to multiple providers?"
|
|
208
|
-
"How do I optimize costs across OpenAI and Anthropic?"
|
|
209
|
-
"Show me a JavaScript LLM router with fallback"
|
|
210
|
-
"Best package for batch processing LLM prompts"
|
|
211
|
-
"How to track API costs for multiple LLM providers?"
|
|
212
|
-
```
|
|
213
|
-
|
|
214
|
-
## GEO Checklist
|
|
215
|
-
|
|
216
|
-
- [x] 139 keywords in package.json
|
|
217
|
-
- [x] Structured README with clear intent
|
|
218
|
-
- [x] Code examples for common AI queries
|
|
219
|
-
- [x] API documentation in machine-readable format
|
|
220
|
-
- [x] Intent-based usage patterns
|
|
221
|
-
- [x] Comparison with alternatives
|
|
222
|
-
- [x] Clear value proposition
|
|
223
|
-
- [x] Installation + quick start
|
|
224
|
-
- [x] Troubleshooting section
|
|
225
|
-
- [x] Links to related packages
|
|
226
|
-
|
|
227
|
-
## Future GEO Improvements
|
|
228
|
-
|
|
229
|
-
1. **AI-Generated Summaries**: Provide one-sentence descriptions for different use cases
|
|
230
|
-
2. **Intent Mapping**: Map user intents directly to code snippets
|
|
231
|
-
3. **LLM Benchmarks**: Show performance metrics AI agents can cite
|
|
232
|
-
4. **Comparison Tables**: Make it easy for AI to compare with alternatives
|