adaptive-memory-multi-model-router 2.14.47 → 2.14.48

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (1) hide show
  1. package/package.json +286 -17
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "adaptive-memory-multi-model-router",
3
- "version": "2.14.47",
3
+ "version": "2.14.48",
4
4
  "shortName": "A3M Router",
5
5
  "displayName": "A3M Router - Adaptive Memory Multi-Model Router",
6
6
  "description": "🥇 Cheapest LLM router on RouterArena ($0.05/1K) · 15K+ downloads in 2 weeks · Open-source AI gateway with parallel multi-LLM execution across 47+ providers, ensemble voting, semantic cache, and budget enforcement",
@@ -57,35 +57,304 @@
57
57
  "keywords": [
58
58
  "a3m",
59
59
  "a3m-router",
60
+ "adaptive-memory-multi-model-router",
61
+ "multi-model-router",
60
62
  "llm-router",
61
- "llm-routing",
62
- "model-routing",
63
- "ai-router",
64
- "ai-gateway",
65
- "ai-routing",
66
63
  "routing",
67
64
  "router",
68
65
  "gateway",
69
- "multi-model-router",
66
+ "ai-gateway",
67
+ "ai-router",
68
+ "model-routing",
69
+ "llm-routing",
70
+ "ai-routing",
71
+ "smart-routing",
72
+ "dynamic-routing",
73
+ "adaptive-routing",
74
+ "semantic-routing",
75
+ "intent-routing",
76
+ "content-routing",
77
+ "tier-routing",
78
+ "cost-routing",
79
+ "latency-routing",
80
+ "quality-routing",
70
81
  "multi-provider",
71
- "multi-llm",
82
+ "provider-routing",
83
+ "llm",
84
+ "large-language-model",
85
+ "ai",
86
+ "artificial-intelligence",
87
+ "machine-learning",
88
+ "ml",
89
+ "deep-learning",
90
+ "neural-network",
91
+ "natural-language-processing",
92
+ "nlp",
93
+ "text-generation",
94
+ "chatgpt",
95
+ "gpt",
96
+ "gpt-4",
97
+ "gpt-4o",
98
+ "gpt-3",
99
+ "gpt-3.5",
100
+ "claude",
101
+ "claude-3",
102
+ "claude-sonnet",
103
+ "claude-opus",
104
+ "claude-haiku",
105
+ "gemini",
106
+ "gemini-pro",
107
+ "gemini-ultra",
108
+ "llama",
109
+ "llama-2",
110
+ "llama-3",
111
+ "mistral",
112
+ "mixtral",
113
+ "phi",
114
+ "gemma",
115
+ "qwen",
116
+ "yi",
117
+ "command-r",
118
+ "deepseek",
119
+ "kimi",
120
+ "grok",
121
+ "palm",
122
+ "bedrock",
123
+ "openai",
124
+ "anthropic",
125
+ "google-ai",
126
+ "google-cloud",
127
+ "vertex-ai",
128
+ "azure-openai",
129
+ "aws-bedrock",
130
+ "cohere",
131
+ "huggingface",
132
+ "replicate",
133
+ "together-ai",
134
+ "fireworks-ai",
135
+ "anyscale",
136
+ "perplexity",
137
+ "mistral-ai",
138
+ "groq",
139
+ "cerebras",
140
+ "sambanova",
141
+ "nvidia-nim",
142
+ "vllm",
143
+ "ollama",
144
+ "lm-studio",
145
+ "jan",
146
+ "text-generation-webui",
147
+ "koboldcpp",
148
+ "openrouter",
149
+ "litellm",
150
+ "portkey",
151
+ "helicone",
152
+ "langfuse",
72
153
  "cost-optimization",
73
154
  "cost-reduction",
74
- "smart-routing",
155
+ "cost-savings",
156
+ "cost-tracking",
157
+ "cost-analytics",
158
+ "budget-management",
159
+ "budget-alerts",
160
+ "token-optimization",
161
+ "token-saving",
162
+ "llm-cost",
163
+ "api-cost-reduction",
164
+ "cheap-llm",
165
+ "low-cost-llm",
166
+ "free-llm",
167
+ "cost-effective",
168
+ "price-comparison",
169
+ "rate-limiting",
170
+ "quota-management",
171
+ "usage-tracking",
172
+ "billing",
75
173
  "caching",
76
174
  "semantic-cache",
175
+ "response-cache",
176
+ "prompt-cache",
177
+ "context-cache",
178
+ "embedding-cache",
179
+ "vector-cache",
180
+ "redis-cache",
181
+ "in-memory-cache",
182
+ "distributed-cache",
183
+ "cache-invalidation",
184
+ "cache-strategy",
185
+ "llm-cache",
186
+ "ai-cache",
187
+ "request-dedup",
77
188
  "fallback",
78
189
  "failover",
190
+ "smart-fallback",
191
+ "smart-failover",
192
+ "circuit-breaker",
193
+ "retry",
194
+ "retry-logic",
195
+ "exponential-backoff",
196
+ "health-check",
197
+ "provider-health",
198
+ "uptime",
199
+ "high-availability",
200
+ "resilience",
201
+ "fault-tolerance",
202
+ "error-handling",
203
+ "graceful-degradation",
204
+ "load-balancing",
205
+ "load-balancer",
206
+ "throttling",
207
+ "parallel-execution",
208
+ "concurrent-requests",
209
+ "batch-processing",
79
210
  "streaming",
80
- "openai",
81
- "anthropic",
82
- "gemini",
83
- "claude",
84
- "deepseek",
85
- "groq",
86
- "openrouter",
211
+ "streaming-llm",
212
+ "server-sent-events",
213
+ "sse",
214
+ "low-latency",
215
+ "high-throughput",
216
+ "performance-optimization",
217
+ "connection-pooling",
218
+ "keep-alive",
219
+ "http2",
220
+ "grpc",
221
+ "edge-computing",
222
+ "edge-deployment",
223
+ "monitoring",
224
+ "metrics",
225
+ "observability",
226
+ "tracing",
227
+ "opentelemetry",
228
+ "prometheus",
229
+ "grafana",
230
+ "logging",
231
+ "structured-logging",
232
+ "debug",
233
+ "telemetry",
234
+ "analytics",
235
+ "dashboard",
236
+ "security",
237
+ "api-key-management",
238
+ "key-rotation",
239
+ "vault",
240
+ "secret-management",
241
+ "encryption",
242
+ "tls",
243
+ "ssl",
244
+ "authentication",
245
+ "authorization",
246
+ "rbac",
247
+ "audit-log",
248
+ "compliance",
249
+ "pii-detection",
250
+ "content-filtering",
251
+ "guardrails",
252
+ "ai-guardrails",
253
+ "safety",
87
254
  "langchain",
88
- "open-source"
255
+ "llamaindex",
256
+ "vercel-ai",
257
+ "vercel-ai-sdk",
258
+ "nextjs",
259
+ "next.js",
260
+ "react",
261
+ "vue",
262
+ "angular",
263
+ "svelte",
264
+ "express",
265
+ "fastify",
266
+ "koa",
267
+ "hono",
268
+ "nestjs",
269
+ "typescript",
270
+ "javascript",
271
+ "node.js",
272
+ "nodejs",
273
+ "deno",
274
+ "bun",
275
+ "python",
276
+ "fastapi",
277
+ "flask",
278
+ "django",
279
+ "docker",
280
+ "kubernetes",
281
+ "k8s",
282
+ "serverless",
283
+ "lambda",
284
+ "cloud-functions",
285
+ "vercel",
286
+ "netlify",
287
+ "railway",
288
+ "render",
289
+ "fly.io",
290
+ "aws",
291
+ "gcp",
292
+ "azure",
293
+ "digitalocean",
294
+ "heroku",
295
+ "self-hosted",
296
+ "on-premise",
297
+ "hybrid-cloud",
298
+ "chatbot",
299
+ "virtual-assistant",
300
+ "ai-agent",
301
+ "autonomous-agents",
302
+ "multi-agent",
303
+ "rag",
304
+ "retrieval-augmented-generation",
305
+ "question-answering",
306
+ "summarization",
307
+ "translation",
308
+ "code-generation",
309
+ "text-extraction",
310
+ "sentiment-analysis",
311
+ "classification",
312
+ "content-generation",
313
+ "copywriting",
314
+ "data-analysis",
315
+ "research",
316
+ "tutoring",
317
+ "customer-support",
318
+ "automation",
319
+ "rest-api",
320
+ "graphql",
321
+ "websocket",
322
+ "json",
323
+ "openapi",
324
+ "swagger",
325
+ "streaming-api",
326
+ "http",
327
+ "https",
328
+ "oauth",
329
+ "jwt",
330
+ "api-key",
331
+ "sdk",
332
+ "api-client",
333
+ "cli",
334
+ "command-line",
335
+ "terminal",
336
+ "tui",
337
+ "configuration",
338
+ "yaml",
339
+ "json-config",
340
+ "environment-variables",
341
+ "typescript-types",
342
+ "type-safety",
343
+ "intellisense",
344
+ "autocomplete",
345
+ "documentation",
346
+ "examples",
347
+ "quickstart",
348
+ "boilerplate",
349
+ "starter-template",
350
+ "scaffold",
351
+ "testing",
352
+ "unit-test",
353
+ "integration-test",
354
+ "mock",
355
+ "stub",
356
+ "benchmark",
357
+ "performance-test"
89
358
  ],
90
359
  "author": "Das-rebel <subho@example.com>",
91
360
  "license": "MIT",