@gajae-code/ai 0.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +2644 -0
- package/README.md +1181 -0
- package/dist/types/api-registry.d.ts +30 -0
- package/dist/types/auth-broker/client.d.ts +66 -0
- package/dist/types/auth-broker/index.d.ts +5 -0
- package/dist/types/auth-broker/refresher.d.ts +25 -0
- package/dist/types/auth-broker/remote-store.d.ts +96 -0
- package/dist/types/auth-broker/server.d.ts +32 -0
- package/dist/types/auth-broker/types.d.ts +105 -0
- package/dist/types/auth-broker/wire-schemas.d.ts +412 -0
- package/dist/types/auth-gateway/http.d.ts +39 -0
- package/dist/types/auth-gateway/index.d.ts +3 -0
- package/dist/types/auth-gateway/server.d.ts +17 -0
- package/dist/types/auth-gateway/types.d.ts +115 -0
- package/dist/types/auth-storage.d.ts +641 -0
- package/dist/types/cli.d.ts +2 -0
- package/dist/types/index.d.ts +49 -0
- package/dist/types/model-cache.d.ts +17 -0
- package/dist/types/model-manager.d.ts +62 -0
- package/dist/types/model-thinking.d.ts +71 -0
- package/dist/types/models.d.ts +12 -0
- package/dist/types/provider-details.d.ts +24 -0
- package/dist/types/provider-models/bundled-references.d.ts +4 -0
- package/dist/types/provider-models/descriptors.d.ts +48 -0
- package/dist/types/provider-models/google.d.ts +20 -0
- package/dist/types/provider-models/index.d.ts +5 -0
- package/dist/types/provider-models/ollama.d.ts +7 -0
- package/dist/types/provider-models/openai-compat.d.ts +237 -0
- package/dist/types/provider-models/special.d.ts +16 -0
- package/dist/types/providers/amazon-bedrock.d.ts +36 -0
- package/dist/types/providers/anthropic-messages-server-schema.d.ts +450 -0
- package/dist/types/providers/anthropic-messages-server.d.ts +17 -0
- package/dist/types/providers/anthropic.d.ts +188 -0
- package/dist/types/providers/aws-credentials.d.ts +43 -0
- package/dist/types/providers/aws-eventstream.d.ts +38 -0
- package/dist/types/providers/aws-sigv4.d.ts +55 -0
- package/dist/types/providers/azure-openai-responses.d.ts +15 -0
- package/dist/types/providers/cursor/gen/agent_pb.d.ts +13022 -0
- package/dist/types/providers/cursor.d.ts +42 -0
- package/dist/types/providers/error-message.d.ts +27 -0
- package/dist/types/providers/github-copilot-headers.d.ts +40 -0
- package/dist/types/providers/gitlab-duo.d.ts +27 -0
- package/dist/types/providers/google-auth.d.ts +24 -0
- package/dist/types/providers/google-gemini-cli.d.ts +72 -0
- package/dist/types/providers/google-gemini-headers.d.ts +18 -0
- package/dist/types/providers/google-shared.d.ts +163 -0
- package/dist/types/providers/google-types.d.ts +138 -0
- package/dist/types/providers/google-vertex.d.ts +7 -0
- package/dist/types/providers/google.d.ts +4 -0
- package/dist/types/providers/grammar.d.ts +1 -0
- package/dist/types/providers/kimi.d.ts +27 -0
- package/dist/types/providers/mock.d.ts +175 -0
- package/dist/types/providers/ollama.d.ts +6 -0
- package/dist/types/providers/openai-anthropic-shim.d.ts +31 -0
- package/dist/types/providers/openai-chat-server-schema.d.ts +814 -0
- package/dist/types/providers/openai-chat-server.d.ts +16 -0
- package/dist/types/providers/openai-codex/constants.d.ts +26 -0
- package/dist/types/providers/openai-codex/request-transformer.d.ts +49 -0
- package/dist/types/providers/openai-codex/response-handler.d.ts +17 -0
- package/dist/types/providers/openai-codex-responses.d.ts +67 -0
- package/dist/types/providers/openai-completions-compat.d.ts +25 -0
- package/dist/types/providers/openai-completions.d.ts +33 -0
- package/dist/types/providers/openai-responses-server-schema.d.ts +392 -0
- package/dist/types/providers/openai-responses-server.d.ts +17 -0
- package/dist/types/providers/openai-responses-shared.d.ts +89 -0
- package/dist/types/providers/openai-responses.d.ts +32 -0
- package/dist/types/providers/pi-native-client.d.ts +13 -0
- package/dist/types/providers/pi-native-server.d.ts +68 -0
- package/dist/types/providers/register-builtins.d.ts +31 -0
- package/dist/types/providers/synthetic.d.ts +26 -0
- package/dist/types/providers/transform-messages.d.ts +12 -0
- package/dist/types/providers/vision-guard.d.ts +8 -0
- package/dist/types/rate-limit-utils.d.ts +19 -0
- package/dist/types/stream.d.ts +24 -0
- package/dist/types/types.d.ts +746 -0
- package/dist/types/usage/claude.d.ts +3 -0
- package/dist/types/usage/gemini.d.ts +2 -0
- package/dist/types/usage/github-copilot.d.ts +7 -0
- package/dist/types/usage/google-antigravity.d.ts +2 -0
- package/dist/types/usage/kimi.d.ts +2 -0
- package/dist/types/usage/minimax-code.d.ts +2 -0
- package/dist/types/usage/openai-codex.d.ts +3 -0
- package/dist/types/usage/shared.d.ts +1 -0
- package/dist/types/usage/zai.d.ts +2 -0
- package/dist/types/usage.d.ts +258 -0
- package/dist/types/utils/abort.d.ts +19 -0
- package/dist/types/utils/anthropic-auth.d.ts +31 -0
- package/dist/types/utils/discovery/antigravity.d.ts +61 -0
- package/dist/types/utils/discovery/codex.d.ts +38 -0
- package/dist/types/utils/discovery/cursor.d.ts +23 -0
- package/dist/types/utils/discovery/gemini.d.ts +25 -0
- package/dist/types/utils/discovery/index.d.ts +4 -0
- package/dist/types/utils/discovery/openai-compatible.d.ts +72 -0
- package/dist/types/utils/event-stream.d.ts +28 -0
- package/dist/types/utils/fireworks-model-id.d.ts +10 -0
- package/dist/types/utils/foundry.d.ts +1 -0
- package/dist/types/utils/h2-fetch.d.ts +22 -0
- package/dist/types/utils/http-inspector.d.ts +31 -0
- package/dist/types/utils/idle-iterator.d.ts +67 -0
- package/dist/types/utils/json-parse.d.ts +10 -0
- package/dist/types/utils/oauth/alibaba-coding-plan.d.ts +18 -0
- package/dist/types/utils/oauth/anthropic.d.ts +22 -0
- package/dist/types/utils/oauth/api-key-login.d.ts +35 -0
- package/dist/types/utils/oauth/api-key-validation.d.ts +27 -0
- package/dist/types/utils/oauth/callback-server.d.ts +57 -0
- package/dist/types/utils/oauth/cerebras.d.ts +1 -0
- package/dist/types/utils/oauth/cloudflare-ai-gateway.d.ts +18 -0
- package/dist/types/utils/oauth/cursor.d.ts +15 -0
- package/dist/types/utils/oauth/deepseek.d.ts +10 -0
- package/dist/types/utils/oauth/firepass.d.ts +1 -0
- package/dist/types/utils/oauth/fireworks.d.ts +1 -0
- package/dist/types/utils/oauth/github-copilot.d.ts +38 -0
- package/dist/types/utils/oauth/gitlab-duo.d.ts +3 -0
- package/dist/types/utils/oauth/google-antigravity.d.ts +11 -0
- package/dist/types/utils/oauth/google-gemini-cli.d.ts +10 -0
- package/dist/types/utils/oauth/google-oauth-shared.d.ts +28 -0
- package/dist/types/utils/oauth/huggingface.d.ts +19 -0
- package/dist/types/utils/oauth/index.d.ts +38 -0
- package/dist/types/utils/oauth/kagi.d.ts +17 -0
- package/dist/types/utils/oauth/kilo.d.ts +5 -0
- package/dist/types/utils/oauth/kimi.d.ts +21 -0
- package/dist/types/utils/oauth/litellm.d.ts +18 -0
- package/dist/types/utils/oauth/lm-studio.d.ts +17 -0
- package/dist/types/utils/oauth/minimax-code.d.ts +28 -0
- package/dist/types/utils/oauth/moonshot.d.ts +1 -0
- package/dist/types/utils/oauth/nanogpt.d.ts +1 -0
- package/dist/types/utils/oauth/nvidia.d.ts +18 -0
- package/dist/types/utils/oauth/ollama-cloud.d.ts +2 -0
- package/dist/types/utils/oauth/ollama.d.ts +18 -0
- package/dist/types/utils/oauth/openai-codex.d.ts +21 -0
- package/dist/types/utils/oauth/opencode.d.ts +18 -0
- package/dist/types/utils/oauth/parallel.d.ts +17 -0
- package/dist/types/utils/oauth/perplexity.d.ts +9 -0
- package/dist/types/utils/oauth/pkce.d.ts +8 -0
- package/dist/types/utils/oauth/qianfan.d.ts +17 -0
- package/dist/types/utils/oauth/qwen-portal.d.ts +19 -0
- package/dist/types/utils/oauth/synthetic.d.ts +1 -0
- package/dist/types/utils/oauth/tavily.d.ts +17 -0
- package/dist/types/utils/oauth/together.d.ts +1 -0
- package/dist/types/utils/oauth/types.d.ts +44 -0
- package/dist/types/utils/oauth/venice.d.ts +18 -0
- package/dist/types/utils/oauth/vercel-ai-gateway.d.ts +18 -0
- package/dist/types/utils/oauth/vllm.d.ts +16 -0
- package/dist/types/utils/oauth/xiaomi.d.ts +19 -0
- package/dist/types/utils/oauth/zai.d.ts +18 -0
- package/dist/types/utils/oauth/zenmux.d.ts +1 -0
- package/dist/types/utils/overflow.d.ts +54 -0
- package/dist/types/utils/parse-bind.d.ts +23 -0
- package/dist/types/utils/provider-response.d.ts +3 -0
- package/dist/types/utils/retry-after.d.ts +3 -0
- package/dist/types/utils/retry.d.ts +26 -0
- package/dist/types/utils/schema/adapt.d.ts +24 -0
- package/dist/types/utils/schema/compatibility.d.ts +30 -0
- package/dist/types/utils/schema/dereference.d.ts +11 -0
- package/dist/types/utils/schema/draft.d.ts +10 -0
- package/dist/types/utils/schema/equality.d.ts +4 -0
- package/dist/types/utils/schema/fields.d.ts +49 -0
- package/dist/types/utils/schema/index.d.ts +13 -0
- package/dist/types/utils/schema/json-schema-validator.d.ts +12 -0
- package/dist/types/utils/schema/meta-validator.d.ts +2 -0
- package/dist/types/utils/schema/normalize.d.ts +93 -0
- package/dist/types/utils/schema/spill.d.ts +8 -0
- package/dist/types/utils/schema/stamps.d.ts +25 -0
- package/dist/types/utils/schema/types.d.ts +4 -0
- package/dist/types/utils/schema/wire.d.ts +54 -0
- package/dist/types/utils/schema/zod-decontaminate.d.ts +31 -0
- package/dist/types/utils/sse-debug.d.ts +10 -0
- package/dist/types/utils/tool-call-healing.d.ts +71 -0
- package/dist/types/utils/tool-choice.d.ts +50 -0
- package/dist/types/utils/validation.d.ts +17 -0
- package/dist/types/utils.d.ts +28 -0
- package/package.json +146 -0
- package/src/api-registry.ts +96 -0
- package/src/auth-broker/client.ts +358 -0
- package/src/auth-broker/index.ts +5 -0
- package/src/auth-broker/refresher.ts +127 -0
- package/src/auth-broker/remote-store.ts +623 -0
- package/src/auth-broker/server.ts +644 -0
- package/src/auth-broker/types.ts +127 -0
- package/src/auth-broker/wire-schemas.ts +200 -0
- package/src/auth-gateway/http.ts +194 -0
- package/src/auth-gateway/index.ts +3 -0
- package/src/auth-gateway/server.ts +717 -0
- package/src/auth-gateway/types.ts +134 -0
- package/src/auth-storage.ts +4104 -0
- package/src/cli.ts +262 -0
- package/src/index.ts +54 -0
- package/src/model-cache.ts +129 -0
- package/src/model-manager.ts +450 -0
- package/src/model-thinking.ts +691 -0
- package/src/models.json +73853 -0
- package/src/models.json.d.ts +9 -0
- package/src/models.ts +56 -0
- package/src/prompts/turn-aborted-guidance.md +4 -0
- package/src/provider-details.ts +90 -0
- package/src/provider-models/bundled-references.ts +38 -0
- package/src/provider-models/descriptors.ts +308 -0
- package/src/provider-models/google.ts +91 -0
- package/src/provider-models/index.ts +5 -0
- package/src/provider-models/ollama.ts +153 -0
- package/src/provider-models/openai-compat.ts +2275 -0
- package/src/provider-models/special.ts +67 -0
- package/src/providers/amazon-bedrock.ts +849 -0
- package/src/providers/anthropic-messages-server-schema.ts +229 -0
- package/src/providers/anthropic-messages-server.ts +677 -0
- package/src/providers/anthropic.ts +2696 -0
- package/src/providers/aws-credentials.ts +501 -0
- package/src/providers/aws-eventstream.ts +185 -0
- package/src/providers/aws-sigv4.ts +218 -0
- package/src/providers/azure-openai-responses.ts +337 -0
- package/src/providers/cursor/gen/agent_pb.ts +15274 -0
- package/src/providers/cursor/proto/agent.proto +3526 -0
- package/src/providers/cursor/proto/buf.gen.yaml +6 -0
- package/src/providers/cursor/proto/buf.yaml +17 -0
- package/src/providers/cursor.ts +2561 -0
- package/src/providers/error-message.ts +21 -0
- package/src/providers/github-copilot-headers.ts +140 -0
- package/src/providers/gitlab-duo.ts +372 -0
- package/src/providers/google-auth.ts +252 -0
- package/src/providers/google-gemini-cli.ts +795 -0
- package/src/providers/google-gemini-headers.ts +41 -0
- package/src/providers/google-shared.ts +902 -0
- package/src/providers/google-types.ts +167 -0
- package/src/providers/google-vertex.ts +88 -0
- package/src/providers/google.ts +41 -0
- package/src/providers/grammar.ts +70 -0
- package/src/providers/kimi.ts +52 -0
- package/src/providers/mock.ts +500 -0
- package/src/providers/ollama.ts +544 -0
- package/src/providers/openai-anthropic-shim.ts +138 -0
- package/src/providers/openai-chat-server-schema.ts +243 -0
- package/src/providers/openai-chat-server.ts +628 -0
- package/src/providers/openai-codex/constants.ts +43 -0
- package/src/providers/openai-codex/request-transformer.ts +161 -0
- package/src/providers/openai-codex/response-handler.ts +81 -0
- package/src/providers/openai-codex-responses.ts +2598 -0
- package/src/providers/openai-completions-compat.ts +279 -0
- package/src/providers/openai-completions.ts +1853 -0
- package/src/providers/openai-responses-server-schema.ts +290 -0
- package/src/providers/openai-responses-server.ts +1183 -0
- package/src/providers/openai-responses-shared.ts +800 -0
- package/src/providers/openai-responses.ts +621 -0
- package/src/providers/pi-native-client.ts +228 -0
- package/src/providers/pi-native-server.ts +210 -0
- package/src/providers/register-builtins.ts +412 -0
- package/src/providers/synthetic.ts +50 -0
- package/src/providers/transform-messages.ts +309 -0
- package/src/providers/vision-guard.ts +31 -0
- package/src/rate-limit-utils.ts +84 -0
- package/src/stream.ts +895 -0
- package/src/types.ts +884 -0
- package/src/usage/claude.ts +431 -0
- package/src/usage/gemini.ts +250 -0
- package/src/usage/github-copilot.ts +421 -0
- package/src/usage/google-antigravity.ts +201 -0
- package/src/usage/kimi.ts +271 -0
- package/src/usage/minimax-code.ts +31 -0
- package/src/usage/openai-codex.ts +503 -0
- package/src/usage/shared.ts +10 -0
- package/src/usage/zai.ts +247 -0
- package/src/usage.ts +183 -0
- package/src/utils/abort.ts +51 -0
- package/src/utils/anthropic-auth.ts +87 -0
- package/src/utils/discovery/antigravity.ts +261 -0
- package/src/utils/discovery/codex.ts +371 -0
- package/src/utils/discovery/cursor.ts +306 -0
- package/src/utils/discovery/gemini.ts +248 -0
- package/src/utils/discovery/index.ts +4 -0
- package/src/utils/discovery/openai-compatible.ts +224 -0
- package/src/utils/event-stream.ts +142 -0
- package/src/utils/fireworks-model-id.ts +30 -0
- package/src/utils/foundry.ts +8 -0
- package/src/utils/h2-fetch.ts +60 -0
- package/src/utils/http-inspector.ts +176 -0
- package/src/utils/idle-iterator.ts +250 -0
- package/src/utils/json-parse.ts +148 -0
- package/src/utils/oauth/alibaba-coding-plan.ts +59 -0
- package/src/utils/oauth/anthropic.ts +200 -0
- package/src/utils/oauth/api-key-login.ts +87 -0
- package/src/utils/oauth/api-key-validation.ts +92 -0
- package/src/utils/oauth/callback-server.ts +276 -0
- package/src/utils/oauth/cerebras.ts +16 -0
- package/src/utils/oauth/cloudflare-ai-gateway.ts +48 -0
- package/src/utils/oauth/cursor.ts +157 -0
- package/src/utils/oauth/deepseek.ts +53 -0
- package/src/utils/oauth/firepass.ts +24 -0
- package/src/utils/oauth/fireworks.ts +15 -0
- package/src/utils/oauth/github-copilot.ts +362 -0
- package/src/utils/oauth/gitlab-duo.ts +123 -0
- package/src/utils/oauth/google-antigravity.ts +200 -0
- package/src/utils/oauth/google-gemini-cli.ts +256 -0
- package/src/utils/oauth/google-oauth-shared.ts +110 -0
- package/src/utils/oauth/huggingface.ts +62 -0
- package/src/utils/oauth/index.ts +444 -0
- package/src/utils/oauth/kagi.ts +47 -0
- package/src/utils/oauth/kilo.ts +87 -0
- package/src/utils/oauth/kimi.ts +254 -0
- package/src/utils/oauth/litellm.ts +47 -0
- package/src/utils/oauth/lm-studio.ts +38 -0
- package/src/utils/oauth/minimax-code.ts +78 -0
- package/src/utils/oauth/moonshot.ts +16 -0
- package/src/utils/oauth/nanogpt.ts +15 -0
- package/src/utils/oauth/nvidia.ts +70 -0
- package/src/utils/oauth/oauth.html +199 -0
- package/src/utils/oauth/ollama-cloud.ts +28 -0
- package/src/utils/oauth/ollama.ts +47 -0
- package/src/utils/oauth/openai-codex.ts +299 -0
- package/src/utils/oauth/opencode.ts +49 -0
- package/src/utils/oauth/parallel.ts +46 -0
- package/src/utils/oauth/perplexity.ts +206 -0
- package/src/utils/oauth/pkce.ts +18 -0
- package/src/utils/oauth/qianfan.ts +58 -0
- package/src/utils/oauth/qwen-portal.ts +60 -0
- package/src/utils/oauth/synthetic.ts +16 -0
- package/src/utils/oauth/tavily.ts +46 -0
- package/src/utils/oauth/together.ts +16 -0
- package/src/utils/oauth/types.ts +94 -0
- package/src/utils/oauth/venice.ts +59 -0
- package/src/utils/oauth/vercel-ai-gateway.ts +47 -0
- package/src/utils/oauth/vllm.ts +40 -0
- package/src/utils/oauth/xiaomi.ts +137 -0
- package/src/utils/oauth/zai.ts +60 -0
- package/src/utils/oauth/zenmux.ts +15 -0
- package/src/utils/overflow.ts +137 -0
- package/src/utils/parse-bind.ts +54 -0
- package/src/utils/provider-response.ts +30 -0
- package/src/utils/retry-after.ts +110 -0
- package/src/utils/retry.ts +54 -0
- package/src/utils/schema/CONSTRAINTS.md +164 -0
- package/src/utils/schema/adapt.ts +36 -0
- package/src/utils/schema/compatibility.ts +435 -0
- package/src/utils/schema/dereference.ts +98 -0
- package/src/utils/schema/draft.ts +341 -0
- package/src/utils/schema/equality.ts +97 -0
- package/src/utils/schema/fields.ts +190 -0
- package/src/utils/schema/index.ts +13 -0
- package/src/utils/schema/json-schema-validator.ts +577 -0
- package/src/utils/schema/meta-validator.ts +167 -0
- package/src/utils/schema/normalize.ts +1588 -0
- package/src/utils/schema/spill.ts +43 -0
- package/src/utils/schema/stamps.ts +97 -0
- package/src/utils/schema/types.ts +11 -0
- package/src/utils/schema/wire.ts +213 -0
- package/src/utils/schema/zod-decontaminate.ts +331 -0
- package/src/utils/sse-debug.ts +289 -0
- package/src/utils/tool-call-healing.ts +271 -0
- package/src/utils/tool-choice.ts +99 -0
- package/src/utils/validation.ts +1019 -0
- package/src/utils.ts +166 -0
|
@@ -0,0 +1,450 @@
|
|
|
1
|
+
import { readModelCache, writeModelCache } from "./model-cache";
|
|
2
|
+
import { enrichModelThinking } from "./model-thinking";
|
|
3
|
+
import { type GeneratedProvider, getBundledModels } from "./models";
|
|
4
|
+
import type { Api, Model, Provider } from "./types";
|
|
5
|
+
import { isRecord } from "./utils";
|
|
6
|
+
|
|
7
|
+
const DEFAULT_CACHE_TTL_MS = 2 * 60 * 60 * 1000;
|
|
8
|
+
const NON_AUTHORITATIVE_RETRY_MS = 5 * 60 * 1000;
|
|
9
|
+
|
|
10
|
+
/**
|
|
11
|
+
* Controls when dynamic endpoint models should be fetched.
|
|
12
|
+
*/
|
|
13
|
+
export type ModelRefreshStrategy = "online" | "offline" | "online-if-uncached";
|
|
14
|
+
|
|
15
|
+
/**
|
|
16
|
+
* Hook for loading and mapping models.dev fallback data into canonical model objects.
|
|
17
|
+
*/
|
|
18
|
+
export interface ModelsDevFallback<TApi extends Api = Api, TPayload = unknown> {
|
|
19
|
+
/** Fetches raw fallback payload (for example from models.dev). */
|
|
20
|
+
fetch(): Promise<TPayload>;
|
|
21
|
+
/** Maps payload into provider models. */
|
|
22
|
+
map(payload: TPayload, providerId: Provider): readonly Model<TApi>[];
|
|
23
|
+
}
|
|
24
|
+
|
|
25
|
+
/**
|
|
26
|
+
* Configuration for provider model resolution.
|
|
27
|
+
*/
|
|
28
|
+
export interface ModelManagerOptions<TApi extends Api = Api, TModelsDevPayload = unknown> {
|
|
29
|
+
/** Provider id used for static lookup and cache namespacing. */
|
|
30
|
+
providerId: Provider;
|
|
31
|
+
/** Optional static list override. When omitted, bundled models.json is used. */
|
|
32
|
+
staticModels?: readonly Model<TApi>[];
|
|
33
|
+
/** Optional override for the cache database path. Default: <agent-dir>/models.db. */
|
|
34
|
+
cacheDbPath?: string;
|
|
35
|
+
/** Maximum cache age in milliseconds before considered stale. Default: 24h. */
|
|
36
|
+
cacheTtlMs?: number;
|
|
37
|
+
/** Optional dynamic endpoint fetcher. */
|
|
38
|
+
fetchDynamicModels?: () => Promise<readonly Model<TApi>[] | null>;
|
|
39
|
+
/** Optional models.dev fallback hook. */
|
|
40
|
+
modelsDev?: ModelsDevFallback<TApi, TModelsDevPayload>;
|
|
41
|
+
/** Clock override for deterministic tests. */
|
|
42
|
+
now?: () => number;
|
|
43
|
+
}
|
|
44
|
+
|
|
45
|
+
/**
|
|
46
|
+
* Resolution result.
|
|
47
|
+
*
|
|
48
|
+
* `stale` is false when the resolved catalog is authoritative for the selected provider:
|
|
49
|
+
* - dynamic endpoint data was fetched in this call,
|
|
50
|
+
* - a still-fresh authoritative cache was reused in `online-if-uncached` mode, or
|
|
51
|
+
* - the provider has no dynamic fetcher configured.
|
|
52
|
+
*/
|
|
53
|
+
export interface ModelResolutionResult<TApi extends Api = Api> {
|
|
54
|
+
models: Model<TApi>[];
|
|
55
|
+
stale: boolean;
|
|
56
|
+
}
|
|
57
|
+
|
|
58
|
+
/**
|
|
59
|
+
* Stateful facade over provider model resolution.
|
|
60
|
+
*/
|
|
61
|
+
export interface ModelManager<TApi extends Api = Api> {
|
|
62
|
+
refresh(strategy?: ModelRefreshStrategy): Promise<ModelResolutionResult<TApi>>;
|
|
63
|
+
}
|
|
64
|
+
|
|
65
|
+
/**
|
|
66
|
+
* Creates a reusable provider model manager.
|
|
67
|
+
*/
|
|
68
|
+
export function createModelManager<TApi extends Api = Api, TModelsDevPayload = unknown>(
|
|
69
|
+
options: ModelManagerOptions<TApi, TModelsDevPayload>,
|
|
70
|
+
): ModelManager<TApi> {
|
|
71
|
+
return {
|
|
72
|
+
refresh(strategy: ModelRefreshStrategy = "online-if-uncached") {
|
|
73
|
+
return resolveProviderModels(options, strategy);
|
|
74
|
+
},
|
|
75
|
+
};
|
|
76
|
+
}
|
|
77
|
+
|
|
78
|
+
/**
|
|
79
|
+
* Cheap fast path for trusted model sources (bundled literals, our own cache rows).
|
|
80
|
+
* Skips per-field validation; only guards against catastrophically corrupt rows.
|
|
81
|
+
*/
|
|
82
|
+
function passModelList<TApi extends Api>(value: unknown): Model<TApi>[] {
|
|
83
|
+
if (!Array.isArray(value)) {
|
|
84
|
+
return [];
|
|
85
|
+
}
|
|
86
|
+
const out: Model<TApi>[] = [];
|
|
87
|
+
for (const item of value) {
|
|
88
|
+
if (item === null || typeof item !== "object" || typeof (item as { id: unknown }).id !== "string") {
|
|
89
|
+
continue;
|
|
90
|
+
}
|
|
91
|
+
out.push(enrichModelThinking(item as Model<TApi>));
|
|
92
|
+
}
|
|
93
|
+
return out;
|
|
94
|
+
}
|
|
95
|
+
|
|
96
|
+
/**
|
|
97
|
+
* Resolves provider models with source precedence:
|
|
98
|
+
* static -> models.dev -> cache -> dynamic.
|
|
99
|
+
*
|
|
100
|
+
* Later sources override earlier ones by model id.
|
|
101
|
+
*/
|
|
102
|
+
export async function resolveProviderModels<TApi extends Api = Api, TModelsDevPayload = unknown>(
|
|
103
|
+
options: ModelManagerOptions<TApi, TModelsDevPayload>,
|
|
104
|
+
strategy: ModelRefreshStrategy = "online-if-uncached",
|
|
105
|
+
): Promise<ModelResolutionResult<TApi>> {
|
|
106
|
+
const now = options.now ?? Date.now;
|
|
107
|
+
const ttlMs = options.cacheTtlMs ?? DEFAULT_CACHE_TTL_MS;
|
|
108
|
+
const dbPath = options.cacheDbPath;
|
|
109
|
+
const staticModels = passModelList<TApi>(
|
|
110
|
+
options.staticModels ?? getBundledModels(options.providerId as GeneratedProvider),
|
|
111
|
+
);
|
|
112
|
+
const cache = readModelCache<TApi>(options.providerId, ttlMs, now, dbPath);
|
|
113
|
+
const dynamicFetcher = options.fetchDynamicModels;
|
|
114
|
+
const hasDynamicFetcher = typeof dynamicFetcher === "function";
|
|
115
|
+
const hasAuthoritativeCache = (cache?.authoritative ?? false) || !hasDynamicFetcher;
|
|
116
|
+
const cacheAgeMs = cache ? now() - cache.updatedAt : Number.POSITIVE_INFINITY;
|
|
117
|
+
const shouldFetchFromNetwork = shouldFetchRemoteSources(
|
|
118
|
+
strategy,
|
|
119
|
+
cache?.fresh ?? false,
|
|
120
|
+
hasAuthoritativeCache,
|
|
121
|
+
cacheAgeMs,
|
|
122
|
+
);
|
|
123
|
+
const staticFingerprint = fingerprintStatic(staticModels);
|
|
124
|
+
|
|
125
|
+
// Cold-start fast path: when a fresh, authoritative cache exists, the network
|
|
126
|
+
// fetch is skipped, AND the static catalog slice is byte-identical to what
|
|
127
|
+
// was merged in last time, the cache row IS the authoritative merge result.
|
|
128
|
+
// Re-running `mergeDynamicModels(static, cache)` would just rebuild the same
|
|
129
|
+
// objects (~800ms in the steady-state cold-start profile for `gjc -p hi`).
|
|
130
|
+
if (
|
|
131
|
+
!shouldFetchFromNetwork &&
|
|
132
|
+
cache?.fresh &&
|
|
133
|
+
hasAuthoritativeCache &&
|
|
134
|
+
cache.staticFingerprint === staticFingerprint &&
|
|
135
|
+
cache.staticFingerprint.length > 0
|
|
136
|
+
) {
|
|
137
|
+
return { models: passModelList<TApi>(cache.models), stale: false };
|
|
138
|
+
}
|
|
139
|
+
|
|
140
|
+
const [fetchedModelsDevModels, fetchedDynamicModels] = shouldFetchFromNetwork
|
|
141
|
+
? await Promise.all([fetchModelsDev(options), dynamicFetcher ? fetchDynamicModels(dynamicFetcher) : null])
|
|
142
|
+
: [null, null];
|
|
143
|
+
const modelsDevModels = normalizeModelList<TApi>(fetchedModelsDevModels ?? []);
|
|
144
|
+
const shouldUseFreshCacheAsAuthoritative =
|
|
145
|
+
strategy === "online-if-uncached" && (cache?.fresh ?? false) && hasAuthoritativeCache;
|
|
146
|
+
const dynamicFetchSucceeded = fetchedDynamicModels !== null;
|
|
147
|
+
const cacheModels = dynamicFetchSucceeded ? [] : normalizeModelList<TApi>(cache?.models ?? []);
|
|
148
|
+
const dynamicModels = fetchedDynamicModels ?? [];
|
|
149
|
+
const mergedWithCache = mergeDynamicModels(mergeModelSources(staticModels, modelsDevModels), cacheModels);
|
|
150
|
+
const models = mergeDynamicModels(mergedWithCache, dynamicModels);
|
|
151
|
+
const dynamicAuthoritative = !hasDynamicFetcher || dynamicFetchSucceeded || shouldUseFreshCacheAsAuthoritative;
|
|
152
|
+
if (shouldFetchFromNetwork) {
|
|
153
|
+
if (dynamicFetchSucceeded) {
|
|
154
|
+
const snapshotModels = mergeDynamicModels(mergeModelSources(staticModels, modelsDevModels), dynamicModels);
|
|
155
|
+
writeModelCache(options.providerId, now(), snapshotModels, true, staticFingerprint, dbPath);
|
|
156
|
+
} else {
|
|
157
|
+
// Dynamic fetch failed — update cache with a non-authoritative snapshot so
|
|
158
|
+
// stale state remains visible while retry backoff still applies.
|
|
159
|
+
const latestCache = readModelCache<TApi>(options.providerId, ttlMs, now, dbPath);
|
|
160
|
+
writeModelCache(
|
|
161
|
+
options.providerId,
|
|
162
|
+
now(),
|
|
163
|
+
mergeDynamicModels(
|
|
164
|
+
mergeModelSources(staticModels, modelsDevModels),
|
|
165
|
+
normalizeModelList<TApi>(latestCache?.models ?? cache?.models ?? []),
|
|
166
|
+
),
|
|
167
|
+
false,
|
|
168
|
+
staticFingerprint,
|
|
169
|
+
dbPath,
|
|
170
|
+
);
|
|
171
|
+
}
|
|
172
|
+
}
|
|
173
|
+
return {
|
|
174
|
+
models,
|
|
175
|
+
stale: !dynamicAuthoritative,
|
|
176
|
+
};
|
|
177
|
+
}
|
|
178
|
+
|
|
179
|
+
async function fetchModelsDev<TApi extends Api, TModelsDevPayload>(
|
|
180
|
+
options: ModelManagerOptions<TApi, TModelsDevPayload>,
|
|
181
|
+
): Promise<Model<TApi>[] | null> {
|
|
182
|
+
if (!options.modelsDev) {
|
|
183
|
+
return null;
|
|
184
|
+
}
|
|
185
|
+
|
|
186
|
+
try {
|
|
187
|
+
const payload = await options.modelsDev.fetch();
|
|
188
|
+
return normalizeModelList<TApi>(options.modelsDev.map(payload, options.providerId));
|
|
189
|
+
} catch {
|
|
190
|
+
return null;
|
|
191
|
+
}
|
|
192
|
+
}
|
|
193
|
+
|
|
194
|
+
async function fetchDynamicModels<TApi extends Api>(
|
|
195
|
+
fetcher: () => Promise<readonly Model<TApi>[] | null>,
|
|
196
|
+
): Promise<Model<TApi>[] | null> {
|
|
197
|
+
try {
|
|
198
|
+
const models = await fetcher();
|
|
199
|
+
if (models === null) {
|
|
200
|
+
return null;
|
|
201
|
+
}
|
|
202
|
+
return normalizeModelList<TApi>(models);
|
|
203
|
+
} catch {
|
|
204
|
+
return null;
|
|
205
|
+
}
|
|
206
|
+
}
|
|
207
|
+
|
|
208
|
+
function shouldFetchRemoteSources(
|
|
209
|
+
strategy: ModelRefreshStrategy,
|
|
210
|
+
hasFreshCache: boolean,
|
|
211
|
+
hasAuthoritativeCache: boolean,
|
|
212
|
+
cacheAgeMs: number,
|
|
213
|
+
): boolean {
|
|
214
|
+
if (strategy === "offline") {
|
|
215
|
+
return false;
|
|
216
|
+
}
|
|
217
|
+
if (strategy === "online") {
|
|
218
|
+
return true;
|
|
219
|
+
}
|
|
220
|
+
// online-if-uncached: skip fetch if cache is fresh.
|
|
221
|
+
// For non-authoritative caches (dynamic fetch previously failed),
|
|
222
|
+
// use a shorter retry interval instead of retrying every startup.
|
|
223
|
+
if (!hasFreshCache) {
|
|
224
|
+
return true;
|
|
225
|
+
}
|
|
226
|
+
if (!hasAuthoritativeCache) {
|
|
227
|
+
return cacheAgeMs >= NON_AUTHORITATIVE_RETRY_MS;
|
|
228
|
+
}
|
|
229
|
+
return false;
|
|
230
|
+
}
|
|
231
|
+
|
|
232
|
+
function mergeModelSources<TApi extends Api>(...sources: readonly (readonly Model<TApi>[])[]): Model<TApi>[] {
|
|
233
|
+
// Strip out empty/missing sources up front. The hot path is `(static, [])`
|
|
234
|
+
// (modelsDev disabled / failed) — a single non-empty source means we can
|
|
235
|
+
// skip the Map churn entirely and just hand back the array.
|
|
236
|
+
const nonEmpty = sources.filter(source => source.length > 0);
|
|
237
|
+
if (nonEmpty.length === 0) return [];
|
|
238
|
+
if (nonEmpty.length === 1) return [...nonEmpty[0]];
|
|
239
|
+
const merged = new Map<string, Model<TApi>>();
|
|
240
|
+
for (const source of nonEmpty) {
|
|
241
|
+
for (const model of source) {
|
|
242
|
+
if (!model?.id) continue;
|
|
243
|
+
merged.set(model.id, model);
|
|
244
|
+
}
|
|
245
|
+
}
|
|
246
|
+
return Array.from(merged.values());
|
|
247
|
+
}
|
|
248
|
+
|
|
249
|
+
function mergeDynamicModels<TApi extends Api>(
|
|
250
|
+
baseModels: readonly Model<TApi>[],
|
|
251
|
+
dynamicModels: readonly Model<TApi>[],
|
|
252
|
+
): Model<TApi>[] {
|
|
253
|
+
// Empty-side fast paths: `mergeDynamicModels(base, [])` is the common shape
|
|
254
|
+
// after we've already merged the first pair, and `(...)` with no base
|
|
255
|
+
// happens for providers without static catalogs.
|
|
256
|
+
if (dynamicModels.length === 0) return baseModels.length === 0 ? [] : [...baseModels];
|
|
257
|
+
if (baseModels.length === 0) return [...dynamicModels];
|
|
258
|
+
const merged = new Map<string, Model<TApi>>(baseModels.map(model => [model.id, model]));
|
|
259
|
+
for (const dynamicModel of dynamicModels) {
|
|
260
|
+
if (!dynamicModel?.id) {
|
|
261
|
+
continue;
|
|
262
|
+
}
|
|
263
|
+
const existingModel = merged.get(dynamicModel.id);
|
|
264
|
+
if (!existingModel) {
|
|
265
|
+
merged.set(dynamicModel.id, dynamicModel);
|
|
266
|
+
continue;
|
|
267
|
+
}
|
|
268
|
+
merged.set(dynamicModel.id, mergeDynamicModel(existingModel, dynamicModel));
|
|
269
|
+
}
|
|
270
|
+
return Array.from(merged.values());
|
|
271
|
+
}
|
|
272
|
+
|
|
273
|
+
/**
|
|
274
|
+
* Stable, low-collision fingerprint of a static catalog slice. Cached by
|
|
275
|
+
* reference so repeat calls in the same process (e.g. multiple cold-start
|
|
276
|
+
* arms calling `resolveProviderModels` with the same `staticModels` array)
|
|
277
|
+
* skip the JSON+hash work after the first call.
|
|
278
|
+
*/
|
|
279
|
+
const kStaticFingerprint = Symbol("model-manager.staticFingerprint");
|
|
280
|
+
type ModelArrayWithFingerprint = readonly Model<Api>[] & { [kStaticFingerprint]?: string };
|
|
281
|
+
function fingerprintStatic<TApi extends Api>(models: readonly Model<TApi>[]): string {
|
|
282
|
+
if (models.length === 0) return "empty";
|
|
283
|
+
const tagged = models as ModelArrayWithFingerprint;
|
|
284
|
+
const cached = tagged[kStaticFingerprint];
|
|
285
|
+
if (cached !== undefined) return cached;
|
|
286
|
+
// `Bun.hash` returns a `bigint`; base36 keeps the string short for the
|
|
287
|
+
// SQLite column without sacrificing distinguishability.
|
|
288
|
+
const fingerprint = Bun.hash(JSON.stringify(models)).toString(36);
|
|
289
|
+
tagged[kStaticFingerprint] = fingerprint;
|
|
290
|
+
return fingerprint;
|
|
291
|
+
}
|
|
292
|
+
|
|
293
|
+
function mergeDynamicModel<TApi extends Api>(existingModel: Model<TApi>, dynamicModel: Model<TApi>): Model<TApi> {
|
|
294
|
+
const supportsImage = existingModel.input.includes("image") || dynamicModel.input.includes("image");
|
|
295
|
+
return enrichModelThinking({
|
|
296
|
+
...existingModel,
|
|
297
|
+
...dynamicModel,
|
|
298
|
+
name: preferDiscoveryName(dynamicModel.name, existingModel.name, dynamicModel.id),
|
|
299
|
+
reasoning: existingModel.reasoning || dynamicModel.reasoning,
|
|
300
|
+
input: supportsImage ? ["text", "image"] : ["text"],
|
|
301
|
+
cost: {
|
|
302
|
+
input: preferDiscoveryCost(dynamicModel.cost.input, existingModel.cost.input),
|
|
303
|
+
output: preferDiscoveryCost(dynamicModel.cost.output, existingModel.cost.output),
|
|
304
|
+
cacheRead: preferDiscoveryCost(dynamicModel.cost.cacheRead, existingModel.cost.cacheRead),
|
|
305
|
+
cacheWrite: preferDiscoveryCost(dynamicModel.cost.cacheWrite, existingModel.cost.cacheWrite),
|
|
306
|
+
},
|
|
307
|
+
contextWindow: preferDiscoveryLimit(dynamicModel.contextWindow, existingModel.contextWindow),
|
|
308
|
+
maxTokens: preferDiscoveryLimit(dynamicModel.maxTokens, existingModel.maxTokens),
|
|
309
|
+
headers: dynamicModel.headers ? { ...existingModel.headers, ...dynamicModel.headers } : existingModel.headers,
|
|
310
|
+
compat: dynamicModel.compat ?? existingModel.compat,
|
|
311
|
+
contextPromotionTarget: dynamicModel.contextPromotionTarget ?? existingModel.contextPromotionTarget,
|
|
312
|
+
});
|
|
313
|
+
}
|
|
314
|
+
|
|
315
|
+
function preferDiscoveryCost(discoveryCost: number, fallbackCost: number): number {
|
|
316
|
+
if (Number.isFinite(discoveryCost) && discoveryCost > 0) {
|
|
317
|
+
return discoveryCost;
|
|
318
|
+
}
|
|
319
|
+
return fallbackCost;
|
|
320
|
+
}
|
|
321
|
+
|
|
322
|
+
function preferDiscoveryName(discoveryName: string, fallbackName: string, modelId: string): string {
|
|
323
|
+
const normalizedDiscoveryName = discoveryName.trim();
|
|
324
|
+
if (normalizedDiscoveryName.length === 0) {
|
|
325
|
+
return fallbackName;
|
|
326
|
+
}
|
|
327
|
+
if (normalizedDiscoveryName === modelId && fallbackName !== modelId) {
|
|
328
|
+
return fallbackName;
|
|
329
|
+
}
|
|
330
|
+
return normalizedDiscoveryName;
|
|
331
|
+
}
|
|
332
|
+
|
|
333
|
+
function preferDiscoveryLimit(discoveryLimit: number, fallbackLimit: number): number {
|
|
334
|
+
if (!Number.isFinite(discoveryLimit) || discoveryLimit <= 0) {
|
|
335
|
+
return fallbackLimit;
|
|
336
|
+
}
|
|
337
|
+
if (discoveryLimit === 4096 && fallbackLimit > discoveryLimit) {
|
|
338
|
+
return fallbackLimit;
|
|
339
|
+
}
|
|
340
|
+
return discoveryLimit;
|
|
341
|
+
}
|
|
342
|
+
|
|
343
|
+
function normalizeModelList<TApi extends Api>(value: unknown): Model<TApi>[] {
|
|
344
|
+
if (!Array.isArray(value)) {
|
|
345
|
+
return [];
|
|
346
|
+
}
|
|
347
|
+
const models: Model<TApi>[] = [];
|
|
348
|
+
for (const item of value) {
|
|
349
|
+
if (isModelLike(item)) {
|
|
350
|
+
models.push(enrichModelThinking(item as Model<TApi>));
|
|
351
|
+
}
|
|
352
|
+
}
|
|
353
|
+
return models;
|
|
354
|
+
}
|
|
355
|
+
|
|
356
|
+
function isModelLike(value: unknown): value is Model<Api> {
|
|
357
|
+
if (!isRecord(value)) {
|
|
358
|
+
return false;
|
|
359
|
+
}
|
|
360
|
+
const v = value as {
|
|
361
|
+
id?: unknown;
|
|
362
|
+
name?: unknown;
|
|
363
|
+
api?: unknown;
|
|
364
|
+
provider?: unknown;
|
|
365
|
+
baseUrl?: unknown;
|
|
366
|
+
reasoning?: unknown;
|
|
367
|
+
input?: unknown;
|
|
368
|
+
cost?: unknown;
|
|
369
|
+
contextWindow?: unknown;
|
|
370
|
+
maxTokens?: unknown;
|
|
371
|
+
};
|
|
372
|
+
if (typeof v.id !== "string" || v.id.length === 0) {
|
|
373
|
+
return false;
|
|
374
|
+
}
|
|
375
|
+
if (typeof v.name !== "string" || v.name.length === 0) {
|
|
376
|
+
return false;
|
|
377
|
+
}
|
|
378
|
+
if (typeof v.api !== "string" || v.api.length === 0) {
|
|
379
|
+
return false;
|
|
380
|
+
}
|
|
381
|
+
if (typeof v.provider !== "string" || v.provider.length === 0) {
|
|
382
|
+
return false;
|
|
383
|
+
}
|
|
384
|
+
if (typeof v.baseUrl !== "string" || v.baseUrl.length === 0) {
|
|
385
|
+
return false;
|
|
386
|
+
}
|
|
387
|
+
if (typeof v.reasoning !== "boolean") {
|
|
388
|
+
return false;
|
|
389
|
+
}
|
|
390
|
+
if (!isModelInputArray(v.input)) {
|
|
391
|
+
return false;
|
|
392
|
+
}
|
|
393
|
+
if (!isModelCost(v.cost)) {
|
|
394
|
+
return false;
|
|
395
|
+
}
|
|
396
|
+
// Finite positive: NaN > 0 is false, +Infinity < Infinity is false.
|
|
397
|
+
const cw = v.contextWindow;
|
|
398
|
+
if (typeof cw !== "number" || !(cw > 0 && cw < Infinity)) {
|
|
399
|
+
return false;
|
|
400
|
+
}
|
|
401
|
+
const mt = v.maxTokens;
|
|
402
|
+
if (typeof mt !== "number" || !(mt > 0 && mt < Infinity)) {
|
|
403
|
+
return false;
|
|
404
|
+
}
|
|
405
|
+
return true;
|
|
406
|
+
}
|
|
407
|
+
|
|
408
|
+
function isModelInputArray(value: unknown): value is ("text" | "image")[] {
|
|
409
|
+
if (!Array.isArray(value) || value.length === 0) {
|
|
410
|
+
return false;
|
|
411
|
+
}
|
|
412
|
+
for (let i = 0; i < value.length; i++) {
|
|
413
|
+
const item = value[i];
|
|
414
|
+
if (item !== "text" && item !== "image") {
|
|
415
|
+
return false;
|
|
416
|
+
}
|
|
417
|
+
}
|
|
418
|
+
return true;
|
|
419
|
+
}
|
|
420
|
+
|
|
421
|
+
function isModelCost(value: unknown): value is Model<Api>["cost"] {
|
|
422
|
+
if (!isRecord(value)) {
|
|
423
|
+
return false;
|
|
424
|
+
}
|
|
425
|
+
const c = value as {
|
|
426
|
+
input?: unknown;
|
|
427
|
+
output?: unknown;
|
|
428
|
+
cacheRead?: unknown;
|
|
429
|
+
cacheWrite?: unknown;
|
|
430
|
+
};
|
|
431
|
+
// Finite (NaN-safe): -Infinity < x < Infinity rejects NaN and both infinities.
|
|
432
|
+
// Preserves original behavior: 0 and negatives remain valid.
|
|
433
|
+
const ci = c.input;
|
|
434
|
+
if (typeof ci !== "number" || !(ci > -Infinity && ci < Infinity)) {
|
|
435
|
+
return false;
|
|
436
|
+
}
|
|
437
|
+
const co = c.output;
|
|
438
|
+
if (typeof co !== "number" || !(co > -Infinity && co < Infinity)) {
|
|
439
|
+
return false;
|
|
440
|
+
}
|
|
441
|
+
const cr = c.cacheRead;
|
|
442
|
+
if (typeof cr !== "number" || !(cr > -Infinity && cr < Infinity)) {
|
|
443
|
+
return false;
|
|
444
|
+
}
|
|
445
|
+
const cw = c.cacheWrite;
|
|
446
|
+
if (typeof cw !== "number" || !(cw > -Infinity && cw < Infinity)) {
|
|
447
|
+
return false;
|
|
448
|
+
}
|
|
449
|
+
return true;
|
|
450
|
+
}
|