@gajae-code/ai 0.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +2644 -0
- package/README.md +1181 -0
- package/dist/types/api-registry.d.ts +30 -0
- package/dist/types/auth-broker/client.d.ts +66 -0
- package/dist/types/auth-broker/index.d.ts +5 -0
- package/dist/types/auth-broker/refresher.d.ts +25 -0
- package/dist/types/auth-broker/remote-store.d.ts +96 -0
- package/dist/types/auth-broker/server.d.ts +32 -0
- package/dist/types/auth-broker/types.d.ts +105 -0
- package/dist/types/auth-broker/wire-schemas.d.ts +412 -0
- package/dist/types/auth-gateway/http.d.ts +39 -0
- package/dist/types/auth-gateway/index.d.ts +3 -0
- package/dist/types/auth-gateway/server.d.ts +17 -0
- package/dist/types/auth-gateway/types.d.ts +115 -0
- package/dist/types/auth-storage.d.ts +641 -0
- package/dist/types/cli.d.ts +2 -0
- package/dist/types/index.d.ts +49 -0
- package/dist/types/model-cache.d.ts +17 -0
- package/dist/types/model-manager.d.ts +62 -0
- package/dist/types/model-thinking.d.ts +71 -0
- package/dist/types/models.d.ts +12 -0
- package/dist/types/provider-details.d.ts +24 -0
- package/dist/types/provider-models/bundled-references.d.ts +4 -0
- package/dist/types/provider-models/descriptors.d.ts +48 -0
- package/dist/types/provider-models/google.d.ts +20 -0
- package/dist/types/provider-models/index.d.ts +5 -0
- package/dist/types/provider-models/ollama.d.ts +7 -0
- package/dist/types/provider-models/openai-compat.d.ts +237 -0
- package/dist/types/provider-models/special.d.ts +16 -0
- package/dist/types/providers/amazon-bedrock.d.ts +36 -0
- package/dist/types/providers/anthropic-messages-server-schema.d.ts +450 -0
- package/dist/types/providers/anthropic-messages-server.d.ts +17 -0
- package/dist/types/providers/anthropic.d.ts +188 -0
- package/dist/types/providers/aws-credentials.d.ts +43 -0
- package/dist/types/providers/aws-eventstream.d.ts +38 -0
- package/dist/types/providers/aws-sigv4.d.ts +55 -0
- package/dist/types/providers/azure-openai-responses.d.ts +15 -0
- package/dist/types/providers/cursor/gen/agent_pb.d.ts +13022 -0
- package/dist/types/providers/cursor.d.ts +42 -0
- package/dist/types/providers/error-message.d.ts +27 -0
- package/dist/types/providers/github-copilot-headers.d.ts +40 -0
- package/dist/types/providers/gitlab-duo.d.ts +27 -0
- package/dist/types/providers/google-auth.d.ts +24 -0
- package/dist/types/providers/google-gemini-cli.d.ts +72 -0
- package/dist/types/providers/google-gemini-headers.d.ts +18 -0
- package/dist/types/providers/google-shared.d.ts +163 -0
- package/dist/types/providers/google-types.d.ts +138 -0
- package/dist/types/providers/google-vertex.d.ts +7 -0
- package/dist/types/providers/google.d.ts +4 -0
- package/dist/types/providers/grammar.d.ts +1 -0
- package/dist/types/providers/kimi.d.ts +27 -0
- package/dist/types/providers/mock.d.ts +175 -0
- package/dist/types/providers/ollama.d.ts +6 -0
- package/dist/types/providers/openai-anthropic-shim.d.ts +31 -0
- package/dist/types/providers/openai-chat-server-schema.d.ts +814 -0
- package/dist/types/providers/openai-chat-server.d.ts +16 -0
- package/dist/types/providers/openai-codex/constants.d.ts +26 -0
- package/dist/types/providers/openai-codex/request-transformer.d.ts +49 -0
- package/dist/types/providers/openai-codex/response-handler.d.ts +17 -0
- package/dist/types/providers/openai-codex-responses.d.ts +67 -0
- package/dist/types/providers/openai-completions-compat.d.ts +25 -0
- package/dist/types/providers/openai-completions.d.ts +33 -0
- package/dist/types/providers/openai-responses-server-schema.d.ts +392 -0
- package/dist/types/providers/openai-responses-server.d.ts +17 -0
- package/dist/types/providers/openai-responses-shared.d.ts +89 -0
- package/dist/types/providers/openai-responses.d.ts +32 -0
- package/dist/types/providers/pi-native-client.d.ts +13 -0
- package/dist/types/providers/pi-native-server.d.ts +68 -0
- package/dist/types/providers/register-builtins.d.ts +31 -0
- package/dist/types/providers/synthetic.d.ts +26 -0
- package/dist/types/providers/transform-messages.d.ts +12 -0
- package/dist/types/providers/vision-guard.d.ts +8 -0
- package/dist/types/rate-limit-utils.d.ts +19 -0
- package/dist/types/stream.d.ts +24 -0
- package/dist/types/types.d.ts +746 -0
- package/dist/types/usage/claude.d.ts +3 -0
- package/dist/types/usage/gemini.d.ts +2 -0
- package/dist/types/usage/github-copilot.d.ts +7 -0
- package/dist/types/usage/google-antigravity.d.ts +2 -0
- package/dist/types/usage/kimi.d.ts +2 -0
- package/dist/types/usage/minimax-code.d.ts +2 -0
- package/dist/types/usage/openai-codex.d.ts +3 -0
- package/dist/types/usage/shared.d.ts +1 -0
- package/dist/types/usage/zai.d.ts +2 -0
- package/dist/types/usage.d.ts +258 -0
- package/dist/types/utils/abort.d.ts +19 -0
- package/dist/types/utils/anthropic-auth.d.ts +31 -0
- package/dist/types/utils/discovery/antigravity.d.ts +61 -0
- package/dist/types/utils/discovery/codex.d.ts +38 -0
- package/dist/types/utils/discovery/cursor.d.ts +23 -0
- package/dist/types/utils/discovery/gemini.d.ts +25 -0
- package/dist/types/utils/discovery/index.d.ts +4 -0
- package/dist/types/utils/discovery/openai-compatible.d.ts +72 -0
- package/dist/types/utils/event-stream.d.ts +28 -0
- package/dist/types/utils/fireworks-model-id.d.ts +10 -0
- package/dist/types/utils/foundry.d.ts +1 -0
- package/dist/types/utils/h2-fetch.d.ts +22 -0
- package/dist/types/utils/http-inspector.d.ts +31 -0
- package/dist/types/utils/idle-iterator.d.ts +67 -0
- package/dist/types/utils/json-parse.d.ts +10 -0
- package/dist/types/utils/oauth/alibaba-coding-plan.d.ts +18 -0
- package/dist/types/utils/oauth/anthropic.d.ts +22 -0
- package/dist/types/utils/oauth/api-key-login.d.ts +35 -0
- package/dist/types/utils/oauth/api-key-validation.d.ts +27 -0
- package/dist/types/utils/oauth/callback-server.d.ts +57 -0
- package/dist/types/utils/oauth/cerebras.d.ts +1 -0
- package/dist/types/utils/oauth/cloudflare-ai-gateway.d.ts +18 -0
- package/dist/types/utils/oauth/cursor.d.ts +15 -0
- package/dist/types/utils/oauth/deepseek.d.ts +10 -0
- package/dist/types/utils/oauth/firepass.d.ts +1 -0
- package/dist/types/utils/oauth/fireworks.d.ts +1 -0
- package/dist/types/utils/oauth/github-copilot.d.ts +38 -0
- package/dist/types/utils/oauth/gitlab-duo.d.ts +3 -0
- package/dist/types/utils/oauth/google-antigravity.d.ts +11 -0
- package/dist/types/utils/oauth/google-gemini-cli.d.ts +10 -0
- package/dist/types/utils/oauth/google-oauth-shared.d.ts +28 -0
- package/dist/types/utils/oauth/huggingface.d.ts +19 -0
- package/dist/types/utils/oauth/index.d.ts +38 -0
- package/dist/types/utils/oauth/kagi.d.ts +17 -0
- package/dist/types/utils/oauth/kilo.d.ts +5 -0
- package/dist/types/utils/oauth/kimi.d.ts +21 -0
- package/dist/types/utils/oauth/litellm.d.ts +18 -0
- package/dist/types/utils/oauth/lm-studio.d.ts +17 -0
- package/dist/types/utils/oauth/minimax-code.d.ts +28 -0
- package/dist/types/utils/oauth/moonshot.d.ts +1 -0
- package/dist/types/utils/oauth/nanogpt.d.ts +1 -0
- package/dist/types/utils/oauth/nvidia.d.ts +18 -0
- package/dist/types/utils/oauth/ollama-cloud.d.ts +2 -0
- package/dist/types/utils/oauth/ollama.d.ts +18 -0
- package/dist/types/utils/oauth/openai-codex.d.ts +21 -0
- package/dist/types/utils/oauth/opencode.d.ts +18 -0
- package/dist/types/utils/oauth/parallel.d.ts +17 -0
- package/dist/types/utils/oauth/perplexity.d.ts +9 -0
- package/dist/types/utils/oauth/pkce.d.ts +8 -0
- package/dist/types/utils/oauth/qianfan.d.ts +17 -0
- package/dist/types/utils/oauth/qwen-portal.d.ts +19 -0
- package/dist/types/utils/oauth/synthetic.d.ts +1 -0
- package/dist/types/utils/oauth/tavily.d.ts +17 -0
- package/dist/types/utils/oauth/together.d.ts +1 -0
- package/dist/types/utils/oauth/types.d.ts +44 -0
- package/dist/types/utils/oauth/venice.d.ts +18 -0
- package/dist/types/utils/oauth/vercel-ai-gateway.d.ts +18 -0
- package/dist/types/utils/oauth/vllm.d.ts +16 -0
- package/dist/types/utils/oauth/xiaomi.d.ts +19 -0
- package/dist/types/utils/oauth/zai.d.ts +18 -0
- package/dist/types/utils/oauth/zenmux.d.ts +1 -0
- package/dist/types/utils/overflow.d.ts +54 -0
- package/dist/types/utils/parse-bind.d.ts +23 -0
- package/dist/types/utils/provider-response.d.ts +3 -0
- package/dist/types/utils/retry-after.d.ts +3 -0
- package/dist/types/utils/retry.d.ts +26 -0
- package/dist/types/utils/schema/adapt.d.ts +24 -0
- package/dist/types/utils/schema/compatibility.d.ts +30 -0
- package/dist/types/utils/schema/dereference.d.ts +11 -0
- package/dist/types/utils/schema/draft.d.ts +10 -0
- package/dist/types/utils/schema/equality.d.ts +4 -0
- package/dist/types/utils/schema/fields.d.ts +49 -0
- package/dist/types/utils/schema/index.d.ts +13 -0
- package/dist/types/utils/schema/json-schema-validator.d.ts +12 -0
- package/dist/types/utils/schema/meta-validator.d.ts +2 -0
- package/dist/types/utils/schema/normalize.d.ts +93 -0
- package/dist/types/utils/schema/spill.d.ts +8 -0
- package/dist/types/utils/schema/stamps.d.ts +25 -0
- package/dist/types/utils/schema/types.d.ts +4 -0
- package/dist/types/utils/schema/wire.d.ts +54 -0
- package/dist/types/utils/schema/zod-decontaminate.d.ts +31 -0
- package/dist/types/utils/sse-debug.d.ts +10 -0
- package/dist/types/utils/tool-call-healing.d.ts +71 -0
- package/dist/types/utils/tool-choice.d.ts +50 -0
- package/dist/types/utils/validation.d.ts +17 -0
- package/dist/types/utils.d.ts +28 -0
- package/package.json +146 -0
- package/src/api-registry.ts +96 -0
- package/src/auth-broker/client.ts +358 -0
- package/src/auth-broker/index.ts +5 -0
- package/src/auth-broker/refresher.ts +127 -0
- package/src/auth-broker/remote-store.ts +623 -0
- package/src/auth-broker/server.ts +644 -0
- package/src/auth-broker/types.ts +127 -0
- package/src/auth-broker/wire-schemas.ts +200 -0
- package/src/auth-gateway/http.ts +194 -0
- package/src/auth-gateway/index.ts +3 -0
- package/src/auth-gateway/server.ts +717 -0
- package/src/auth-gateway/types.ts +134 -0
- package/src/auth-storage.ts +4104 -0
- package/src/cli.ts +262 -0
- package/src/index.ts +54 -0
- package/src/model-cache.ts +129 -0
- package/src/model-manager.ts +450 -0
- package/src/model-thinking.ts +691 -0
- package/src/models.json +73853 -0
- package/src/models.json.d.ts +9 -0
- package/src/models.ts +56 -0
- package/src/prompts/turn-aborted-guidance.md +4 -0
- package/src/provider-details.ts +90 -0
- package/src/provider-models/bundled-references.ts +38 -0
- package/src/provider-models/descriptors.ts +308 -0
- package/src/provider-models/google.ts +91 -0
- package/src/provider-models/index.ts +5 -0
- package/src/provider-models/ollama.ts +153 -0
- package/src/provider-models/openai-compat.ts +2275 -0
- package/src/provider-models/special.ts +67 -0
- package/src/providers/amazon-bedrock.ts +849 -0
- package/src/providers/anthropic-messages-server-schema.ts +229 -0
- package/src/providers/anthropic-messages-server.ts +677 -0
- package/src/providers/anthropic.ts +2696 -0
- package/src/providers/aws-credentials.ts +501 -0
- package/src/providers/aws-eventstream.ts +185 -0
- package/src/providers/aws-sigv4.ts +218 -0
- package/src/providers/azure-openai-responses.ts +337 -0
- package/src/providers/cursor/gen/agent_pb.ts +15274 -0
- package/src/providers/cursor/proto/agent.proto +3526 -0
- package/src/providers/cursor/proto/buf.gen.yaml +6 -0
- package/src/providers/cursor/proto/buf.yaml +17 -0
- package/src/providers/cursor.ts +2561 -0
- package/src/providers/error-message.ts +21 -0
- package/src/providers/github-copilot-headers.ts +140 -0
- package/src/providers/gitlab-duo.ts +372 -0
- package/src/providers/google-auth.ts +252 -0
- package/src/providers/google-gemini-cli.ts +795 -0
- package/src/providers/google-gemini-headers.ts +41 -0
- package/src/providers/google-shared.ts +902 -0
- package/src/providers/google-types.ts +167 -0
- package/src/providers/google-vertex.ts +88 -0
- package/src/providers/google.ts +41 -0
- package/src/providers/grammar.ts +70 -0
- package/src/providers/kimi.ts +52 -0
- package/src/providers/mock.ts +500 -0
- package/src/providers/ollama.ts +544 -0
- package/src/providers/openai-anthropic-shim.ts +138 -0
- package/src/providers/openai-chat-server-schema.ts +243 -0
- package/src/providers/openai-chat-server.ts +628 -0
- package/src/providers/openai-codex/constants.ts +43 -0
- package/src/providers/openai-codex/request-transformer.ts +161 -0
- package/src/providers/openai-codex/response-handler.ts +81 -0
- package/src/providers/openai-codex-responses.ts +2598 -0
- package/src/providers/openai-completions-compat.ts +279 -0
- package/src/providers/openai-completions.ts +1853 -0
- package/src/providers/openai-responses-server-schema.ts +290 -0
- package/src/providers/openai-responses-server.ts +1183 -0
- package/src/providers/openai-responses-shared.ts +800 -0
- package/src/providers/openai-responses.ts +621 -0
- package/src/providers/pi-native-client.ts +228 -0
- package/src/providers/pi-native-server.ts +210 -0
- package/src/providers/register-builtins.ts +412 -0
- package/src/providers/synthetic.ts +50 -0
- package/src/providers/transform-messages.ts +309 -0
- package/src/providers/vision-guard.ts +31 -0
- package/src/rate-limit-utils.ts +84 -0
- package/src/stream.ts +895 -0
- package/src/types.ts +884 -0
- package/src/usage/claude.ts +431 -0
- package/src/usage/gemini.ts +250 -0
- package/src/usage/github-copilot.ts +421 -0
- package/src/usage/google-antigravity.ts +201 -0
- package/src/usage/kimi.ts +271 -0
- package/src/usage/minimax-code.ts +31 -0
- package/src/usage/openai-codex.ts +503 -0
- package/src/usage/shared.ts +10 -0
- package/src/usage/zai.ts +247 -0
- package/src/usage.ts +183 -0
- package/src/utils/abort.ts +51 -0
- package/src/utils/anthropic-auth.ts +87 -0
- package/src/utils/discovery/antigravity.ts +261 -0
- package/src/utils/discovery/codex.ts +371 -0
- package/src/utils/discovery/cursor.ts +306 -0
- package/src/utils/discovery/gemini.ts +248 -0
- package/src/utils/discovery/index.ts +4 -0
- package/src/utils/discovery/openai-compatible.ts +224 -0
- package/src/utils/event-stream.ts +142 -0
- package/src/utils/fireworks-model-id.ts +30 -0
- package/src/utils/foundry.ts +8 -0
- package/src/utils/h2-fetch.ts +60 -0
- package/src/utils/http-inspector.ts +176 -0
- package/src/utils/idle-iterator.ts +250 -0
- package/src/utils/json-parse.ts +148 -0
- package/src/utils/oauth/alibaba-coding-plan.ts +59 -0
- package/src/utils/oauth/anthropic.ts +200 -0
- package/src/utils/oauth/api-key-login.ts +87 -0
- package/src/utils/oauth/api-key-validation.ts +92 -0
- package/src/utils/oauth/callback-server.ts +276 -0
- package/src/utils/oauth/cerebras.ts +16 -0
- package/src/utils/oauth/cloudflare-ai-gateway.ts +48 -0
- package/src/utils/oauth/cursor.ts +157 -0
- package/src/utils/oauth/deepseek.ts +53 -0
- package/src/utils/oauth/firepass.ts +24 -0
- package/src/utils/oauth/fireworks.ts +15 -0
- package/src/utils/oauth/github-copilot.ts +362 -0
- package/src/utils/oauth/gitlab-duo.ts +123 -0
- package/src/utils/oauth/google-antigravity.ts +200 -0
- package/src/utils/oauth/google-gemini-cli.ts +256 -0
- package/src/utils/oauth/google-oauth-shared.ts +110 -0
- package/src/utils/oauth/huggingface.ts +62 -0
- package/src/utils/oauth/index.ts +444 -0
- package/src/utils/oauth/kagi.ts +47 -0
- package/src/utils/oauth/kilo.ts +87 -0
- package/src/utils/oauth/kimi.ts +254 -0
- package/src/utils/oauth/litellm.ts +47 -0
- package/src/utils/oauth/lm-studio.ts +38 -0
- package/src/utils/oauth/minimax-code.ts +78 -0
- package/src/utils/oauth/moonshot.ts +16 -0
- package/src/utils/oauth/nanogpt.ts +15 -0
- package/src/utils/oauth/nvidia.ts +70 -0
- package/src/utils/oauth/oauth.html +199 -0
- package/src/utils/oauth/ollama-cloud.ts +28 -0
- package/src/utils/oauth/ollama.ts +47 -0
- package/src/utils/oauth/openai-codex.ts +299 -0
- package/src/utils/oauth/opencode.ts +49 -0
- package/src/utils/oauth/parallel.ts +46 -0
- package/src/utils/oauth/perplexity.ts +206 -0
- package/src/utils/oauth/pkce.ts +18 -0
- package/src/utils/oauth/qianfan.ts +58 -0
- package/src/utils/oauth/qwen-portal.ts +60 -0
- package/src/utils/oauth/synthetic.ts +16 -0
- package/src/utils/oauth/tavily.ts +46 -0
- package/src/utils/oauth/together.ts +16 -0
- package/src/utils/oauth/types.ts +94 -0
- package/src/utils/oauth/venice.ts +59 -0
- package/src/utils/oauth/vercel-ai-gateway.ts +47 -0
- package/src/utils/oauth/vllm.ts +40 -0
- package/src/utils/oauth/xiaomi.ts +137 -0
- package/src/utils/oauth/zai.ts +60 -0
- package/src/utils/oauth/zenmux.ts +15 -0
- package/src/utils/overflow.ts +137 -0
- package/src/utils/parse-bind.ts +54 -0
- package/src/utils/provider-response.ts +30 -0
- package/src/utils/retry-after.ts +110 -0
- package/src/utils/retry.ts +54 -0
- package/src/utils/schema/CONSTRAINTS.md +164 -0
- package/src/utils/schema/adapt.ts +36 -0
- package/src/utils/schema/compatibility.ts +435 -0
- package/src/utils/schema/dereference.ts +98 -0
- package/src/utils/schema/draft.ts +341 -0
- package/src/utils/schema/equality.ts +97 -0
- package/src/utils/schema/fields.ts +190 -0
- package/src/utils/schema/index.ts +13 -0
- package/src/utils/schema/json-schema-validator.ts +577 -0
- package/src/utils/schema/meta-validator.ts +167 -0
- package/src/utils/schema/normalize.ts +1588 -0
- package/src/utils/schema/spill.ts +43 -0
- package/src/utils/schema/stamps.ts +97 -0
- package/src/utils/schema/types.ts +11 -0
- package/src/utils/schema/wire.ts +213 -0
- package/src/utils/schema/zod-decontaminate.ts +331 -0
- package/src/utils/sse-debug.ts +289 -0
- package/src/utils/tool-call-healing.ts +271 -0
- package/src/utils/tool-choice.ts +99 -0
- package/src/utils/validation.ts +1019 -0
- package/src/utils.ts +166 -0
|
@@ -0,0 +1,228 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Client half of the pi-native auth-gateway protocol.
|
|
3
|
+
*
|
|
4
|
+
* Dispatches a {@link streamSimple}-shaped request to an `gjc auth-gateway`
|
|
5
|
+
* via `POST /v1/pi/stream`, reads the SSE event stream back, and pushes the
|
|
6
|
+
* parsed events into a local {@link AssistantMessageEventStream} — the same
|
|
7
|
+
* stream type every other provider client produces. Callers downstream of
|
|
8
|
+
* `streamSimple` cannot tell whether the events came from a real provider
|
|
9
|
+
* SDK or from a gateway hop; they consume `AssistantMessageEvent`s either
|
|
10
|
+
* way.
|
|
11
|
+
*
|
|
12
|
+
* Activated when a {@link Model} has `transport: "pi-native"` set; the
|
|
13
|
+
* dispatch hook lives in `streamSimple()` (see `../stream.ts`). Used by
|
|
14
|
+
* containerized gjc deployments (robogjc slots, the swarm extension) that
|
|
15
|
+
* route every LLM call through a credential-holding sidecar so the slot
|
|
16
|
+
* itself stays credential-free.
|
|
17
|
+
*/
|
|
18
|
+
import { readSseJson } from "@gajae-code/utils";
|
|
19
|
+
import type {
|
|
20
|
+
Api,
|
|
21
|
+
AssistantMessage,
|
|
22
|
+
AssistantMessageEvent,
|
|
23
|
+
AssistantMessageEventStream as AssistantMessageEventStreamType,
|
|
24
|
+
Context,
|
|
25
|
+
Model,
|
|
26
|
+
SimpleStreamOptions,
|
|
27
|
+
} from "../types";
|
|
28
|
+
import { AssistantMessageEventStream } from "../utils/event-stream";
|
|
29
|
+
|
|
30
|
+
/**
|
|
31
|
+
* Fields that must not cross the wire — either non-serializable (functions,
|
|
32
|
+
* `AbortSignal`, the provider-session `Map`) or server-controlled
|
|
33
|
+
* (`apiKey`, which the gateway injects from its own credential store; the
|
|
34
|
+
* client's `apiKey` is the gateway *bearer*, sent in the `Authorization`
|
|
35
|
+
* header rather than the request body).
|
|
36
|
+
*/
|
|
37
|
+
const NON_WIRE_KEYS = new Set<keyof SimpleStreamOptions>([
|
|
38
|
+
"signal",
|
|
39
|
+
"apiKey",
|
|
40
|
+
"fetch",
|
|
41
|
+
"onPayload",
|
|
42
|
+
"onResponse",
|
|
43
|
+
"onSseEvent",
|
|
44
|
+
"execHandlers",
|
|
45
|
+
"cursorExecHandlers",
|
|
46
|
+
"cursorOnToolResult",
|
|
47
|
+
"providerSessionState",
|
|
48
|
+
]);
|
|
49
|
+
|
|
50
|
+
function buildWireOptions(options: SimpleStreamOptions | undefined): Record<string, unknown> {
|
|
51
|
+
if (!options) return {};
|
|
52
|
+
const wire: Record<string, unknown> = {};
|
|
53
|
+
for (const [k, v] of Object.entries(options)) {
|
|
54
|
+
if (v === undefined) continue;
|
|
55
|
+
if (NON_WIRE_KEYS.has(k as keyof SimpleStreamOptions)) continue;
|
|
56
|
+
wire[k] = v;
|
|
57
|
+
}
|
|
58
|
+
return wire;
|
|
59
|
+
}
|
|
60
|
+
|
|
61
|
+
async function decodeGatewayError(response: Response): Promise<Error> {
|
|
62
|
+
const status = response.status;
|
|
63
|
+
let body: unknown;
|
|
64
|
+
try {
|
|
65
|
+
body = await response.json();
|
|
66
|
+
} catch {
|
|
67
|
+
body = await response.text().catch(() => "");
|
|
68
|
+
}
|
|
69
|
+
if (typeof body === "object" && body !== null && "error" in body) {
|
|
70
|
+
const err = (body as { error: unknown }).error;
|
|
71
|
+
if (typeof err === "object" && err !== null) {
|
|
72
|
+
const message = (err as { message?: unknown }).message;
|
|
73
|
+
const type = (err as { type?: unknown }).type;
|
|
74
|
+
const out = new Error(typeof message === "string" ? message : `auth-gateway ${status}`);
|
|
75
|
+
(out as { status?: number; type?: string }).status = status;
|
|
76
|
+
if (typeof type === "string") (out as { type?: string }).type = type;
|
|
77
|
+
return out;
|
|
78
|
+
}
|
|
79
|
+
}
|
|
80
|
+
const text = typeof body === "string" ? body : JSON.stringify(body);
|
|
81
|
+
const err = new Error(`auth-gateway ${status}: ${text || response.statusText}`);
|
|
82
|
+
(err as { status?: number }).status = status;
|
|
83
|
+
return err;
|
|
84
|
+
}
|
|
85
|
+
|
|
86
|
+
/**
|
|
87
|
+
* Resolve the `/v1/pi/stream` endpoint URL from the model's `baseUrl`.
|
|
88
|
+
* Trims a trailing slash so concatenation can't double-slash; throws when
|
|
89
|
+
* the baseUrl is missing (transport=pi-native without a gateway target is
|
|
90
|
+
* a configuration error, not a runtime recoverable one).
|
|
91
|
+
*/
|
|
92
|
+
function resolveStreamUrl(model: Model<Api>): string {
|
|
93
|
+
if (!model.baseUrl) {
|
|
94
|
+
throw new Error(
|
|
95
|
+
`pi-native transport requires \`baseUrl\` on model ${model.id} (set it on the provider config in models.yml)`,
|
|
96
|
+
);
|
|
97
|
+
}
|
|
98
|
+
return `${model.baseUrl.replace(/\/+$/, "")}/v1/pi/stream`;
|
|
99
|
+
}
|
|
100
|
+
|
|
101
|
+
function buildHeaders(model: Model<Api>, apiKey: string | undefined): Record<string, string> {
|
|
102
|
+
const headers: Record<string, string> = {
|
|
103
|
+
"Content-Type": "application/json",
|
|
104
|
+
Accept: "text/event-stream",
|
|
105
|
+
...(model.headers ?? {}),
|
|
106
|
+
};
|
|
107
|
+
if (apiKey && !headers.Authorization) {
|
|
108
|
+
headers.Authorization = `Bearer ${apiKey}`;
|
|
109
|
+
}
|
|
110
|
+
return headers;
|
|
111
|
+
}
|
|
112
|
+
|
|
113
|
+
/**
|
|
114
|
+
* Stream a turn through an `gjc auth-gateway` over the pi-native protocol.
|
|
115
|
+
*
|
|
116
|
+
* The returned {@link AssistantMessageEventStream} receives each parsed
|
|
117
|
+
* `AssistantMessageEvent` verbatim from the gateway; the terminal `done` /
|
|
118
|
+
* `error` event resolves `.result()` automatically via the base class's
|
|
119
|
+
* completion check. Non-streaming consumers just call `.result()` and pay
|
|
120
|
+
* for SSE framing they don't use — that overhead is dominated by provider
|
|
121
|
+
* latency, so we always stream rather than maintaining a parallel
|
|
122
|
+
* non-streaming path.
|
|
123
|
+
*/
|
|
124
|
+
export function streamPiNative<TApi extends Api>(
|
|
125
|
+
model: Model<TApi>,
|
|
126
|
+
context: Context,
|
|
127
|
+
options?: SimpleStreamOptions,
|
|
128
|
+
): AssistantMessageEventStreamType {
|
|
129
|
+
const stream = new AssistantMessageEventStream();
|
|
130
|
+
|
|
131
|
+
void (async () => {
|
|
132
|
+
const signal = options?.signal;
|
|
133
|
+
// Abort propagation: cancel the response body when the caller's signal
|
|
134
|
+
// fires. Mirror `streamProxy`'s shape — explicit listener + finally
|
|
135
|
+
// cleanup — so we don't leak listeners on the long-running case.
|
|
136
|
+
let response: Response | null = null;
|
|
137
|
+
const onAbort = (): void => {
|
|
138
|
+
const body = response?.body;
|
|
139
|
+
if (body) body.cancel("Request aborted by caller").catch(() => {});
|
|
140
|
+
};
|
|
141
|
+
if (signal) {
|
|
142
|
+
if (signal.aborted) {
|
|
143
|
+
stream.fail(signal.reason instanceof Error ? signal.reason : new Error(String(signal.reason ?? "aborted")));
|
|
144
|
+
return;
|
|
145
|
+
}
|
|
146
|
+
signal.addEventListener("abort", onAbort, { once: true });
|
|
147
|
+
}
|
|
148
|
+
|
|
149
|
+
try {
|
|
150
|
+
const url = resolveStreamUrl(model as Model<Api>);
|
|
151
|
+
const fetchImpl = options?.fetch ?? globalThis.fetch;
|
|
152
|
+
const headers = buildHeaders(model as Model<Api>, options?.apiKey);
|
|
153
|
+
const body = JSON.stringify({
|
|
154
|
+
modelId: model.id,
|
|
155
|
+
context,
|
|
156
|
+
options: buildWireOptions(options),
|
|
157
|
+
stream: true,
|
|
158
|
+
});
|
|
159
|
+
|
|
160
|
+
response = await fetchImpl(url, { method: "POST", headers, body, signal });
|
|
161
|
+
if (!response.ok) {
|
|
162
|
+
stream.fail(await decodeGatewayError(response));
|
|
163
|
+
return;
|
|
164
|
+
}
|
|
165
|
+
if (!response.body) {
|
|
166
|
+
stream.fail(new Error("auth-gateway returned empty body"));
|
|
167
|
+
return;
|
|
168
|
+
}
|
|
169
|
+
|
|
170
|
+
let sawTerminal = false;
|
|
171
|
+
for await (const event of readSseJson<AssistantMessageEvent>(
|
|
172
|
+
response.body as ReadableStream<Uint8Array>,
|
|
173
|
+
signal,
|
|
174
|
+
)) {
|
|
175
|
+
if (event.type === "done" || event.type === "error") sawTerminal = true;
|
|
176
|
+
stream.push(event);
|
|
177
|
+
// `stream.push` resolves `.result()` on `done`/`error`; subsequent
|
|
178
|
+
// pushes are silently dropped by the base class. We still iterate
|
|
179
|
+
// to drain any trailing bytes from the wire so the underlying TCP
|
|
180
|
+
// stream closes cleanly.
|
|
181
|
+
}
|
|
182
|
+
|
|
183
|
+
if (!sawTerminal) {
|
|
184
|
+
// SSE closed before a terminal event reached us — synthesize one
|
|
185
|
+
// so awaiters of `.result()` resolve instead of hanging forever.
|
|
186
|
+
// Matches the gateway's own defensive fallback in
|
|
187
|
+
// `pi-native-server.encodeStream`.
|
|
188
|
+
const aborted = signal?.aborted === true;
|
|
189
|
+
const partial = makeSyntheticAssistant(model as Model<Api>);
|
|
190
|
+
if (aborted) {
|
|
191
|
+
partial.stopReason = "aborted";
|
|
192
|
+
partial.errorMessage = "stream closed without terminal event";
|
|
193
|
+
stream.push({ type: "error", reason: "aborted", error: partial });
|
|
194
|
+
} else {
|
|
195
|
+
partial.stopReason = "stop";
|
|
196
|
+
stream.push({ type: "done", reason: "stop", message: partial });
|
|
197
|
+
}
|
|
198
|
+
}
|
|
199
|
+
stream.end();
|
|
200
|
+
} catch (err) {
|
|
201
|
+
stream.fail(err);
|
|
202
|
+
} finally {
|
|
203
|
+
if (signal) signal.removeEventListener("abort", onAbort);
|
|
204
|
+
}
|
|
205
|
+
})();
|
|
206
|
+
|
|
207
|
+
return stream;
|
|
208
|
+
}
|
|
209
|
+
|
|
210
|
+
function makeSyntheticAssistant(model: Model<Api>): AssistantMessage {
|
|
211
|
+
return {
|
|
212
|
+
role: "assistant",
|
|
213
|
+
content: [],
|
|
214
|
+
api: model.api,
|
|
215
|
+
provider: model.provider,
|
|
216
|
+
model: model.id,
|
|
217
|
+
usage: {
|
|
218
|
+
input: 0,
|
|
219
|
+
output: 0,
|
|
220
|
+
cacheRead: 0,
|
|
221
|
+
cacheWrite: 0,
|
|
222
|
+
totalTokens: 0,
|
|
223
|
+
cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0, total: 0 },
|
|
224
|
+
},
|
|
225
|
+
stopReason: "stop",
|
|
226
|
+
timestamp: Date.now(),
|
|
227
|
+
};
|
|
228
|
+
}
|
|
@@ -0,0 +1,210 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Pi-native wire format for the auth-gateway.
|
|
3
|
+
*
|
|
4
|
+
* Where the OpenAI / Anthropic / Responses route modules translate foreign
|
|
5
|
+
* wire shapes through pi-ai's canonical {@link Context}, this module accepts
|
|
6
|
+
* the canonical shape *directly* — for clients that already speak pi-ai
|
|
7
|
+
* (containerized gjc, the swarm extension, robogjc's sidecar auth-gateway).
|
|
8
|
+
* Skipping the wire-format → Context → wire-format round-trip cuts
|
|
9
|
+
* per-request CPU but, more importantly, avoids the quantization that those
|
|
10
|
+
* translations impose on first-class pi-ai fields (service tier, cache
|
|
11
|
+
* markers, thinking budgets, tool-choice variants, …).
|
|
12
|
+
*
|
|
13
|
+
* The streaming wire is {@link AssistantMessageEvent} serialized verbatim and
|
|
14
|
+
* SSE-framed. Same type pi-ai already produces internally; the client feeds
|
|
15
|
+
* each parsed event straight into `AssistantMessageEventStream.push()` with
|
|
16
|
+
* no translation. Including `partial: AssistantMessage` on every delta is
|
|
17
|
+
* O(N²) in turn length on the wire — acceptable for the loopback / sidecar
|
|
18
|
+
* topology this transport is designed for; provider latency dominates the
|
|
19
|
+
* actual cost.
|
|
20
|
+
*
|
|
21
|
+
* Endpoint contract:
|
|
22
|
+
* POST /v1/pi/stream
|
|
23
|
+
* body: { modelId, context, options?, stream? } // `stream` defaults to true
|
|
24
|
+
* 200 SSE: stream of `AssistantMessageEvent` (terminated by `data: [DONE]`)
|
|
25
|
+
* 200 JSON (stream=false): { message: AssistantMessage }
|
|
26
|
+
* 4xx/5xx: { error: { type, message } }
|
|
27
|
+
*/
|
|
28
|
+
import type { AssistantMessageEventStream, Context, SimpleStreamOptions } from "../types";
|
|
29
|
+
|
|
30
|
+
export interface PiNativeParsedRequest {
|
|
31
|
+
modelId: string;
|
|
32
|
+
context: Context;
|
|
33
|
+
options: SimpleStreamOptions;
|
|
34
|
+
stream: boolean;
|
|
35
|
+
}
|
|
36
|
+
/**
|
|
37
|
+
* Subset of {@link SimpleStreamOptions} accepted from the wire. Function-valued
|
|
38
|
+
* fields (`fetch`, `onPayload`, `onResponse`, `onSseEvent`, exec handlers, the
|
|
39
|
+
* provider-session map) and gateway-owned controls (`apiKey`, `signal`) are
|
|
40
|
+
* intentionally absent — those are server-side concerns. Anything outside this
|
|
41
|
+
* allow-list is dropped silently rather than 400ing, so clients can forward
|
|
42
|
+
* `SimpleStreamOptions` from older / newer gjc builds without per-version
|
|
43
|
+
* conditionals.
|
|
44
|
+
*/
|
|
45
|
+
const ALLOWED_OPTION_KEYS: ReadonlySet<keyof SimpleStreamOptions> = new Set([
|
|
46
|
+
"temperature",
|
|
47
|
+
"topP",
|
|
48
|
+
"topK",
|
|
49
|
+
"minP",
|
|
50
|
+
"presencePenalty",
|
|
51
|
+
"frequencyPenalty",
|
|
52
|
+
"repetitionPenalty",
|
|
53
|
+
"stopSequences",
|
|
54
|
+
"maxTokens",
|
|
55
|
+
"cacheRetention",
|
|
56
|
+
"headers",
|
|
57
|
+
"initiatorOverride",
|
|
58
|
+
"maxRetryDelayMs",
|
|
59
|
+
"metadata",
|
|
60
|
+
"sessionId",
|
|
61
|
+
"streamFirstEventTimeoutMs",
|
|
62
|
+
"streamIdleTimeoutMs",
|
|
63
|
+
"reasoning",
|
|
64
|
+
"disableReasoning",
|
|
65
|
+
"hideThinkingSummary",
|
|
66
|
+
"thinkingBudgets",
|
|
67
|
+
"toolChoice",
|
|
68
|
+
"serviceTier",
|
|
69
|
+
"kimiApiFormat",
|
|
70
|
+
"syntheticApiFormat",
|
|
71
|
+
"preferWebsockets",
|
|
72
|
+
] as const satisfies readonly (keyof SimpleStreamOptions)[]);
|
|
73
|
+
|
|
74
|
+
// ---------------------------------------------------------------------------
|
|
75
|
+
// parseRequest
|
|
76
|
+
// ---------------------------------------------------------------------------
|
|
77
|
+
|
|
78
|
+
/**
|
|
79
|
+
* Parse a pi-native request body. Validation is intentionally minimal — only
|
|
80
|
+
* the shape the gateway itself reads is checked (`modelId`, `context.messages`
|
|
81
|
+
* array, options is an object). Everything downstream is the canonical pi-ai
|
|
82
|
+
* type surface; mis-shaped values surface as a `502 upstream_error` from
|
|
83
|
+
* `streamSimple` rather than being re-validated here.
|
|
84
|
+
*
|
|
85
|
+
* Accepts both `{ modelId: string }` and `{ model: { id: string } }` so the
|
|
86
|
+
* existing `streamProxy` client (which sends the full Model object) can target
|
|
87
|
+
* the gateway with only a URL swap.
|
|
88
|
+
*/
|
|
89
|
+
export function parseRequest(body: unknown, _headers?: Headers): PiNativeParsedRequest {
|
|
90
|
+
if (typeof body !== "object" || body === null || Array.isArray(body)) {
|
|
91
|
+
throw new Error("Request body must be a JSON object");
|
|
92
|
+
}
|
|
93
|
+
const obj = body as Record<string, unknown>;
|
|
94
|
+
|
|
95
|
+
let modelId: string | undefined;
|
|
96
|
+
if (typeof obj.modelId === "string" && obj.modelId.length > 0) {
|
|
97
|
+
modelId = obj.modelId;
|
|
98
|
+
} else if (typeof obj.model === "string" && obj.model.length > 0) {
|
|
99
|
+
modelId = obj.model;
|
|
100
|
+
} else if (typeof obj.model === "object" && obj.model !== null) {
|
|
101
|
+
const m = obj.model as Record<string, unknown>;
|
|
102
|
+
if (typeof m.id === "string" && m.id.length > 0) modelId = m.id;
|
|
103
|
+
}
|
|
104
|
+
if (!modelId) throw new Error("Missing `modelId` (or `model.id`) field");
|
|
105
|
+
|
|
106
|
+
const context = obj.context;
|
|
107
|
+
if (typeof context !== "object" || context === null || Array.isArray(context)) {
|
|
108
|
+
throw new Error("Missing `context` object");
|
|
109
|
+
}
|
|
110
|
+
const ctxObj = context as Record<string, unknown>;
|
|
111
|
+
if (!Array.isArray(ctxObj.messages)) {
|
|
112
|
+
throw new Error("`context.messages` must be an array");
|
|
113
|
+
}
|
|
114
|
+
if (ctxObj.systemPrompt !== undefined && !Array.isArray(ctxObj.systemPrompt)) {
|
|
115
|
+
throw new Error("`context.systemPrompt` must be an array of strings when present");
|
|
116
|
+
}
|
|
117
|
+
if (ctxObj.tools !== undefined && !Array.isArray(ctxObj.tools)) {
|
|
118
|
+
throw new Error("`context.tools` must be an array when present");
|
|
119
|
+
}
|
|
120
|
+
|
|
121
|
+
const options: SimpleStreamOptions = {};
|
|
122
|
+
const rawOpts = obj.options;
|
|
123
|
+
if (typeof rawOpts === "object" && rawOpts !== null && !Array.isArray(rawOpts)) {
|
|
124
|
+
const optsBag = options as Record<string, unknown>;
|
|
125
|
+
for (const [k, v] of Object.entries(rawOpts)) {
|
|
126
|
+
if (v === undefined || v === null) continue;
|
|
127
|
+
if (!ALLOWED_OPTION_KEYS.has(k as keyof SimpleStreamOptions)) continue;
|
|
128
|
+
optsBag[k] = v;
|
|
129
|
+
}
|
|
130
|
+
}
|
|
131
|
+
|
|
132
|
+
// `stream` defaults to true — pi-native clients overwhelmingly stream, and
|
|
133
|
+
// matching `streamProxy`'s implicit-stream behavior avoids a one-flag papercut.
|
|
134
|
+
const stream = typeof obj.stream === "boolean" ? obj.stream : true;
|
|
135
|
+
|
|
136
|
+
return {
|
|
137
|
+
modelId,
|
|
138
|
+
context: context as Context,
|
|
139
|
+
options,
|
|
140
|
+
stream,
|
|
141
|
+
};
|
|
142
|
+
}
|
|
143
|
+
// ---------------------------------------------------------------------------
|
|
144
|
+
// encodeStream (SSE)
|
|
145
|
+
// ---------------------------------------------------------------------------
|
|
146
|
+
|
|
147
|
+
const SSE_ENCODER = new TextEncoder();
|
|
148
|
+
const SSE_DONE = SSE_ENCODER.encode("data: [DONE]\n\n");
|
|
149
|
+
|
|
150
|
+
/**
|
|
151
|
+
* Ship every {@link AssistantMessageEvent} verbatim, SSE-framed.
|
|
152
|
+
*
|
|
153
|
+
* No per-event re-shaping: the pi-native client is pi-ai itself, so the
|
|
154
|
+
* canonical event type IS the wire type. Including the rolling
|
|
155
|
+
* `partial: AssistantMessage` on every delta is quadratic in turn length
|
|
156
|
+
* on the wire, but for the loopback / sidecar topology this transport
|
|
157
|
+
* targets (containerized gjc → host gateway, robogjc slot → gjc-auth-gateway
|
|
158
|
+
* sidecar) the bandwidth cost is negligible compared to provider latency —
|
|
159
|
+
* and the client gets to feed the events straight into its existing
|
|
160
|
+
* `AssistantMessageEventStream.push()` plumbing with zero translation.
|
|
161
|
+
*/
|
|
162
|
+
export function encodeStream(events: AssistantMessageEventStream): ReadableStream<Uint8Array> {
|
|
163
|
+
return new ReadableStream<Uint8Array>({
|
|
164
|
+
async start(controller) {
|
|
165
|
+
try {
|
|
166
|
+
for await (const event of events) {
|
|
167
|
+
controller.enqueue(SSE_ENCODER.encode(`data: ${JSON.stringify(event)}\n\n`));
|
|
168
|
+
if (event.type === "done" || event.type === "error") break;
|
|
169
|
+
}
|
|
170
|
+
controller.enqueue(SSE_DONE);
|
|
171
|
+
controller.close();
|
|
172
|
+
} catch (err) {
|
|
173
|
+
// Best-effort error envelope so the client iterator resolves
|
|
174
|
+
// instead of hanging on the dropped connection. Shape matches the
|
|
175
|
+
// canonical `error` event minus the unrecoverable `error:
|
|
176
|
+
// AssistantMessage` payload (we don't have a usable one here).
|
|
177
|
+
const message = err instanceof Error ? err.message : String(err);
|
|
178
|
+
controller.enqueue(
|
|
179
|
+
SSE_ENCODER.encode(
|
|
180
|
+
`data: ${JSON.stringify({ type: "error", reason: "error", errorMessage: message })}\n\n`,
|
|
181
|
+
),
|
|
182
|
+
);
|
|
183
|
+
controller.enqueue(SSE_DONE);
|
|
184
|
+
controller.close();
|
|
185
|
+
}
|
|
186
|
+
},
|
|
187
|
+
});
|
|
188
|
+
}
|
|
189
|
+
|
|
190
|
+
// ---------------------------------------------------------------------------
|
|
191
|
+
// formatError
|
|
192
|
+
// ---------------------------------------------------------------------------
|
|
193
|
+
|
|
194
|
+
/**
|
|
195
|
+
* Pi-native error envelope:
|
|
196
|
+
* `{ error: { type, message } }`
|
|
197
|
+
*
|
|
198
|
+
* Mirrors OpenAI's outer shape (which clients/SDKs already parse) without the
|
|
199
|
+
* provider-specific status taxonomy — pi-native callers consume `type`
|
|
200
|
+
* directly.
|
|
201
|
+
*/
|
|
202
|
+
export function formatError(status: number, type: string, message: string): Response {
|
|
203
|
+
return new Response(JSON.stringify({ error: { type, message } }), {
|
|
204
|
+
status,
|
|
205
|
+
headers: {
|
|
206
|
+
"Content-Type": "application/json; charset=utf-8",
|
|
207
|
+
"Cache-Control": "no-store",
|
|
208
|
+
},
|
|
209
|
+
});
|
|
210
|
+
}
|