@gajae-code/ai 0.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (349) hide show
  1. package/CHANGELOG.md +2644 -0
  2. package/README.md +1181 -0
  3. package/dist/types/api-registry.d.ts +30 -0
  4. package/dist/types/auth-broker/client.d.ts +66 -0
  5. package/dist/types/auth-broker/index.d.ts +5 -0
  6. package/dist/types/auth-broker/refresher.d.ts +25 -0
  7. package/dist/types/auth-broker/remote-store.d.ts +96 -0
  8. package/dist/types/auth-broker/server.d.ts +32 -0
  9. package/dist/types/auth-broker/types.d.ts +105 -0
  10. package/dist/types/auth-broker/wire-schemas.d.ts +412 -0
  11. package/dist/types/auth-gateway/http.d.ts +39 -0
  12. package/dist/types/auth-gateway/index.d.ts +3 -0
  13. package/dist/types/auth-gateway/server.d.ts +17 -0
  14. package/dist/types/auth-gateway/types.d.ts +115 -0
  15. package/dist/types/auth-storage.d.ts +641 -0
  16. package/dist/types/cli.d.ts +2 -0
  17. package/dist/types/index.d.ts +49 -0
  18. package/dist/types/model-cache.d.ts +17 -0
  19. package/dist/types/model-manager.d.ts +62 -0
  20. package/dist/types/model-thinking.d.ts +71 -0
  21. package/dist/types/models.d.ts +12 -0
  22. package/dist/types/provider-details.d.ts +24 -0
  23. package/dist/types/provider-models/bundled-references.d.ts +4 -0
  24. package/dist/types/provider-models/descriptors.d.ts +48 -0
  25. package/dist/types/provider-models/google.d.ts +20 -0
  26. package/dist/types/provider-models/index.d.ts +5 -0
  27. package/dist/types/provider-models/ollama.d.ts +7 -0
  28. package/dist/types/provider-models/openai-compat.d.ts +237 -0
  29. package/dist/types/provider-models/special.d.ts +16 -0
  30. package/dist/types/providers/amazon-bedrock.d.ts +36 -0
  31. package/dist/types/providers/anthropic-messages-server-schema.d.ts +450 -0
  32. package/dist/types/providers/anthropic-messages-server.d.ts +17 -0
  33. package/dist/types/providers/anthropic.d.ts +188 -0
  34. package/dist/types/providers/aws-credentials.d.ts +43 -0
  35. package/dist/types/providers/aws-eventstream.d.ts +38 -0
  36. package/dist/types/providers/aws-sigv4.d.ts +55 -0
  37. package/dist/types/providers/azure-openai-responses.d.ts +15 -0
  38. package/dist/types/providers/cursor/gen/agent_pb.d.ts +13022 -0
  39. package/dist/types/providers/cursor.d.ts +42 -0
  40. package/dist/types/providers/error-message.d.ts +27 -0
  41. package/dist/types/providers/github-copilot-headers.d.ts +40 -0
  42. package/dist/types/providers/gitlab-duo.d.ts +27 -0
  43. package/dist/types/providers/google-auth.d.ts +24 -0
  44. package/dist/types/providers/google-gemini-cli.d.ts +72 -0
  45. package/dist/types/providers/google-gemini-headers.d.ts +18 -0
  46. package/dist/types/providers/google-shared.d.ts +163 -0
  47. package/dist/types/providers/google-types.d.ts +138 -0
  48. package/dist/types/providers/google-vertex.d.ts +7 -0
  49. package/dist/types/providers/google.d.ts +4 -0
  50. package/dist/types/providers/grammar.d.ts +1 -0
  51. package/dist/types/providers/kimi.d.ts +27 -0
  52. package/dist/types/providers/mock.d.ts +175 -0
  53. package/dist/types/providers/ollama.d.ts +6 -0
  54. package/dist/types/providers/openai-anthropic-shim.d.ts +31 -0
  55. package/dist/types/providers/openai-chat-server-schema.d.ts +814 -0
  56. package/dist/types/providers/openai-chat-server.d.ts +16 -0
  57. package/dist/types/providers/openai-codex/constants.d.ts +26 -0
  58. package/dist/types/providers/openai-codex/request-transformer.d.ts +49 -0
  59. package/dist/types/providers/openai-codex/response-handler.d.ts +17 -0
  60. package/dist/types/providers/openai-codex-responses.d.ts +67 -0
  61. package/dist/types/providers/openai-completions-compat.d.ts +25 -0
  62. package/dist/types/providers/openai-completions.d.ts +33 -0
  63. package/dist/types/providers/openai-responses-server-schema.d.ts +392 -0
  64. package/dist/types/providers/openai-responses-server.d.ts +17 -0
  65. package/dist/types/providers/openai-responses-shared.d.ts +89 -0
  66. package/dist/types/providers/openai-responses.d.ts +32 -0
  67. package/dist/types/providers/pi-native-client.d.ts +13 -0
  68. package/dist/types/providers/pi-native-server.d.ts +68 -0
  69. package/dist/types/providers/register-builtins.d.ts +31 -0
  70. package/dist/types/providers/synthetic.d.ts +26 -0
  71. package/dist/types/providers/transform-messages.d.ts +12 -0
  72. package/dist/types/providers/vision-guard.d.ts +8 -0
  73. package/dist/types/rate-limit-utils.d.ts +19 -0
  74. package/dist/types/stream.d.ts +24 -0
  75. package/dist/types/types.d.ts +746 -0
  76. package/dist/types/usage/claude.d.ts +3 -0
  77. package/dist/types/usage/gemini.d.ts +2 -0
  78. package/dist/types/usage/github-copilot.d.ts +7 -0
  79. package/dist/types/usage/google-antigravity.d.ts +2 -0
  80. package/dist/types/usage/kimi.d.ts +2 -0
  81. package/dist/types/usage/minimax-code.d.ts +2 -0
  82. package/dist/types/usage/openai-codex.d.ts +3 -0
  83. package/dist/types/usage/shared.d.ts +1 -0
  84. package/dist/types/usage/zai.d.ts +2 -0
  85. package/dist/types/usage.d.ts +258 -0
  86. package/dist/types/utils/abort.d.ts +19 -0
  87. package/dist/types/utils/anthropic-auth.d.ts +31 -0
  88. package/dist/types/utils/discovery/antigravity.d.ts +61 -0
  89. package/dist/types/utils/discovery/codex.d.ts +38 -0
  90. package/dist/types/utils/discovery/cursor.d.ts +23 -0
  91. package/dist/types/utils/discovery/gemini.d.ts +25 -0
  92. package/dist/types/utils/discovery/index.d.ts +4 -0
  93. package/dist/types/utils/discovery/openai-compatible.d.ts +72 -0
  94. package/dist/types/utils/event-stream.d.ts +28 -0
  95. package/dist/types/utils/fireworks-model-id.d.ts +10 -0
  96. package/dist/types/utils/foundry.d.ts +1 -0
  97. package/dist/types/utils/h2-fetch.d.ts +22 -0
  98. package/dist/types/utils/http-inspector.d.ts +31 -0
  99. package/dist/types/utils/idle-iterator.d.ts +67 -0
  100. package/dist/types/utils/json-parse.d.ts +10 -0
  101. package/dist/types/utils/oauth/alibaba-coding-plan.d.ts +18 -0
  102. package/dist/types/utils/oauth/anthropic.d.ts +22 -0
  103. package/dist/types/utils/oauth/api-key-login.d.ts +35 -0
  104. package/dist/types/utils/oauth/api-key-validation.d.ts +27 -0
  105. package/dist/types/utils/oauth/callback-server.d.ts +57 -0
  106. package/dist/types/utils/oauth/cerebras.d.ts +1 -0
  107. package/dist/types/utils/oauth/cloudflare-ai-gateway.d.ts +18 -0
  108. package/dist/types/utils/oauth/cursor.d.ts +15 -0
  109. package/dist/types/utils/oauth/deepseek.d.ts +10 -0
  110. package/dist/types/utils/oauth/firepass.d.ts +1 -0
  111. package/dist/types/utils/oauth/fireworks.d.ts +1 -0
  112. package/dist/types/utils/oauth/github-copilot.d.ts +38 -0
  113. package/dist/types/utils/oauth/gitlab-duo.d.ts +3 -0
  114. package/dist/types/utils/oauth/google-antigravity.d.ts +11 -0
  115. package/dist/types/utils/oauth/google-gemini-cli.d.ts +10 -0
  116. package/dist/types/utils/oauth/google-oauth-shared.d.ts +28 -0
  117. package/dist/types/utils/oauth/huggingface.d.ts +19 -0
  118. package/dist/types/utils/oauth/index.d.ts +38 -0
  119. package/dist/types/utils/oauth/kagi.d.ts +17 -0
  120. package/dist/types/utils/oauth/kilo.d.ts +5 -0
  121. package/dist/types/utils/oauth/kimi.d.ts +21 -0
  122. package/dist/types/utils/oauth/litellm.d.ts +18 -0
  123. package/dist/types/utils/oauth/lm-studio.d.ts +17 -0
  124. package/dist/types/utils/oauth/minimax-code.d.ts +28 -0
  125. package/dist/types/utils/oauth/moonshot.d.ts +1 -0
  126. package/dist/types/utils/oauth/nanogpt.d.ts +1 -0
  127. package/dist/types/utils/oauth/nvidia.d.ts +18 -0
  128. package/dist/types/utils/oauth/ollama-cloud.d.ts +2 -0
  129. package/dist/types/utils/oauth/ollama.d.ts +18 -0
  130. package/dist/types/utils/oauth/openai-codex.d.ts +21 -0
  131. package/dist/types/utils/oauth/opencode.d.ts +18 -0
  132. package/dist/types/utils/oauth/parallel.d.ts +17 -0
  133. package/dist/types/utils/oauth/perplexity.d.ts +9 -0
  134. package/dist/types/utils/oauth/pkce.d.ts +8 -0
  135. package/dist/types/utils/oauth/qianfan.d.ts +17 -0
  136. package/dist/types/utils/oauth/qwen-portal.d.ts +19 -0
  137. package/dist/types/utils/oauth/synthetic.d.ts +1 -0
  138. package/dist/types/utils/oauth/tavily.d.ts +17 -0
  139. package/dist/types/utils/oauth/together.d.ts +1 -0
  140. package/dist/types/utils/oauth/types.d.ts +44 -0
  141. package/dist/types/utils/oauth/venice.d.ts +18 -0
  142. package/dist/types/utils/oauth/vercel-ai-gateway.d.ts +18 -0
  143. package/dist/types/utils/oauth/vllm.d.ts +16 -0
  144. package/dist/types/utils/oauth/xiaomi.d.ts +19 -0
  145. package/dist/types/utils/oauth/zai.d.ts +18 -0
  146. package/dist/types/utils/oauth/zenmux.d.ts +1 -0
  147. package/dist/types/utils/overflow.d.ts +54 -0
  148. package/dist/types/utils/parse-bind.d.ts +23 -0
  149. package/dist/types/utils/provider-response.d.ts +3 -0
  150. package/dist/types/utils/retry-after.d.ts +3 -0
  151. package/dist/types/utils/retry.d.ts +26 -0
  152. package/dist/types/utils/schema/adapt.d.ts +24 -0
  153. package/dist/types/utils/schema/compatibility.d.ts +30 -0
  154. package/dist/types/utils/schema/dereference.d.ts +11 -0
  155. package/dist/types/utils/schema/draft.d.ts +10 -0
  156. package/dist/types/utils/schema/equality.d.ts +4 -0
  157. package/dist/types/utils/schema/fields.d.ts +49 -0
  158. package/dist/types/utils/schema/index.d.ts +13 -0
  159. package/dist/types/utils/schema/json-schema-validator.d.ts +12 -0
  160. package/dist/types/utils/schema/meta-validator.d.ts +2 -0
  161. package/dist/types/utils/schema/normalize.d.ts +93 -0
  162. package/dist/types/utils/schema/spill.d.ts +8 -0
  163. package/dist/types/utils/schema/stamps.d.ts +25 -0
  164. package/dist/types/utils/schema/types.d.ts +4 -0
  165. package/dist/types/utils/schema/wire.d.ts +54 -0
  166. package/dist/types/utils/schema/zod-decontaminate.d.ts +31 -0
  167. package/dist/types/utils/sse-debug.d.ts +10 -0
  168. package/dist/types/utils/tool-call-healing.d.ts +71 -0
  169. package/dist/types/utils/tool-choice.d.ts +50 -0
  170. package/dist/types/utils/validation.d.ts +17 -0
  171. package/dist/types/utils.d.ts +28 -0
  172. package/package.json +146 -0
  173. package/src/api-registry.ts +96 -0
  174. package/src/auth-broker/client.ts +358 -0
  175. package/src/auth-broker/index.ts +5 -0
  176. package/src/auth-broker/refresher.ts +127 -0
  177. package/src/auth-broker/remote-store.ts +623 -0
  178. package/src/auth-broker/server.ts +644 -0
  179. package/src/auth-broker/types.ts +127 -0
  180. package/src/auth-broker/wire-schemas.ts +200 -0
  181. package/src/auth-gateway/http.ts +194 -0
  182. package/src/auth-gateway/index.ts +3 -0
  183. package/src/auth-gateway/server.ts +717 -0
  184. package/src/auth-gateway/types.ts +134 -0
  185. package/src/auth-storage.ts +4104 -0
  186. package/src/cli.ts +262 -0
  187. package/src/index.ts +54 -0
  188. package/src/model-cache.ts +129 -0
  189. package/src/model-manager.ts +450 -0
  190. package/src/model-thinking.ts +691 -0
  191. package/src/models.json +73853 -0
  192. package/src/models.json.d.ts +9 -0
  193. package/src/models.ts +56 -0
  194. package/src/prompts/turn-aborted-guidance.md +4 -0
  195. package/src/provider-details.ts +90 -0
  196. package/src/provider-models/bundled-references.ts +38 -0
  197. package/src/provider-models/descriptors.ts +308 -0
  198. package/src/provider-models/google.ts +91 -0
  199. package/src/provider-models/index.ts +5 -0
  200. package/src/provider-models/ollama.ts +153 -0
  201. package/src/provider-models/openai-compat.ts +2275 -0
  202. package/src/provider-models/special.ts +67 -0
  203. package/src/providers/amazon-bedrock.ts +849 -0
  204. package/src/providers/anthropic-messages-server-schema.ts +229 -0
  205. package/src/providers/anthropic-messages-server.ts +677 -0
  206. package/src/providers/anthropic.ts +2696 -0
  207. package/src/providers/aws-credentials.ts +501 -0
  208. package/src/providers/aws-eventstream.ts +185 -0
  209. package/src/providers/aws-sigv4.ts +218 -0
  210. package/src/providers/azure-openai-responses.ts +337 -0
  211. package/src/providers/cursor/gen/agent_pb.ts +15274 -0
  212. package/src/providers/cursor/proto/agent.proto +3526 -0
  213. package/src/providers/cursor/proto/buf.gen.yaml +6 -0
  214. package/src/providers/cursor/proto/buf.yaml +17 -0
  215. package/src/providers/cursor.ts +2561 -0
  216. package/src/providers/error-message.ts +21 -0
  217. package/src/providers/github-copilot-headers.ts +140 -0
  218. package/src/providers/gitlab-duo.ts +372 -0
  219. package/src/providers/google-auth.ts +252 -0
  220. package/src/providers/google-gemini-cli.ts +795 -0
  221. package/src/providers/google-gemini-headers.ts +41 -0
  222. package/src/providers/google-shared.ts +902 -0
  223. package/src/providers/google-types.ts +167 -0
  224. package/src/providers/google-vertex.ts +88 -0
  225. package/src/providers/google.ts +41 -0
  226. package/src/providers/grammar.ts +70 -0
  227. package/src/providers/kimi.ts +52 -0
  228. package/src/providers/mock.ts +500 -0
  229. package/src/providers/ollama.ts +544 -0
  230. package/src/providers/openai-anthropic-shim.ts +138 -0
  231. package/src/providers/openai-chat-server-schema.ts +243 -0
  232. package/src/providers/openai-chat-server.ts +628 -0
  233. package/src/providers/openai-codex/constants.ts +43 -0
  234. package/src/providers/openai-codex/request-transformer.ts +161 -0
  235. package/src/providers/openai-codex/response-handler.ts +81 -0
  236. package/src/providers/openai-codex-responses.ts +2598 -0
  237. package/src/providers/openai-completions-compat.ts +279 -0
  238. package/src/providers/openai-completions.ts +1853 -0
  239. package/src/providers/openai-responses-server-schema.ts +290 -0
  240. package/src/providers/openai-responses-server.ts +1183 -0
  241. package/src/providers/openai-responses-shared.ts +800 -0
  242. package/src/providers/openai-responses.ts +621 -0
  243. package/src/providers/pi-native-client.ts +228 -0
  244. package/src/providers/pi-native-server.ts +210 -0
  245. package/src/providers/register-builtins.ts +412 -0
  246. package/src/providers/synthetic.ts +50 -0
  247. package/src/providers/transform-messages.ts +309 -0
  248. package/src/providers/vision-guard.ts +31 -0
  249. package/src/rate-limit-utils.ts +84 -0
  250. package/src/stream.ts +895 -0
  251. package/src/types.ts +884 -0
  252. package/src/usage/claude.ts +431 -0
  253. package/src/usage/gemini.ts +250 -0
  254. package/src/usage/github-copilot.ts +421 -0
  255. package/src/usage/google-antigravity.ts +201 -0
  256. package/src/usage/kimi.ts +271 -0
  257. package/src/usage/minimax-code.ts +31 -0
  258. package/src/usage/openai-codex.ts +503 -0
  259. package/src/usage/shared.ts +10 -0
  260. package/src/usage/zai.ts +247 -0
  261. package/src/usage.ts +183 -0
  262. package/src/utils/abort.ts +51 -0
  263. package/src/utils/anthropic-auth.ts +87 -0
  264. package/src/utils/discovery/antigravity.ts +261 -0
  265. package/src/utils/discovery/codex.ts +371 -0
  266. package/src/utils/discovery/cursor.ts +306 -0
  267. package/src/utils/discovery/gemini.ts +248 -0
  268. package/src/utils/discovery/index.ts +4 -0
  269. package/src/utils/discovery/openai-compatible.ts +224 -0
  270. package/src/utils/event-stream.ts +142 -0
  271. package/src/utils/fireworks-model-id.ts +30 -0
  272. package/src/utils/foundry.ts +8 -0
  273. package/src/utils/h2-fetch.ts +60 -0
  274. package/src/utils/http-inspector.ts +176 -0
  275. package/src/utils/idle-iterator.ts +250 -0
  276. package/src/utils/json-parse.ts +148 -0
  277. package/src/utils/oauth/alibaba-coding-plan.ts +59 -0
  278. package/src/utils/oauth/anthropic.ts +200 -0
  279. package/src/utils/oauth/api-key-login.ts +87 -0
  280. package/src/utils/oauth/api-key-validation.ts +92 -0
  281. package/src/utils/oauth/callback-server.ts +276 -0
  282. package/src/utils/oauth/cerebras.ts +16 -0
  283. package/src/utils/oauth/cloudflare-ai-gateway.ts +48 -0
  284. package/src/utils/oauth/cursor.ts +157 -0
  285. package/src/utils/oauth/deepseek.ts +53 -0
  286. package/src/utils/oauth/firepass.ts +24 -0
  287. package/src/utils/oauth/fireworks.ts +15 -0
  288. package/src/utils/oauth/github-copilot.ts +362 -0
  289. package/src/utils/oauth/gitlab-duo.ts +123 -0
  290. package/src/utils/oauth/google-antigravity.ts +200 -0
  291. package/src/utils/oauth/google-gemini-cli.ts +256 -0
  292. package/src/utils/oauth/google-oauth-shared.ts +110 -0
  293. package/src/utils/oauth/huggingface.ts +62 -0
  294. package/src/utils/oauth/index.ts +444 -0
  295. package/src/utils/oauth/kagi.ts +47 -0
  296. package/src/utils/oauth/kilo.ts +87 -0
  297. package/src/utils/oauth/kimi.ts +254 -0
  298. package/src/utils/oauth/litellm.ts +47 -0
  299. package/src/utils/oauth/lm-studio.ts +38 -0
  300. package/src/utils/oauth/minimax-code.ts +78 -0
  301. package/src/utils/oauth/moonshot.ts +16 -0
  302. package/src/utils/oauth/nanogpt.ts +15 -0
  303. package/src/utils/oauth/nvidia.ts +70 -0
  304. package/src/utils/oauth/oauth.html +199 -0
  305. package/src/utils/oauth/ollama-cloud.ts +28 -0
  306. package/src/utils/oauth/ollama.ts +47 -0
  307. package/src/utils/oauth/openai-codex.ts +299 -0
  308. package/src/utils/oauth/opencode.ts +49 -0
  309. package/src/utils/oauth/parallel.ts +46 -0
  310. package/src/utils/oauth/perplexity.ts +206 -0
  311. package/src/utils/oauth/pkce.ts +18 -0
  312. package/src/utils/oauth/qianfan.ts +58 -0
  313. package/src/utils/oauth/qwen-portal.ts +60 -0
  314. package/src/utils/oauth/synthetic.ts +16 -0
  315. package/src/utils/oauth/tavily.ts +46 -0
  316. package/src/utils/oauth/together.ts +16 -0
  317. package/src/utils/oauth/types.ts +94 -0
  318. package/src/utils/oauth/venice.ts +59 -0
  319. package/src/utils/oauth/vercel-ai-gateway.ts +47 -0
  320. package/src/utils/oauth/vllm.ts +40 -0
  321. package/src/utils/oauth/xiaomi.ts +137 -0
  322. package/src/utils/oauth/zai.ts +60 -0
  323. package/src/utils/oauth/zenmux.ts +15 -0
  324. package/src/utils/overflow.ts +137 -0
  325. package/src/utils/parse-bind.ts +54 -0
  326. package/src/utils/provider-response.ts +30 -0
  327. package/src/utils/retry-after.ts +110 -0
  328. package/src/utils/retry.ts +54 -0
  329. package/src/utils/schema/CONSTRAINTS.md +164 -0
  330. package/src/utils/schema/adapt.ts +36 -0
  331. package/src/utils/schema/compatibility.ts +435 -0
  332. package/src/utils/schema/dereference.ts +98 -0
  333. package/src/utils/schema/draft.ts +341 -0
  334. package/src/utils/schema/equality.ts +97 -0
  335. package/src/utils/schema/fields.ts +190 -0
  336. package/src/utils/schema/index.ts +13 -0
  337. package/src/utils/schema/json-schema-validator.ts +577 -0
  338. package/src/utils/schema/meta-validator.ts +167 -0
  339. package/src/utils/schema/normalize.ts +1588 -0
  340. package/src/utils/schema/spill.ts +43 -0
  341. package/src/utils/schema/stamps.ts +97 -0
  342. package/src/utils/schema/types.ts +11 -0
  343. package/src/utils/schema/wire.ts +213 -0
  344. package/src/utils/schema/zod-decontaminate.ts +331 -0
  345. package/src/utils/sse-debug.ts +289 -0
  346. package/src/utils/tool-call-healing.ts +271 -0
  347. package/src/utils/tool-choice.ts +99 -0
  348. package/src/utils/validation.ts +1019 -0
  349. package/src/utils.ts +166 -0
@@ -0,0 +1,228 @@
1
+ /**
2
+ * Client half of the pi-native auth-gateway protocol.
3
+ *
4
+ * Dispatches a {@link streamSimple}-shaped request to an `gjc auth-gateway`
5
+ * via `POST /v1/pi/stream`, reads the SSE event stream back, and pushes the
6
+ * parsed events into a local {@link AssistantMessageEventStream} — the same
7
+ * stream type every other provider client produces. Callers downstream of
8
+ * `streamSimple` cannot tell whether the events came from a real provider
9
+ * SDK or from a gateway hop; they consume `AssistantMessageEvent`s either
10
+ * way.
11
+ *
12
+ * Activated when a {@link Model} has `transport: "pi-native"` set; the
13
+ * dispatch hook lives in `streamSimple()` (see `../stream.ts`). Used by
14
+ * containerized gjc deployments (robogjc slots, the swarm extension) that
15
+ * route every LLM call through a credential-holding sidecar so the slot
16
+ * itself stays credential-free.
17
+ */
18
+ import { readSseJson } from "@gajae-code/utils";
19
+ import type {
20
+ Api,
21
+ AssistantMessage,
22
+ AssistantMessageEvent,
23
+ AssistantMessageEventStream as AssistantMessageEventStreamType,
24
+ Context,
25
+ Model,
26
+ SimpleStreamOptions,
27
+ } from "../types";
28
+ import { AssistantMessageEventStream } from "../utils/event-stream";
29
+
30
+ /**
31
+ * Fields that must not cross the wire — either non-serializable (functions,
32
+ * `AbortSignal`, the provider-session `Map`) or server-controlled
33
+ * (`apiKey`, which the gateway injects from its own credential store; the
34
+ * client's `apiKey` is the gateway *bearer*, sent in the `Authorization`
35
+ * header rather than the request body).
36
+ */
37
+ const NON_WIRE_KEYS = new Set<keyof SimpleStreamOptions>([
38
+ "signal",
39
+ "apiKey",
40
+ "fetch",
41
+ "onPayload",
42
+ "onResponse",
43
+ "onSseEvent",
44
+ "execHandlers",
45
+ "cursorExecHandlers",
46
+ "cursorOnToolResult",
47
+ "providerSessionState",
48
+ ]);
49
+
50
+ function buildWireOptions(options: SimpleStreamOptions | undefined): Record<string, unknown> {
51
+ if (!options) return {};
52
+ const wire: Record<string, unknown> = {};
53
+ for (const [k, v] of Object.entries(options)) {
54
+ if (v === undefined) continue;
55
+ if (NON_WIRE_KEYS.has(k as keyof SimpleStreamOptions)) continue;
56
+ wire[k] = v;
57
+ }
58
+ return wire;
59
+ }
60
+
61
+ async function decodeGatewayError(response: Response): Promise<Error> {
62
+ const status = response.status;
63
+ let body: unknown;
64
+ try {
65
+ body = await response.json();
66
+ } catch {
67
+ body = await response.text().catch(() => "");
68
+ }
69
+ if (typeof body === "object" && body !== null && "error" in body) {
70
+ const err = (body as { error: unknown }).error;
71
+ if (typeof err === "object" && err !== null) {
72
+ const message = (err as { message?: unknown }).message;
73
+ const type = (err as { type?: unknown }).type;
74
+ const out = new Error(typeof message === "string" ? message : `auth-gateway ${status}`);
75
+ (out as { status?: number; type?: string }).status = status;
76
+ if (typeof type === "string") (out as { type?: string }).type = type;
77
+ return out;
78
+ }
79
+ }
80
+ const text = typeof body === "string" ? body : JSON.stringify(body);
81
+ const err = new Error(`auth-gateway ${status}: ${text || response.statusText}`);
82
+ (err as { status?: number }).status = status;
83
+ return err;
84
+ }
85
+
86
+ /**
87
+ * Resolve the `/v1/pi/stream` endpoint URL from the model's `baseUrl`.
88
+ * Trims a trailing slash so concatenation can't double-slash; throws when
89
+ * the baseUrl is missing (transport=pi-native without a gateway target is
90
+ * a configuration error, not a runtime recoverable one).
91
+ */
92
+ function resolveStreamUrl(model: Model<Api>): string {
93
+ if (!model.baseUrl) {
94
+ throw new Error(
95
+ `pi-native transport requires \`baseUrl\` on model ${model.id} (set it on the provider config in models.yml)`,
96
+ );
97
+ }
98
+ return `${model.baseUrl.replace(/\/+$/, "")}/v1/pi/stream`;
99
+ }
100
+
101
+ function buildHeaders(model: Model<Api>, apiKey: string | undefined): Record<string, string> {
102
+ const headers: Record<string, string> = {
103
+ "Content-Type": "application/json",
104
+ Accept: "text/event-stream",
105
+ ...(model.headers ?? {}),
106
+ };
107
+ if (apiKey && !headers.Authorization) {
108
+ headers.Authorization = `Bearer ${apiKey}`;
109
+ }
110
+ return headers;
111
+ }
112
+
113
+ /**
114
+ * Stream a turn through an `gjc auth-gateway` over the pi-native protocol.
115
+ *
116
+ * The returned {@link AssistantMessageEventStream} receives each parsed
117
+ * `AssistantMessageEvent` verbatim from the gateway; the terminal `done` /
118
+ * `error` event resolves `.result()` automatically via the base class's
119
+ * completion check. Non-streaming consumers just call `.result()` and pay
120
+ * for SSE framing they don't use — that overhead is dominated by provider
121
+ * latency, so we always stream rather than maintaining a parallel
122
+ * non-streaming path.
123
+ */
124
+ export function streamPiNative<TApi extends Api>(
125
+ model: Model<TApi>,
126
+ context: Context,
127
+ options?: SimpleStreamOptions,
128
+ ): AssistantMessageEventStreamType {
129
+ const stream = new AssistantMessageEventStream();
130
+
131
+ void (async () => {
132
+ const signal = options?.signal;
133
+ // Abort propagation: cancel the response body when the caller's signal
134
+ // fires. Mirror `streamProxy`'s shape — explicit listener + finally
135
+ // cleanup — so we don't leak listeners on the long-running case.
136
+ let response: Response | null = null;
137
+ const onAbort = (): void => {
138
+ const body = response?.body;
139
+ if (body) body.cancel("Request aborted by caller").catch(() => {});
140
+ };
141
+ if (signal) {
142
+ if (signal.aborted) {
143
+ stream.fail(signal.reason instanceof Error ? signal.reason : new Error(String(signal.reason ?? "aborted")));
144
+ return;
145
+ }
146
+ signal.addEventListener("abort", onAbort, { once: true });
147
+ }
148
+
149
+ try {
150
+ const url = resolveStreamUrl(model as Model<Api>);
151
+ const fetchImpl = options?.fetch ?? globalThis.fetch;
152
+ const headers = buildHeaders(model as Model<Api>, options?.apiKey);
153
+ const body = JSON.stringify({
154
+ modelId: model.id,
155
+ context,
156
+ options: buildWireOptions(options),
157
+ stream: true,
158
+ });
159
+
160
+ response = await fetchImpl(url, { method: "POST", headers, body, signal });
161
+ if (!response.ok) {
162
+ stream.fail(await decodeGatewayError(response));
163
+ return;
164
+ }
165
+ if (!response.body) {
166
+ stream.fail(new Error("auth-gateway returned empty body"));
167
+ return;
168
+ }
169
+
170
+ let sawTerminal = false;
171
+ for await (const event of readSseJson<AssistantMessageEvent>(
172
+ response.body as ReadableStream<Uint8Array>,
173
+ signal,
174
+ )) {
175
+ if (event.type === "done" || event.type === "error") sawTerminal = true;
176
+ stream.push(event);
177
+ // `stream.push` resolves `.result()` on `done`/`error`; subsequent
178
+ // pushes are silently dropped by the base class. We still iterate
179
+ // to drain any trailing bytes from the wire so the underlying TCP
180
+ // stream closes cleanly.
181
+ }
182
+
183
+ if (!sawTerminal) {
184
+ // SSE closed before a terminal event reached us — synthesize one
185
+ // so awaiters of `.result()` resolve instead of hanging forever.
186
+ // Matches the gateway's own defensive fallback in
187
+ // `pi-native-server.encodeStream`.
188
+ const aborted = signal?.aborted === true;
189
+ const partial = makeSyntheticAssistant(model as Model<Api>);
190
+ if (aborted) {
191
+ partial.stopReason = "aborted";
192
+ partial.errorMessage = "stream closed without terminal event";
193
+ stream.push({ type: "error", reason: "aborted", error: partial });
194
+ } else {
195
+ partial.stopReason = "stop";
196
+ stream.push({ type: "done", reason: "stop", message: partial });
197
+ }
198
+ }
199
+ stream.end();
200
+ } catch (err) {
201
+ stream.fail(err);
202
+ } finally {
203
+ if (signal) signal.removeEventListener("abort", onAbort);
204
+ }
205
+ })();
206
+
207
+ return stream;
208
+ }
209
+
210
+ function makeSyntheticAssistant(model: Model<Api>): AssistantMessage {
211
+ return {
212
+ role: "assistant",
213
+ content: [],
214
+ api: model.api,
215
+ provider: model.provider,
216
+ model: model.id,
217
+ usage: {
218
+ input: 0,
219
+ output: 0,
220
+ cacheRead: 0,
221
+ cacheWrite: 0,
222
+ totalTokens: 0,
223
+ cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0, total: 0 },
224
+ },
225
+ stopReason: "stop",
226
+ timestamp: Date.now(),
227
+ };
228
+ }
@@ -0,0 +1,210 @@
1
+ /**
2
+ * Pi-native wire format for the auth-gateway.
3
+ *
4
+ * Where the OpenAI / Anthropic / Responses route modules translate foreign
5
+ * wire shapes through pi-ai's canonical {@link Context}, this module accepts
6
+ * the canonical shape *directly* — for clients that already speak pi-ai
7
+ * (containerized gjc, the swarm extension, robogjc's sidecar auth-gateway).
8
+ * Skipping the wire-format → Context → wire-format round-trip cuts
9
+ * per-request CPU but, more importantly, avoids the quantization that those
10
+ * translations impose on first-class pi-ai fields (service tier, cache
11
+ * markers, thinking budgets, tool-choice variants, …).
12
+ *
13
+ * The streaming wire is {@link AssistantMessageEvent} serialized verbatim and
14
+ * SSE-framed. Same type pi-ai already produces internally; the client feeds
15
+ * each parsed event straight into `AssistantMessageEventStream.push()` with
16
+ * no translation. Including `partial: AssistantMessage` on every delta is
17
+ * O(N²) in turn length on the wire — acceptable for the loopback / sidecar
18
+ * topology this transport is designed for; provider latency dominates the
19
+ * actual cost.
20
+ *
21
+ * Endpoint contract:
22
+ * POST /v1/pi/stream
23
+ * body: { modelId, context, options?, stream? } // `stream` defaults to true
24
+ * 200 SSE: stream of `AssistantMessageEvent` (terminated by `data: [DONE]`)
25
+ * 200 JSON (stream=false): { message: AssistantMessage }
26
+ * 4xx/5xx: { error: { type, message } }
27
+ */
28
+ import type { AssistantMessageEventStream, Context, SimpleStreamOptions } from "../types";
29
+
30
+ export interface PiNativeParsedRequest {
31
+ modelId: string;
32
+ context: Context;
33
+ options: SimpleStreamOptions;
34
+ stream: boolean;
35
+ }
36
+ /**
37
+ * Subset of {@link SimpleStreamOptions} accepted from the wire. Function-valued
38
+ * fields (`fetch`, `onPayload`, `onResponse`, `onSseEvent`, exec handlers, the
39
+ * provider-session map) and gateway-owned controls (`apiKey`, `signal`) are
40
+ * intentionally absent — those are server-side concerns. Anything outside this
41
+ * allow-list is dropped silently rather than 400ing, so clients can forward
42
+ * `SimpleStreamOptions` from older / newer gjc builds without per-version
43
+ * conditionals.
44
+ */
45
+ const ALLOWED_OPTION_KEYS: ReadonlySet<keyof SimpleStreamOptions> = new Set([
46
+ "temperature",
47
+ "topP",
48
+ "topK",
49
+ "minP",
50
+ "presencePenalty",
51
+ "frequencyPenalty",
52
+ "repetitionPenalty",
53
+ "stopSequences",
54
+ "maxTokens",
55
+ "cacheRetention",
56
+ "headers",
57
+ "initiatorOverride",
58
+ "maxRetryDelayMs",
59
+ "metadata",
60
+ "sessionId",
61
+ "streamFirstEventTimeoutMs",
62
+ "streamIdleTimeoutMs",
63
+ "reasoning",
64
+ "disableReasoning",
65
+ "hideThinkingSummary",
66
+ "thinkingBudgets",
67
+ "toolChoice",
68
+ "serviceTier",
69
+ "kimiApiFormat",
70
+ "syntheticApiFormat",
71
+ "preferWebsockets",
72
+ ] as const satisfies readonly (keyof SimpleStreamOptions)[]);
73
+
74
+ // ---------------------------------------------------------------------------
75
+ // parseRequest
76
+ // ---------------------------------------------------------------------------
77
+
78
+ /**
79
+ * Parse a pi-native request body. Validation is intentionally minimal — only
80
+ * the shape the gateway itself reads is checked (`modelId`, `context.messages`
81
+ * array, options is an object). Everything downstream is the canonical pi-ai
82
+ * type surface; mis-shaped values surface as a `502 upstream_error` from
83
+ * `streamSimple` rather than being re-validated here.
84
+ *
85
+ * Accepts both `{ modelId: string }` and `{ model: { id: string } }` so the
86
+ * existing `streamProxy` client (which sends the full Model object) can target
87
+ * the gateway with only a URL swap.
88
+ */
89
+ export function parseRequest(body: unknown, _headers?: Headers): PiNativeParsedRequest {
90
+ if (typeof body !== "object" || body === null || Array.isArray(body)) {
91
+ throw new Error("Request body must be a JSON object");
92
+ }
93
+ const obj = body as Record<string, unknown>;
94
+
95
+ let modelId: string | undefined;
96
+ if (typeof obj.modelId === "string" && obj.modelId.length > 0) {
97
+ modelId = obj.modelId;
98
+ } else if (typeof obj.model === "string" && obj.model.length > 0) {
99
+ modelId = obj.model;
100
+ } else if (typeof obj.model === "object" && obj.model !== null) {
101
+ const m = obj.model as Record<string, unknown>;
102
+ if (typeof m.id === "string" && m.id.length > 0) modelId = m.id;
103
+ }
104
+ if (!modelId) throw new Error("Missing `modelId` (or `model.id`) field");
105
+
106
+ const context = obj.context;
107
+ if (typeof context !== "object" || context === null || Array.isArray(context)) {
108
+ throw new Error("Missing `context` object");
109
+ }
110
+ const ctxObj = context as Record<string, unknown>;
111
+ if (!Array.isArray(ctxObj.messages)) {
112
+ throw new Error("`context.messages` must be an array");
113
+ }
114
+ if (ctxObj.systemPrompt !== undefined && !Array.isArray(ctxObj.systemPrompt)) {
115
+ throw new Error("`context.systemPrompt` must be an array of strings when present");
116
+ }
117
+ if (ctxObj.tools !== undefined && !Array.isArray(ctxObj.tools)) {
118
+ throw new Error("`context.tools` must be an array when present");
119
+ }
120
+
121
+ const options: SimpleStreamOptions = {};
122
+ const rawOpts = obj.options;
123
+ if (typeof rawOpts === "object" && rawOpts !== null && !Array.isArray(rawOpts)) {
124
+ const optsBag = options as Record<string, unknown>;
125
+ for (const [k, v] of Object.entries(rawOpts)) {
126
+ if (v === undefined || v === null) continue;
127
+ if (!ALLOWED_OPTION_KEYS.has(k as keyof SimpleStreamOptions)) continue;
128
+ optsBag[k] = v;
129
+ }
130
+ }
131
+
132
+ // `stream` defaults to true — pi-native clients overwhelmingly stream, and
133
+ // matching `streamProxy`'s implicit-stream behavior avoids a one-flag papercut.
134
+ const stream = typeof obj.stream === "boolean" ? obj.stream : true;
135
+
136
+ return {
137
+ modelId,
138
+ context: context as Context,
139
+ options,
140
+ stream,
141
+ };
142
+ }
143
+ // ---------------------------------------------------------------------------
144
+ // encodeStream (SSE)
145
+ // ---------------------------------------------------------------------------
146
+
147
+ const SSE_ENCODER = new TextEncoder();
148
+ const SSE_DONE = SSE_ENCODER.encode("data: [DONE]\n\n");
149
+
150
+ /**
151
+ * Ship every {@link AssistantMessageEvent} verbatim, SSE-framed.
152
+ *
153
+ * No per-event re-shaping: the pi-native client is pi-ai itself, so the
154
+ * canonical event type IS the wire type. Including the rolling
155
+ * `partial: AssistantMessage` on every delta is quadratic in turn length
156
+ * on the wire, but for the loopback / sidecar topology this transport
157
+ * targets (containerized gjc → host gateway, robogjc slot → gjc-auth-gateway
158
+ * sidecar) the bandwidth cost is negligible compared to provider latency —
159
+ * and the client gets to feed the events straight into its existing
160
+ * `AssistantMessageEventStream.push()` plumbing with zero translation.
161
+ */
162
+ export function encodeStream(events: AssistantMessageEventStream): ReadableStream<Uint8Array> {
163
+ return new ReadableStream<Uint8Array>({
164
+ async start(controller) {
165
+ try {
166
+ for await (const event of events) {
167
+ controller.enqueue(SSE_ENCODER.encode(`data: ${JSON.stringify(event)}\n\n`));
168
+ if (event.type === "done" || event.type === "error") break;
169
+ }
170
+ controller.enqueue(SSE_DONE);
171
+ controller.close();
172
+ } catch (err) {
173
+ // Best-effort error envelope so the client iterator resolves
174
+ // instead of hanging on the dropped connection. Shape matches the
175
+ // canonical `error` event minus the unrecoverable `error:
176
+ // AssistantMessage` payload (we don't have a usable one here).
177
+ const message = err instanceof Error ? err.message : String(err);
178
+ controller.enqueue(
179
+ SSE_ENCODER.encode(
180
+ `data: ${JSON.stringify({ type: "error", reason: "error", errorMessage: message })}\n\n`,
181
+ ),
182
+ );
183
+ controller.enqueue(SSE_DONE);
184
+ controller.close();
185
+ }
186
+ },
187
+ });
188
+ }
189
+
190
+ // ---------------------------------------------------------------------------
191
+ // formatError
192
+ // ---------------------------------------------------------------------------
193
+
194
+ /**
195
+ * Pi-native error envelope:
196
+ * `{ error: { type, message } }`
197
+ *
198
+ * Mirrors OpenAI's outer shape (which clients/SDKs already parse) without the
199
+ * provider-specific status taxonomy — pi-native callers consume `type`
200
+ * directly.
201
+ */
202
+ export function formatError(status: number, type: string, message: string): Response {
203
+ return new Response(JSON.stringify({ error: { type, message } }), {
204
+ status,
205
+ headers: {
206
+ "Content-Type": "application/json; charset=utf-8",
207
+ "Cache-Control": "no-store",
208
+ },
209
+ });
210
+ }