@aryee337/aery-ai 0.1.148 → 0.2.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (592) hide show
  1. package/CHANGELOG.md +2914 -0
  2. package/README.md +614 -813
  3. package/dist/types/api-registry.d.ts +30 -0
  4. package/dist/types/auth-broker/client.d.ts +66 -0
  5. package/dist/types/auth-broker/index.d.ts +5 -0
  6. package/dist/types/auth-broker/refresher.d.ts +25 -0
  7. package/dist/types/auth-broker/remote-store.d.ts +96 -0
  8. package/dist/types/auth-broker/server.d.ts +32 -0
  9. package/dist/types/auth-broker/types.d.ts +105 -0
  10. package/dist/types/auth-broker/wire-schemas.d.ts +412 -0
  11. package/dist/types/auth-gateway/http.d.ts +39 -0
  12. package/dist/types/auth-gateway/index.d.ts +3 -0
  13. package/dist/types/auth-gateway/server.d.ts +36 -0
  14. package/dist/types/auth-gateway/types.d.ts +117 -0
  15. package/dist/types/auth-storage.d.ts +739 -0
  16. package/dist/types/index.d.ts +49 -0
  17. package/dist/types/model-cache.d.ts +17 -0
  18. package/dist/types/model-manager.d.ts +64 -0
  19. package/dist/types/model-thinking.d.ts +100 -0
  20. package/dist/types/models.d.ts +12 -0
  21. package/dist/types/provider-details.d.ts +24 -0
  22. package/dist/types/provider-models/bundled-references.d.ts +4 -0
  23. package/dist/types/provider-models/descriptors.d.ts +50 -0
  24. package/dist/types/provider-models/google.d.ts +24 -0
  25. package/dist/types/provider-models/index.d.ts +5 -0
  26. package/dist/types/provider-models/ollama.d.ts +7 -0
  27. package/dist/types/provider-models/openai-compat.d.ts +296 -0
  28. package/dist/types/provider-models/special.d.ts +16 -0
  29. package/dist/types/providers/aery-native-client.d.ts +13 -0
  30. package/dist/types/providers/aery-native-server.d.ts +68 -0
  31. package/dist/types/providers/amazon-bedrock.d.ts +38 -0
  32. package/dist/types/providers/anthropic-client.d.ts +99 -0
  33. package/dist/types/providers/anthropic-messages-server-schema.d.ts +465 -0
  34. package/dist/types/providers/anthropic-messages-server.d.ts +17 -0
  35. package/dist/types/providers/anthropic-wire.d.ts +262 -0
  36. package/dist/types/providers/anthropic.d.ts +206 -0
  37. package/dist/types/providers/aws-credentials.d.ts +43 -0
  38. package/dist/types/providers/aws-eventstream.d.ts +38 -0
  39. package/dist/types/providers/aws-sigv4.d.ts +55 -0
  40. package/dist/types/providers/azure-openai-responses.d.ts +15 -0
  41. package/dist/types/providers/cursor/gen/agent_pb.d.ts +13022 -0
  42. package/dist/types/providers/cursor.d.ts +43 -0
  43. package/dist/types/providers/error-message.d.ts +27 -0
  44. package/dist/types/providers/github-copilot-headers.d.ts +40 -0
  45. package/dist/types/providers/gitlab-duo.d.ts +27 -0
  46. package/dist/types/providers/google-auth.d.ts +24 -0
  47. package/dist/types/providers/google-gemini-cli.d.ts +81 -0
  48. package/dist/types/providers/google-gemini-headers.d.ts +18 -0
  49. package/dist/types/providers/google-shared.d.ts +171 -0
  50. package/dist/types/providers/google-types.d.ts +138 -0
  51. package/dist/types/providers/google-vertex.d.ts +7 -0
  52. package/dist/types/providers/google.d.ts +4 -0
  53. package/dist/types/providers/grammar.d.ts +1 -0
  54. package/dist/types/providers/kimi.d.ts +27 -0
  55. package/dist/types/providers/mock.d.ts +173 -0
  56. package/dist/types/providers/ollama.d.ts +6 -0
  57. package/dist/types/providers/openai-anthropic-shim.d.ts +31 -0
  58. package/dist/types/providers/openai-chat-server-schema.d.ts +817 -0
  59. package/dist/types/providers/openai-chat-server.d.ts +16 -0
  60. package/dist/types/providers/openai-codex/constants.d.ts +26 -0
  61. package/dist/types/providers/openai-codex/request-transformer.d.ts +49 -0
  62. package/dist/types/providers/openai-codex/response-handler.d.ts +17 -0
  63. package/dist/types/providers/openai-codex-responses.d.ts +67 -0
  64. package/dist/types/providers/openai-completions-compat.d.ts +25 -0
  65. package/dist/types/providers/openai-completions.d.ts +54 -0
  66. package/dist/types/providers/openai-responses-server-schema.d.ts +392 -0
  67. package/dist/types/providers/openai-responses-server.d.ts +17 -0
  68. package/dist/types/providers/openai-responses-shared.d.ts +100 -0
  69. package/dist/types/providers/openai-responses.d.ts +66 -0
  70. package/dist/types/providers/register-builtins.d.ts +31 -0
  71. package/dist/types/providers/synthetic.d.ts +26 -0
  72. package/dist/{providers → types/providers}/transform-messages.d.ts +6 -2
  73. package/dist/types/providers/vision-guard.d.ts +8 -0
  74. package/dist/types/providers/xai-responses.d.ts +23 -0
  75. package/dist/types/rate-limit-utils.d.ts +19 -0
  76. package/dist/types/stream.d.ts +28 -0
  77. package/dist/types/types.d.ts +801 -0
  78. package/dist/types/usage/claude.d.ts +4 -0
  79. package/dist/types/usage/gemini.d.ts +2 -0
  80. package/dist/types/usage/github-copilot.d.ts +7 -0
  81. package/dist/types/usage/google-antigravity.d.ts +2 -0
  82. package/dist/types/usage/kimi.d.ts +2 -0
  83. package/dist/types/usage/minimax-code.d.ts +2 -0
  84. package/dist/types/usage/openai-codex.d.ts +3 -0
  85. package/dist/types/usage/shared.d.ts +1 -0
  86. package/dist/types/usage/zai.d.ts +2 -0
  87. package/dist/types/usage.d.ts +260 -0
  88. package/dist/types/utils/abort.d.ts +19 -0
  89. package/dist/types/utils/abortable-iterator.d.ts +4 -0
  90. package/dist/types/utils/anthropic-auth.d.ts +35 -0
  91. package/dist/types/utils/discovery/antigravity.d.ts +61 -0
  92. package/dist/types/utils/discovery/codex.d.ts +38 -0
  93. package/dist/types/utils/discovery/cursor.d.ts +23 -0
  94. package/dist/types/utils/discovery/gemini.d.ts +25 -0
  95. package/dist/types/utils/discovery/index.d.ts +4 -0
  96. package/dist/types/utils/discovery/openai-compatible.d.ts +72 -0
  97. package/dist/types/utils/event-stream.d.ts +28 -0
  98. package/dist/types/utils/fireworks-model-id.d.ts +10 -0
  99. package/dist/types/utils/foundry.d.ts +1 -0
  100. package/dist/types/utils/http-inspector.d.ts +31 -0
  101. package/dist/types/utils/idle-iterator.d.ts +78 -0
  102. package/dist/types/utils/json-parse.d.ts +37 -0
  103. package/dist/types/utils/oauth/__tests__/xai-oauth.test.d.ts +1 -0
  104. package/dist/types/utils/oauth/alibaba-coding-plan.d.ts +18 -0
  105. package/dist/types/utils/oauth/anthropic.d.ts +22 -0
  106. package/dist/types/utils/oauth/api-key-login.d.ts +35 -0
  107. package/dist/types/utils/oauth/api-key-validation.d.ts +27 -0
  108. package/dist/types/utils/oauth/callback-server.d.ts +57 -0
  109. package/dist/types/utils/oauth/cerebras.d.ts +1 -0
  110. package/dist/types/utils/oauth/cloudflare-ai-gateway.d.ts +18 -0
  111. package/dist/types/utils/oauth/cursor.d.ts +15 -0
  112. package/dist/types/utils/oauth/deepseek.d.ts +10 -0
  113. package/dist/types/utils/oauth/firepass.d.ts +1 -0
  114. package/dist/types/utils/oauth/fireworks.d.ts +1 -0
  115. package/dist/types/utils/oauth/github-copilot.d.ts +38 -0
  116. package/dist/types/utils/oauth/gitlab-duo.d.ts +3 -0
  117. package/dist/types/utils/oauth/google-antigravity.d.ts +11 -0
  118. package/dist/types/utils/oauth/google-gemini-cli.d.ts +10 -0
  119. package/dist/types/utils/oauth/google-oauth-shared.d.ts +28 -0
  120. package/dist/types/utils/oauth/huggingface.d.ts +19 -0
  121. package/dist/types/utils/oauth/index.d.ts +38 -0
  122. package/dist/types/utils/oauth/kagi.d.ts +17 -0
  123. package/dist/types/utils/oauth/kilo.d.ts +5 -0
  124. package/dist/types/utils/oauth/kimi.d.ts +21 -0
  125. package/dist/types/utils/oauth/litellm.d.ts +18 -0
  126. package/dist/types/utils/oauth/lm-studio.d.ts +17 -0
  127. package/dist/types/utils/oauth/minimax-code.d.ts +28 -0
  128. package/dist/types/utils/oauth/moonshot.d.ts +1 -0
  129. package/dist/types/utils/oauth/nanogpt.d.ts +1 -0
  130. package/dist/types/utils/oauth/nvidia.d.ts +18 -0
  131. package/dist/types/utils/oauth/ollama-cloud.d.ts +2 -0
  132. package/dist/types/utils/oauth/ollama.d.ts +18 -0
  133. package/dist/types/utils/oauth/openai-codex.d.ts +21 -0
  134. package/dist/types/utils/oauth/opencode.d.ts +18 -0
  135. package/dist/types/utils/oauth/openrouter.d.ts +1 -0
  136. package/dist/types/utils/oauth/parallel.d.ts +17 -0
  137. package/dist/types/utils/oauth/perplexity.d.ts +9 -0
  138. package/dist/{utils → types/utils}/oauth/pkce.d.ts +0 -5
  139. package/dist/types/utils/oauth/qianfan.d.ts +17 -0
  140. package/dist/types/utils/oauth/qwen-portal.d.ts +19 -0
  141. package/dist/types/utils/oauth/synthetic.d.ts +1 -0
  142. package/dist/types/utils/oauth/tavily.d.ts +17 -0
  143. package/dist/types/utils/oauth/together.d.ts +1 -0
  144. package/dist/types/utils/oauth/types.d.ts +44 -0
  145. package/dist/types/utils/oauth/venice.d.ts +18 -0
  146. package/dist/types/utils/oauth/vercel-ai-gateway.d.ts +18 -0
  147. package/dist/types/utils/oauth/vllm.d.ts +16 -0
  148. package/dist/types/utils/oauth/wafer.d.ts +2 -0
  149. package/dist/types/utils/oauth/xai-oauth.d.ts +60 -0
  150. package/dist/types/utils/oauth/xiaomi.d.ts +19 -0
  151. package/dist/types/utils/oauth/zai.d.ts +18 -0
  152. package/dist/types/utils/oauth/zenmux.d.ts +1 -0
  153. package/dist/types/utils/oauth/zhipu.d.ts +18 -0
  154. package/dist/{utils → types/utils}/overflow.d.ts +9 -11
  155. package/dist/types/utils/parse-bind.d.ts +23 -0
  156. package/dist/types/utils/provider-response.d.ts +3 -0
  157. package/dist/types/utils/request-debug.d.ts +29 -0
  158. package/dist/types/utils/retry-after.d.ts +3 -0
  159. package/dist/types/utils/retry.d.ts +26 -0
  160. package/dist/types/utils/schema/adapt.d.ts +24 -0
  161. package/dist/types/utils/schema/compatibility.d.ts +30 -0
  162. package/dist/types/utils/schema/dereference.d.ts +11 -0
  163. package/dist/types/utils/schema/draft.d.ts +10 -0
  164. package/dist/types/utils/schema/equality.d.ts +4 -0
  165. package/dist/types/utils/schema/fields.d.ts +49 -0
  166. package/dist/types/utils/schema/index.d.ts +13 -0
  167. package/dist/types/utils/schema/json-schema-validator.d.ts +12 -0
  168. package/dist/types/utils/schema/meta-validator.d.ts +2 -0
  169. package/dist/types/utils/schema/normalize.d.ts +93 -0
  170. package/dist/types/utils/schema/spill.d.ts +8 -0
  171. package/dist/types/utils/schema/stamps.d.ts +25 -0
  172. package/dist/types/utils/schema/types.d.ts +4 -0
  173. package/dist/types/utils/schema/wire.d.ts +53 -0
  174. package/dist/types/utils/schema/zod-decontaminate.d.ts +31 -0
  175. package/dist/types/utils/sdk-stream-timeout.d.ts +33 -0
  176. package/dist/types/utils/sse-debug.d.ts +10 -0
  177. package/dist/types/utils/stream-markup-healing.d.ts +80 -0
  178. package/dist/types/utils/tool-choice.d.ts +50 -0
  179. package/dist/types/utils/validation.d.ts +17 -0
  180. package/dist/types/utils.d.ts +28 -0
  181. package/package.json +139 -105
  182. package/src/api-registry.ts +96 -0
  183. package/src/auth-broker/client.ts +358 -0
  184. package/src/auth-broker/index.ts +5 -0
  185. package/src/auth-broker/refresher.ts +117 -0
  186. package/src/auth-broker/remote-store.ts +623 -0
  187. package/src/auth-broker/server.ts +644 -0
  188. package/src/auth-broker/types.ts +127 -0
  189. package/src/auth-broker/wire-schemas.ts +200 -0
  190. package/src/auth-gateway/http.ts +194 -0
  191. package/src/auth-gateway/index.ts +3 -0
  192. package/src/auth-gateway/server.ts +818 -0
  193. package/src/auth-gateway/types.ts +143 -0
  194. package/src/auth-storage.ts +4422 -0
  195. package/src/index.ts +54 -0
  196. package/src/model-cache.ts +129 -0
  197. package/src/model-manager.ts +469 -0
  198. package/src/model-thinking.ts +782 -0
  199. package/src/models.json +83530 -0
  200. package/src/models.json.d.ts +9 -0
  201. package/src/models.ts +56 -0
  202. package/src/prompts/turn-aborted-guidance.md +4 -0
  203. package/src/provider-details.ts +90 -0
  204. package/src/provider-models/bundled-references.ts +38 -0
  205. package/src/provider-models/descriptors.ts +355 -0
  206. package/src/provider-models/google.ts +88 -0
  207. package/src/provider-models/index.ts +5 -0
  208. package/src/provider-models/ollama.ts +153 -0
  209. package/src/provider-models/openai-compat.ts +2817 -0
  210. package/src/provider-models/special.ts +67 -0
  211. package/src/providers/aery-native-client.ts +228 -0
  212. package/src/providers/aery-native-server.ts +212 -0
  213. package/src/providers/amazon-bedrock.ts +873 -0
  214. package/src/providers/anthropic-client.ts +318 -0
  215. package/src/providers/anthropic-messages-server-schema.ts +243 -0
  216. package/src/providers/anthropic-messages-server.ts +683 -0
  217. package/src/providers/anthropic-wire.ts +268 -0
  218. package/src/providers/anthropic.ts +3094 -0
  219. package/src/providers/aws-credentials.ts +501 -0
  220. package/src/providers/aws-eventstream.ts +185 -0
  221. package/src/providers/aws-sigv4.ts +218 -0
  222. package/src/providers/azure-openai-responses.ts +361 -0
  223. package/src/providers/cursor/gen/agent_pb.ts +15274 -0
  224. package/src/providers/cursor/proto/agent.proto +3526 -0
  225. package/src/providers/cursor/proto/buf.gen.yaml +6 -0
  226. package/src/providers/cursor/proto/buf.yaml +17 -0
  227. package/src/providers/cursor.ts +2621 -0
  228. package/src/providers/error-message.ts +21 -0
  229. package/src/providers/github-copilot-headers.ts +140 -0
  230. package/src/providers/gitlab-duo.ts +372 -0
  231. package/src/providers/google-auth.ts +252 -0
  232. package/src/providers/google-gemini-cli.ts +809 -0
  233. package/src/providers/google-gemini-headers.ts +41 -0
  234. package/src/providers/google-shared.ts +917 -0
  235. package/src/providers/google-types.ts +167 -0
  236. package/src/providers/google-vertex.ts +91 -0
  237. package/src/providers/google.ts +41 -0
  238. package/src/providers/grammar.ts +70 -0
  239. package/src/providers/kimi.ts +52 -0
  240. package/src/providers/mock.ts +496 -0
  241. package/src/providers/ollama.ts +644 -0
  242. package/src/providers/openai-anthropic-shim.ts +138 -0
  243. package/src/providers/openai-chat-server-schema.ts +252 -0
  244. package/src/providers/openai-chat-server.ts +647 -0
  245. package/src/providers/openai-codex/constants.ts +43 -0
  246. package/src/providers/openai-codex/request-transformer.ts +161 -0
  247. package/src/providers/openai-codex/response-handler.ts +81 -0
  248. package/src/providers/openai-codex-responses.ts +3018 -0
  249. package/src/providers/openai-completions-compat.ts +300 -0
  250. package/src/providers/openai-completions.ts +1979 -0
  251. package/src/providers/openai-responses-server-schema.ts +290 -0
  252. package/src/providers/openai-responses-server.ts +1183 -0
  253. package/src/providers/openai-responses-shared.ts +873 -0
  254. package/src/providers/openai-responses.ts +679 -0
  255. package/src/providers/register-builtins.ts +436 -0
  256. package/src/providers/synthetic.ts +50 -0
  257. package/src/providers/transform-messages.ts +382 -0
  258. package/src/providers/vision-guard.ts +31 -0
  259. package/src/providers/xai-responses.ts +82 -0
  260. package/src/rate-limit-utils.ts +84 -0
  261. package/src/stream.ts +1065 -0
  262. package/src/types.ts +944 -0
  263. package/src/usage/claude.ts +482 -0
  264. package/src/usage/gemini.ts +250 -0
  265. package/src/usage/github-copilot.ts +421 -0
  266. package/src/usage/google-antigravity.ts +201 -0
  267. package/src/usage/kimi.ts +271 -0
  268. package/src/usage/minimax-code.ts +31 -0
  269. package/src/usage/openai-codex.ts +503 -0
  270. package/src/usage/shared.ts +10 -0
  271. package/src/usage/zai.ts +247 -0
  272. package/src/usage.ts +185 -0
  273. package/src/utils/abort.ts +51 -0
  274. package/src/utils/abortable-iterator.ts +69 -0
  275. package/src/utils/anthropic-auth.ts +93 -0
  276. package/src/utils/discovery/antigravity.ts +261 -0
  277. package/src/utils/discovery/codex.ts +371 -0
  278. package/src/utils/discovery/cursor.ts +306 -0
  279. package/src/utils/discovery/gemini.ts +248 -0
  280. package/src/utils/discovery/index.ts +4 -0
  281. package/src/utils/discovery/openai-compatible.ts +224 -0
  282. package/src/utils/event-stream.ts +142 -0
  283. package/src/utils/fireworks-model-id.ts +30 -0
  284. package/src/utils/foundry.ts +8 -0
  285. package/src/utils/http-inspector.ts +176 -0
  286. package/src/utils/idle-iterator.ts +267 -0
  287. package/src/utils/json-parse.ts +182 -0
  288. package/src/utils/oauth/__tests__/xai-oauth.test.ts +107 -0
  289. package/src/utils/oauth/alibaba-coding-plan.ts +59 -0
  290. package/src/utils/oauth/anthropic.ts +273 -0
  291. package/src/utils/oauth/api-key-login.ts +87 -0
  292. package/src/utils/oauth/api-key-validation.ts +92 -0
  293. package/src/utils/oauth/callback-server.ts +276 -0
  294. package/src/utils/oauth/cerebras.ts +16 -0
  295. package/src/utils/oauth/cloudflare-ai-gateway.ts +48 -0
  296. package/src/utils/oauth/cursor.ts +157 -0
  297. package/src/utils/oauth/deepseek.ts +53 -0
  298. package/src/utils/oauth/firepass.ts +24 -0
  299. package/src/utils/oauth/fireworks.ts +15 -0
  300. package/src/utils/oauth/github-copilot.ts +362 -0
  301. package/src/utils/oauth/gitlab-duo.ts +123 -0
  302. package/src/utils/oauth/google-antigravity.ts +200 -0
  303. package/src/utils/oauth/google-gemini-cli.ts +256 -0
  304. package/src/utils/oauth/google-oauth-shared.ts +110 -0
  305. package/src/utils/oauth/huggingface.ts +62 -0
  306. package/src/utils/oauth/index.ts +484 -0
  307. package/src/utils/oauth/kagi.ts +47 -0
  308. package/src/utils/oauth/kilo.ts +87 -0
  309. package/src/utils/oauth/kimi.ts +254 -0
  310. package/src/utils/oauth/litellm.ts +47 -0
  311. package/src/utils/oauth/lm-studio.ts +38 -0
  312. package/src/utils/oauth/minimax-code.ts +78 -0
  313. package/src/utils/oauth/moonshot.ts +23 -0
  314. package/src/utils/oauth/nanogpt.ts +15 -0
  315. package/src/utils/oauth/nvidia.ts +70 -0
  316. package/src/utils/oauth/oauth.html +203 -0
  317. package/src/utils/oauth/ollama-cloud.ts +28 -0
  318. package/src/utils/oauth/ollama.ts +47 -0
  319. package/src/utils/oauth/openai-codex.ts +299 -0
  320. package/src/utils/oauth/opencode.ts +49 -0
  321. package/src/utils/oauth/openrouter.ts +20 -0
  322. package/src/utils/oauth/parallel.ts +46 -0
  323. package/src/utils/oauth/perplexity.ts +206 -0
  324. package/src/utils/oauth/pkce.ts +18 -0
  325. package/src/utils/oauth/qianfan.ts +58 -0
  326. package/src/utils/oauth/qwen-portal.ts +60 -0
  327. package/src/utils/oauth/synthetic.ts +15 -0
  328. package/src/utils/oauth/tavily.ts +46 -0
  329. package/src/utils/oauth/together.ts +16 -0
  330. package/src/utils/oauth/types.ts +99 -0
  331. package/src/utils/oauth/venice.ts +59 -0
  332. package/src/utils/oauth/vercel-ai-gateway.ts +47 -0
  333. package/src/utils/oauth/vllm.ts +40 -0
  334. package/src/utils/oauth/wafer.ts +50 -0
  335. package/src/utils/oauth/xai-oauth.ts +342 -0
  336. package/src/utils/oauth/xiaomi.ts +139 -0
  337. package/src/utils/oauth/zai.ts +60 -0
  338. package/src/utils/oauth/zenmux.ts +15 -0
  339. package/src/utils/oauth/zhipu.ts +60 -0
  340. package/src/utils/overflow.ts +137 -0
  341. package/src/utils/parse-bind.ts +54 -0
  342. package/src/utils/provider-response.ts +30 -0
  343. package/src/utils/request-debug.ts +336 -0
  344. package/src/utils/retry-after.ts +110 -0
  345. package/src/utils/retry.ts +54 -0
  346. package/src/utils/schema/CONSTRAINTS.md +164 -0
  347. package/src/utils/schema/adapt.ts +36 -0
  348. package/src/utils/schema/compatibility.ts +435 -0
  349. package/src/utils/schema/dereference.ts +98 -0
  350. package/src/utils/schema/draft.ts +341 -0
  351. package/src/utils/schema/equality.ts +97 -0
  352. package/src/utils/schema/fields.ts +191 -0
  353. package/src/utils/schema/index.ts +13 -0
  354. package/src/utils/schema/json-schema-validator.ts +577 -0
  355. package/src/utils/schema/meta-validator.ts +167 -0
  356. package/src/utils/schema/normalize.ts +1588 -0
  357. package/src/utils/schema/spill.ts +43 -0
  358. package/src/utils/schema/stamps.ts +97 -0
  359. package/src/utils/schema/types.ts +10 -0
  360. package/src/utils/schema/wire.ts +293 -0
  361. package/src/utils/schema/zod-decontaminate.ts +331 -0
  362. package/src/utils/sdk-stream-timeout.ts +43 -0
  363. package/src/utils/sse-debug.ts +289 -0
  364. package/src/utils/stream-markup-healing.ts +612 -0
  365. package/src/utils/tool-choice.ts +99 -0
  366. package/src/utils/validation.ts +1024 -0
  367. package/src/utils.ts +166 -0
  368. package/dist/api-registry.d.ts +0 -20
  369. package/dist/api-registry.d.ts.map +0 -1
  370. package/dist/api-registry.js +0 -44
  371. package/dist/api-registry.js.map +0 -1
  372. package/dist/bedrock-provider.d.ts +0 -5
  373. package/dist/bedrock-provider.d.ts.map +0 -1
  374. package/dist/bedrock-provider.js +0 -6
  375. package/dist/bedrock-provider.js.map +0 -1
  376. package/dist/cli.d.ts +0 -3
  377. package/dist/cli.d.ts.map +0 -1
  378. package/dist/cli.js +0 -130
  379. package/dist/cli.js.map +0 -1
  380. package/dist/env-api-keys.d.ts +0 -18
  381. package/dist/env-api-keys.d.ts.map +0 -1
  382. package/dist/env-api-keys.js +0 -178
  383. package/dist/env-api-keys.js.map +0 -1
  384. package/dist/image-models.d.ts +0 -10
  385. package/dist/image-models.d.ts.map +0 -1
  386. package/dist/image-models.generated.d.ts +0 -440
  387. package/dist/image-models.generated.d.ts.map +0 -1
  388. package/dist/image-models.generated.js +0 -442
  389. package/dist/image-models.generated.js.map +0 -1
  390. package/dist/image-models.js +0 -23
  391. package/dist/image-models.js.map +0 -1
  392. package/dist/images-api-registry.d.ts +0 -14
  393. package/dist/images-api-registry.d.ts.map +0 -1
  394. package/dist/images-api-registry.js +0 -22
  395. package/dist/images-api-registry.js.map +0 -1
  396. package/dist/images.d.ts +0 -4
  397. package/dist/images.d.ts.map +0 -1
  398. package/dist/images.js +0 -14
  399. package/dist/images.js.map +0 -1
  400. package/dist/index.d.ts +0 -32
  401. package/dist/index.d.ts.map +0 -1
  402. package/dist/index.js +0 -20
  403. package/dist/index.js.map +0 -1
  404. package/dist/models.d.ts +0 -18
  405. package/dist/models.d.ts.map +0 -1
  406. package/dist/models.generated.d.ts +0 -17480
  407. package/dist/models.generated.d.ts.map +0 -1
  408. package/dist/models.generated.js +0 -16339
  409. package/dist/models.generated.js.map +0 -1
  410. package/dist/models.js +0 -71
  411. package/dist/models.js.map +0 -1
  412. package/dist/oauth.d.ts +0 -2
  413. package/dist/oauth.d.ts.map +0 -1
  414. package/dist/oauth.js +0 -2
  415. package/dist/oauth.js.map +0 -1
  416. package/dist/providers/aery-error-formatting.d.ts +0 -13
  417. package/dist/providers/aery-error-formatting.d.ts.map +0 -1
  418. package/dist/providers/aery-error-formatting.js +0 -112
  419. package/dist/providers/aery-error-formatting.js.map +0 -1
  420. package/dist/providers/amazon-bedrock.d.ts +0 -38
  421. package/dist/providers/amazon-bedrock.d.ts.map +0 -1
  422. package/dist/providers/amazon-bedrock.js +0 -763
  423. package/dist/providers/amazon-bedrock.js.map +0 -1
  424. package/dist/providers/anthropic.d.ts +0 -71
  425. package/dist/providers/anthropic.d.ts.map +0 -1
  426. package/dist/providers/anthropic.js +0 -949
  427. package/dist/providers/anthropic.js.map +0 -1
  428. package/dist/providers/azure-openai-responses.d.ts +0 -15
  429. package/dist/providers/azure-openai-responses.d.ts.map +0 -1
  430. package/dist/providers/azure-openai-responses.js +0 -225
  431. package/dist/providers/azure-openai-responses.js.map +0 -1
  432. package/dist/providers/cloudflare.d.ts +0 -13
  433. package/dist/providers/cloudflare.d.ts.map +0 -1
  434. package/dist/providers/cloudflare.js +0 -26
  435. package/dist/providers/cloudflare.js.map +0 -1
  436. package/dist/providers/faux.d.ts +0 -56
  437. package/dist/providers/faux.d.ts.map +0 -1
  438. package/dist/providers/faux.js +0 -368
  439. package/dist/providers/faux.js.map +0 -1
  440. package/dist/providers/github-copilot-headers.d.ts +0 -8
  441. package/dist/providers/github-copilot-headers.d.ts.map +0 -1
  442. package/dist/providers/github-copilot-headers.js +0 -29
  443. package/dist/providers/github-copilot-headers.js.map +0 -1
  444. package/dist/providers/google-gemini-cli.d.ts +0 -74
  445. package/dist/providers/google-gemini-cli.d.ts.map +0 -1
  446. package/dist/providers/google-gemini-cli.js +0 -779
  447. package/dist/providers/google-gemini-cli.js.map +0 -1
  448. package/dist/providers/google-shared.d.ts +0 -70
  449. package/dist/providers/google-shared.d.ts.map +0 -1
  450. package/dist/providers/google-shared.js +0 -329
  451. package/dist/providers/google-shared.js.map +0 -1
  452. package/dist/providers/google-vertex.d.ts +0 -15
  453. package/dist/providers/google-vertex.d.ts.map +0 -1
  454. package/dist/providers/google-vertex.js +0 -442
  455. package/dist/providers/google-vertex.js.map +0 -1
  456. package/dist/providers/google.d.ts +0 -13
  457. package/dist/providers/google.d.ts.map +0 -1
  458. package/dist/providers/google.js +0 -400
  459. package/dist/providers/google.js.map +0 -1
  460. package/dist/providers/images/openrouter.d.ts +0 -3
  461. package/dist/providers/images/openrouter.d.ts.map +0 -1
  462. package/dist/providers/images/openrouter.js +0 -129
  463. package/dist/providers/images/openrouter.js.map +0 -1
  464. package/dist/providers/images/register-builtins.d.ts +0 -4
  465. package/dist/providers/images/register-builtins.d.ts.map +0 -1
  466. package/dist/providers/images/register-builtins.js +0 -34
  467. package/dist/providers/images/register-builtins.js.map +0 -1
  468. package/dist/providers/mistral.d.ts +0 -25
  469. package/dist/providers/mistral.d.ts.map +0 -1
  470. package/dist/providers/mistral.js +0 -535
  471. package/dist/providers/mistral.js.map +0 -1
  472. package/dist/providers/openai-codex-responses.d.ts +0 -30
  473. package/dist/providers/openai-codex-responses.d.ts.map +0 -1
  474. package/dist/providers/openai-codex-responses.js +0 -1090
  475. package/dist/providers/openai-codex-responses.js.map +0 -1
  476. package/dist/providers/openai-completions.d.ts +0 -19
  477. package/dist/providers/openai-completions.d.ts.map +0 -1
  478. package/dist/providers/openai-completions.js +0 -950
  479. package/dist/providers/openai-completions.js.map +0 -1
  480. package/dist/providers/openai-prompt-cache.d.ts +0 -3
  481. package/dist/providers/openai-prompt-cache.d.ts.map +0 -1
  482. package/dist/providers/openai-prompt-cache.js +0 -10
  483. package/dist/providers/openai-prompt-cache.js.map +0 -1
  484. package/dist/providers/openai-responses-shared.d.ts +0 -18
  485. package/dist/providers/openai-responses-shared.d.ts.map +0 -1
  486. package/dist/providers/openai-responses-shared.js +0 -492
  487. package/dist/providers/openai-responses-shared.js.map +0 -1
  488. package/dist/providers/openai-responses.d.ts +0 -13
  489. package/dist/providers/openai-responses.d.ts.map +0 -1
  490. package/dist/providers/openai-responses.js +0 -237
  491. package/dist/providers/openai-responses.js.map +0 -1
  492. package/dist/providers/register-builtins.d.ts +0 -38
  493. package/dist/providers/register-builtins.d.ts.map +0 -1
  494. package/dist/providers/register-builtins.js +0 -278
  495. package/dist/providers/register-builtins.js.map +0 -1
  496. package/dist/providers/simple-options.d.ts +0 -8
  497. package/dist/providers/simple-options.d.ts.map +0 -1
  498. package/dist/providers/simple-options.js +0 -41
  499. package/dist/providers/simple-options.js.map +0 -1
  500. package/dist/providers/transform-messages.d.ts.map +0 -1
  501. package/dist/providers/transform-messages.js +0 -184
  502. package/dist/providers/transform-messages.js.map +0 -1
  503. package/dist/session-resources.d.ts +0 -4
  504. package/dist/session-resources.d.ts.map +0 -1
  505. package/dist/session-resources.js +0 -22
  506. package/dist/session-resources.js.map +0 -1
  507. package/dist/stream.d.ts +0 -8
  508. package/dist/stream.d.ts.map +0 -1
  509. package/dist/stream.js +0 -27
  510. package/dist/stream.js.map +0 -1
  511. package/dist/types.d.ts +0 -498
  512. package/dist/types.d.ts.map +0 -1
  513. package/dist/types.js +0 -2
  514. package/dist/types.js.map +0 -1
  515. package/dist/utils/diagnostics.d.ts +0 -19
  516. package/dist/utils/diagnostics.d.ts.map +0 -1
  517. package/dist/utils/diagnostics.js +0 -25
  518. package/dist/utils/diagnostics.js.map +0 -1
  519. package/dist/utils/event-stream.d.ts +0 -21
  520. package/dist/utils/event-stream.d.ts.map +0 -1
  521. package/dist/utils/event-stream.js +0 -81
  522. package/dist/utils/event-stream.js.map +0 -1
  523. package/dist/utils/hash.d.ts +0 -3
  524. package/dist/utils/hash.d.ts.map +0 -1
  525. package/dist/utils/hash.js +0 -14
  526. package/dist/utils/hash.js.map +0 -1
  527. package/dist/utils/headers.d.ts +0 -2
  528. package/dist/utils/headers.d.ts.map +0 -1
  529. package/dist/utils/headers.js +0 -8
  530. package/dist/utils/headers.js.map +0 -1
  531. package/dist/utils/json-parse.d.ts +0 -16
  532. package/dist/utils/json-parse.d.ts.map +0 -1
  533. package/dist/utils/json-parse.js +0 -113
  534. package/dist/utils/json-parse.js.map +0 -1
  535. package/dist/utils/node-http-proxy.d.ts +0 -10
  536. package/dist/utils/node-http-proxy.d.ts.map +0 -1
  537. package/dist/utils/node-http-proxy.js +0 -97
  538. package/dist/utils/node-http-proxy.js.map +0 -1
  539. package/dist/utils/oauth/anthropic.d.ts +0 -25
  540. package/dist/utils/oauth/anthropic.d.ts.map +0 -1
  541. package/dist/utils/oauth/anthropic.js +0 -335
  542. package/dist/utils/oauth/anthropic.js.map +0 -1
  543. package/dist/utils/oauth/device-code.d.ts +0 -19
  544. package/dist/utils/oauth/device-code.d.ts.map +0 -1
  545. package/dist/utils/oauth/device-code.js +0 -55
  546. package/dist/utils/oauth/device-code.js.map +0 -1
  547. package/dist/utils/oauth/github-copilot.d.ts +0 -30
  548. package/dist/utils/oauth/github-copilot.d.ts.map +0 -1
  549. package/dist/utils/oauth/github-copilot.js +0 -268
  550. package/dist/utils/oauth/github-copilot.js.map +0 -1
  551. package/dist/utils/oauth/google-antigravity.d.ts +0 -26
  552. package/dist/utils/oauth/google-antigravity.d.ts.map +0 -1
  553. package/dist/utils/oauth/google-antigravity.js +0 -377
  554. package/dist/utils/oauth/google-antigravity.js.map +0 -1
  555. package/dist/utils/oauth/google-gemini-cli.d.ts +0 -26
  556. package/dist/utils/oauth/google-gemini-cli.d.ts.map +0 -1
  557. package/dist/utils/oauth/google-gemini-cli.js +0 -482
  558. package/dist/utils/oauth/google-gemini-cli.js.map +0 -1
  559. package/dist/utils/oauth/index.d.ts +0 -63
  560. package/dist/utils/oauth/index.d.ts.map +0 -1
  561. package/dist/utils/oauth/index.js +0 -131
  562. package/dist/utils/oauth/index.js.map +0 -1
  563. package/dist/utils/oauth/oauth-page.d.ts +0 -3
  564. package/dist/utils/oauth/oauth-page.d.ts.map +0 -1
  565. package/dist/utils/oauth/oauth-page.js +0 -105
  566. package/dist/utils/oauth/oauth-page.js.map +0 -1
  567. package/dist/utils/oauth/openai-codex.d.ts +0 -34
  568. package/dist/utils/oauth/openai-codex.d.ts.map +0 -1
  569. package/dist/utils/oauth/openai-codex.js +0 -385
  570. package/dist/utils/oauth/openai-codex.js.map +0 -1
  571. package/dist/utils/oauth/pkce.d.ts.map +0 -1
  572. package/dist/utils/oauth/pkce.js +0 -31
  573. package/dist/utils/oauth/pkce.js.map +0 -1
  574. package/dist/utils/oauth/types.d.ts +0 -64
  575. package/dist/utils/oauth/types.d.ts.map +0 -1
  576. package/dist/utils/oauth/types.js +0 -2
  577. package/dist/utils/oauth/types.js.map +0 -1
  578. package/dist/utils/overflow.d.ts.map +0 -1
  579. package/dist/utils/overflow.js +0 -151
  580. package/dist/utils/overflow.js.map +0 -1
  581. package/dist/utils/sanitize-unicode.d.ts +0 -22
  582. package/dist/utils/sanitize-unicode.d.ts.map +0 -1
  583. package/dist/utils/sanitize-unicode.js +0 -26
  584. package/dist/utils/sanitize-unicode.js.map +0 -1
  585. package/dist/utils/typebox-helpers.d.ts +0 -17
  586. package/dist/utils/typebox-helpers.d.ts.map +0 -1
  587. package/dist/utils/typebox-helpers.js +0 -21
  588. package/dist/utils/typebox-helpers.js.map +0 -1
  589. package/dist/utils/validation.d.ts +0 -18
  590. package/dist/utils/validation.d.ts.map +0 -1
  591. package/dist/utils/validation.js +0 -281
  592. package/dist/utils/validation.js.map +0 -1
@@ -0,0 +1,801 @@
1
+ import type { ZodType, z } from "zod/v4";
2
+ import type { BedrockOptions } from "./providers/amazon-bedrock";
3
+ import type { AnthropicOptions } from "./providers/anthropic";
4
+ import type { AzureOpenAIResponsesOptions } from "./providers/azure-openai-responses";
5
+ import type { CursorOptions } from "./providers/cursor";
6
+ import type { DeleteArgs, DeleteResult, DiagnosticsArgs, DiagnosticsResult, GrepArgs, GrepResult, LsArgs, LsResult, McpResult, ReadArgs, ReadResult, ShellArgs, ShellResult, WriteArgs, WriteResult } from "./providers/cursor/gen/agent_pb";
7
+ import type { GoogleOptions } from "./providers/google";
8
+ import type { GoogleGeminiCliOptions } from "./providers/google-gemini-cli";
9
+ import type { GoogleVertexOptions } from "./providers/google-vertex";
10
+ import type { OllamaChatOptions } from "./providers/ollama";
11
+ import type { OpenAICodexResponsesOptions } from "./providers/openai-codex-responses";
12
+ import type { OpenAICompletionsOptions } from "./providers/openai-completions";
13
+ import type { OpenAIResponsesOptions } from "./providers/openai-responses";
14
+ import type { AssistantMessageEventStream } from "./utils/event-stream";
15
+ export type { AssistantMessageEventStream } from "./utils/event-stream";
16
+ export type KnownApi = "openai-completions" | "openai-responses" | "openai-codex-responses" | "azure-openai-responses" | "anthropic-messages" | "bedrock-converse-stream" | "google-generative-ai" | "google-gemini-cli" | "google-vertex" | "ollama-chat" | "cursor-agent";
17
+ export type Api = KnownApi | (string & {});
18
+ export interface ApiOptionsMap {
19
+ "anthropic-messages": AnthropicOptions;
20
+ "bedrock-converse-stream": BedrockOptions;
21
+ "openai-completions": OpenAICompletionsOptions;
22
+ "openai-responses": OpenAIResponsesOptions;
23
+ "openai-codex-responses": OpenAICodexResponsesOptions;
24
+ "azure-openai-responses": AzureOpenAIResponsesOptions;
25
+ "google-generative-ai": GoogleOptions;
26
+ "google-gemini-cli": GoogleGeminiCliOptions;
27
+ "google-vertex": GoogleVertexOptions;
28
+ "ollama-chat": OllamaChatOptions;
29
+ "cursor-agent": CursorOptions;
30
+ }
31
+ export type OptionsForApi<TApi extends Api> = StreamOptions | (TApi extends keyof ApiOptionsMap ? ApiOptionsMap[TApi] : never);
32
+ /** Canonical thinking transport used by a model. */
33
+ export type ThinkingControlMode = "effort" | "budget" | "google-level" | "anthropic-adaptive" | "anthropic-budget-effort";
34
+ /** Per-model thinking capabilities used to clamp and map user-facing effort levels. */
35
+ export interface ThinkingConfig {
36
+ /** Least intensive supported user-facing effort level. */
37
+ minLevel: Effort;
38
+ /** Most intensive supported user-facing effort level. */
39
+ maxLevel: Effort;
40
+ /**
41
+ * Optional explicit list of supported levels. When present, takes precedence over
42
+ * the `minLevel`..`maxLevel` range — used to encode discrete sets with gaps
43
+ * (e.g. Gemini 3 Pro supports `low` and `high` but not `medium`).
44
+ */
45
+ levels?: readonly Effort[];
46
+ /** Optional default effort applied when this model is selected. Falls back to global default if absent. */
47
+ defaultLevel?: Effort;
48
+ /** Provider-specific transport used to encode the selected effort. */
49
+ mode: ThinkingControlMode;
50
+ }
51
+ export type KnownProvider = "alibaba-coding-plan" | "amazon-bedrock" | "anthropic" | "google" | "google-gemini-cli" | "google-antigravity" | "google-vertex" | "openai" | "openai-codex" | "kimi-code" | "minimax-code" | "minimax-code-cn" | "github-copilot" | "fireworks" | "firepass" | "gitlab-duo" | "cursor" | "deepseek" | "xai" | "xai-oauth" | "groq" | "cerebras" | "openrouter" | "kilo" | "vercel-ai-gateway" | "zai" | "zhipu-coding-plan" | "mistral" | "minimax" | "opencode-go" | "opencode-zen" | "synthetic" | "cloudflare-ai-gateway" | "huggingface" | "litellm" | "moonshot" | "nvidia" | "nanogpt" | "ollama" | "ollama-cloud" | "qianfan" | "qwen-portal" | "together" | "venice" | "vllm" | "xiaomi" | "wafer-pass" | "wafer-serverless" | "zenmux" | "lm-studio";
52
+ export type Provider = KnownProvider | string;
53
+ import type { Effort } from "./model-thinking";
54
+ /** Token budgets for each thinking level (token-based providers only) */
55
+ export type ThinkingBudgets = {
56
+ [key in Effort]?: number;
57
+ };
58
+ export interface TokenTaskBudget {
59
+ type: "tokens";
60
+ total: number;
61
+ remaining?: number;
62
+ }
63
+ export type MessageAttribution = "user" | "agent";
64
+ export type ToolChoice = "auto" | "none" | "any" | "required" | {
65
+ type: "function";
66
+ name: string;
67
+ } | {
68
+ type: "function";
69
+ function: {
70
+ name: string;
71
+ };
72
+ } | {
73
+ type: "tool";
74
+ name: string;
75
+ };
76
+ export type CacheRetention = "none" | "short" | "long";
77
+ /**
78
+ * Service tier hint for processing priority / cost control.
79
+ *
80
+ * The unscoped values (`"auto"`, `"default"`, `"flex"`, `"scale"`,
81
+ * `"priority"`) are passed through to providers that understand them
82
+ * (OpenAI's `service_tier` field directly; Anthropic translates
83
+ * `"priority"` into `speed: "fast"` on supported Opus models).
84
+ *
85
+ * The scoped values target a specific provider family and behave as the
86
+ * unscoped value on the matching provider, or `undefined` everywhere else.
87
+ * They let users opt into priority on one family without paying premium
88
+ * costs on the other when switching models mid-session.
89
+ *
90
+ * - `"openai-only"` → `"priority"` on `openai` and `openai-codex`; ignored elsewhere.
91
+ * - `"claude-only"` → `"priority"` on direct `anthropic` (not Bedrock/Vertex Claude).
92
+ */
93
+ export type ServiceTier = "auto" | "default" | "flex" | "scale" | "priority" | "openai-only" | "claude-only";
94
+ /** Resolved tier — one of the values that providers actually consume on the wire. */
95
+ export type ResolvedServiceTier = Exclude<ServiceTier, "openai-only" | "claude-only">;
96
+ /**
97
+ * Resolves a possibly scoped `ServiceTier` to the effective tier for the
98
+ * given provider. Scoped values match their target family and otherwise
99
+ * collapse to `undefined`; unscoped values pass through unchanged.
100
+ */
101
+ export declare function resolveServiceTier(serviceTier: ServiceTier | null | undefined, provider: Provider | undefined): ResolvedServiceTier | undefined;
102
+ /**
103
+ * True when the (possibly scoped) tier should be sent as OpenAI's
104
+ * `service_tier` request field for the given provider. Non-OpenAI
105
+ * providers, unsupported tiers (`"auto"`, `"default"`), and scope
106
+ * mismatches all return false.
107
+ */
108
+ export declare function shouldSendServiceTier(serviceTier: ServiceTier | null | undefined, provider: Provider | undefined): boolean;
109
+ /**
110
+ * Premium-request weight contributed by sending priority to a provider
111
+ * that supports it. Mirrors GitHub Copilot's `premiumRequests` accounting
112
+ * so the "premium requests" stat aggregates priority traffic across the
113
+ * OpenAI family and Anthropic fast-mode realizations.
114
+ *
115
+ * Returns 1 per resolved priority request, 0 otherwise.
116
+ */
117
+ export declare function getPriorityPremiumRequests(serviceTier: ServiceTier | null | undefined, provider: Provider | undefined): number;
118
+ export interface ProviderSessionState {
119
+ close(): void;
120
+ }
121
+ export interface ProviderResponseMetadata {
122
+ status: number;
123
+ headers: Record<string, string>;
124
+ requestId?: string | null;
125
+ metadata?: Record<string, unknown>;
126
+ }
127
+ export interface RawSseEvent {
128
+ event: string | null;
129
+ data: string;
130
+ raw: string[];
131
+ }
132
+ /**
133
+ * `fetch`-compatible function. Accepts any callable matching the standard
134
+ * fetch signature; `preconnect` is optional because non-Bun runtimes (browsers,
135
+ * test mocks) won't expose it.
136
+ */
137
+ export type FetchImpl = ((input: string | URL | Request, init?: RequestInit) => Promise<Response>) & {
138
+ preconnect?: typeof globalThis.fetch.preconnect;
139
+ };
140
+ export interface StreamOptions {
141
+ temperature?: number;
142
+ topP?: number;
143
+ topK?: number;
144
+ minP?: number;
145
+ presencePenalty?: number;
146
+ repetitionPenalty?: number;
147
+ /**
148
+ * Stop sequences. Anthropic encodes as `stop_sequences` (array, max 4);
149
+ * OpenAI chat-completions encodes as `stop` (string or array of up to 4);
150
+ * OpenAI Responses API has no `stop` field today (silently dropped by the
151
+ * provider when present).
152
+ */
153
+ stopSequences?: string[];
154
+ /**
155
+ * Frequency penalty (OpenAI). Penalizes new tokens based on existing frequency
156
+ * in the text so far. Range -2.0 to 2.0. Parallel to {@link presencePenalty}.
157
+ */
158
+ frequencyPenalty?: number;
159
+ maxTokens?: number;
160
+ signal?: AbortSignal;
161
+ apiKey?: string;
162
+ /**
163
+ * Called when a provider returns 401 before any replay-unsafe assistant
164
+ * event has been emitted. Returning a different key retries the provider
165
+ * request once.
166
+ */
167
+ onAuthError?: (provider: string, apiKey: string, error: unknown) => Promise<string | undefined>;
168
+ cacheRetention?: CacheRetention;
169
+ /**
170
+ * Additional headers to include in provider requests.
171
+ * These are merged on top of model-defined headers.
172
+ */
173
+ headers?: Record<string, string>;
174
+ /**
175
+ * Optional explicit request attribution override for providers that support it.
176
+ */
177
+ initiatorOverride?: MessageAttribution;
178
+ /**
179
+ * Maximum delay in milliseconds to wait for a retry when the server requests a long wait.
180
+ * If the server's requested delay exceeds this value, the request fails immediately
181
+ * with an error containing the requested delay, allowing higher-level retry logic
182
+ * to handle it with user visibility.
183
+ * Default: 60000 (60 seconds). Set to 0 to disable the cap.
184
+ */
185
+ maxRetryDelayMs?: number;
186
+ /**
187
+ * Optional metadata to include in API requests.
188
+ * Providers extract the fields they understand and ignore the rest.
189
+ * For example, Anthropic uses `user_id` for abuse tracking and rate limiting.
190
+ */
191
+ metadata?: Record<string, unknown>;
192
+ /**
193
+ * Advisory token budget for a full agentic loop. Anthropic encodes this as
194
+ * `output_config.task_budget` with the `task-budgets-2026-03-13` beta header.
195
+ */
196
+ taskBudget?: TokenTaskBudget;
197
+ /**
198
+ * Optional session identifier for providers that support session-based
199
+ * routing, request affinity, or transport reuse. Providers may also use this
200
+ * as the prompt-cache key when `promptCacheKey` is not set.
201
+ */
202
+ sessionId?: string;
203
+ /**
204
+ * Optional prompt-cache identity. When set, OpenAI Responses-compatible
205
+ * providers use this for `prompt_cache_key` while keeping `sessionId` for
206
+ * provider routing / conversation headers.
207
+ */
208
+ promptCacheKey?: string;
209
+ /**
210
+ * Provider-scoped mutable state store for this agent session.
211
+ * Providers can use this to persist transport/session state between turns.
212
+ */
213
+ providerSessionState?: Map<string, ProviderSessionState>;
214
+ /**
215
+ * Optional callback for inspecting or replacing provider payloads before sending.
216
+ * Return undefined to keep the payload unchanged.
217
+ */
218
+ onPayload?: (payload: unknown, model?: Model<Api>) => unknown | undefined | Promise<unknown | undefined>;
219
+ /**
220
+ * Optional callback for provider response metadata after headers are received.
221
+ */
222
+ onResponse?: (response: ProviderResponseMetadata, model?: Model<Api>) => void | Promise<void>;
223
+ /**
224
+ * Optional callback for raw Server-Sent Events as they arrive from HTTP streaming providers,
225
+ * plus synthesized SSE-shaped frames for the Codex WebSocket transport (one synthetic frame
226
+ * per JSON request/response message). WebSocket frames are tagged with a leading
227
+ * `: ws → <type>` (outbound) or `: ws ← <type>` (inbound) comment line in `RawSseEvent.raw`.
228
+ *
229
+ * Diagnostic only: provider implementations must ignore callback failures and must not
230
+ * let observers alter stream contents.
231
+ */
232
+ onSseEvent?: (event: RawSseEvent, model?: Model<Api>) => void;
233
+ /**
234
+ * Optional override for the first-event watchdog in milliseconds. Built-in
235
+ * providers apply this budget twice when they can: once to the underlying
236
+ * SDK/request while waiting for the HTTP stream object to exist, then again
237
+ * in the iterator while waiting for the first semantic stream event. Set to
238
+ * `0` to disable both layers for this request. After the first semantic
239
+ * event arrives, `streamIdleTimeoutMs` governs inter-event stalls. Falls
240
+ * back to `PI_STREAM_FIRST_EVENT_TIMEOUT_MS` and then to a 100s default.
241
+ * OpenAI-family transports additionally honor
242
+ * `PI_OPENAI_STREAM_FIRST_EVENT_TIMEOUT_MS` as the most-specific override and
243
+ * floor the first-event budget at the resolved idle (per-call
244
+ * `streamIdleTimeoutMs` or `PI_OPENAI_STREAM_IDLE_TIMEOUT_MS`) so slow local
245
+ * OpenAI-compatible servers are not undercut during prompt processing.
246
+ *
247
+ * Iterator-level honored by: every built-in provider (via the lazy-stream
248
+ * forwarder in `register-builtins`). SDK-request honored by:
249
+ * `openai-completions`, `openai-responses`, `azure-openai-responses`,
250
+ * `anthropic-messages`.
251
+ */
252
+ streamFirstEventTimeoutMs?: number;
253
+ /**
254
+ * Optional override for the maximum idle gap between streamed events in
255
+ * milliseconds. Once the first event arrives, this guards against silent
256
+ * mid-stream stalls (broker dies, half-open socket, model produces no real
257
+ * progress for too long). Set to `0` to disable. Falls back to
258
+ * `PI_STREAM_IDLE_TIMEOUT_MS` (alias: `PI_OPENAI_STREAM_IDLE_TIMEOUT_MS`)
259
+ * and then to a 120s default.
260
+ */
261
+ streamIdleTimeoutMs?: number;
262
+ /**
263
+ * Optional retry delay hook for tests and transports that need custom scheduling.
264
+ */
265
+ providerRetryWait?: (delayMs: number, signal?: AbortSignal) => Promise<void>;
266
+ /**
267
+ * Optional `fetch` implementation override. Providers route every HTTP
268
+ * request — direct calls, SDK clients, and retry helpers — through this
269
+ * implementation when set. Defaults to `globalThis.fetch`. Providers that
270
+ * do not use `fetch` (Bedrock's AWS SDK transport, Cursor's HTTP/2
271
+ * channel) silently ignore the override.
272
+ */
273
+ fetch?: FetchImpl;
274
+ /** Cursor exec/MCP tool handlers (cursor-agent only). */
275
+ execHandlers?: CursorExecHandlers;
276
+ }
277
+ export interface SimpleStreamOptions extends StreamOptions {
278
+ reasoning?: Effort;
279
+ /**
280
+ * Force-disable reasoning for the request even when the model supports it.
281
+ * Takes precedence over `reasoning`. Useful for fast utility calls
282
+ * (e.g. title generation) where the model would otherwise burn the entire
283
+ * output budget on internal thinking. Provider support is format-specific:
284
+ * some transports can disable reasoning directly, while generic
285
+ * effort-based OpenAI-compatible endpoints use the lowest supported effort.
286
+ */
287
+ disableReasoning?: boolean;
288
+ /**
289
+ * If true, request that the provider omit thinking/reasoning summaries
290
+ * from the response (e.g. Anthropic `thinking.display = "omitted"`,
291
+ * OpenAI Responses `reasoning.summary` left unset). The model still
292
+ * reasons internally; only the human-readable summary stream is dropped.
293
+ * Useful when the UI hides thinking blocks anyway and the summary is wasted bandwidth.
294
+ */
295
+ hideThinkingSummary?: boolean;
296
+ /** Custom token budgets for thinking levels (token-based providers only) */
297
+ thinkingBudgets?: ThinkingBudgets;
298
+ /** Cursor exec handlers for local tool execution */
299
+ cursorExecHandlers?: CursorExecHandlers;
300
+ /** Hook to handle tool results from Cursor exec */
301
+ cursorOnToolResult?: CursorToolResultHandler;
302
+ /** Optional tool choice override for compatible providers */
303
+ toolChoice?: ToolChoice;
304
+ /** OpenAI service tier for processing priority/cost control. Ignored by non-OpenAI providers. */
305
+ serviceTier?: ServiceTier;
306
+ /** API format for Kimi Code provider: "openai" or "anthropic" (default: "anthropic") */
307
+ kimiApiFormat?: "openai" | "anthropic";
308
+ /** API format for Synthetic provider: "openai" or "anthropic" (default: "openai") */
309
+ syntheticApiFormat?: "openai" | "anthropic";
310
+ /** Hint that websocket transport should be preferred when supported by the provider implementation. */
311
+ preferWebsockets?: boolean;
312
+ /**
313
+ * OpenRouter routing-variant suffix automatically appended to model IDs when
314
+ * the request targets OpenRouter (`model.provider === "openrouter"`). Common
315
+ * values: `"nitro"` (throughput), `"floor"` (cheapest), `"online"` (web
316
+ * search plugin), `"exacto"` (cherry-picked high-quality providers, only
317
+ * defined for some models). Ignored when the resolved model id already
318
+ * contains a `:<variant>` suffix (e.g. the user typed `:nitro` explicitly
319
+ * or the catalog entry already names the variant).
320
+ */
321
+ openrouterVariant?: string;
322
+ }
323
+ export type StreamFunction<TApi extends Api> = (model: Model<TApi>, context: Context, options: OptionsForApi<TApi>) => AssistantMessageEventStream;
324
+ export interface TextSignatureV1 {
325
+ v: 1;
326
+ id: string;
327
+ phase?: "commentary" | "final_answer";
328
+ }
329
+ export interface TextContent {
330
+ type: "text";
331
+ text: string;
332
+ textSignature?: string;
333
+ }
334
+ export interface ThinkingContent {
335
+ type: "thinking";
336
+ thinking: string;
337
+ thinkingSignature?: string;
338
+ itemId?: string;
339
+ }
340
+ export interface RedactedThinkingContent {
341
+ type: "redactedThinking";
342
+ data: string;
343
+ }
344
+ export interface ImageContent {
345
+ type: "image";
346
+ data: string;
347
+ mimeType: string;
348
+ }
349
+ export interface ToolCall {
350
+ type: "toolCall";
351
+ id: string;
352
+ name: string;
353
+ arguments: Record<string, any>;
354
+ thoughtSignature?: string;
355
+ intent?: string;
356
+ /**
357
+ * Original wire-level name when the tool was invoked via OpenAI's custom-tool
358
+ * mechanism (e.g., `apply_patch`). Set by `openai-responses` on receive so
359
+ * the history-replay path can re-emit the call as `custom_tool_call` with
360
+ * its paired tool-result as `custom_tool_call_output`. Absent for regular
361
+ * JSON function tools.
362
+ */
363
+ customWireName?: string;
364
+ }
365
+ export interface Usage {
366
+ /** Non-cached input tokens (matches the bucket the provider bills as new input). */
367
+ input: number;
368
+ /** Total output tokens for the turn, including thinking, assistant text, and tool-call argument tokens. */
369
+ output: number;
370
+ /** Tokens read from the prompt cache. */
371
+ cacheRead: number;
372
+ /** Tokens written to the prompt cache (cache creation). */
373
+ cacheWrite: number;
374
+ /** Sum of input + output + cacheRead + cacheWrite. */
375
+ totalTokens: number;
376
+ /** Copilot premium-request counter, when applicable. */
377
+ premiumRequests?: number;
378
+ /**
379
+ * Reasoning/thinking tokens included in `output`, when the provider reports them
380
+ * (OpenAI `output_tokens_details.reasoning_tokens`, Google `thoughtsTokenCount`).
381
+ * Always a subset of `output` — non-reasoning output is `output - reasoningTokens`.
382
+ *
383
+ * Providers that don't expose this leave it undefined rather than guessing;
384
+ * `undefined` means unknown, NOT zero.
385
+ */
386
+ reasoningTokens?: number;
387
+ /**
388
+ * Cache-write TTL breakdown (Anthropic only). When set, the components sum to
389
+ * `cacheWrite`. Absent providers do not populate this.
390
+ */
391
+ cttl?: {
392
+ ephemeral5m?: number;
393
+ ephemeral1h?: number;
394
+ };
395
+ /**
396
+ * Server-side tool invocations made during this turn (Anthropic web_search /
397
+ * web_fetch, OpenAI built-in tools when reported). Counts requests, not tokens.
398
+ */
399
+ server?: {
400
+ webSearch?: number;
401
+ webFetch?: number;
402
+ };
403
+ cost: {
404
+ input: number;
405
+ output: number;
406
+ cacheRead: number;
407
+ cacheWrite: number;
408
+ total: number;
409
+ };
410
+ }
411
+ export type StopReason = "stop" | "length" | "toolUse" | "error" | "aborted";
412
+ export interface OpenAIResponsesHistoryPayload {
413
+ type: "openaiResponsesHistory";
414
+ provider?: string;
415
+ dt?: boolean;
416
+ items: Array<Record<string, unknown>>;
417
+ }
418
+ export type ProviderPayload = OpenAIResponsesHistoryPayload;
419
+ export interface UserMessage {
420
+ role: "user";
421
+ content: string | (TextContent | ImageContent)[];
422
+ /** True if the message was injected by the system (e.g., auto-continue). */
423
+ synthetic?: boolean;
424
+ /** Who initiated this message for billing/attribution semantics. */
425
+ attribution?: MessageAttribution;
426
+ /** Provider-specific opaque payload used to reconstruct transport-native history. */
427
+ providerPayload?: ProviderPayload;
428
+ timestamp: number;
429
+ }
430
+ export interface DeveloperMessage {
431
+ role: "developer";
432
+ content: string | (TextContent | ImageContent)[];
433
+ /** Who initiated this message for billing/attribution semantics. */
434
+ attribution?: MessageAttribution;
435
+ /** Provider-specific opaque payload used to reconstruct transport-native history. */
436
+ providerPayload?: ProviderPayload;
437
+ timestamp: number;
438
+ }
439
+ export interface AssistantMessage {
440
+ role: "assistant";
441
+ content: (TextContent | ThinkingContent | RedactedThinkingContent | ToolCall)[];
442
+ api: Api;
443
+ provider: Provider;
444
+ model: string;
445
+ responseId?: string;
446
+ usage: Usage;
447
+ stopReason: StopReason;
448
+ errorMessage?: string;
449
+ /** HTTP status surfaced by the provider when the request failed. Populated by every provider's catch block alongside `errorMessage` so consumers (auth retry, telemetry, UI) can branch without regex-scraping the message. */
450
+ errorStatus?: number;
451
+ /**
452
+ * Stable identifiers for request features the provider silently dropped
453
+ * during this turn (e.g. `"priority"`). Set when a server-side rejection
454
+ * triggered an in-provider fallback retry that succeeded without the
455
+ * feature. Callers can use this to sync user-facing toggles back to the
456
+ * server's actual state.
457
+ */
458
+ disabledFeatures?: string[];
459
+ /** Provider-specific opaque payload used to reconstruct transport-native history. */
460
+ providerPayload?: ProviderPayload;
461
+ timestamp: number;
462
+ duration?: number;
463
+ ttft?: number;
464
+ }
465
+ export interface ToolResultMessage<TDetails = any> {
466
+ role: "toolResult";
467
+ toolCallId: string;
468
+ toolName: string;
469
+ content: (TextContent | ImageContent)[];
470
+ details?: TDetails;
471
+ isError: boolean;
472
+ /** Who initiated this message for billing/attribution semantics. */
473
+ attribution?: MessageAttribution;
474
+ /** Timestamp when output was pruned (ms since epoch). Undefined if unpruned. */
475
+ prunedAt?: number;
476
+ timestamp: number;
477
+ }
478
+ export type Message = UserMessage | DeveloperMessage | AssistantMessage | ToolResultMessage;
479
+ export type CursorExecHandlerResult<T> = {
480
+ result: T;
481
+ toolResult?: ToolResultMessage;
482
+ } | T | ToolResultMessage;
483
+ export type CursorToolResultHandler = (result: ToolResultMessage) => ToolResultMessage | undefined | Promise<ToolResultMessage | undefined>;
484
+ export interface CursorMcpCall {
485
+ name: string;
486
+ providerIdentifier: string;
487
+ toolName: string;
488
+ toolCallId: string;
489
+ args: Record<string, unknown>;
490
+ rawArgs: Record<string, Uint8Array>;
491
+ }
492
+ export interface CursorShellStreamCallbacks {
493
+ onStdout(data: string): void;
494
+ onStderr(data: string): void;
495
+ }
496
+ export interface CursorExecHandlers {
497
+ read?: (args: ReadArgs) => Promise<CursorExecHandlerResult<ReadResult>>;
498
+ ls?: (args: LsArgs) => Promise<CursorExecHandlerResult<LsResult>>;
499
+ grep?: (args: GrepArgs) => Promise<CursorExecHandlerResult<GrepResult>>;
500
+ write?: (args: WriteArgs) => Promise<CursorExecHandlerResult<WriteResult>>;
501
+ delete?: (args: DeleteArgs) => Promise<CursorExecHandlerResult<DeleteResult>>;
502
+ shell?: (args: ShellArgs) => Promise<CursorExecHandlerResult<ShellResult>>;
503
+ shellStream?: (args: ShellArgs, callbacks: CursorShellStreamCallbacks) => Promise<CursorExecHandlerResult<ShellResult>>;
504
+ diagnostics?: (args: DiagnosticsArgs) => Promise<CursorExecHandlerResult<DiagnosticsResult>>;
505
+ mcp?: (call: CursorMcpCall) => Promise<CursorExecHandlerResult<McpResult>>;
506
+ onToolResult?: CursorToolResultHandler;
507
+ }
508
+ /**
509
+ * Plain JSON Schema document used by extension-authored tools (legacy TypeBox
510
+ * emits this shape). Distinguished from Zod at runtime via {@link isZodSchema}.
511
+ */
512
+ export type TJsonSchema = Record<string, unknown>;
513
+ /**
514
+ * Schema type accepted by the {@link Tool} interface.
515
+ *
516
+ * Canonical authoring uses Zod. Extension compat may supply a JSON Schema
517
+ * object (including TypeBox static schema objects).
518
+ */
519
+ export type TSchema = ZodType | TJsonSchema;
520
+ /** Resolve parameter types for tool execution / handlers. */
521
+ export type Static<S> = S extends ZodType ? z.infer<S> : S extends {
522
+ static: infer T;
523
+ } ? T : unknown;
524
+ export interface Tool<TParameters extends TSchema = TSchema> {
525
+ name: string;
526
+ description: string;
527
+ parameters: TParameters;
528
+ /** If true, tool is strictly typed and validated against the parameters schema before execution */
529
+ strict?: boolean;
530
+ /**
531
+ * Optional grammar constraint for OpenAI custom-tool emission.
532
+ * When set, providers that support grammar-constrained tools (currently only
533
+ * `openai-responses` against models with the right capability flag) may emit
534
+ * this tool as `{type: "custom", format: {type: "grammar", …}}` instead of a
535
+ * JSON function tool. Other providers ignore the field.
536
+ */
537
+ customFormat?: {
538
+ syntax: "lark" | "regex";
539
+ definition: string;
540
+ };
541
+ /**
542
+ * Optional wire-level name used when this tool is emitted as a custom tool
543
+ * (e.g. OpenAI's `{type: "custom"}` shape). Models trained on specific tool
544
+ * names — like GPT-5 on `apply_patch` — need to see that exact name on the
545
+ * wire, but it may differ from the harness-internal `name`. The agent-loop
546
+ * dispatcher matches both `name` and `customWireName` so returned tool
547
+ * calls route correctly. Absent for regular JSON function tools.
548
+ */
549
+ customWireName?: string;
550
+ }
551
+ export interface Context {
552
+ systemPrompt?: string[];
553
+ messages: Message[];
554
+ tools?: Tool[];
555
+ }
556
+ export type AssistantMessageEvent = {
557
+ type: "start";
558
+ contentIndex?: undefined;
559
+ partial: AssistantMessage;
560
+ } | {
561
+ type: "text_start";
562
+ contentIndex: number;
563
+ partial: AssistantMessage;
564
+ } | {
565
+ type: "text_delta";
566
+ contentIndex: number;
567
+ delta: string;
568
+ partial: AssistantMessage;
569
+ } | {
570
+ type: "text_end";
571
+ contentIndex: number;
572
+ content: string;
573
+ partial: AssistantMessage;
574
+ } | {
575
+ type: "thinking_start";
576
+ contentIndex: number;
577
+ partial: AssistantMessage;
578
+ } | {
579
+ type: "thinking_delta";
580
+ contentIndex: number;
581
+ delta: string;
582
+ partial: AssistantMessage;
583
+ } | {
584
+ type: "thinking_end";
585
+ contentIndex: number;
586
+ content: string;
587
+ partial: AssistantMessage;
588
+ } | {
589
+ type: "toolcall_start";
590
+ contentIndex: number;
591
+ partial: AssistantMessage;
592
+ } | {
593
+ type: "toolcall_delta";
594
+ contentIndex: number;
595
+ delta: string;
596
+ partial: AssistantMessage;
597
+ } | {
598
+ type: "toolcall_end";
599
+ contentIndex: number;
600
+ toolCall: ToolCall;
601
+ partial: AssistantMessage;
602
+ } | {
603
+ type: "done";
604
+ contentIndex?: undefined;
605
+ reason: Extract<StopReason, "stop" | "length" | "toolUse">;
606
+ message: AssistantMessage;
607
+ } | {
608
+ type: "error";
609
+ contentIndex?: undefined;
610
+ reason: Extract<StopReason, "aborted" | "error">;
611
+ error: AssistantMessage;
612
+ };
613
+ /**
614
+ * Compatibility settings for openai-completions API.
615
+ * Use this to override URL-based auto-detection for custom providers.
616
+ */
617
+ export interface OpenAICompat {
618
+ /** Whether the provider supports the `store` field. Default: auto-detected from URL. */
619
+ supportsStore?: boolean;
620
+ /** Whether the provider supports the `developer` role (vs `system`). Default: auto-detected from URL. */
621
+ supportsDeveloperRole?: boolean;
622
+ /**
623
+ * Whether the provider's chat-completions endpoint accepts multiple
624
+ * leading `system`/`developer` messages. When false, ordered system
625
+ * prompts are coalesced into a single message joined by `\n\n` so
626
+ * strict chat templates (e.g. Qwen-served via vLLM, MiniMax) accept
627
+ * the request. Default: detected per provider/baseUrl. Canonical
628
+ * OpenAI/Azure/OpenRouter/Cerebras/Together/Fireworks/Groq/DeepSeek/
629
+ * Mistral/xAI/Z.ai/GitHub Copilot/Zenmux are treated as `true`;
630
+ * unknown or strict-template hosts default to `false`. Setting this
631
+ * to `true` preserves separate blocks, which is preferred for
632
+ * KV-cache reuse when the trailing prompt changes between calls.
633
+ */
634
+ supportsMultipleSystemMessages?: boolean;
635
+ /** Whether the provider supports `reasoning_effort`. Default: auto-detected from URL. */
636
+ supportsReasoningEffort?: boolean;
637
+ /** Optional mapping from aery-ai reasoning levels to provider/model-specific `reasoning_effort` values. */
638
+ reasoningEffortMap?: Partial<Record<Effort, string>>;
639
+ /** Whether the provider supports `stream_options: { include_usage: true }` for token usage in streaming responses. Default: true. */
640
+ supportsUsageInStreaming?: boolean;
641
+ /** Which field to use for max tokens. Default: auto-detected from URL. */
642
+ maxTokensField?: "max_completion_tokens" | "max_tokens";
643
+ /** Whether tool results require the `name` field. Default: auto-detected from URL. */
644
+ requiresToolResultName?: boolean;
645
+ /** Whether a user message after tool results requires an assistant message in between. Default: auto-detected from URL. */
646
+ requiresAssistantAfterToolResult?: boolean;
647
+ /** Whether thinking blocks must be converted to text blocks with <thinking> delimiters. Default: auto-detected from URL. */
648
+ requiresThinkingAsText?: boolean;
649
+ /** Whether tool call IDs must be normalized to Mistral format (exactly 9 alphanumeric chars). Default: auto-detected from URL. */
650
+ requiresMistralToolIds?: boolean;
651
+ /** Format for reasoning/thinking parameter. "openai" uses reasoning_effort, "openrouter" uses reasoning: { effort }, "zai" uses thinking: { type: "enabled" | "disabled" } (also used by Moonshot Kimi), "qwen" uses top-level enable_thinking, and "qwen-chat-template" uses chat_template_kwargs.enable_thinking. Default: "openai". */
652
+ thinkingFormat?: "openai" | "openrouter" | "zai" | "qwen" | "qwen-chat-template";
653
+ /** Which reasoning content field to emit on assistant messages. Default: auto-detected. */
654
+ reasoningContentField?: "reasoning_content" | "reasoning" | "reasoning_text";
655
+ /** Whether assistant tool-call messages must include reasoning content. Default: false. */
656
+ requiresReasoningContentForToolCalls?: boolean;
657
+ /** Whether the provider accepts a synthetic placeholder (e.g. ".") for missing reasoning_content on tool-call turns. Default: true. Set to false for providers like DeepSeek that validate the exact reasoning_content value. */
658
+ allowsSyntheticReasoningContentForToolCalls?: boolean;
659
+ /** Whether assistant tool-call messages must include non-empty content. Default: false. */
660
+ requiresAssistantContentForToolCalls?: boolean;
661
+ /** Whether the provider supports the `tool_choice` parameter. Default: true. */
662
+ supportsToolChoice?: boolean;
663
+ /**
664
+ * Drop reasoning fields (`reasoning_effort`, OpenRouter `reasoning`) for
665
+ * the request when `tool_choice` forces a tool call. Mirrors the Anthropic
666
+ * `disableThinkingIfToolChoiceForced` rule for backends like Kimi that
667
+ * 400 with `tool_choice 'specified' is incompatible with thinking
668
+ * enabled` whenever both are present. Default: auto-detected (Kimi).
669
+ */
670
+ disableReasoningOnForcedToolChoice?: boolean;
671
+ /**
672
+ * Drop reasoning fields (`reasoning_effort`, OpenRouter `reasoning`) for
673
+ * any request that sends `tool_choice`. Use for providers/models that accept
674
+ * tools and `tool_choice`, but reject `tool_choice` while thinking is enabled.
675
+ * Default: auto-detected (DeepSeek reasoning models).
676
+ */
677
+ disableReasoningOnToolChoice?: boolean;
678
+ /** OpenRouter-specific routing preferences. Only used when baseUrl points to OpenRouter. */
679
+ openRouterRouting?: OpenRouterRouting;
680
+ /** Vercel AI Gateway routing preferences. Only used when baseUrl points to Vercel AI Gateway. */
681
+ vercelGatewayRouting?: VercelGatewayRouting;
682
+ /** Extra fields to include in request body (e.g. gateway routing hints for OpenClaw-style proxies). */
683
+ extraBody?: Record<string, unknown>;
684
+ /** Whether the provider supports the `strict` field in tool definitions. Default: auto-detected per provider/baseUrl (conservative for unknown providers). */
685
+ supportsStrictMode?: boolean;
686
+ /** Whether tool schemas must be sent either all strict or all non-strict. Undefined keeps the existing per-tool mixed behavior. */
687
+ toolStrictMode?: "all_strict" | "none";
688
+ }
689
+ /**
690
+ * Compatibility settings for anthropic-messages API.
691
+ * Use this to disable features that strict-by-default Anthropic accepts but
692
+ * that proxy gateways (Vertex AI, AWS Bedrock-style fronts, etc.) reject.
693
+ */
694
+ export interface AnthropicCompat {
695
+ /**
696
+ * Drop the top-level `strict: true` field on tool definitions. Vertex AI's
697
+ * Anthropic-compatible endpoint rejects unknown tool fields with
698
+ * `tools.<n>.custom.strict: Extra inputs are not permitted`.
699
+ */
700
+ disableStrictTools?: boolean;
701
+ /**
702
+ * Map adaptive thinking (`thinking: { type: "adaptive" }`) to
703
+ * `{ type: "enabled", budget_tokens }`. Vertex AI rejects the `adaptive`
704
+ * tag with `Input tag 'adaptive' ... does not match any of the expected
705
+ * tags: 'disabled', 'enabled'`.
706
+ */
707
+ disableAdaptiveThinking?: boolean;
708
+ /** Whether tools may include Anthropic's per-tool eager_input_streaming flag. Default: true. */
709
+ supportsEagerToolInputStreaming?: boolean;
710
+ /** Whether long prompt-cache retention (`ttl: "1h"`) is supported. Default: true for canonical Anthropic API. */
711
+ supportsLongCacheRetention?: boolean;
712
+ /**
713
+ * Whether mid-conversation `role: "system"` messages are accepted in the
714
+ * `messages` array (Claude Opus 4.8+ on the first-party Claude API and
715
+ * Claude Platform on AWS). When unset, auto-detected from the model id and
716
+ * base URL. Not available on Bedrock, Vertex AI, or Microsoft Foundry.
717
+ */
718
+ supportsMidConversationSystem?: boolean;
719
+ }
720
+ /**
721
+ * OpenRouter provider routing preferences.
722
+ * Controls which upstream providers OpenRouter routes requests to.
723
+ * @see https://openrouter.ai/docs/provider-routing
724
+ */
725
+ export interface OpenRouterRouting {
726
+ /** List of provider slugs to exclusively use for this request (e.g., ["amazon-bedrock", "anthropic"]). */
727
+ only?: string[];
728
+ /** List of provider slugs to try in order (e.g., ["anthropic", "openai"]). */
729
+ order?: string[];
730
+ }
731
+ /**
732
+ * Vercel AI Gateway routing preferences.
733
+ * Controls which upstream providers the gateway routes requests to.
734
+ * @see https://vercel.com/docs/ai-gateway/models-and-providers/provider-options
735
+ */
736
+ export interface VercelGatewayRouting {
737
+ /** List of provider slugs to exclusively use for this request (e.g., ["bedrock", "anthropic"]). */
738
+ only?: string[];
739
+ /** List of provider slugs to try in order (e.g., ["anthropic", "openai"]). */
740
+ order?: string[];
741
+ }
742
+ export interface Model<TApi extends Api = any> {
743
+ id: string;
744
+ name: string;
745
+ api: TApi;
746
+ provider: Provider;
747
+ baseUrl: string;
748
+ reasoning: boolean;
749
+ input: ("text" | "image")[];
750
+ cost: {
751
+ input: number;
752
+ output: number;
753
+ cacheRead: number;
754
+ cacheWrite: number;
755
+ };
756
+ /** Premium Copilot requests charged per user-initiated request (defaults to 1). */
757
+ premiumMultiplier?: number;
758
+ contextWindow: number;
759
+ maxTokens: number;
760
+ headers?: Record<string, string>;
761
+ /**
762
+ * Streaming transport override. When `"aery-native"`, `streamSimple` routes
763
+ * the request to the model's `baseUrl` via the auth-gateway's
764
+ * `POST /v1/aery/stream` endpoint instead of dispatching the per-API
765
+ * provider client. The `baseUrl` must point at an `aery auth-gateway`
766
+ * (or compatible) host; `headers.Authorization` (or `apiKey` resolved by
767
+ * the registry) carries the gateway bearer.
768
+ *
769
+ * Used by containerized aery installs (e.g. robomp slots) to route every
770
+ * LLM call through a sidecar gateway that holds the real provider
771
+ * credentials. The model's other metadata (pricing, context window,
772
+ * thinking config, …) still resolves locally; only the streaming
773
+ * dispatch is redirected.
774
+ */
775
+ transport?: "aery-native";
776
+ /** Hint that websocket transport should be preferred when supported by the provider implementation. */
777
+ preferWebsockets?: boolean;
778
+ /** Preferred model to switch to when context promotion is triggered (model id or provider/id). */
779
+ contextPromotionTarget?: string;
780
+ /** Provider-assigned priority value (lower = higher priority). */
781
+ priority?: number;
782
+ /** Canonical thinking capability metadata for this model. */
783
+ thinking?: ThinkingConfig;
784
+ /** Compatibility overrides per API. If not set, auto-detected from baseUrl. */
785
+ compat?: TApi extends "openai-completions" | "openai-responses" ? OpenAICompat : TApi extends "anthropic-messages" ? AnthropicCompat : never;
786
+ /**
787
+ * Which shape to use when exposing the Codex `apply_patch` tool to this model.
788
+ * Generated catalog policy sets `"freeform"` for first-party GPT-5 Responses
789
+ * models that support OpenAI custom tools with a Lark grammar. The freeform
790
+ * variant sends a raw patch string with no JSON envelope.
791
+ * - `"function"` or undefined: JSON function-tool with `{input: string}` (spec §1.2).
792
+ */
793
+ applyPatchToolType?: "freeform" | "function";
794
+ /**
795
+ * Force OAuth-style request shaping for providers whose API key prefix doesn't
796
+ * match an OAuth token (e.g. routing Anthropic traffic through a proxy that
797
+ * expects Claude Code framing). When true, the streaming layer sets
798
+ * `options.isOAuth = true` for the underlying provider call.
799
+ */
800
+ isOAuth?: boolean;
801
+ }