@dexto/core 1.5.6 → 1.5.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (217) hide show
  1. package/dist/agent/DextoAgent.cjs +189 -30
  2. package/dist/agent/DextoAgent.d.ts +44 -9
  3. package/dist/agent/DextoAgent.d.ts.map +1 -1
  4. package/dist/agent/DextoAgent.js +190 -31
  5. package/dist/agent/schemas.cjs +5 -0
  6. package/dist/agent/schemas.d.ts +456 -66
  7. package/dist/agent/schemas.d.ts.map +1 -1
  8. package/dist/agent/schemas.js +5 -0
  9. package/dist/context/manager.cjs +1 -1
  10. package/dist/context/manager.js +1 -1
  11. package/dist/context/utils.cjs +90 -17
  12. package/dist/context/utils.d.ts.map +1 -1
  13. package/dist/context/utils.js +90 -17
  14. package/dist/errors/types.cjs +2 -1
  15. package/dist/errors/types.d.ts +2 -1
  16. package/dist/errors/types.d.ts.map +1 -1
  17. package/dist/errors/types.js +2 -1
  18. package/dist/events/index.cjs +4 -1
  19. package/dist/events/index.d.ts +37 -2
  20. package/dist/events/index.d.ts.map +1 -1
  21. package/dist/events/index.js +4 -1
  22. package/dist/image/types.d.ts +15 -0
  23. package/dist/image/types.d.ts.map +1 -1
  24. package/dist/index.browser.d.ts +1 -1
  25. package/dist/index.browser.d.ts.map +1 -1
  26. package/dist/llm/curation-config.cjs +82 -0
  27. package/dist/llm/curation-config.d.ts +13 -0
  28. package/dist/llm/curation-config.d.ts.map +1 -0
  29. package/dist/llm/curation-config.js +59 -0
  30. package/dist/llm/curation.cjs +57 -0
  31. package/dist/llm/curation.d.ts +16 -0
  32. package/dist/llm/curation.d.ts.map +1 -0
  33. package/dist/llm/curation.js +34 -0
  34. package/dist/llm/error-codes.cjs +1 -0
  35. package/dist/llm/error-codes.d.ts +1 -0
  36. package/dist/llm/error-codes.d.ts.map +1 -1
  37. package/dist/llm/error-codes.js +1 -0
  38. package/dist/llm/errors.cjs +16 -1
  39. package/dist/llm/errors.d.ts +15 -8
  40. package/dist/llm/errors.d.ts.map +1 -1
  41. package/dist/llm/errors.js +16 -1
  42. package/dist/llm/executor/provider-options.cjs +1 -1
  43. package/dist/llm/executor/provider-options.js +1 -1
  44. package/dist/llm/executor/turn-executor.cjs +35 -2
  45. package/dist/llm/executor/turn-executor.d.ts.map +1 -1
  46. package/dist/llm/executor/turn-executor.js +35 -2
  47. package/dist/llm/index.cjs +14 -3
  48. package/dist/llm/index.d.ts +3 -1
  49. package/dist/llm/index.d.ts.map +1 -1
  50. package/dist/llm/index.js +13 -2
  51. package/dist/llm/registry/auto-update.cjs +263 -0
  52. package/dist/llm/registry/auto-update.d.ts +27 -0
  53. package/dist/llm/registry/auto-update.d.ts.map +1 -0
  54. package/dist/llm/registry/auto-update.js +227 -0
  55. package/dist/llm/registry/index.cjs +806 -0
  56. package/dist/llm/{registry.d.ts → registry/index.d.ts} +67 -13
  57. package/dist/llm/registry/index.d.ts.map +1 -0
  58. package/dist/llm/registry/index.js +756 -0
  59. package/dist/llm/registry/models.generated.cjs +4861 -0
  60. package/dist/llm/registry/models.generated.d.ts +431 -0
  61. package/dist/llm/registry/models.generated.d.ts.map +1 -0
  62. package/dist/llm/registry/models.generated.js +4838 -0
  63. package/dist/llm/registry/models.manual.cjs +44 -0
  64. package/dist/llm/registry/models.manual.d.ts +22 -0
  65. package/dist/llm/registry/models.manual.d.ts.map +1 -0
  66. package/dist/llm/registry/models.manual.js +21 -0
  67. package/dist/llm/registry/sync.cjs +354 -0
  68. package/dist/llm/registry/sync.d.ts +41 -0
  69. package/dist/llm/registry/sync.d.ts.map +1 -0
  70. package/dist/llm/registry/sync.js +328 -0
  71. package/dist/llm/resolver.cjs +29 -7
  72. package/dist/llm/resolver.d.ts +1 -1
  73. package/dist/llm/resolver.d.ts.map +1 -1
  74. package/dist/llm/resolver.js +31 -8
  75. package/dist/llm/schemas.cjs +13 -1
  76. package/dist/llm/schemas.d.ts +59 -59
  77. package/dist/llm/schemas.d.ts.map +1 -1
  78. package/dist/llm/schemas.js +14 -1
  79. package/dist/llm/services/factory.cjs +43 -27
  80. package/dist/llm/services/factory.d.ts +20 -1
  81. package/dist/llm/services/factory.d.ts.map +1 -1
  82. package/dist/llm/services/factory.js +44 -28
  83. package/dist/llm/services/test-utils.integration.cjs +5 -1
  84. package/dist/llm/services/test-utils.integration.d.ts.map +1 -1
  85. package/dist/llm/services/test-utils.integration.js +5 -1
  86. package/dist/llm/services/vercel.cjs +4 -1
  87. package/dist/llm/services/vercel.d.ts +1 -0
  88. package/dist/llm/services/vercel.d.ts.map +1 -1
  89. package/dist/llm/services/vercel.js +4 -1
  90. package/dist/llm/types.cjs +5 -2
  91. package/dist/llm/types.d.ts +1 -1
  92. package/dist/llm/types.d.ts.map +1 -1
  93. package/dist/llm/types.js +5 -2
  94. package/dist/llm/validation.cjs +1 -1
  95. package/dist/llm/validation.js +1 -1
  96. package/dist/logger/v2/dexto-logger.cjs +4 -0
  97. package/dist/logger/v2/dexto-logger.d.ts +3 -0
  98. package/dist/logger/v2/dexto-logger.d.ts.map +1 -1
  99. package/dist/logger/v2/dexto-logger.js +4 -0
  100. package/dist/logger/v2/types.d.ts +2 -0
  101. package/dist/logger/v2/types.d.ts.map +1 -1
  102. package/dist/mcp/error-codes.cjs +1 -0
  103. package/dist/mcp/error-codes.d.ts +1 -0
  104. package/dist/mcp/error-codes.d.ts.map +1 -1
  105. package/dist/mcp/error-codes.js +1 -0
  106. package/dist/mcp/errors.cjs +13 -0
  107. package/dist/mcp/errors.d.ts +7 -0
  108. package/dist/mcp/errors.d.ts.map +1 -1
  109. package/dist/mcp/errors.js +13 -0
  110. package/dist/mcp/manager.cjs +46 -4
  111. package/dist/mcp/manager.d.ts +10 -2
  112. package/dist/mcp/manager.d.ts.map +1 -1
  113. package/dist/mcp/manager.js +46 -4
  114. package/dist/mcp/mcp-client.cjs +89 -5
  115. package/dist/mcp/mcp-client.d.ts +5 -1
  116. package/dist/mcp/mcp-client.d.ts.map +1 -1
  117. package/dist/mcp/mcp-client.js +89 -5
  118. package/dist/mcp/schemas.cjs +6 -1
  119. package/dist/mcp/schemas.d.ts +1 -1
  120. package/dist/mcp/schemas.d.ts.map +1 -1
  121. package/dist/mcp/schemas.js +6 -1
  122. package/dist/mcp/types.d.ts +5 -0
  123. package/dist/mcp/types.d.ts.map +1 -1
  124. package/dist/prompts/index.d.ts +1 -1
  125. package/dist/prompts/index.d.ts.map +1 -1
  126. package/dist/prompts/prompt-manager.cjs +90 -4
  127. package/dist/prompts/prompt-manager.d.ts +16 -6
  128. package/dist/prompts/prompt-manager.d.ts.map +1 -1
  129. package/dist/prompts/prompt-manager.js +90 -4
  130. package/dist/prompts/providers/config-prompt-provider.cjs +104 -10
  131. package/dist/prompts/providers/config-prompt-provider.d.ts.map +1 -1
  132. package/dist/prompts/providers/config-prompt-provider.js +105 -11
  133. package/dist/prompts/providers/custom-prompt-provider.cjs +1 -0
  134. package/dist/prompts/providers/custom-prompt-provider.d.ts.map +1 -1
  135. package/dist/prompts/providers/custom-prompt-provider.js +1 -0
  136. package/dist/prompts/providers/mcp-prompt-provider.cjs +1 -0
  137. package/dist/prompts/providers/mcp-prompt-provider.d.ts.map +1 -1
  138. package/dist/prompts/providers/mcp-prompt-provider.js +1 -0
  139. package/dist/prompts/schemas.cjs +28 -2
  140. package/dist/prompts/schemas.d.ts +130 -0
  141. package/dist/prompts/schemas.d.ts.map +1 -1
  142. package/dist/prompts/schemas.js +28 -2
  143. package/dist/prompts/types.d.ts +55 -3
  144. package/dist/prompts/types.d.ts.map +1 -1
  145. package/dist/resources/handlers/filesystem-handler.cjs +25 -0
  146. package/dist/resources/handlers/filesystem-handler.d.ts +1 -0
  147. package/dist/resources/handlers/filesystem-handler.d.ts.map +1 -1
  148. package/dist/resources/handlers/filesystem-handler.js +25 -0
  149. package/dist/session/chat-session.cjs +1 -1
  150. package/dist/session/chat-session.d.ts +1 -1
  151. package/dist/session/chat-session.d.ts.map +1 -1
  152. package/dist/session/chat-session.js +1 -1
  153. package/dist/session/index.d.ts +1 -1
  154. package/dist/session/index.d.ts.map +1 -1
  155. package/dist/session/message-queue.cjs +29 -5
  156. package/dist/session/message-queue.d.ts +3 -1
  157. package/dist/session/message-queue.d.ts.map +1 -1
  158. package/dist/session/message-queue.js +29 -5
  159. package/dist/session/session-manager.cjs +84 -3
  160. package/dist/session/session-manager.d.ts +12 -0
  161. package/dist/session/session-manager.d.ts.map +1 -1
  162. package/dist/session/session-manager.js +74 -3
  163. package/dist/session/types.d.ts +1 -0
  164. package/dist/session/types.d.ts.map +1 -1
  165. package/dist/systemPrompt/contributors.cjs +42 -0
  166. package/dist/systemPrompt/contributors.d.ts +13 -0
  167. package/dist/systemPrompt/contributors.d.ts.map +1 -1
  168. package/dist/systemPrompt/contributors.js +41 -0
  169. package/dist/tools/errors.cjs +7 -3
  170. package/dist/tools/errors.d.ts +5 -1
  171. package/dist/tools/errors.d.ts.map +1 -1
  172. package/dist/tools/errors.js +7 -3
  173. package/dist/tools/internal-tools/constants.cjs +2 -1
  174. package/dist/tools/internal-tools/constants.d.ts +1 -1
  175. package/dist/tools/internal-tools/constants.d.ts.map +1 -1
  176. package/dist/tools/internal-tools/constants.js +2 -1
  177. package/dist/tools/internal-tools/implementations/invoke-skill-tool.cjs +140 -0
  178. package/dist/tools/internal-tools/implementations/invoke-skill-tool.d.ts +24 -0
  179. package/dist/tools/internal-tools/implementations/invoke-skill-tool.d.ts.map +1 -0
  180. package/dist/tools/internal-tools/implementations/invoke-skill-tool.js +117 -0
  181. package/dist/tools/internal-tools/provider.cjs +15 -0
  182. package/dist/tools/internal-tools/provider.d.ts +15 -1
  183. package/dist/tools/internal-tools/provider.d.ts.map +1 -1
  184. package/dist/tools/internal-tools/provider.js +15 -0
  185. package/dist/tools/internal-tools/registry.cjs +6 -0
  186. package/dist/tools/internal-tools/registry.d.ts +35 -1
  187. package/dist/tools/internal-tools/registry.d.ts.map +1 -1
  188. package/dist/tools/internal-tools/registry.js +6 -0
  189. package/dist/tools/schemas.d.ts +1 -1
  190. package/dist/tools/schemas.d.ts.map +1 -1
  191. package/dist/tools/tool-call-metadata.cjs +75 -0
  192. package/dist/tools/tool-call-metadata.d.ts +16 -0
  193. package/dist/tools/tool-call-metadata.d.ts.map +1 -0
  194. package/dist/tools/tool-call-metadata.js +51 -0
  195. package/dist/tools/tool-manager.cjs +481 -103
  196. package/dist/tools/tool-manager.d.ts +131 -9
  197. package/dist/tools/tool-manager.d.ts.map +1 -1
  198. package/dist/tools/tool-manager.js +482 -104
  199. package/dist/utils/api-key-resolver.cjs +5 -2
  200. package/dist/utils/api-key-resolver.d.ts.map +1 -1
  201. package/dist/utils/api-key-resolver.js +5 -2
  202. package/dist/utils/env.cjs +49 -0
  203. package/dist/utils/env.d.ts +4 -0
  204. package/dist/utils/env.d.ts.map +1 -0
  205. package/dist/utils/env.js +24 -0
  206. package/dist/utils/index.cjs +3 -1
  207. package/dist/utils/index.d.ts +1 -0
  208. package/dist/utils/index.d.ts.map +1 -1
  209. package/dist/utils/index.js +1 -0
  210. package/dist/utils/service-initializer.cjs +25 -7
  211. package/dist/utils/service-initializer.d.ts +24 -1
  212. package/dist/utils/service-initializer.d.ts.map +1 -1
  213. package/dist/utils/service-initializer.js +25 -7
  214. package/package.json +6 -2
  215. package/dist/llm/registry.cjs +0 -1631
  216. package/dist/llm/registry.d.ts.map +0 -1
  217. package/dist/llm/registry.js +0 -1586
@@ -1,1631 +0,0 @@
1
- "use strict";
2
- var __defProp = Object.defineProperty;
3
- var __getOwnPropDesc = Object.getOwnPropertyDescriptor;
4
- var __getOwnPropNames = Object.getOwnPropertyNames;
5
- var __hasOwnProp = Object.prototype.hasOwnProperty;
6
- var __export = (target, all) => {
7
- for (var name in all)
8
- __defProp(target, name, { get: all[name], enumerable: true });
9
- };
10
- var __copyProps = (to, from, except, desc) => {
11
- if (from && typeof from === "object" || typeof from === "function") {
12
- for (let key of __getOwnPropNames(from))
13
- if (!__hasOwnProp.call(to, key) && key !== except)
14
- __defProp(to, key, { get: () => from[key], enumerable: !(desc = __getOwnPropDesc(from, key)) || desc.enumerable });
15
- }
16
- return to;
17
- };
18
- var __toCommonJS = (mod) => __copyProps(__defProp({}, "__esModule", { value: true }), mod);
19
- var registry_exports = {};
20
- __export(registry_exports, {
21
- DEFAULT_MAX_INPUT_TOKENS: () => DEFAULT_MAX_INPUT_TOKENS,
22
- LLM_REGISTRY: () => LLM_REGISTRY,
23
- MIME_TYPE_TO_FILE_TYPE: () => MIME_TYPE_TO_FILE_TYPE,
24
- acceptsAnyModel: () => acceptsAnyModel,
25
- calculateCost: () => calculateCost,
26
- getAllSupportedModels: () => getAllSupportedModels,
27
- getAllowedMimeTypes: () => getAllowedMimeTypes,
28
- getDefaultModelForProvider: () => getDefaultModelForProvider,
29
- getEffectiveMaxInputTokens: () => getEffectiveMaxInputTokens,
30
- getMaxInputTokensForModel: () => getMaxInputTokensForModel,
31
- getModelDisplayName: () => getModelDisplayName,
32
- getModelPricing: () => getModelPricing,
33
- getProviderFromModel: () => getProviderFromModel,
34
- getSupportedFileTypesForModel: () => getSupportedFileTypesForModel,
35
- getSupportedModels: () => getSupportedModels,
36
- getSupportedProviders: () => getSupportedProviders,
37
- isReasoningCapableModel: () => isReasoningCapableModel,
38
- isValidProviderModel: () => isValidProviderModel,
39
- modelSupportsFileType: () => modelSupportsFileType,
40
- requiresApiKey: () => requiresApiKey,
41
- requiresBaseURL: () => requiresBaseURL,
42
- stripBedrockRegionPrefix: () => stripBedrockRegionPrefix,
43
- supportsBaseURL: () => supportsBaseURL,
44
- supportsCustomModels: () => supportsCustomModels,
45
- validateModelFileSupport: () => validateModelFileSupport
46
- });
47
- module.exports = __toCommonJS(registry_exports);
48
- var import_errors = require("./errors.js");
49
- var import_error_codes = require("./error-codes.js");
50
- var import_DextoRuntimeError = require("../errors/DextoRuntimeError.js");
51
- var import_types = require("./types.js");
52
- var import_openrouter_model_registry = require("./providers/openrouter-model-registry.js");
53
- const MIME_TYPE_TO_FILE_TYPE = {
54
- "application/pdf": "pdf",
55
- "audio/mp3": "audio",
56
- "audio/mpeg": "audio",
57
- "audio/wav": "audio",
58
- "audio/x-wav": "audio",
59
- "audio/wave": "audio",
60
- "audio/webm": "audio",
61
- "audio/ogg": "audio",
62
- "audio/m4a": "audio",
63
- "audio/aac": "audio",
64
- // Common image MIME types
65
- "image/jpeg": "image",
66
- "image/jpg": "image",
67
- "image/png": "image",
68
- "image/webp": "image",
69
- "image/gif": "image"
70
- };
71
- function getAllowedMimeTypes() {
72
- return Object.keys(MIME_TYPE_TO_FILE_TYPE);
73
- }
74
- const DEFAULT_MAX_INPUT_TOKENS = 128e3;
75
- const LLM_REGISTRY = {
76
- openai: {
77
- models: [
78
- // GPT-5.2 series (latest, released Dec 2025)
79
- {
80
- name: "gpt-5.2-chat-latest",
81
- displayName: "GPT-5.2 Instant",
82
- maxInputTokens: 4e5,
83
- supportedFileTypes: ["pdf", "image"],
84
- pricing: {
85
- inputPerM: 1.75,
86
- outputPerM: 14,
87
- cacheReadPerM: 0.175,
88
- currency: "USD",
89
- unit: "per_million_tokens"
90
- }
91
- },
92
- {
93
- name: "gpt-5.2",
94
- displayName: "GPT-5.2 Thinking",
95
- maxInputTokens: 4e5,
96
- supportedFileTypes: ["pdf", "image"],
97
- pricing: {
98
- inputPerM: 1.75,
99
- outputPerM: 14,
100
- cacheReadPerM: 0.175,
101
- currency: "USD",
102
- unit: "per_million_tokens"
103
- }
104
- },
105
- {
106
- name: "gpt-5.2-pro",
107
- displayName: "GPT-5.2 Pro",
108
- maxInputTokens: 4e5,
109
- supportedFileTypes: ["pdf", "image"],
110
- pricing: {
111
- inputPerM: 21,
112
- outputPerM: 168,
113
- cacheReadPerM: 2.1,
114
- currency: "USD",
115
- unit: "per_million_tokens"
116
- }
117
- },
118
- {
119
- name: "gpt-5.2-codex",
120
- displayName: "GPT-5.2 Codex",
121
- maxInputTokens: 4e5,
122
- supportedFileTypes: ["pdf", "image"],
123
- pricing: {
124
- inputPerM: 1.75,
125
- outputPerM: 14,
126
- cacheReadPerM: 0.175,
127
- currency: "USD",
128
- unit: "per_million_tokens"
129
- }
130
- },
131
- // GPT-5.1 series
132
- {
133
- name: "gpt-5.1-chat-latest",
134
- displayName: "GPT-5.1 Instant",
135
- maxInputTokens: 4e5,
136
- supportedFileTypes: ["pdf", "image"],
137
- pricing: {
138
- inputPerM: 1.25,
139
- outputPerM: 10,
140
- cacheReadPerM: 0.125,
141
- currency: "USD",
142
- unit: "per_million_tokens"
143
- }
144
- },
145
- {
146
- name: "gpt-5.1",
147
- displayName: "GPT-5.1 Thinking",
148
- maxInputTokens: 4e5,
149
- supportedFileTypes: ["pdf", "image"],
150
- pricing: {
151
- inputPerM: 1.25,
152
- outputPerM: 10,
153
- cacheReadPerM: 0.125,
154
- currency: "USD",
155
- unit: "per_million_tokens"
156
- }
157
- },
158
- {
159
- name: "gpt-5.1-codex",
160
- displayName: "GPT-5.1 Codex",
161
- maxInputTokens: 4e5,
162
- supportedFileTypes: ["pdf", "image"],
163
- pricing: {
164
- inputPerM: 1.25,
165
- outputPerM: 10,
166
- cacheReadPerM: 0.125,
167
- currency: "USD",
168
- unit: "per_million_tokens"
169
- }
170
- },
171
- {
172
- name: "gpt-5.1-codex-mini",
173
- displayName: "GPT-5.1 Codex Mini",
174
- maxInputTokens: 4e5,
175
- supportedFileTypes: ["pdf", "image"],
176
- pricing: {
177
- inputPerM: 0.25,
178
- outputPerM: 2,
179
- cacheReadPerM: 0.025,
180
- currency: "USD",
181
- unit: "per_million_tokens"
182
- }
183
- },
184
- // {
185
- // name: 'gpt-5.1-codex-max',
186
- // displayName: 'GPT-5.1 Codex Max',
187
- // maxInputTokens: 400000,
188
- // supportedFileTypes: ['pdf', 'image'],
189
- // pricing: {
190
- // inputPerM: 1.25,
191
- // outputPerM: 10.0,
192
- // cacheReadPerM: 0.125,
193
- // currency: 'USD',
194
- // unit: 'per_million_tokens',
195
- // },
196
- // },
197
- {
198
- name: "gpt-5-pro",
199
- displayName: "GPT-5 Pro",
200
- maxInputTokens: 4e5,
201
- supportedFileTypes: ["pdf", "image"],
202
- pricing: {
203
- inputPerM: 15,
204
- outputPerM: 120,
205
- cacheReadPerM: 1.5,
206
- currency: "USD",
207
- unit: "per_million_tokens"
208
- }
209
- },
210
- {
211
- name: "gpt-5",
212
- displayName: "GPT-5",
213
- maxInputTokens: 4e5,
214
- supportedFileTypes: ["pdf", "image"],
215
- pricing: {
216
- inputPerM: 1.25,
217
- outputPerM: 10,
218
- cacheReadPerM: 0.125,
219
- currency: "USD",
220
- unit: "per_million_tokens"
221
- }
222
- },
223
- {
224
- name: "gpt-5-mini",
225
- displayName: "GPT-5 Mini",
226
- maxInputTokens: 4e5,
227
- default: true,
228
- supportedFileTypes: ["pdf", "image"],
229
- pricing: {
230
- inputPerM: 0.25,
231
- outputPerM: 2,
232
- cacheReadPerM: 0.025,
233
- currency: "USD",
234
- unit: "per_million_tokens"
235
- }
236
- },
237
- {
238
- name: "gpt-5-nano",
239
- displayName: "GPT-5 Nano",
240
- maxInputTokens: 4e5,
241
- supportedFileTypes: ["pdf", "image"],
242
- pricing: {
243
- inputPerM: 0.05,
244
- outputPerM: 0.4,
245
- cacheReadPerM: 5e-3,
246
- currency: "USD",
247
- unit: "per_million_tokens"
248
- }
249
- },
250
- {
251
- name: "gpt-5-codex",
252
- displayName: "GPT-5 Codex",
253
- maxInputTokens: 4e5,
254
- supportedFileTypes: ["pdf", "image"],
255
- pricing: {
256
- inputPerM: 1.25,
257
- outputPerM: 10,
258
- cacheReadPerM: 0.125,
259
- currency: "USD",
260
- unit: "per_million_tokens"
261
- }
262
- },
263
- {
264
- name: "gpt-4.1",
265
- displayName: "GPT-4.1",
266
- maxInputTokens: 1048576,
267
- supportedFileTypes: ["pdf", "image"],
268
- pricing: {
269
- inputPerM: 2,
270
- outputPerM: 8,
271
- cacheReadPerM: 0.5,
272
- currency: "USD",
273
- unit: "per_million_tokens"
274
- }
275
- },
276
- {
277
- name: "gpt-4.1-mini",
278
- displayName: "GPT-4.1 Mini",
279
- maxInputTokens: 1048576,
280
- supportedFileTypes: ["pdf", "image"],
281
- pricing: {
282
- inputPerM: 0.4,
283
- outputPerM: 1.6,
284
- cacheReadPerM: 0.1,
285
- currency: "USD",
286
- unit: "per_million_tokens"
287
- }
288
- },
289
- {
290
- name: "gpt-4.1-nano",
291
- displayName: "GPT-4.1 Nano",
292
- maxInputTokens: 1048576,
293
- supportedFileTypes: ["pdf", "image"],
294
- pricing: {
295
- inputPerM: 0.1,
296
- outputPerM: 0.4,
297
- cacheReadPerM: 0.025,
298
- currency: "USD",
299
- unit: "per_million_tokens"
300
- }
301
- },
302
- {
303
- name: "gpt-4o",
304
- displayName: "GPT-4o",
305
- maxInputTokens: 128e3,
306
- supportedFileTypes: ["pdf", "image"],
307
- pricing: {
308
- inputPerM: 2.5,
309
- outputPerM: 10,
310
- cacheReadPerM: 1.25,
311
- currency: "USD",
312
- unit: "per_million_tokens"
313
- }
314
- },
315
- {
316
- name: "gpt-4o-mini",
317
- displayName: "GPT-4o Mini",
318
- maxInputTokens: 128e3,
319
- supportedFileTypes: ["pdf", "image"],
320
- pricing: {
321
- inputPerM: 0.15,
322
- outputPerM: 0.6,
323
- cacheReadPerM: 0.075,
324
- currency: "USD",
325
- unit: "per_million_tokens"
326
- }
327
- },
328
- {
329
- name: "gpt-4o-audio-preview",
330
- displayName: "GPT-4o Audio Preview",
331
- maxInputTokens: 128e3,
332
- supportedFileTypes: ["audio"],
333
- pricing: {
334
- inputPerM: 2.5,
335
- outputPerM: 10,
336
- cacheReadPerM: 1.25,
337
- currency: "USD",
338
- unit: "per_million_tokens"
339
- }
340
- },
341
- {
342
- name: "o4-mini",
343
- displayName: "O4 Mini",
344
- maxInputTokens: 2e5,
345
- supportedFileTypes: ["pdf", "image"],
346
- pricing: {
347
- inputPerM: 1.1,
348
- outputPerM: 4.4,
349
- cacheReadPerM: 0.275,
350
- currency: "USD",
351
- unit: "per_million_tokens"
352
- }
353
- },
354
- {
355
- name: "o3",
356
- displayName: "O3",
357
- maxInputTokens: 2e5,
358
- supportedFileTypes: ["pdf", "image"],
359
- pricing: {
360
- inputPerM: 2,
361
- outputPerM: 8,
362
- cacheReadPerM: 0.5,
363
- currency: "USD",
364
- unit: "per_million_tokens"
365
- }
366
- },
367
- {
368
- name: "o3-mini",
369
- displayName: "O3 Mini",
370
- maxInputTokens: 2e5,
371
- supportedFileTypes: [],
372
- pricing: {
373
- inputPerM: 1.1,
374
- outputPerM: 4.4,
375
- cacheReadPerM: 0.55,
376
- currency: "USD",
377
- unit: "per_million_tokens"
378
- }
379
- },
380
- {
381
- name: "o1",
382
- displayName: "O1",
383
- maxInputTokens: 2e5,
384
- supportedFileTypes: ["pdf", "image"],
385
- pricing: {
386
- inputPerM: 15,
387
- outputPerM: 60,
388
- cacheReadPerM: 7.5,
389
- currency: "USD",
390
- unit: "per_million_tokens"
391
- }
392
- }
393
- ],
394
- baseURLSupport: "none",
395
- supportedFileTypes: []
396
- // No defaults - models must explicitly specify support
397
- },
398
- "openai-compatible": {
399
- models: [],
400
- // Empty - accepts any model name for custom endpoints
401
- baseURLSupport: "required",
402
- supportedFileTypes: ["pdf", "image", "audio"],
403
- // Allow all types for custom endpoints - user assumes responsibility for model capabilities
404
- supportsCustomModels: true
405
- },
406
- anthropic: {
407
- models: [
408
- {
409
- name: "claude-haiku-4-5-20251001",
410
- displayName: "Claude 4.5 Haiku",
411
- maxInputTokens: 2e5,
412
- default: true,
413
- supportedFileTypes: ["pdf", "image"],
414
- pricing: {
415
- inputPerM: 1,
416
- outputPerM: 5,
417
- cacheWritePerM: 1.25,
418
- cacheReadPerM: 0.1,
419
- currency: "USD",
420
- unit: "per_million_tokens"
421
- }
422
- },
423
- {
424
- name: "claude-sonnet-4-5-20250929",
425
- displayName: "Claude 4.5 Sonnet",
426
- maxInputTokens: 2e5,
427
- supportedFileTypes: ["pdf", "image"],
428
- pricing: {
429
- inputPerM: 3,
430
- outputPerM: 15,
431
- cacheWritePerM: 3.75,
432
- cacheReadPerM: 0.3,
433
- currency: "USD",
434
- unit: "per_million_tokens"
435
- }
436
- },
437
- {
438
- name: "claude-opus-4-5-20251101",
439
- displayName: "Claude 4.5 Opus",
440
- maxInputTokens: 2e5,
441
- supportedFileTypes: ["pdf", "image"],
442
- pricing: {
443
- inputPerM: 5,
444
- outputPerM: 25,
445
- cacheWritePerM: 6.25,
446
- cacheReadPerM: 0.5,
447
- currency: "USD",
448
- unit: "per_million_tokens"
449
- }
450
- },
451
- {
452
- name: "claude-opus-4-1-20250805",
453
- displayName: "Claude 4.1 Opus",
454
- maxInputTokens: 2e5,
455
- supportedFileTypes: ["pdf", "image"],
456
- pricing: {
457
- inputPerM: 15,
458
- outputPerM: 75,
459
- cacheWritePerM: 18.75,
460
- cacheReadPerM: 1.5,
461
- currency: "USD",
462
- unit: "per_million_tokens"
463
- }
464
- },
465
- {
466
- name: "claude-4-opus-20250514",
467
- displayName: "Claude 4 Opus",
468
- maxInputTokens: 2e5,
469
- supportedFileTypes: ["pdf", "image"],
470
- pricing: {
471
- inputPerM: 15,
472
- outputPerM: 75,
473
- cacheWritePerM: 18.75,
474
- cacheReadPerM: 1.5,
475
- currency: "USD",
476
- unit: "per_million_tokens"
477
- }
478
- },
479
- {
480
- name: "claude-4-sonnet-20250514",
481
- displayName: "Claude 4 Sonnet",
482
- maxInputTokens: 2e5,
483
- supportedFileTypes: ["pdf", "image"],
484
- pricing: {
485
- inputPerM: 3,
486
- outputPerM: 15,
487
- cacheWritePerM: 3.75,
488
- cacheReadPerM: 0.3,
489
- currency: "USD",
490
- unit: "per_million_tokens"
491
- }
492
- },
493
- {
494
- name: "claude-3-7-sonnet-20250219",
495
- displayName: "Claude 3.7 Sonnet",
496
- maxInputTokens: 2e5,
497
- supportedFileTypes: ["pdf", "image"],
498
- pricing: {
499
- inputPerM: 3,
500
- outputPerM: 15,
501
- cacheWritePerM: 3.75,
502
- cacheReadPerM: 0.3,
503
- currency: "USD",
504
- unit: "per_million_tokens"
505
- }
506
- },
507
- {
508
- name: "claude-3-5-sonnet-20240620",
509
- displayName: "Claude 3.5 Sonnet",
510
- maxInputTokens: 2e5,
511
- supportedFileTypes: ["pdf", "image"],
512
- pricing: {
513
- inputPerM: 3,
514
- outputPerM: 15,
515
- cacheWritePerM: 3.75,
516
- cacheReadPerM: 0.3,
517
- currency: "USD",
518
- unit: "per_million_tokens"
519
- }
520
- },
521
- {
522
- name: "claude-3-5-haiku-20241022",
523
- displayName: "Claude 3.5 Haiku",
524
- maxInputTokens: 2e5,
525
- supportedFileTypes: ["pdf", "image"],
526
- pricing: {
527
- inputPerM: 0.8,
528
- outputPerM: 4,
529
- cacheWritePerM: 1,
530
- cacheReadPerM: 0.08,
531
- currency: "USD",
532
- unit: "per_million_tokens"
533
- }
534
- }
535
- ],
536
- baseURLSupport: "none",
537
- supportedFileTypes: []
538
- // No defaults - models must explicitly specify support
539
- },
540
- google: {
541
- models: [
542
- {
543
- name: "gemini-3-flash-preview",
544
- displayName: "Gemini 3 Flash Preview",
545
- maxInputTokens: 1048576,
546
- default: true,
547
- supportedFileTypes: ["pdf", "image", "audio"],
548
- pricing: {
549
- inputPerM: 0.5,
550
- outputPerM: 3,
551
- cacheReadPerM: 0.05,
552
- currency: "USD",
553
- unit: "per_million_tokens"
554
- }
555
- },
556
- {
557
- name: "gemini-3-pro-preview",
558
- displayName: "Gemini 3 Pro Preview",
559
- maxInputTokens: 1048576,
560
- supportedFileTypes: ["pdf", "image", "audio"],
561
- pricing: {
562
- inputPerM: 2,
563
- outputPerM: 12,
564
- cacheReadPerM: 0.2,
565
- currency: "USD",
566
- unit: "per_million_tokens"
567
- }
568
- },
569
- {
570
- name: "gemini-3-pro-image-preview",
571
- displayName: "Gemini 3 Pro Image Preview",
572
- maxInputTokens: 1048576,
573
- supportedFileTypes: ["image"],
574
- pricing: {
575
- inputPerM: 2,
576
- outputPerM: 120,
577
- cacheReadPerM: 0.2,
578
- currency: "USD",
579
- unit: "per_million_tokens"
580
- }
581
- },
582
- {
583
- name: "gemini-2.5-pro",
584
- displayName: "Gemini 2.5 Pro",
585
- maxInputTokens: 1048576,
586
- supportedFileTypes: ["pdf", "image", "audio"],
587
- pricing: {
588
- inputPerM: 1.25,
589
- outputPerM: 10,
590
- cacheReadPerM: 0.31,
591
- currency: "USD",
592
- unit: "per_million_tokens"
593
- }
594
- },
595
- {
596
- name: "gemini-2.5-flash",
597
- displayName: "Gemini 2.5 Flash",
598
- maxInputTokens: 1048576,
599
- supportedFileTypes: ["pdf", "image", "audio"],
600
- pricing: {
601
- inputPerM: 0.3,
602
- outputPerM: 2.5,
603
- cacheReadPerM: 0.03,
604
- currency: "USD",
605
- unit: "per_million_tokens"
606
- }
607
- },
608
- {
609
- name: "gemini-2.5-flash-lite",
610
- displayName: "Gemini 2.5 Flash Lite",
611
- maxInputTokens: 1048576,
612
- supportedFileTypes: ["pdf", "image", "audio"],
613
- pricing: {
614
- inputPerM: 0.1,
615
- outputPerM: 0.4,
616
- cacheReadPerM: 0.025,
617
- currency: "USD",
618
- unit: "per_million_tokens"
619
- }
620
- },
621
- {
622
- name: "gemini-2.0-flash",
623
- displayName: "Gemini 2.0 Flash",
624
- maxInputTokens: 1048576,
625
- supportedFileTypes: ["pdf", "image", "audio"],
626
- pricing: {
627
- inputPerM: 0.15,
628
- outputPerM: 0.6,
629
- cacheReadPerM: 0.025,
630
- cacheWritePerM: 1,
631
- currency: "USD",
632
- unit: "per_million_tokens"
633
- }
634
- },
635
- {
636
- name: "gemini-2.0-flash-lite",
637
- displayName: "Gemini 2.0 Flash Lite",
638
- maxInputTokens: 1048576,
639
- supportedFileTypes: ["pdf", "image", "audio"],
640
- pricing: {
641
- inputPerM: 0.075,
642
- outputPerM: 0.3,
643
- cacheReadPerM: 0.01875,
644
- currency: "USD",
645
- unit: "per_million_tokens"
646
- }
647
- }
648
- ],
649
- baseURLSupport: "none",
650
- supportedFileTypes: []
651
- // No defaults - models must explicitly specify support
652
- },
653
- // https://console.groq.com/docs/models
654
- groq: {
655
- models: [
656
- {
657
- name: "gemma-2-9b-it",
658
- displayName: "Gemma 2 9B Instruct",
659
- maxInputTokens: 8192,
660
- supportedFileTypes: [],
661
- pricing: {
662
- inputPerM: 0.2,
663
- outputPerM: 0.2,
664
- currency: "USD",
665
- unit: "per_million_tokens"
666
- }
667
- },
668
- {
669
- name: "openai/gpt-oss-20b",
670
- displayName: "GPT OSS 20B 128k",
671
- maxInputTokens: 128e3,
672
- supportedFileTypes: [],
673
- pricing: {
674
- inputPerM: 0.1,
675
- outputPerM: 0.5,
676
- currency: "USD",
677
- unit: "per_million_tokens"
678
- }
679
- },
680
- {
681
- name: "openai/gpt-oss-120b",
682
- displayName: "GPT OSS 120B 128k",
683
- maxInputTokens: 128e3,
684
- supportedFileTypes: [],
685
- pricing: {
686
- inputPerM: 0.15,
687
- outputPerM: 0.75,
688
- currency: "USD",
689
- unit: "per_million_tokens"
690
- }
691
- },
692
- {
693
- name: "moonshotai/kimi-k2-instruct",
694
- displayName: "Kimi K2 1T 128k",
695
- maxInputTokens: 128e3,
696
- supportedFileTypes: [],
697
- pricing: {
698
- inputPerM: 1,
699
- outputPerM: 3,
700
- cacheReadPerM: 0.5,
701
- currency: "USD",
702
- unit: "per_million_tokens"
703
- }
704
- },
705
- {
706
- name: "meta-llama/llama-4-scout-17b-16e-instruct",
707
- displayName: "Llama 4 Scout (17Bx16E) 128k",
708
- maxInputTokens: 128e3,
709
- supportedFileTypes: [],
710
- pricing: {
711
- inputPerM: 0.11,
712
- outputPerM: 0.34,
713
- currency: "USD",
714
- unit: "per_million_tokens"
715
- }
716
- },
717
- {
718
- name: "meta-llama/llama-4-maverick-17b-128e-instruct",
719
- displayName: "Llama 4 Maverick (17Bx128E) 128k",
720
- maxInputTokens: 128e3,
721
- supportedFileTypes: [],
722
- pricing: {
723
- inputPerM: 0.2,
724
- outputPerM: 0.6,
725
- currency: "USD",
726
- unit: "per_million_tokens"
727
- }
728
- },
729
- {
730
- name: "deepseek-r1-distill-llama-70b",
731
- displayName: "DeepSeek R1 Distill Llama 70B 128k",
732
- maxInputTokens: 128e3,
733
- supportedFileTypes: [],
734
- pricing: {
735
- inputPerM: 0.75,
736
- outputPerM: 0.9,
737
- currency: "USD",
738
- unit: "per_million_tokens"
739
- }
740
- },
741
- {
742
- name: "qwen/qwen3-32b",
743
- displayName: "Qwen3 32B 131k",
744
- maxInputTokens: 131e3,
745
- supportedFileTypes: [],
746
- pricing: {
747
- inputPerM: 0.29,
748
- outputPerM: 0.59,
749
- currency: "USD",
750
- unit: "per_million_tokens"
751
- }
752
- },
753
- {
754
- name: "llama-3.3-70b-versatile",
755
- displayName: "Llama 3.3 70B Versatile",
756
- maxInputTokens: 128e3,
757
- default: true,
758
- supportedFileTypes: [],
759
- pricing: {
760
- inputPerM: 0.59,
761
- outputPerM: 0.79,
762
- currency: "USD",
763
- unit: "per_million_tokens"
764
- }
765
- }
766
- ],
767
- baseURLSupport: "none",
768
- supportedFileTypes: []
769
- // Groq currently doesn't support file uploads
770
- },
771
- // https://docs.x.ai/docs/models
772
- // Note: XAI API only supports image uploads (JPG/PNG up to 20MB), not PDFs
773
- xai: {
774
- models: [
775
- {
776
- name: "grok-4",
777
- displayName: "Grok 4",
778
- maxInputTokens: 256e3,
779
- default: true,
780
- supportedFileTypes: ["image"],
781
- pricing: {
782
- inputPerM: 3,
783
- outputPerM: 15,
784
- cacheReadPerM: 0.75,
785
- currency: "USD",
786
- unit: "per_million_tokens"
787
- }
788
- },
789
- {
790
- name: "grok-3",
791
- displayName: "Grok 3",
792
- maxInputTokens: 131072,
793
- supportedFileTypes: ["image"],
794
- pricing: {
795
- inputPerM: 3,
796
- outputPerM: 15,
797
- cacheReadPerM: 0.75,
798
- currency: "USD",
799
- unit: "per_million_tokens"
800
- }
801
- },
802
- {
803
- name: "grok-3-mini",
804
- displayName: "Grok 3 Mini",
805
- maxInputTokens: 131072,
806
- supportedFileTypes: ["image"],
807
- pricing: {
808
- inputPerM: 0.3,
809
- outputPerM: 0.5,
810
- cacheReadPerM: 0.075,
811
- currency: "USD",
812
- unit: "per_million_tokens"
813
- }
814
- },
815
- {
816
- name: "grok-code-fast-1",
817
- displayName: "Grok Code Fast",
818
- maxInputTokens: 131072,
819
- supportedFileTypes: [],
820
- pricing: {
821
- inputPerM: 0.2,
822
- outputPerM: 1.5,
823
- cacheReadPerM: 0.02,
824
- currency: "USD",
825
- unit: "per_million_tokens"
826
- }
827
- }
828
- ],
829
- baseURLSupport: "none",
830
- supportedFileTypes: []
831
- // XAI currently doesn't support file uploads
832
- },
833
- // https://docs.cohere.com/reference/models
834
- cohere: {
835
- models: [
836
- {
837
- name: "command-a-03-2025",
838
- displayName: "Command A (03-2025)",
839
- maxInputTokens: 256e3,
840
- default: true,
841
- supportedFileTypes: [],
842
- pricing: {
843
- inputPerM: 2.5,
844
- outputPerM: 10,
845
- currency: "USD",
846
- unit: "per_million_tokens"
847
- }
848
- },
849
- {
850
- name: "command-r-plus",
851
- displayName: "Command R+",
852
- maxInputTokens: 128e3,
853
- supportedFileTypes: [],
854
- pricing: {
855
- inputPerM: 2.5,
856
- outputPerM: 10,
857
- currency: "USD",
858
- unit: "per_million_tokens"
859
- }
860
- },
861
- {
862
- name: "command-r",
863
- displayName: "Command R",
864
- maxInputTokens: 128e3,
865
- supportedFileTypes: [],
866
- pricing: {
867
- inputPerM: 0.15,
868
- outputPerM: 0.6,
869
- currency: "USD",
870
- unit: "per_million_tokens"
871
- }
872
- },
873
- {
874
- name: "command-r7b",
875
- displayName: "Command R7B",
876
- maxInputTokens: 128e3,
877
- supportedFileTypes: [],
878
- pricing: {
879
- inputPerM: 0.0375,
880
- outputPerM: 0.15,
881
- currency: "USD",
882
- unit: "per_million_tokens"
883
- }
884
- }
885
- ],
886
- baseURLSupport: "none",
887
- supportedFileTypes: []
888
- // Cohere currently doesn't support file uploads
889
- },
890
- // https://openrouter.ai/docs
891
- // OpenRouter is a unified API gateway providing access to 100+ models from various providers.
892
- // Model validation is handled dynamically via openrouter-model-registry.ts
893
- openrouter: {
894
- models: [],
895
- // Empty - accepts any model name (validated against OpenRouter's catalog)
896
- baseURLSupport: "none",
897
- // Fixed endpoint - baseURL auto-injected in resolver, no user override allowed
898
- supportedFileTypes: ["pdf", "image", "audio"],
899
- // Allow all types - user assumes responsibility for model capabilities
900
- supportsCustomModels: true
901
- },
902
- // https://docs.litellm.ai/
903
- // LiteLLM is an OpenAI-compatible proxy that unifies 100+ LLM providers.
904
- // User must host their own LiteLLM proxy and provide the baseURL.
905
- litellm: {
906
- models: [],
907
- // Empty - accepts any model name (user's proxy determines available models)
908
- baseURLSupport: "required",
909
- // User must provide their LiteLLM proxy URL
910
- supportedFileTypes: ["pdf", "image", "audio"],
911
- // Allow all types - user assumes responsibility for model capabilities
912
- supportsCustomModels: true
913
- },
914
- // https://glama.ai/
915
- // Glama is an OpenAI-compatible gateway providing unified access to multiple LLM providers.
916
- // Fixed endpoint: https://glama.ai/api/gateway/openai/v1
917
- glama: {
918
- models: [],
919
- // Empty - accepts any model name (format: provider/model e.g., openai/gpt-4o)
920
- baseURLSupport: "none",
921
- // Fixed endpoint - baseURL auto-injected
922
- supportedFileTypes: ["pdf", "image", "audio"],
923
- // Allow all types - user assumes responsibility for model capabilities
924
- supportsCustomModels: true
925
- },
926
- // https://cloud.google.com/vertex-ai
927
- // Google Vertex AI - GCP-hosted gateway for Gemini and Claude models
928
- // Supports both Google's Gemini models and Anthropic's Claude via partnership
929
- //
930
- // Setup instructions:
931
- // 1. Create a Google Cloud account and project
932
- // 2. Enable the Vertex AI API: gcloud services enable aiplatform.googleapis.com
933
- // 3. Enable desired Claude models (requires Anthropic Model Garden)
934
- // 4. Install Google Cloud CLI: https://cloud.google.com/sdk/docs/install
935
- // 5. Configure ADC: gcloud auth application-default login
936
- // 6. Set env vars: GOOGLE_VERTEX_PROJECT (required), GOOGLE_VERTEX_LOCATION (optional)
937
- //
938
- // TODO: Add dynamic model fetching via publishers.models.list API
939
- // - Requires: projectId, region, ADC auth
940
- // - Endpoints: GET projects/{project}/locations/{location}/publishers/{google,anthropic}/models
941
- // - Note: API doesn't return aliases (e.g., gemini-2.0-flash), only versioned IDs
942
- // - Docs: https://cloud.google.com/vertex-ai/docs/reference/rest/v1/projects.locations.models/list
943
- // - Models: https://cloud.google.com/vertex-ai/generative-ai/docs/models
944
- vertex: {
945
- models: [
946
- // Gemini 3 models on Vertex AI (Preview)
947
- {
948
- name: "gemini-3-flash-preview",
949
- displayName: "Gemini 3 Flash (Vertex)",
950
- maxInputTokens: 1048576,
951
- default: true,
952
- supportedFileTypes: ["pdf", "image", "audio"],
953
- pricing: {
954
- inputPerM: 0.5,
955
- outputPerM: 3,
956
- cacheReadPerM: 0.05,
957
- currency: "USD",
958
- unit: "per_million_tokens"
959
- }
960
- },
961
- {
962
- name: "gemini-3-pro-preview",
963
- displayName: "Gemini 3 Pro (Vertex)",
964
- maxInputTokens: 1048576,
965
- supportedFileTypes: ["pdf", "image", "audio"],
966
- pricing: {
967
- inputPerM: 2,
968
- outputPerM: 12,
969
- cacheReadPerM: 0.2,
970
- currency: "USD",
971
- unit: "per_million_tokens"
972
- }
973
- },
974
- // Gemini 2.x models on Vertex AI
975
- {
976
- name: "gemini-2.5-pro",
977
- displayName: "Gemini 2.5 Pro (Vertex)",
978
- maxInputTokens: 1048576,
979
- supportedFileTypes: ["pdf", "image", "audio"],
980
- pricing: {
981
- inputPerM: 1.25,
982
- outputPerM: 10,
983
- cacheReadPerM: 0.31,
984
- currency: "USD",
985
- unit: "per_million_tokens"
986
- }
987
- },
988
- {
989
- name: "gemini-2.5-flash",
990
- displayName: "Gemini 2.5 Flash (Vertex)",
991
- maxInputTokens: 1048576,
992
- supportedFileTypes: ["pdf", "image", "audio"],
993
- pricing: {
994
- inputPerM: 0.15,
995
- outputPerM: 0.6,
996
- cacheReadPerM: 0.0375,
997
- currency: "USD",
998
- unit: "per_million_tokens"
999
- }
1000
- },
1001
- {
1002
- name: "gemini-2.0-flash",
1003
- displayName: "Gemini 2.0 Flash (Vertex)",
1004
- maxInputTokens: 1048576,
1005
- supportedFileTypes: ["pdf", "image", "audio"],
1006
- pricing: {
1007
- inputPerM: 0.1,
1008
- outputPerM: 0.4,
1009
- cacheReadPerM: 0.025,
1010
- currency: "USD",
1011
- unit: "per_million_tokens"
1012
- }
1013
- },
1014
- // Claude 4.5 models on Vertex AI (via Anthropic partnership)
1015
- // Note: Claude model IDs use @ suffix format on Vertex
1016
- {
1017
- name: "claude-opus-4-5@20251101",
1018
- displayName: "Claude 4.5 Opus (Vertex)",
1019
- maxInputTokens: 2e5,
1020
- supportedFileTypes: ["pdf", "image"],
1021
- pricing: {
1022
- inputPerM: 5,
1023
- outputPerM: 25,
1024
- cacheWritePerM: 6.25,
1025
- cacheReadPerM: 0.5,
1026
- currency: "USD",
1027
- unit: "per_million_tokens"
1028
- }
1029
- },
1030
- {
1031
- name: "claude-sonnet-4-5@20250929",
1032
- displayName: "Claude 4.5 Sonnet (Vertex)",
1033
- maxInputTokens: 2e5,
1034
- supportedFileTypes: ["pdf", "image"],
1035
- pricing: {
1036
- inputPerM: 3,
1037
- outputPerM: 15,
1038
- cacheWritePerM: 3.75,
1039
- cacheReadPerM: 0.3,
1040
- currency: "USD",
1041
- unit: "per_million_tokens"
1042
- }
1043
- },
1044
- {
1045
- name: "claude-haiku-4-5@20251001",
1046
- displayName: "Claude 4.5 Haiku (Vertex)",
1047
- maxInputTokens: 2e5,
1048
- supportedFileTypes: ["pdf", "image"],
1049
- pricing: {
1050
- inputPerM: 1,
1051
- outputPerM: 5,
1052
- cacheWritePerM: 1.25,
1053
- cacheReadPerM: 0.1,
1054
- currency: "USD",
1055
- unit: "per_million_tokens"
1056
- }
1057
- },
1058
- // Claude 4.1 and 4.0 models on Vertex AI
1059
- {
1060
- name: "claude-opus-4-1@20250805",
1061
- displayName: "Claude 4.1 Opus (Vertex)",
1062
- maxInputTokens: 2e5,
1063
- supportedFileTypes: ["pdf", "image"],
1064
- pricing: {
1065
- inputPerM: 15,
1066
- outputPerM: 75,
1067
- cacheWritePerM: 18.75,
1068
- cacheReadPerM: 1.5,
1069
- currency: "USD",
1070
- unit: "per_million_tokens"
1071
- }
1072
- },
1073
- {
1074
- name: "claude-opus-4@20250514",
1075
- displayName: "Claude 4 Opus (Vertex)",
1076
- maxInputTokens: 2e5,
1077
- supportedFileTypes: ["pdf", "image"],
1078
- pricing: {
1079
- inputPerM: 15,
1080
- outputPerM: 75,
1081
- cacheWritePerM: 18.75,
1082
- cacheReadPerM: 1.5,
1083
- currency: "USD",
1084
- unit: "per_million_tokens"
1085
- }
1086
- },
1087
- {
1088
- name: "claude-sonnet-4@20250514",
1089
- displayName: "Claude 4 Sonnet (Vertex)",
1090
- maxInputTokens: 2e5,
1091
- supportedFileTypes: ["pdf", "image"],
1092
- pricing: {
1093
- inputPerM: 3,
1094
- outputPerM: 15,
1095
- cacheWritePerM: 3.75,
1096
- cacheReadPerM: 0.3,
1097
- currency: "USD",
1098
- unit: "per_million_tokens"
1099
- }
1100
- },
1101
- // Claude 3.x models on Vertex AI
1102
- {
1103
- name: "claude-3-7-sonnet@20250219",
1104
- displayName: "Claude 3.7 Sonnet (Vertex)",
1105
- maxInputTokens: 2e5,
1106
- supportedFileTypes: ["pdf", "image"],
1107
- pricing: {
1108
- inputPerM: 3,
1109
- outputPerM: 15,
1110
- cacheWritePerM: 3.75,
1111
- cacheReadPerM: 0.3,
1112
- currency: "USD",
1113
- unit: "per_million_tokens"
1114
- }
1115
- },
1116
- {
1117
- name: "claude-3-5-sonnet-v2@20241022",
1118
- displayName: "Claude 3.5 Sonnet v2 (Vertex)",
1119
- maxInputTokens: 2e5,
1120
- supportedFileTypes: ["pdf", "image"],
1121
- pricing: {
1122
- inputPerM: 3,
1123
- outputPerM: 15,
1124
- cacheWritePerM: 3.75,
1125
- cacheReadPerM: 0.3,
1126
- currency: "USD",
1127
- unit: "per_million_tokens"
1128
- }
1129
- },
1130
- {
1131
- name: "claude-3-5-haiku@20241022",
1132
- displayName: "Claude 3.5 Haiku (Vertex)",
1133
- maxInputTokens: 2e5,
1134
- supportedFileTypes: ["pdf", "image"],
1135
- pricing: {
1136
- inputPerM: 0.8,
1137
- outputPerM: 4,
1138
- cacheWritePerM: 1,
1139
- cacheReadPerM: 0.08,
1140
- currency: "USD",
1141
- unit: "per_million_tokens"
1142
- }
1143
- }
1144
- ],
1145
- baseURLSupport: "none",
1146
- // Auto-constructed from projectId and region
1147
- supportedFileTypes: ["pdf", "image", "audio"]
1148
- },
1149
- // Amazon Bedrock - AWS-hosted gateway for Claude, Nova, and more
1150
- // Auth: AWS credentials (env vars) or Bedrock API key (AWS_BEARER_TOKEN_BEDROCK)
1151
- //
1152
- // Cross-region inference: Auto-added for anthropic.* and amazon.* models
1153
- // supportsCustomModels: true allows users to add custom model IDs beyond the fixed list
1154
- bedrock: {
1155
- supportsCustomModels: true,
1156
- models: [
1157
- // Claude 4.5 models (latest)
1158
- {
1159
- name: "anthropic.claude-sonnet-4-5-20250929-v1:0",
1160
- displayName: "Claude 4.5 Sonnet",
1161
- maxInputTokens: 2e5,
1162
- default: true,
1163
- supportedFileTypes: ["pdf", "image"],
1164
- pricing: {
1165
- inputPerM: 3,
1166
- outputPerM: 15,
1167
- cacheWritePerM: 3.75,
1168
- cacheReadPerM: 0.3,
1169
- currency: "USD",
1170
- unit: "per_million_tokens"
1171
- }
1172
- },
1173
- {
1174
- name: "anthropic.claude-haiku-4-5-20251001-v1:0",
1175
- displayName: "Claude 4.5 Haiku",
1176
- maxInputTokens: 2e5,
1177
- supportedFileTypes: ["pdf", "image"],
1178
- pricing: {
1179
- inputPerM: 1,
1180
- outputPerM: 5,
1181
- cacheWritePerM: 1.25,
1182
- cacheReadPerM: 0.1,
1183
- currency: "USD",
1184
- unit: "per_million_tokens"
1185
- }
1186
- },
1187
- {
1188
- name: "anthropic.claude-opus-4-5-20251101-v1:0",
1189
- displayName: "Claude 4.5 Opus",
1190
- maxInputTokens: 2e5,
1191
- supportedFileTypes: ["pdf", "image"],
1192
- pricing: {
1193
- inputPerM: 5,
1194
- outputPerM: 25,
1195
- cacheWritePerM: 6.25,
1196
- cacheReadPerM: 0.5,
1197
- currency: "USD",
1198
- unit: "per_million_tokens"
1199
- }
1200
- },
1201
- // Amazon Nova models
1202
- {
1203
- name: "amazon.nova-premier-v1:0",
1204
- displayName: "Nova Premier",
1205
- maxInputTokens: 1e6,
1206
- supportedFileTypes: ["image"],
1207
- pricing: {
1208
- inputPerM: 2.5,
1209
- outputPerM: 12.5,
1210
- currency: "USD",
1211
- unit: "per_million_tokens"
1212
- }
1213
- },
1214
- {
1215
- name: "amazon.nova-pro-v1:0",
1216
- displayName: "Nova Pro",
1217
- maxInputTokens: 3e5,
1218
- supportedFileTypes: ["pdf", "image"],
1219
- pricing: {
1220
- inputPerM: 0.8,
1221
- outputPerM: 3.2,
1222
- cacheReadPerM: 0.2,
1223
- currency: "USD",
1224
- unit: "per_million_tokens"
1225
- }
1226
- },
1227
- {
1228
- name: "amazon.nova-lite-v1:0",
1229
- displayName: "Nova Lite",
1230
- maxInputTokens: 3e5,
1231
- supportedFileTypes: ["pdf", "image"],
1232
- pricing: {
1233
- inputPerM: 0.06,
1234
- outputPerM: 0.24,
1235
- cacheReadPerM: 0.015,
1236
- currency: "USD",
1237
- unit: "per_million_tokens"
1238
- }
1239
- },
1240
- {
1241
- name: "amazon.nova-micro-v1:0",
1242
- displayName: "Nova Micro",
1243
- maxInputTokens: 128e3,
1244
- supportedFileTypes: [],
1245
- pricing: {
1246
- inputPerM: 0.035,
1247
- outputPerM: 0.14,
1248
- cacheReadPerM: 875e-5,
1249
- currency: "USD",
1250
- unit: "per_million_tokens"
1251
- }
1252
- },
1253
- // OpenAI GPT-OSS
1254
- {
1255
- name: "openai.gpt-oss-120b-1:0",
1256
- displayName: "GPT-OSS 120B",
1257
- maxInputTokens: 128e3,
1258
- supportedFileTypes: [],
1259
- pricing: {
1260
- inputPerM: 0.15,
1261
- outputPerM: 0.6,
1262
- currency: "USD",
1263
- unit: "per_million_tokens"
1264
- }
1265
- },
1266
- {
1267
- name: "openai.gpt-oss-20b-1:0",
1268
- displayName: "GPT-OSS 20B",
1269
- maxInputTokens: 128e3,
1270
- supportedFileTypes: [],
1271
- pricing: {
1272
- inputPerM: 0.07,
1273
- outputPerM: 0.3,
1274
- currency: "USD",
1275
- unit: "per_million_tokens"
1276
- }
1277
- },
1278
- // Qwen
1279
- {
1280
- name: "qwen.qwen3-coder-30b-a3b-v1:0",
1281
- displayName: "Qwen3 Coder 30B",
1282
- maxInputTokens: 262144,
1283
- supportedFileTypes: [],
1284
- pricing: {
1285
- inputPerM: 0.15,
1286
- outputPerM: 0.6,
1287
- currency: "USD",
1288
- unit: "per_million_tokens"
1289
- }
1290
- },
1291
- {
1292
- name: "qwen.qwen3-coder-480b-a35b-v1:0",
1293
- displayName: "Qwen3 Coder 480B",
1294
- maxInputTokens: 262144,
1295
- supportedFileTypes: [],
1296
- pricing: {
1297
- inputPerM: 0.22,
1298
- outputPerM: 1.8,
1299
- currency: "USD",
1300
- unit: "per_million_tokens"
1301
- }
1302
- }
1303
- ],
1304
- baseURLSupport: "none",
1305
- // Auto-constructed from region
1306
- supportedFileTypes: ["pdf", "image"]
1307
- },
1308
- // Native local model execution via node-llama-cpp
1309
- // Runs GGUF models directly on the machine using Metal/CUDA/Vulkan acceleration
1310
- // Models are downloaded from HuggingFace and stored in ~/.dexto/models/
1311
- local: {
1312
- models: [],
1313
- // Populated dynamically from local model registry
1314
- baseURLSupport: "none",
1315
- // No external server needed
1316
- supportedFileTypes: ["image"],
1317
- // Vision support depends on model capabilities
1318
- supportsCustomModels: true
1319
- // Allow any GGUF model path
1320
- },
1321
- // Ollama server integration
1322
- // Uses Ollama's OpenAI-compatible API for local model inference
1323
- // Requires Ollama to be installed and running (default: http://localhost:11434)
1324
- ollama: {
1325
- models: [],
1326
- // Populated dynamically from Ollama API
1327
- baseURLSupport: "optional",
1328
- // Default: http://localhost:11434, can be customized
1329
- supportedFileTypes: ["image"],
1330
- // Vision support depends on model
1331
- supportsCustomModels: true
1332
- // Accept any Ollama model name
1333
- }
1334
- // TODO: Add 'dexto' provider (similar to openrouter, uses https://api.dexto.ai/v1)
1335
- };
1336
- function stripBedrockRegionPrefix(model) {
1337
- if (model.startsWith("eu.") || model.startsWith("us.")) {
1338
- return model.slice(3);
1339
- }
1340
- if (model.startsWith("global.")) {
1341
- return model.slice(7);
1342
- }
1343
- return model;
1344
- }
1345
- function getDefaultModelForProvider(provider) {
1346
- const providerInfo = LLM_REGISTRY[provider];
1347
- return providerInfo.models.find((m) => m.default)?.name || null;
1348
- }
1349
- function getSupportedProviders() {
1350
- return [...import_types.LLM_PROVIDERS];
1351
- }
1352
- function getSupportedModels(provider) {
1353
- const providerInfo = LLM_REGISTRY[provider];
1354
- return providerInfo.models.map((m) => m.name);
1355
- }
1356
- function getMaxInputTokensForModel(provider, model, logger) {
1357
- const providerInfo = LLM_REGISTRY[provider];
1358
- const normalizedModel = stripBedrockRegionPrefix(model).toLowerCase();
1359
- const modelInfo = providerInfo.models.find((m) => m.name.toLowerCase() === normalizedModel);
1360
- if (!modelInfo) {
1361
- const supportedModels = getSupportedModels(provider).join(", ");
1362
- logger?.error(
1363
- `Model '${model}' not found for provider '${provider}' in LLM registry. Supported models: ${supportedModels}`
1364
- );
1365
- throw import_errors.LLMError.unknownModel(provider, model);
1366
- }
1367
- logger?.debug(`Found max tokens for ${provider}/${model}: ${modelInfo.maxInputTokens}`);
1368
- return modelInfo.maxInputTokens;
1369
- }
1370
- function isValidProviderModel(provider, model) {
1371
- const providerInfo = LLM_REGISTRY[provider];
1372
- const normalizedModel = stripBedrockRegionPrefix(model).toLowerCase();
1373
- return providerInfo.models.some((m) => m.name.toLowerCase() === normalizedModel);
1374
- }
1375
- function getProviderFromModel(model) {
1376
- const normalizedModel = stripBedrockRegionPrefix(model).toLowerCase();
1377
- for (const provider of import_types.LLM_PROVIDERS) {
1378
- const info = LLM_REGISTRY[provider];
1379
- if (info.models.some((m) => m.name.toLowerCase() === normalizedModel)) {
1380
- return provider;
1381
- }
1382
- }
1383
- throw import_errors.LLMError.modelProviderUnknown(model);
1384
- }
1385
- function getAllSupportedModels() {
1386
- return Object.values(LLM_REGISTRY).flatMap((info) => info.models.map((m) => m.name));
1387
- }
1388
- function supportsBaseURL(provider) {
1389
- const providerInfo = LLM_REGISTRY[provider];
1390
- return providerInfo.baseURLSupport !== "none";
1391
- }
1392
- function requiresBaseURL(provider) {
1393
- const providerInfo = LLM_REGISTRY[provider];
1394
- return providerInfo.baseURLSupport === "required";
1395
- }
1396
- function acceptsAnyModel(provider) {
1397
- const providerInfo = LLM_REGISTRY[provider];
1398
- return providerInfo.models.length === 0;
1399
- }
1400
- function supportsCustomModels(provider) {
1401
- const providerInfo = LLM_REGISTRY[provider];
1402
- return providerInfo.supportsCustomModels === true;
1403
- }
1404
- const API_KEY_OPTIONAL_PROVIDERS = /* @__PURE__ */ new Set([
1405
- "local",
1406
- // Native node-llama-cpp execution - no auth needed
1407
- "ollama",
1408
- // Ollama server - no auth needed by default
1409
- "openai-compatible",
1410
- // vLLM, LocalAI - often no auth needed
1411
- "litellm",
1412
- // Self-hosted proxy - handles auth internally
1413
- "vertex",
1414
- // Uses Google Cloud ADC (Application Default Credentials)
1415
- "bedrock"
1416
- // Uses AWS credentials (access key + secret or IAM role)
1417
- ]);
1418
- function requiresApiKey(provider) {
1419
- return !API_KEY_OPTIONAL_PROVIDERS.has(provider);
1420
- }
1421
- function getSupportedFileTypesForModel(provider, model) {
1422
- const providerInfo = LLM_REGISTRY[provider];
1423
- if (acceptsAnyModel(provider)) {
1424
- return providerInfo.supportedFileTypes;
1425
- }
1426
- const normalizedModel = stripBedrockRegionPrefix(model).toLowerCase();
1427
- const modelInfo = providerInfo.models.find((m) => m.name.toLowerCase() === normalizedModel);
1428
- if (!modelInfo) {
1429
- throw import_errors.LLMError.unknownModel(provider, model);
1430
- }
1431
- return modelInfo.supportedFileTypes;
1432
- }
1433
- function modelSupportsFileType(provider, model, fileType) {
1434
- const supportedTypes = getSupportedFileTypesForModel(provider, model);
1435
- return supportedTypes.includes(fileType);
1436
- }
1437
- function validateModelFileSupport(provider, model, mimeType) {
1438
- const baseMimeType = mimeType.toLowerCase().split(";")[0]?.trim() || mimeType.toLowerCase();
1439
- const fileType = MIME_TYPE_TO_FILE_TYPE[baseMimeType];
1440
- if (!fileType) {
1441
- return {
1442
- isSupported: false,
1443
- error: `Unsupported file type: ${mimeType}`
1444
- };
1445
- }
1446
- try {
1447
- if (!modelSupportsFileType(provider, model, fileType)) {
1448
- return {
1449
- isSupported: false,
1450
- fileType,
1451
- error: `Model '${model}' (${provider}) does not support ${fileType} files`
1452
- };
1453
- }
1454
- return {
1455
- isSupported: true,
1456
- fileType
1457
- };
1458
- } catch (error) {
1459
- return {
1460
- isSupported: false,
1461
- fileType,
1462
- error: error instanceof Error ? error.message : "Unknown error validating model file support"
1463
- };
1464
- }
1465
- }
1466
- function getEffectiveMaxInputTokens(config, logger) {
1467
- const configuredMaxInputTokens = config.maxInputTokens;
1468
- if (configuredMaxInputTokens != null) {
1469
- if (config.baseURL) {
1470
- logger.debug(
1471
- `Using maxInputTokens from configuration (with baseURL): ${configuredMaxInputTokens}`
1472
- );
1473
- return configuredMaxInputTokens;
1474
- }
1475
- try {
1476
- const registryMaxInputTokens = getMaxInputTokensForModel(
1477
- config.provider,
1478
- config.model,
1479
- logger
1480
- );
1481
- if (configuredMaxInputTokens > registryMaxInputTokens) {
1482
- logger.warn(
1483
- `Provided maxInputTokens (${configuredMaxInputTokens}) for ${config.provider}/${config.model} exceeds the known limit (${registryMaxInputTokens}) for model ${config.model}. Capping to registry limit.`
1484
- );
1485
- return registryMaxInputTokens;
1486
- } else {
1487
- logger.debug(
1488
- `Using valid maxInputTokens override from configuration: ${configuredMaxInputTokens} (Registry limit: ${registryMaxInputTokens})`
1489
- );
1490
- return configuredMaxInputTokens;
1491
- }
1492
- } catch (error) {
1493
- if (error instanceof import_DextoRuntimeError.DextoRuntimeError && error.code === import_error_codes.LLMErrorCode.MODEL_UNKNOWN) {
1494
- logger.warn(
1495
- `Registry lookup failed during maxInputTokens override check for ${config.provider}/${config.model}: ${error.message}. Proceeding with the provided maxInputTokens value (${configuredMaxInputTokens}), but it might be invalid.`
1496
- );
1497
- return configuredMaxInputTokens;
1498
- } else {
1499
- logger.error(
1500
- `Unexpected error during registry lookup for maxInputTokens override check: ${error}`
1501
- );
1502
- throw error;
1503
- }
1504
- }
1505
- }
1506
- if (config.provider === "openrouter") {
1507
- const contextLength = (0, import_openrouter_model_registry.getOpenRouterModelContextLength)(config.model);
1508
- if (contextLength !== null) {
1509
- logger.debug(
1510
- `Using maxInputTokens from OpenRouter registry for ${config.model}: ${contextLength}`
1511
- );
1512
- return contextLength;
1513
- }
1514
- logger.warn(
1515
- `OpenRouter model ${config.model} not found in cache, defaulting to ${DEFAULT_MAX_INPUT_TOKENS} tokens`
1516
- );
1517
- return DEFAULT_MAX_INPUT_TOKENS;
1518
- }
1519
- if (config.baseURL) {
1520
- logger.warn(
1521
- `baseURL is set but maxInputTokens is missing. Defaulting to ${DEFAULT_MAX_INPUT_TOKENS}. Provide 'maxInputTokens' in configuration to avoid default fallback.`
1522
- );
1523
- return DEFAULT_MAX_INPUT_TOKENS;
1524
- }
1525
- if (acceptsAnyModel(config.provider)) {
1526
- logger.debug(
1527
- `Provider ${config.provider} accepts any model, defaulting to ${DEFAULT_MAX_INPUT_TOKENS} tokens`
1528
- );
1529
- return DEFAULT_MAX_INPUT_TOKENS;
1530
- }
1531
- try {
1532
- const registryMaxInputTokens = getMaxInputTokensForModel(
1533
- config.provider,
1534
- config.model,
1535
- logger
1536
- );
1537
- logger.debug(
1538
- `Using maxInputTokens from registry for ${config.provider}/${config.model}: ${registryMaxInputTokens}`
1539
- );
1540
- return registryMaxInputTokens;
1541
- } catch (error) {
1542
- if (error instanceof import_DextoRuntimeError.DextoRuntimeError && error.code === import_error_codes.LLMErrorCode.MODEL_UNKNOWN) {
1543
- if (supportsCustomModels(config.provider)) {
1544
- logger.debug(
1545
- `Custom model ${config.model} not in ${config.provider} registry, defaulting to ${DEFAULT_MAX_INPUT_TOKENS} tokens`
1546
- );
1547
- return DEFAULT_MAX_INPUT_TOKENS;
1548
- }
1549
- logger.error(
1550
- `Registry lookup failed for ${config.provider}/${config.model}: ${error.message}. Effective maxInputTokens cannot be determined.`
1551
- );
1552
- throw import_errors.LLMError.unknownModel(config.provider, config.model);
1553
- } else {
1554
- logger.error(`Unexpected error during registry lookup for maxInputTokens: ${error}`);
1555
- throw error;
1556
- }
1557
- }
1558
- }
1559
- function getModelPricing(provider, model) {
1560
- const providerInfo = LLM_REGISTRY[provider];
1561
- if (acceptsAnyModel(provider)) {
1562
- return void 0;
1563
- }
1564
- const normalizedModel = stripBedrockRegionPrefix(model).toLowerCase();
1565
- const modelInfo = providerInfo.models.find((m) => m.name.toLowerCase() === normalizedModel);
1566
- return modelInfo?.pricing;
1567
- }
1568
- function getModelDisplayName(model, provider) {
1569
- let resolvedProvider;
1570
- try {
1571
- resolvedProvider = provider ?? getProviderFromModel(model);
1572
- } catch {
1573
- return model;
1574
- }
1575
- const providerInfo = LLM_REGISTRY[resolvedProvider];
1576
- if (!providerInfo || acceptsAnyModel(resolvedProvider)) {
1577
- return model;
1578
- }
1579
- const normalizedModel = stripBedrockRegionPrefix(model).toLowerCase();
1580
- const modelInfo = providerInfo.models.find((m) => m.name.toLowerCase() === normalizedModel);
1581
- return modelInfo?.displayName ?? model;
1582
- }
1583
- function isReasoningCapableModel(model, _provider) {
1584
- const modelLower = model.toLowerCase();
1585
- if (modelLower.includes("codex")) {
1586
- return true;
1587
- }
1588
- if (modelLower.startsWith("o1") || modelLower.startsWith("o3") || modelLower.startsWith("o4")) {
1589
- return true;
1590
- }
1591
- if (modelLower.includes("gpt-5") || modelLower.includes("gpt-5.1") || modelLower.includes("gpt-5.2")) {
1592
- return true;
1593
- }
1594
- return false;
1595
- }
1596
- function calculateCost(usage, pricing) {
1597
- const inputCost = (usage.inputTokens ?? 0) * pricing.inputPerM / 1e6;
1598
- const outputCost = (usage.outputTokens ?? 0) * pricing.outputPerM / 1e6;
1599
- const cacheReadCost = (usage.cacheReadTokens ?? 0) * (pricing.cacheReadPerM ?? 0) / 1e6;
1600
- const cacheWriteCost = (usage.cacheWriteTokens ?? 0) * (pricing.cacheWritePerM ?? 0) / 1e6;
1601
- const reasoningCost = (usage.reasoningTokens ?? 0) * pricing.outputPerM / 1e6;
1602
- return inputCost + outputCost + cacheReadCost + cacheWriteCost + reasoningCost;
1603
- }
1604
- // Annotate the CommonJS export names for ESM import in node:
1605
- 0 && (module.exports = {
1606
- DEFAULT_MAX_INPUT_TOKENS,
1607
- LLM_REGISTRY,
1608
- MIME_TYPE_TO_FILE_TYPE,
1609
- acceptsAnyModel,
1610
- calculateCost,
1611
- getAllSupportedModels,
1612
- getAllowedMimeTypes,
1613
- getDefaultModelForProvider,
1614
- getEffectiveMaxInputTokens,
1615
- getMaxInputTokensForModel,
1616
- getModelDisplayName,
1617
- getModelPricing,
1618
- getProviderFromModel,
1619
- getSupportedFileTypesForModel,
1620
- getSupportedModels,
1621
- getSupportedProviders,
1622
- isReasoningCapableModel,
1623
- isValidProviderModel,
1624
- modelSupportsFileType,
1625
- requiresApiKey,
1626
- requiresBaseURL,
1627
- stripBedrockRegionPrefix,
1628
- supportsBaseURL,
1629
- supportsCustomModels,
1630
- validateModelFileSupport
1631
- });