promptfoo 0.119.13 → 0.119.14

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (131) hide show
  1. package/dist/package.json +28 -26
  2. package/dist/src/app/assets/index-eJ2lMe94.js +51 -0
  3. package/dist/src/app/assets/{source-map-support-Bnh0UQ2S.js → source-map-support-1v4oeb7P.js} +1 -1
  4. package/dist/src/app/assets/sync-CtLQRuC1.js +1 -0
  5. package/dist/src/app/assets/{vendor-charts-T60Uk0Z3.js → vendor-charts-DnVv66VV.js} +1 -1
  6. package/dist/src/app/assets/{vendor-markdown-DLig-KJh.js → vendor-markdown-DCpQIyMA.js} +1 -1
  7. package/dist/src/app/assets/{vendor-mui-core-5BLaiG3c.js → vendor-mui-core-Boqnpf9f.js} +1 -1
  8. package/dist/src/app/assets/{vendor-mui-icons-fn39Fu2e.js → vendor-mui-icons-B8MqoVbj.js} +1 -1
  9. package/dist/src/app/assets/vendor-mui-x-CGSS6QHF.js +45 -0
  10. package/dist/src/app/assets/{vendor-utils-DYBMEuwX.js → vendor-utils-DdfHIEy8.js} +1 -1
  11. package/dist/src/app/index.html +7 -7
  12. package/dist/src/assertions/guardrails.d.ts +1 -1
  13. package/dist/src/assertions/guardrails.js +18 -9
  14. package/dist/src/assertions/index.d.ts +1 -1
  15. package/dist/src/assertions/index.js +9 -3
  16. package/dist/src/assertions/searchRubric.d.ts +3 -0
  17. package/dist/src/assertions/searchRubric.js +18 -0
  18. package/dist/src/commands/eval.js +1 -1
  19. package/dist/src/commands/modelScan.d.ts +7 -1
  20. package/dist/src/commands/modelScan.js +121 -59
  21. package/dist/src/database/index.d.ts +6 -0
  22. package/dist/src/database/index.js +11 -0
  23. package/dist/src/database/tables.d.ts +46 -24
  24. package/dist/src/envars.d.ts +17 -0
  25. package/dist/src/generated/constants.js +1 -1
  26. package/dist/src/logger.d.ts +5 -0
  27. package/dist/src/logger.js +28 -0
  28. package/dist/src/main.js +17 -6
  29. package/dist/src/matchers.d.ts +1 -0
  30. package/dist/src/matchers.js +80 -0
  31. package/dist/src/models/eval.d.ts +2 -1
  32. package/dist/src/models/eval.js +44 -2
  33. package/dist/src/prompts/grading.d.ts +1 -0
  34. package/dist/src/prompts/grading.js +26 -1
  35. package/dist/src/prompts/index.d.ts +1 -0
  36. package/dist/src/prompts/index.js +4 -1
  37. package/dist/src/providers/adaline.gateway.js +2 -2
  38. package/dist/src/providers/anthropic/defaults.d.ts +1 -1
  39. package/dist/src/providers/anthropic/defaults.js +15 -0
  40. package/dist/src/providers/azure/chat.d.ts +3 -1
  41. package/dist/src/providers/azure/chat.js +16 -3
  42. package/dist/src/providers/azure/defaults.js +660 -141
  43. package/dist/src/providers/azure/responses.d.ts +5 -0
  44. package/dist/src/providers/azure/responses.js +33 -4
  45. package/dist/src/providers/azure/types.d.ts +4 -0
  46. package/dist/src/providers/bedrock/agents.d.ts +1 -1
  47. package/dist/src/providers/bedrock/agents.js +2 -2
  48. package/dist/src/providers/bedrock/base.d.ts +40 -0
  49. package/dist/src/providers/bedrock/base.js +171 -0
  50. package/dist/src/providers/bedrock/converse.d.ts +146 -0
  51. package/dist/src/providers/bedrock/converse.js +1044 -0
  52. package/dist/src/providers/bedrock/index.d.ts +1 -34
  53. package/dist/src/providers/bedrock/index.js +4 -159
  54. package/dist/src/providers/bedrock/knowledgeBase.d.ts +1 -1
  55. package/dist/src/providers/bedrock/knowledgeBase.js +2 -2
  56. package/dist/src/providers/bedrock/nova-sonic.d.ts +2 -1
  57. package/dist/src/providers/bedrock/nova-sonic.js +2 -2
  58. package/dist/src/providers/claude-agent-sdk.d.ts +58 -1
  59. package/dist/src/providers/claude-agent-sdk.js +22 -1
  60. package/dist/src/providers/defaults.js +4 -0
  61. package/dist/src/providers/github/defaults.js +6 -6
  62. package/dist/src/providers/google/types.d.ts +25 -0
  63. package/dist/src/providers/google/util.d.ts +2 -0
  64. package/dist/src/providers/google/vertex.js +78 -22
  65. package/dist/src/providers/{groq.d.ts → groq/chat.d.ts} +26 -20
  66. package/dist/src/providers/groq/chat.js +79 -0
  67. package/dist/src/providers/groq/index.d.ts +5 -0
  68. package/dist/src/providers/groq/index.js +24 -0
  69. package/dist/src/providers/groq/responses.d.ts +106 -0
  70. package/dist/src/providers/groq/responses.js +64 -0
  71. package/dist/src/providers/groq/types.d.ts +44 -0
  72. package/dist/src/providers/groq/types.js +3 -0
  73. package/dist/src/providers/groq/util.d.ts +15 -0
  74. package/dist/src/providers/groq/util.js +28 -0
  75. package/dist/src/providers/mcp/client.d.ts +8 -0
  76. package/dist/src/providers/mcp/client.js +60 -10
  77. package/dist/src/providers/mcp/types.d.ts +21 -0
  78. package/dist/src/providers/openai/chatkit-pool.d.ts +114 -0
  79. package/dist/src/providers/openai/chatkit-pool.js +548 -0
  80. package/dist/src/providers/openai/chatkit-types.d.ts +73 -0
  81. package/dist/src/providers/openai/chatkit-types.js +3 -0
  82. package/dist/src/providers/openai/chatkit.d.ts +76 -0
  83. package/dist/src/providers/openai/chatkit.js +879 -0
  84. package/dist/src/providers/openai/codex-sdk.d.ts +109 -0
  85. package/dist/src/providers/openai/codex-sdk.js +346 -0
  86. package/dist/src/providers/openai/defaults.d.ts +2 -0
  87. package/dist/src/providers/openai/defaults.js +10 -4
  88. package/dist/src/providers/registry.js +48 -9
  89. package/dist/src/providers/responses/types.d.ts +1 -1
  90. package/dist/src/providers/sagemaker.d.ts +2 -2
  91. package/dist/src/providers/webSearchUtils.d.ts +17 -0
  92. package/dist/src/providers/webSearchUtils.js +169 -0
  93. package/dist/src/providers/xai/chat.d.ts +61 -0
  94. package/dist/src/providers/xai/chat.js +68 -3
  95. package/dist/src/providers/xai/responses.d.ts +189 -0
  96. package/dist/src/providers/xai/responses.js +268 -0
  97. package/dist/src/redteam/constants/plugins.d.ts +1 -1
  98. package/dist/src/redteam/constants/plugins.js +1 -1
  99. package/dist/src/redteam/constants/strategies.d.ts +1 -1
  100. package/dist/src/redteam/constants/strategies.js +1 -0
  101. package/dist/src/redteam/plugins/vlguard.d.ts +53 -4
  102. package/dist/src/redteam/plugins/vlguard.js +362 -46
  103. package/dist/src/redteam/providers/constants.d.ts +2 -2
  104. package/dist/src/redteam/providers/constants.js +2 -2
  105. package/dist/src/redteam/providers/crescendo/index.d.ts +1 -1
  106. package/dist/src/redteam/providers/crescendo/index.js +5 -3
  107. package/dist/src/redteam/providers/hydra/index.js +1 -1
  108. package/dist/src/server/routes/modelAudit.js +4 -4
  109. package/dist/src/share.js +4 -2
  110. package/dist/src/telemetry.js +44 -8
  111. package/dist/src/types/env.d.ts +3 -0
  112. package/dist/src/types/env.js +1 -0
  113. package/dist/src/types/index.d.ts +896 -615
  114. package/dist/src/types/index.js +1 -0
  115. package/dist/src/types/providers.d.ts +1 -0
  116. package/dist/src/types/tracing.d.ts +3 -0
  117. package/dist/src/util/database.d.ts +6 -4
  118. package/dist/src/util/file.js +6 -4
  119. package/dist/src/util/modelAuditCliParser.d.ts +4 -4
  120. package/dist/src/util/xlsx.js +52 -26
  121. package/dist/src/validators/providers.d.ts +142 -122
  122. package/dist/src/validators/providers.js +4 -6
  123. package/dist/src/validators/redteam.d.ts +36 -28
  124. package/dist/src/validators/redteam.js +9 -3
  125. package/dist/tsconfig.tsbuildinfo +1 -1
  126. package/package.json +28 -26
  127. package/dist/drizzle/CLAUDE.md +0 -65
  128. package/dist/src/app/assets/index-DifT6VGT.js +0 -51
  129. package/dist/src/app/assets/sync-Oo-W_Rbj.js +0 -1
  130. package/dist/src/app/assets/vendor-mui-x-C2xF-yiO.js +0 -45
  131. package/dist/src/providers/groq.js +0 -48
@@ -3,216 +3,735 @@ Object.defineProperty(exports, "__esModule", { value: true });
3
3
  exports.AZURE_MODELS = exports.DEFAULT_AZURE_API_VERSION = void 0;
4
4
  exports.DEFAULT_AZURE_API_VERSION = '2024-12-01-preview';
5
5
  exports.AZURE_MODELS = [
6
- // GPT-4.1 models
6
+ // =============================================================================
7
+ // GPT-5 Series (Latest Flagship)
8
+ // Note: Pricing is provisional/estimated based on relative model capabilities
9
+ // =============================================================================
10
+ {
11
+ id: 'gpt-5',
12
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
13
+ },
14
+ {
15
+ id: 'gpt-5-2025-08-07',
16
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
17
+ },
18
+ {
19
+ id: 'gpt-5-pro',
20
+ cost: { input: 5 / 1000000, output: 20 / 1000000 },
21
+ },
22
+ {
23
+ id: 'gpt-5-pro-2025-10-06',
24
+ cost: { input: 5 / 1000000, output: 20 / 1000000 },
25
+ },
26
+ {
27
+ id: 'gpt-5-mini',
28
+ cost: { input: 0.4 / 1000000, output: 1.6 / 1000000 },
29
+ },
30
+ {
31
+ id: 'gpt-5-mini-2025-08-07',
32
+ cost: { input: 0.4 / 1000000, output: 1.6 / 1000000 },
33
+ },
34
+ {
35
+ id: 'gpt-5-nano',
36
+ cost: { input: 0.1 / 1000000, output: 0.4 / 1000000 },
37
+ },
38
+ {
39
+ id: 'gpt-5-nano-2025-08-07',
40
+ cost: { input: 0.1 / 1000000, output: 0.4 / 1000000 },
41
+ },
42
+ {
43
+ id: 'gpt-5-chat',
44
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
45
+ },
46
+ {
47
+ id: 'gpt-5-chat-2025-08-07',
48
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
49
+ },
50
+ {
51
+ id: 'gpt-5-chat-2025-10-03',
52
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
53
+ },
54
+ {
55
+ id: 'gpt-5-codex',
56
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
57
+ },
58
+ {
59
+ id: 'gpt-5-codex-2025-09-15',
60
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
61
+ },
62
+ // =============================================================================
63
+ // GPT-5.1 Series (Newest)
64
+ // Note: Pricing is provisional/estimated based on relative model capabilities
65
+ // =============================================================================
66
+ {
67
+ id: 'gpt-5.1',
68
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
69
+ },
70
+ {
71
+ id: 'gpt-5.1-2025-11-13',
72
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
73
+ },
74
+ {
75
+ id: 'gpt-5.1-chat',
76
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
77
+ },
78
+ {
79
+ id: 'gpt-5.1-chat-2025-11-13',
80
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
81
+ },
82
+ {
83
+ id: 'gpt-5.1-codex',
84
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
85
+ },
86
+ {
87
+ id: 'gpt-5.1-codex-2025-11-13',
88
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
89
+ },
90
+ {
91
+ id: 'gpt-5.1-codex-mini',
92
+ cost: { input: 0.4 / 1000000, output: 1.6 / 1000000 },
93
+ },
94
+ {
95
+ id: 'gpt-5.1-codex-mini-2025-11-13',
96
+ cost: { input: 0.4 / 1000000, output: 1.6 / 1000000 },
97
+ },
98
+ // =============================================================================
99
+ // GPT-4.1 Series (1M Context)
100
+ // =============================================================================
101
+ {
102
+ id: 'gpt-4.1',
103
+ cost: { input: 2 / 1000000, output: 8 / 1000000 },
104
+ },
7
105
  {
8
106
  id: 'gpt-4.1-2025-04-14',
9
- cost: {
10
- input: 2 / 1000000,
11
- output: 8 / 1000000,
12
- },
107
+ cost: { input: 2 / 1000000, output: 8 / 1000000 },
108
+ },
109
+ {
110
+ id: 'gpt-4.1-mini',
111
+ cost: { input: 0.4 / 1000000, output: 1.6 / 1000000 },
112
+ },
113
+ {
114
+ id: 'gpt-4.1-mini-2025-04-14',
115
+ cost: { input: 0.4 / 1000000, output: 1.6 / 1000000 },
116
+ },
117
+ {
118
+ id: 'gpt-4.1-nano',
119
+ cost: { input: 0.1 / 1000000, output: 0.4 / 1000000 },
120
+ },
121
+ {
122
+ id: 'gpt-4.1-nano-2025-04-14',
123
+ cost: { input: 0.1 / 1000000, output: 0.4 / 1000000 },
124
+ },
125
+ // =============================================================================
126
+ // Reasoning Models (o-series)
127
+ // =============================================================================
128
+ {
129
+ id: 'o4-mini',
130
+ cost: { input: 1.1 / 1000000, output: 4.4 / 1000000 },
131
+ },
132
+ {
133
+ id: 'o4-mini-2025-04-16',
134
+ cost: { input: 1.1 / 1000000, output: 4.4 / 1000000 },
135
+ },
136
+ {
137
+ id: 'o3',
138
+ cost: { input: 10 / 1000000, output: 40 / 1000000 },
139
+ },
140
+ {
141
+ id: 'o3-2025-04-16',
142
+ cost: { input: 10 / 1000000, output: 40 / 1000000 },
143
+ },
144
+ {
145
+ id: 'o3-pro',
146
+ cost: { input: 20 / 1000000, output: 80 / 1000000 },
147
+ },
148
+ {
149
+ id: 'o3-pro-2025-06-10',
150
+ cost: { input: 20 / 1000000, output: 80 / 1000000 },
151
+ },
152
+ {
153
+ id: 'o3-mini',
154
+ cost: { input: 1.1 / 1000000, output: 4.4 / 1000000 },
155
+ },
156
+ {
157
+ id: 'o3-mini-2025-01-31',
158
+ cost: { input: 1.1 / 1000000, output: 4.4 / 1000000 },
159
+ },
160
+ {
161
+ id: 'o3-deep-research',
162
+ cost: { input: 10 / 1000000, output: 40 / 1000000 },
163
+ },
164
+ {
165
+ id: 'o3-deep-research-2025-06-26',
166
+ cost: { input: 10 / 1000000, output: 40 / 1000000 },
167
+ },
168
+ {
169
+ id: 'o1',
170
+ cost: { input: 15 / 1000000, output: 60 / 1000000 },
13
171
  },
14
- // o1 reasoning models
15
172
  {
16
173
  id: 'o1-2024-12-17',
17
- cost: {
18
- input: 15 / 1000000,
19
- output: 60 / 1000000,
20
- },
174
+ cost: { input: 15 / 1000000, output: 60 / 1000000 },
175
+ },
176
+ {
177
+ id: 'o1-preview',
178
+ cost: { input: 15 / 1000000, output: 60 / 1000000 },
21
179
  },
22
180
  {
23
181
  id: 'o1-preview-2024-09-12',
24
- cost: {
25
- input: 15 / 1000000,
26
- output: 60 / 1000000,
27
- },
182
+ cost: { input: 15 / 1000000, output: 60 / 1000000 },
28
183
  },
29
- // o3 mini models
30
184
  {
31
- id: 'o3-mini-2025-01-31',
32
- cost: {
33
- input: 1.1 / 1000000,
34
- output: 4.4 / 1000000,
35
- },
185
+ id: 'o1-mini',
186
+ cost: { input: 1.1 / 1000000, output: 4.4 / 1000000 },
36
187
  },
37
188
  {
38
189
  id: 'o1-mini-2024-09-12',
39
- cost: {
40
- input: 1.1 / 1000000,
41
- output: 4.4 / 1000000,
42
- },
190
+ cost: { input: 1.1 / 1000000, output: 4.4 / 1000000 },
191
+ },
192
+ // =============================================================================
193
+ // GPT-4o Series
194
+ // =============================================================================
195
+ {
196
+ id: 'gpt-4o',
197
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
198
+ },
199
+ {
200
+ id: 'gpt-4o-2024-11-20',
201
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
202
+ },
203
+ {
204
+ id: 'gpt-4o-2024-08-06',
205
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
206
+ },
207
+ {
208
+ id: 'gpt-4o-2024-05-13',
209
+ cost: { input: 5 / 1000000, output: 15 / 1000000 },
210
+ },
211
+ {
212
+ id: 'gpt-4o-mini',
213
+ cost: { input: 0.15 / 1000000, output: 0.6 / 1000000 },
214
+ },
215
+ {
216
+ id: 'gpt-4o-mini-2024-07-18',
217
+ cost: { input: 0.15 / 1000000, output: 0.6 / 1000000 },
218
+ },
219
+ // =============================================================================
220
+ // GPT-4o Audio & Realtime Models
221
+ // =============================================================================
222
+ {
223
+ id: 'gpt-4o-realtime-preview',
224
+ cost: { input: 5 / 1000000, output: 20 / 1000000 },
43
225
  },
44
- // GPT-4o Realtime models (text only pricing)
45
226
  {
46
227
  id: 'gpt-4o-realtime-preview-2024-12-17',
47
- cost: {
48
- input: 5 / 1000000,
49
- output: 20 / 1000000,
50
- },
228
+ cost: { input: 5 / 1000000, output: 20 / 1000000 },
229
+ },
230
+ {
231
+ id: 'gpt-4o-realtime-preview-2025-06-03',
232
+ cost: { input: 5 / 1000000, output: 20 / 1000000 },
233
+ },
234
+ {
235
+ id: 'gpt-4o-mini-realtime-preview',
236
+ cost: { input: 0.6 / 1000000, output: 2.4 / 1000000 },
51
237
  },
52
238
  {
53
239
  id: 'gpt-4o-mini-realtime-preview-2024-12-17',
54
- cost: {
55
- input: 0.6 / 1000000,
56
- output: 2.4 / 1000000,
57
- },
240
+ cost: { input: 0.6 / 1000000, output: 2.4 / 1000000 },
241
+ },
242
+ {
243
+ id: 'gpt-4o-audio-preview',
244
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
58
245
  },
59
- // GPT-4o Audio models (text only pricing)
60
246
  {
61
247
  id: 'gpt-4o-audio-preview-2024-12-17',
62
- cost: {
63
- input: 2.5 / 1000000,
64
- output: 10 / 1000000,
65
- },
248
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
249
+ },
250
+ {
251
+ id: 'gpt-4o-mini-audio-preview',
252
+ cost: { input: 0.15 / 1000000, output: 0.6 / 1000000 },
66
253
  },
67
254
  {
68
255
  id: 'gpt-4o-mini-audio-preview-2024-12-17',
69
- cost: {
70
- input: 0.15 / 1000000,
71
- output: 0.6 / 1000000,
72
- },
256
+ cost: { input: 0.15 / 1000000, output: 0.6 / 1000000 },
73
257
  },
74
- // Updated GPT-4o models
75
258
  {
76
- id: 'gpt-4o-2024-1120',
77
- cost: {
78
- input: 2.5 / 1000000,
79
- output: 10 / 1000000,
80
- },
259
+ id: 'gpt-realtime',
260
+ cost: { input: 5 / 1000000, output: 20 / 1000000 },
81
261
  },
82
262
  {
83
- id: 'gpt-4o-2024-08-06',
84
- cost: {
85
- input: 2.5 / 1000000,
86
- output: 10 / 1000000,
87
- },
263
+ id: 'gpt-realtime-2025-08-28',
264
+ cost: { input: 5 / 1000000, output: 20 / 1000000 },
88
265
  },
89
266
  {
90
- id: 'gpt-4o-2024-0513',
91
- cost: {
92
- input: 5 / 1000000,
93
- output: 15 / 1000000,
94
- },
267
+ id: 'gpt-realtime-mini',
268
+ cost: { input: 0.6 / 1000000, output: 2.4 / 1000000 },
95
269
  },
96
270
  {
97
- id: 'gpt-4o-mini-0718',
98
- cost: {
99
- input: 0.15 / 1000000,
100
- output: 0.6 / 1000000,
101
- },
271
+ id: 'gpt-realtime-mini-2025-10-06',
272
+ cost: { input: 0.6 / 1000000, output: 2.4 / 1000000 },
102
273
  },
103
274
  {
104
- id: 'gpt-4o',
105
- cost: {
106
- input: 5 / 1000000,
107
- output: 15 / 1000000,
108
- },
275
+ id: 'gpt-audio',
276
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
109
277
  },
110
278
  {
111
- id: 'gpt-4o-mini',
112
- cost: {
113
- input: 0.15 / 1000000,
114
- output: 0.6 / 1000000,
115
- },
279
+ id: 'gpt-audio-2025-08-28',
280
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
116
281
  },
117
282
  {
118
- id: 'gpt-3.5-turbo-0125',
119
- cost: {
120
- input: 0.5 / 1000000,
121
- output: 1.5 / 1000000,
122
- },
283
+ id: 'gpt-audio-mini',
284
+ cost: { input: 0.15 / 1000000, output: 0.6 / 1000000 },
123
285
  },
124
286
  {
125
- id: 'gpt-3.5-turbo-instruct',
126
- cost: {
127
- input: 1.5 / 1000000,
128
- output: 2 / 1000000,
129
- },
287
+ id: 'gpt-audio-mini-2025-10-06',
288
+ cost: { input: 0.15 / 1000000, output: 0.6 / 1000000 },
289
+ },
290
+ // =============================================================================
291
+ // GPT-4o Transcription Models
292
+ // =============================================================================
293
+ {
294
+ id: 'gpt-4o-transcribe',
295
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
296
+ },
297
+ {
298
+ id: 'gpt-4o-transcribe-2025-03-20',
299
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
300
+ },
301
+ {
302
+ id: 'gpt-4o-mini-transcribe',
303
+ cost: { input: 0.15 / 1000000, output: 0.6 / 1000000 },
304
+ },
305
+ {
306
+ id: 'gpt-4o-mini-transcribe-2025-03-20',
307
+ cost: { input: 0.15 / 1000000, output: 0.6 / 1000000 },
130
308
  },
309
+ {
310
+ id: 'gpt-4o-transcribe-diarize',
311
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
312
+ },
313
+ {
314
+ id: 'gpt-4o-transcribe-diarize-2025-10-15',
315
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
316
+ },
317
+ {
318
+ id: 'gpt-4o-mini-tts',
319
+ cost: { input: 0.15 / 1000000, output: 0.6 / 1000000 },
320
+ },
321
+ {
322
+ id: 'gpt-4o-mini-tts-2025-03-20',
323
+ cost: { input: 0.15 / 1000000, output: 0.6 / 1000000 },
324
+ },
325
+ // =============================================================================
326
+ // GPT-4 Legacy
327
+ // =============================================================================
131
328
  {
132
329
  id: 'gpt-4',
133
- cost: {
134
- input: 30 / 1000000,
135
- output: 60 / 1000000,
136
- },
330
+ cost: { input: 30 / 1000000, output: 60 / 1000000 },
137
331
  },
138
332
  {
139
333
  id: 'gpt-4-32k',
140
- cost: {
141
- input: 60 / 1000000,
142
- output: 120 / 1000000,
143
- },
334
+ cost: { input: 60 / 1000000, output: 120 / 1000000 },
144
335
  },
145
336
  {
146
- id: 'babbage-002',
147
- cost: {
148
- input: 0.4 / 1000000,
149
- output: 0.4 / 1000000,
150
- },
337
+ id: 'gpt-4-turbo',
338
+ cost: { input: 10 / 1000000, output: 30 / 1000000 },
151
339
  },
152
340
  {
153
- id: 'davinci-002',
154
- cost: {
155
- input: 2 / 1000000,
156
- output: 2 / 1000000,
157
- },
341
+ id: 'gpt-4-turbo-2024-04-09',
342
+ cost: { input: 10 / 1000000, output: 30 / 1000000 },
158
343
  },
159
344
  {
160
- id: 'text-embedding-ada-002',
161
- cost: {
162
- input: 0.1 / 1000000,
163
- output: 0.1 / 1000000,
164
- },
345
+ id: 'gpt-4-turbo-vision',
346
+ cost: { input: 10 / 1000000, output: 30 / 1000000 },
347
+ },
348
+ // =============================================================================
349
+ // GPT-3.5 Legacy
350
+ // =============================================================================
351
+ {
352
+ id: 'gpt-35-turbo',
353
+ cost: { input: 0.5 / 1000000, output: 1.5 / 1000000 },
354
+ },
355
+ {
356
+ id: 'gpt-35-turbo-0125',
357
+ cost: { input: 0.5 / 1000000, output: 1.5 / 1000000 },
358
+ },
359
+ {
360
+ id: 'gpt-35-turbo-1106',
361
+ cost: { input: 1 / 1000000, output: 2 / 1000000 },
362
+ },
363
+ {
364
+ id: 'gpt-35-turbo-0613',
365
+ cost: { input: 1.5 / 1000000, output: 2 / 1000000 },
366
+ },
367
+ {
368
+ id: 'gpt-35-turbo-0301',
369
+ cost: { input: 2 / 1000000, output: 2 / 1000000 },
370
+ },
371
+ {
372
+ id: 'gpt-35-turbo-16k',
373
+ cost: { input: 3 / 1000000, output: 4 / 1000000 },
374
+ },
375
+ {
376
+ id: 'gpt-35-turbo-instruct',
377
+ cost: { input: 1.5 / 1000000, output: 2 / 1000000 },
378
+ },
379
+ // OpenAI-style naming (for compatibility)
380
+ {
381
+ id: 'gpt-3.5-turbo',
382
+ cost: { input: 0.5 / 1000000, output: 1.5 / 1000000 },
383
+ },
384
+ {
385
+ id: 'gpt-3.5-turbo-0125',
386
+ cost: { input: 0.5 / 1000000, output: 1.5 / 1000000 },
165
387
  },
388
+ {
389
+ id: 'gpt-3.5-turbo-instruct',
390
+ cost: { input: 1.5 / 1000000, output: 2 / 1000000 },
391
+ },
392
+ // =============================================================================
393
+ // Image Generation Models
394
+ // =============================================================================
395
+ {
396
+ id: 'gpt-image-1',
397
+ cost: { input: 5 / 1000000, output: 40 / 1000000 },
398
+ },
399
+ {
400
+ id: 'gpt-image-1-2025-04-15',
401
+ cost: { input: 5 / 1000000, output: 40 / 1000000 },
402
+ },
403
+ {
404
+ id: 'gpt-image-1-mini',
405
+ cost: { input: 1.25 / 1000000, output: 10 / 1000000 },
406
+ },
407
+ {
408
+ id: 'gpt-image-1-mini-2025-10-06',
409
+ cost: { input: 1.25 / 1000000, output: 10 / 1000000 },
410
+ },
411
+ {
412
+ id: 'dall-e-3',
413
+ cost: { input: 40 / 1000000, output: 40 / 1000000 },
414
+ },
415
+ {
416
+ id: 'dall-e-2',
417
+ cost: { input: 20 / 1000000, output: 20 / 1000000 },
418
+ },
419
+ // =============================================================================
420
+ // Embedding Models
421
+ // =============================================================================
166
422
  {
167
423
  id: 'text-embedding-3-large',
168
- cost: {
169
- input: 0.13 / 1000000,
170
- output: 0.13 / 1000000,
171
- },
424
+ cost: { input: 0.13 / 1000000, output: 0.13 / 1000000 },
172
425
  },
173
426
  {
174
427
  id: 'text-embedding-3-small',
175
- cost: {
176
- input: 0.02 / 1000000,
177
- output: 0.02 / 1000000,
178
- },
428
+ cost: { input: 0.02 / 1000000, output: 0.02 / 1000000 },
179
429
  },
180
- // Legacy models
181
430
  {
182
- id: 'gpt-3.5-turbo-0301',
183
- cost: {
184
- input: 2 / 1000000,
185
- output: 2 / 1000000,
186
- },
431
+ id: 'text-embedding-ada-002',
432
+ cost: { input: 0.1 / 1000000, output: 0.1 / 1000000 },
187
433
  },
434
+ // =============================================================================
435
+ // Base/Legacy Models
436
+ // =============================================================================
188
437
  {
189
- id: 'gpt-3.5-turbo-0613',
190
- cost: {
191
- input: 1.5 / 1000000,
192
- output: 2 / 1000000,
193
- },
438
+ id: 'babbage-002',
439
+ cost: { input: 0.4 / 1000000, output: 0.4 / 1000000 },
194
440
  },
195
441
  {
196
- id: 'gpt-3.5-turbo-1106',
197
- cost: {
198
- input: 1 / 1000000,
199
- output: 2 / 1000000,
200
- },
442
+ id: 'davinci-002',
443
+ cost: { input: 2 / 1000000, output: 2 / 1000000 },
201
444
  },
202
- // More legacy models from pricing sheet
203
445
  {
204
- id: 'gpt-4-turbo',
205
- cost: {
206
- input: 10 / 1000000,
207
- output: 30 / 1000000,
208
- },
446
+ id: 'codex-mini',
447
+ cost: { input: 1.5 / 1000000, output: 6 / 1000000 },
209
448
  },
210
449
  {
211
- id: 'gpt-4-turbo-vision',
212
- cost: {
213
- input: 10 / 1000000,
214
- output: 30 / 1000000,
215
- },
450
+ id: 'codex-mini-2025-05-16',
451
+ cost: { input: 1.5 / 1000000, output: 6 / 1000000 },
452
+ },
453
+ // =============================================================================
454
+ // Anthropic Claude Models (via Azure AI Foundry)
455
+ // =============================================================================
456
+ {
457
+ id: 'claude-opus-4-5',
458
+ cost: { input: 5 / 1000000, output: 25 / 1000000 },
459
+ },
460
+ {
461
+ id: 'claude-opus-4-5-20251101',
462
+ cost: { input: 5 / 1000000, output: 25 / 1000000 },
463
+ },
464
+ {
465
+ id: 'claude-opus-4-1',
466
+ cost: { input: 15 / 1000000, output: 75 / 1000000 },
467
+ },
468
+ {
469
+ id: 'claude-opus-4-1-20250805',
470
+ cost: { input: 15 / 1000000, output: 75 / 1000000 },
471
+ },
472
+ {
473
+ id: 'claude-sonnet-4-5',
474
+ cost: { input: 3 / 1000000, output: 15 / 1000000 },
475
+ },
476
+ {
477
+ id: 'claude-sonnet-4-5-20250929',
478
+ cost: { input: 3 / 1000000, output: 15 / 1000000 },
479
+ },
480
+ {
481
+ id: 'claude-haiku-4-5',
482
+ cost: { input: 0.8 / 1000000, output: 4 / 1000000 },
483
+ },
484
+ {
485
+ id: 'claude-haiku-4-5-20251001',
486
+ cost: { input: 0.8 / 1000000, output: 4 / 1000000 },
487
+ },
488
+ // =============================================================================
489
+ // Meta Llama Models (via Azure AI Foundry)
490
+ // =============================================================================
491
+ {
492
+ id: 'Llama-4-Maverick-17B-128E-Instruct-FP8',
493
+ cost: { input: 0.22 / 1000000, output: 0.88 / 1000000 },
494
+ },
495
+ {
496
+ id: 'Llama-4-Scout-17B-16E-Instruct',
497
+ cost: { input: 0.17 / 1000000, output: 0.68 / 1000000 },
498
+ },
499
+ {
500
+ id: 'Llama-3.3-70B-Instruct',
501
+ cost: { input: 0.37 / 1000000, output: 0.37 / 1000000 },
502
+ },
503
+ {
504
+ id: 'Llama-3.2-90B-Vision-Instruct',
505
+ cost: { input: 0.99 / 1000000, output: 0.99 / 1000000 },
506
+ },
507
+ {
508
+ id: 'Llama-3.2-11B-Vision-Instruct',
509
+ cost: { input: 0.037 / 1000000, output: 0.037 / 1000000 },
510
+ },
511
+ {
512
+ id: 'Meta-Llama-3.1-405B-Instruct',
513
+ cost: { input: 2.1 / 1000000, output: 2.1 / 1000000 },
514
+ },
515
+ {
516
+ id: 'Meta-Llama-3.1-70B-Instruct',
517
+ cost: { input: 0.37 / 1000000, output: 0.37 / 1000000 },
518
+ },
519
+ {
520
+ id: 'Meta-Llama-3.1-8B-Instruct',
521
+ cost: { input: 0.03 / 1000000, output: 0.03 / 1000000 },
522
+ },
523
+ {
524
+ id: 'Meta-Llama-3-70B-Instruct',
525
+ cost: { input: 0.37 / 1000000, output: 0.37 / 1000000 },
526
+ },
527
+ {
528
+ id: 'Meta-Llama-3-8B-Instruct',
529
+ cost: { input: 0.03 / 1000000, output: 0.03 / 1000000 },
530
+ },
531
+ // =============================================================================
532
+ // DeepSeek Models (via Azure AI Foundry)
533
+ // =============================================================================
534
+ {
535
+ id: 'DeepSeek-R1',
536
+ cost: { input: 0.55 / 1000000, output: 2.19 / 1000000 },
537
+ },
538
+ {
539
+ id: 'DeepSeek-R1-0528',
540
+ cost: { input: 0.55 / 1000000, output: 2.19 / 1000000 },
541
+ },
542
+ {
543
+ id: 'DeepSeek-V3',
544
+ cost: { input: 0.27 / 1000000, output: 1.1 / 1000000 },
545
+ },
546
+ {
547
+ id: 'DeepSeek-V3-0324',
548
+ cost: { input: 0.27 / 1000000, output: 1.1 / 1000000 },
549
+ },
550
+ {
551
+ id: 'DeepSeek-V3.1',
552
+ cost: { input: 0.27 / 1000000, output: 1.1 / 1000000 },
553
+ },
554
+ // =============================================================================
555
+ // xAI Grok Models (via Azure AI Foundry)
556
+ // =============================================================================
557
+ {
558
+ id: 'grok-4',
559
+ cost: { input: 3 / 1000000, output: 15 / 1000000 },
560
+ },
561
+ {
562
+ id: 'grok-4-fast-reasoning',
563
+ cost: { input: 3 / 1000000, output: 15 / 1000000 },
564
+ },
565
+ {
566
+ id: 'grok-4-fast-non-reasoning',
567
+ cost: { input: 3 / 1000000, output: 15 / 1000000 },
568
+ },
569
+ {
570
+ id: 'grok-3',
571
+ cost: { input: 3 / 1000000, output: 15 / 1000000 },
572
+ },
573
+ {
574
+ id: 'grok-3-mini',
575
+ cost: { input: 0.3 / 1000000, output: 0.5 / 1000000 },
576
+ },
577
+ {
578
+ id: 'grok-code-fast-1',
579
+ cost: { input: 0.15 / 1000000, output: 0.6 / 1000000 },
580
+ },
581
+ // =============================================================================
582
+ // Microsoft Phi Models (via Azure AI Foundry)
583
+ // =============================================================================
584
+ {
585
+ id: 'Phi-4',
586
+ cost: { input: 0.07 / 1000000, output: 0.14 / 1000000 },
587
+ },
588
+ {
589
+ id: 'Phi-4-reasoning',
590
+ cost: { input: 0.07 / 1000000, output: 0.14 / 1000000 },
591
+ },
592
+ {
593
+ id: 'Phi-4-mini-reasoning',
594
+ cost: { input: 0.035 / 1000000, output: 0.07 / 1000000 },
595
+ },
596
+ {
597
+ id: 'Phi-4-mini-instruct',
598
+ cost: { input: 0.035 / 1000000, output: 0.07 / 1000000 },
599
+ },
600
+ {
601
+ id: 'Phi-4-multimodal-instruct',
602
+ cost: { input: 0.07 / 1000000, output: 0.14 / 1000000 },
603
+ },
604
+ {
605
+ id: 'Phi-3.5-MoE-instruct',
606
+ cost: { input: 0.26 / 1000000, output: 0.52 / 1000000 },
607
+ },
608
+ {
609
+ id: 'Phi-3.5-mini-instruct',
610
+ cost: { input: 0.026 / 1000000, output: 0.052 / 1000000 },
611
+ },
612
+ {
613
+ id: 'Phi-3.5-vision-instruct',
614
+ cost: { input: 0.026 / 1000000, output: 0.052 / 1000000 },
615
+ },
616
+ {
617
+ id: 'Phi-3-medium-128k-instruct',
618
+ cost: { input: 0.14 / 1000000, output: 0.14 / 1000000 },
619
+ },
620
+ {
621
+ id: 'Phi-3-small-128k-instruct',
622
+ cost: { input: 0.052 / 1000000, output: 0.052 / 1000000 },
623
+ },
624
+ {
625
+ id: 'Phi-3-mini-128k-instruct',
626
+ cost: { input: 0.026 / 1000000, output: 0.026 / 1000000 },
627
+ },
628
+ // =============================================================================
629
+ // Mistral Models (via Azure AI Foundry)
630
+ // =============================================================================
631
+ {
632
+ id: 'Mistral-Large-2411',
633
+ cost: { input: 2 / 1000000, output: 6 / 1000000 },
634
+ },
635
+ {
636
+ id: 'Mistral-large-2407',
637
+ cost: { input: 2 / 1000000, output: 6 / 1000000 },
638
+ },
639
+ {
640
+ id: 'Mistral-large',
641
+ cost: { input: 2 / 1000000, output: 6 / 1000000 },
642
+ },
643
+ {
644
+ id: 'mistral-medium-2505',
645
+ cost: { input: 0.4 / 1000000, output: 1.5 / 1000000 },
646
+ },
647
+ {
648
+ id: 'mistral-small-2503',
649
+ cost: { input: 0.1 / 1000000, output: 0.3 / 1000000 },
650
+ },
651
+ {
652
+ id: 'Mistral-small',
653
+ cost: { input: 0.1 / 1000000, output: 0.3 / 1000000 },
654
+ },
655
+ {
656
+ id: 'Mistral-Nemo',
657
+ cost: { input: 0.15 / 1000000, output: 0.15 / 1000000 },
658
+ },
659
+ {
660
+ id: 'Ministral-3B',
661
+ cost: { input: 0.04 / 1000000, output: 0.04 / 1000000 },
662
+ },
663
+ {
664
+ id: 'Codestral-2501',
665
+ cost: { input: 0.3 / 1000000, output: 0.9 / 1000000 },
666
+ },
667
+ {
668
+ id: 'mistral-document-ai-2505',
669
+ cost: { input: 0.5 / 1000000, output: 1 / 1000000 },
670
+ },
671
+ // =============================================================================
672
+ // Cohere Models (via Azure AI Foundry)
673
+ // =============================================================================
674
+ {
675
+ id: 'cohere-command-a',
676
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
677
+ },
678
+ {
679
+ id: 'Cohere-command-r-plus',
680
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
681
+ },
682
+ {
683
+ id: 'Cohere-command-r-plus-08-2024',
684
+ cost: { input: 2.5 / 1000000, output: 10 / 1000000 },
685
+ },
686
+ {
687
+ id: 'Cohere-command-r',
688
+ cost: { input: 0.15 / 1000000, output: 0.6 / 1000000 },
689
+ },
690
+ {
691
+ id: 'Cohere-command-r-08-2024',
692
+ cost: { input: 0.15 / 1000000, output: 0.6 / 1000000 },
693
+ },
694
+ {
695
+ id: 'Cohere-embed-v3-english',
696
+ cost: { input: 0.1 / 1000000, output: 0.1 / 1000000 },
697
+ },
698
+ {
699
+ id: 'Cohere-embed-v3-multilingual',
700
+ cost: { input: 0.1 / 1000000, output: 0.1 / 1000000 },
701
+ },
702
+ {
703
+ id: 'embed-v-4-0',
704
+ cost: { input: 0.1 / 1000000, output: 0.1 / 1000000 },
705
+ },
706
+ // =============================================================================
707
+ // AI21 Labs Models (via Azure AI Foundry)
708
+ // =============================================================================
709
+ {
710
+ id: 'AI21-Jamba-1.5-Large',
711
+ cost: { input: 0.2 / 1000000, output: 0.8 / 1000000 },
712
+ },
713
+ {
714
+ id: 'AI21-Jamba-1.5-Mini',
715
+ cost: { input: 0.02 / 1000000, output: 0.08 / 1000000 },
716
+ },
717
+ {
718
+ id: 'AI21-Jamba-Instruct',
719
+ cost: { input: 0.5 / 1000000, output: 0.7 / 1000000 },
720
+ },
721
+ // =============================================================================
722
+ // Core42 Models (via Azure AI Foundry)
723
+ // =============================================================================
724
+ {
725
+ id: 'jais-30b-chat',
726
+ cost: { input: 0.1 / 1000000, output: 0.1 / 1000000 },
727
+ },
728
+ {
729
+ id: 'JAIS-70b-chat',
730
+ cost: { input: 0.2 / 1000000, output: 0.2 / 1000000 },
731
+ },
732
+ {
733
+ id: 'Falcon3-7B-Instruct',
734
+ cost: { input: 0.05 / 1000000, output: 0.05 / 1000000 },
216
735
  },
217
736
  ];
218
737
  //# sourceMappingURL=defaults.js.map