@funkai/models 0.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.generated/entries.json +23 -0
- package/.generated/req.txt +1 -0
- package/.turbo/turbo-build.log +145 -0
- package/.turbo/turbo-typecheck.log +4 -0
- package/CHANGELOG.md +23 -0
- package/README.md +95 -0
- package/dist/alibaba-B6q4Ng1R.mjs +957 -0
- package/dist/alibaba-B6q4Ng1R.mjs.map +1 -0
- package/dist/amazon-bedrock-Cv9AHQBH.mjs +2070 -0
- package/dist/amazon-bedrock-Cv9AHQBH.mjs.map +1 -0
- package/dist/anthropic-yB7ST97_.mjs +651 -0
- package/dist/anthropic-yB7ST97_.mjs.map +1 -0
- package/dist/cerebras-COfl7XM-.mjs +95 -0
- package/dist/cerebras-COfl7XM-.mjs.map +1 -0
- package/dist/cohere-B7TgO0hT.mjs +271 -0
- package/dist/cohere-B7TgO0hT.mjs.map +1 -0
- package/dist/deepinfra-B0GxUwCG.mjs +636 -0
- package/dist/deepinfra-B0GxUwCG.mjs.map +1 -0
- package/dist/deepseek-D64ZEsvS.mjs +50 -0
- package/dist/deepseek-D64ZEsvS.mjs.map +1 -0
- package/dist/fireworks-ai-DJYvdAi_.mjs +304 -0
- package/dist/fireworks-ai-DJYvdAi_.mjs.map +1 -0
- package/dist/google-BypRl349.mjs +833 -0
- package/dist/google-BypRl349.mjs.map +1 -0
- package/dist/google-vertex-DbS-zTGD.mjs +730 -0
- package/dist/google-vertex-DbS-zTGD.mjs.map +1 -0
- package/dist/groq-ei_PerYi.mjs +381 -0
- package/dist/groq-ei_PerYi.mjs.map +1 -0
- package/dist/huggingface-DaM1EeLP.mjs +456 -0
- package/dist/huggingface-DaM1EeLP.mjs.map +1 -0
- package/dist/inception-CspEzqNV.mjs +101 -0
- package/dist/inception-CspEzqNV.mjs.map +1 -0
- package/dist/index.d.mts +30314 -0
- package/dist/index.d.mts.map +1 -0
- package/dist/index.mjs +271 -0
- package/dist/index.mjs.map +1 -0
- package/dist/llama-Cf3-koap.mjs +161 -0
- package/dist/llama-Cf3-koap.mjs.map +1 -0
- package/dist/mistral-BI9MdAO4.mjs +579 -0
- package/dist/mistral-BI9MdAO4.mjs.map +1 -0
- package/dist/nvidia-COHacuoa.mjs +1625 -0
- package/dist/nvidia-COHacuoa.mjs.map +1 -0
- package/dist/openai-C0nCfZUq.mjs +1023 -0
- package/dist/openai-C0nCfZUq.mjs.map +1 -0
- package/dist/openrouter-DSFzxKQb.mjs +4608 -0
- package/dist/openrouter-DSFzxKQb.mjs.map +1 -0
- package/dist/perplexity-zeZ2WlBU.mjs +96 -0
- package/dist/perplexity-zeZ2WlBU.mjs.map +1 -0
- package/dist/providers/alibaba.d.mts +1795 -0
- package/dist/providers/alibaba.d.mts.map +1 -0
- package/dist/providers/alibaba.mjs +39 -0
- package/dist/providers/alibaba.mjs.map +1 -0
- package/dist/providers/amazon-bedrock.d.mts +3713 -0
- package/dist/providers/amazon-bedrock.d.mts.map +1 -0
- package/dist/providers/amazon-bedrock.mjs +39 -0
- package/dist/providers/amazon-bedrock.mjs.map +1 -0
- package/dist/providers/anthropic.d.mts +1109 -0
- package/dist/providers/anthropic.d.mts.map +1 -0
- package/dist/providers/anthropic.mjs +39 -0
- package/dist/providers/anthropic.mjs.map +1 -0
- package/dist/providers/cerebras.d.mts +219 -0
- package/dist/providers/cerebras.d.mts.map +1 -0
- package/dist/providers/cerebras.mjs +39 -0
- package/dist/providers/cerebras.mjs.map +1 -0
- package/dist/providers/cohere.d.mts +555 -0
- package/dist/providers/cohere.d.mts.map +1 -0
- package/dist/providers/cohere.mjs +39 -0
- package/dist/providers/cohere.mjs.map +1 -0
- package/dist/providers/deepinfra.d.mts +1245 -0
- package/dist/providers/deepinfra.d.mts.map +1 -0
- package/dist/providers/deepinfra.mjs +39 -0
- package/dist/providers/deepinfra.mjs.map +1 -0
- package/dist/providers/deepseek.d.mts +139 -0
- package/dist/providers/deepseek.d.mts.map +1 -0
- package/dist/providers/deepseek.mjs +39 -0
- package/dist/providers/deepseek.mjs.map +1 -0
- package/dist/providers/fireworks-ai.d.mts +611 -0
- package/dist/providers/fireworks-ai.d.mts.map +1 -0
- package/dist/providers/fireworks-ai.mjs +39 -0
- package/dist/providers/fireworks-ai.mjs.map +1 -0
- package/dist/providers/google-vertex.d.mts +1227 -0
- package/dist/providers/google-vertex.d.mts.map +1 -0
- package/dist/providers/google-vertex.mjs +39 -0
- package/dist/providers/google-vertex.mjs.map +1 -0
- package/dist/providers/google.d.mts +1359 -0
- package/dist/providers/google.d.mts.map +1 -0
- package/dist/providers/google.mjs +39 -0
- package/dist/providers/google.mjs.map +1 -0
- package/dist/providers/groq.d.mts +765 -0
- package/dist/providers/groq.d.mts.map +1 -0
- package/dist/providers/groq.mjs +39 -0
- package/dist/providers/groq.mjs.map +1 -0
- package/dist/providers/huggingface.d.mts +901 -0
- package/dist/providers/huggingface.d.mts.map +1 -0
- package/dist/providers/huggingface.mjs +39 -0
- package/dist/providers/huggingface.mjs.map +1 -0
- package/dist/providers/inception.d.mts +231 -0
- package/dist/providers/inception.d.mts.map +1 -0
- package/dist/providers/inception.mjs +39 -0
- package/dist/providers/inception.mjs.map +1 -0
- package/dist/providers/llama.d.mts +345 -0
- package/dist/providers/llama.d.mts.map +1 -0
- package/dist/providers/llama.mjs +39 -0
- package/dist/providers/llama.mjs.map +1 -0
- package/dist/providers/mistral.d.mts +1143 -0
- package/dist/providers/mistral.d.mts.map +1 -0
- package/dist/providers/mistral.mjs +39 -0
- package/dist/providers/mistral.mjs.map +1 -0
- package/dist/providers/nvidia.d.mts +3117 -0
- package/dist/providers/nvidia.d.mts.map +1 -0
- package/dist/providers/nvidia.mjs +39 -0
- package/dist/providers/nvidia.mjs.map +1 -0
- package/dist/providers/openai.d.mts +1963 -0
- package/dist/providers/openai.d.mts.map +1 -0
- package/dist/providers/openai.mjs +39 -0
- package/dist/providers/openai.mjs.map +1 -0
- package/dist/providers/openrouter.d.mts +8531 -0
- package/dist/providers/openrouter.d.mts.map +1 -0
- package/dist/providers/openrouter.mjs +39 -0
- package/dist/providers/openrouter.mjs.map +1 -0
- package/dist/providers/perplexity.d.mts +221 -0
- package/dist/providers/perplexity.d.mts.map +1 -0
- package/dist/providers/perplexity.mjs +39 -0
- package/dist/providers/perplexity.mjs.map +1 -0
- package/dist/providers/togetherai.d.mts +767 -0
- package/dist/providers/togetherai.d.mts.map +1 -0
- package/dist/providers/togetherai.mjs +39 -0
- package/dist/providers/togetherai.mjs.map +1 -0
- package/dist/providers/xai.d.mts +1161 -0
- package/dist/providers/xai.d.mts.map +1 -0
- package/dist/providers/xai.mjs +39 -0
- package/dist/providers/xai.mjs.map +1 -0
- package/dist/togetherai-BvcxUfPE.mjs +382 -0
- package/dist/togetherai-BvcxUfPE.mjs.map +1 -0
- package/dist/types-DjdaZckF.d.mts +71 -0
- package/dist/types-DjdaZckF.d.mts.map +1 -0
- package/dist/xai-fSuAkQJo.mjs +587 -0
- package/dist/xai-fSuAkQJo.mjs.map +1 -0
- package/docs/catalog/filtering.md +102 -0
- package/docs/catalog/overview.md +168 -0
- package/docs/catalog/providers.md +73 -0
- package/docs/cost/overview.md +125 -0
- package/docs/guides/filter-models.md +113 -0
- package/docs/guides/setup-resolver.md +106 -0
- package/docs/guides/track-costs.md +133 -0
- package/docs/overview.md +139 -0
- package/docs/provider/configuration.md +100 -0
- package/docs/provider/openrouter.md +105 -0
- package/docs/provider/overview.md +131 -0
- package/docs/troubleshooting.md +100 -0
- package/package.json +142 -0
- package/providers.json +39 -0
- package/scripts/generate-models.ts +392 -0
- package/src/catalog/index.test.ts +124 -0
- package/src/catalog/index.ts +65 -0
- package/src/catalog/providers/alibaba.ts +468 -0
- package/src/catalog/providers/amazon-bedrock.ts +941 -0
- package/src/catalog/providers/anthropic.ts +270 -0
- package/src/catalog/providers/cerebras.ts +61 -0
- package/src/catalog/providers/cohere.ts +149 -0
- package/src/catalog/providers/deepinfra.ts +325 -0
- package/src/catalog/providers/deepseek.ts +39 -0
- package/src/catalog/providers/fireworks-ai.ts +160 -0
- package/src/catalog/providers/google-vertex.ts +314 -0
- package/src/catalog/providers/google.ts +347 -0
- package/src/catalog/providers/groq.ts +204 -0
- package/src/catalog/providers/huggingface.ts +237 -0
- package/src/catalog/providers/inception.ts +61 -0
- package/src/catalog/providers/index.ts +59 -0
- package/src/catalog/providers/llama.ts +94 -0
- package/src/catalog/providers/mistral.ts +303 -0
- package/src/catalog/providers/nvidia.ts +820 -0
- package/src/catalog/providers/openai.ts +501 -0
- package/src/catalog/providers/openrouter.ts +2201 -0
- package/src/catalog/providers/perplexity.ts +61 -0
- package/src/catalog/providers/togetherai.ts +204 -0
- package/src/catalog/providers/xai.ts +292 -0
- package/src/catalog/types.ts +86 -0
- package/src/cost/calculate.test.ts +157 -0
- package/src/cost/calculate.ts +43 -0
- package/src/cost/index.ts +2 -0
- package/src/cost/types.ts +25 -0
- package/src/index.ts +25 -0
- package/src/provider/index.ts +9 -0
- package/src/provider/openrouter.test.ts +125 -0
- package/src/provider/openrouter.ts +110 -0
- package/src/provider/resolver.test.ts +138 -0
- package/src/provider/resolver.ts +125 -0
- package/src/provider/types.ts +39 -0
- package/src/providers/alibaba.ts +65 -0
- package/src/providers/amazon-bedrock.ts +67 -0
- package/src/providers/anthropic.ts +65 -0
- package/src/providers/cerebras.ts +65 -0
- package/src/providers/cohere.ts +65 -0
- package/src/providers/deepinfra.ts +65 -0
- package/src/providers/deepseek.ts +65 -0
- package/src/providers/fireworks-ai.ts +65 -0
- package/src/providers/google-vertex.ts +67 -0
- package/src/providers/google.ts +65 -0
- package/src/providers/groq.ts +65 -0
- package/src/providers/huggingface.ts +67 -0
- package/src/providers/inception.ts +65 -0
- package/src/providers/llama.ts +65 -0
- package/src/providers/mistral.ts +65 -0
- package/src/providers/nvidia.ts +65 -0
- package/src/providers/openai.ts +65 -0
- package/src/providers/openrouter.ts +67 -0
- package/src/providers/perplexity.ts +67 -0
- package/src/providers/togetherai.ts +65 -0
- package/src/providers/xai.ts +65 -0
- package/tsconfig.json +25 -0
- package/tsdown.config.ts +23 -0
- package/vitest.config.ts +29 -0
|
@@ -0,0 +1,3117 @@
|
|
|
1
|
+
import { n as ModelDefinition } from "../types-DjdaZckF.mjs";
|
|
2
|
+
import { LiteralUnion } from "type-fest";
|
|
3
|
+
|
|
4
|
+
//#region src/catalog/providers/nvidia.d.ts
|
|
5
|
+
declare const NVIDIA_MODELS: readonly [{
|
|
6
|
+
readonly id: "nvidia/llama-3.1-nemotron-70b-instruct";
|
|
7
|
+
readonly name: "Llama 3.1 Nemotron 70b Instruct";
|
|
8
|
+
readonly provider: "nvidia";
|
|
9
|
+
readonly family: "";
|
|
10
|
+
readonly pricing: {
|
|
11
|
+
readonly input: 0;
|
|
12
|
+
readonly output: 0;
|
|
13
|
+
};
|
|
14
|
+
readonly contextWindow: 128000;
|
|
15
|
+
readonly maxOutput: 4096;
|
|
16
|
+
readonly modalities: {
|
|
17
|
+
readonly input: readonly ["text"];
|
|
18
|
+
readonly output: readonly ["text"];
|
|
19
|
+
};
|
|
20
|
+
readonly capabilities: {
|
|
21
|
+
readonly reasoning: false;
|
|
22
|
+
readonly toolCall: true;
|
|
23
|
+
readonly attachment: false;
|
|
24
|
+
readonly structuredOutput: true;
|
|
25
|
+
};
|
|
26
|
+
}, {
|
|
27
|
+
readonly id: "nvidia/llama-3.1-nemotron-ultra-253b-v1";
|
|
28
|
+
readonly name: "Llama-3.1-Nemotron-Ultra-253B-v1";
|
|
29
|
+
readonly provider: "nvidia";
|
|
30
|
+
readonly family: "llama";
|
|
31
|
+
readonly pricing: {
|
|
32
|
+
readonly input: 0;
|
|
33
|
+
readonly output: 0;
|
|
34
|
+
};
|
|
35
|
+
readonly contextWindow: 131072;
|
|
36
|
+
readonly maxOutput: 8192;
|
|
37
|
+
readonly modalities: {
|
|
38
|
+
readonly input: readonly ["text"];
|
|
39
|
+
readonly output: readonly ["text"];
|
|
40
|
+
};
|
|
41
|
+
readonly capabilities: {
|
|
42
|
+
readonly reasoning: true;
|
|
43
|
+
readonly toolCall: true;
|
|
44
|
+
readonly attachment: false;
|
|
45
|
+
readonly structuredOutput: false;
|
|
46
|
+
};
|
|
47
|
+
}, {
|
|
48
|
+
readonly id: "nvidia/llama-3.1-nemotron-51b-instruct";
|
|
49
|
+
readonly name: "Llama 3.1 Nemotron 51b Instruct";
|
|
50
|
+
readonly provider: "nvidia";
|
|
51
|
+
readonly family: "";
|
|
52
|
+
readonly pricing: {
|
|
53
|
+
readonly input: 0;
|
|
54
|
+
readonly output: 0;
|
|
55
|
+
};
|
|
56
|
+
readonly contextWindow: 128000;
|
|
57
|
+
readonly maxOutput: 4096;
|
|
58
|
+
readonly modalities: {
|
|
59
|
+
readonly input: readonly ["text"];
|
|
60
|
+
readonly output: readonly ["text"];
|
|
61
|
+
};
|
|
62
|
+
readonly capabilities: {
|
|
63
|
+
readonly reasoning: false;
|
|
64
|
+
readonly toolCall: true;
|
|
65
|
+
readonly attachment: false;
|
|
66
|
+
readonly structuredOutput: true;
|
|
67
|
+
};
|
|
68
|
+
}, {
|
|
69
|
+
readonly id: "nvidia/parakeet-tdt-0.6b-v2";
|
|
70
|
+
readonly name: "Parakeet TDT 0.6B v2";
|
|
71
|
+
readonly provider: "nvidia";
|
|
72
|
+
readonly family: "parakeet";
|
|
73
|
+
readonly pricing: {
|
|
74
|
+
readonly input: 0;
|
|
75
|
+
readonly output: 0;
|
|
76
|
+
};
|
|
77
|
+
readonly contextWindow: 0;
|
|
78
|
+
readonly maxOutput: 4096;
|
|
79
|
+
readonly modalities: {
|
|
80
|
+
readonly input: readonly ["audio"];
|
|
81
|
+
readonly output: readonly ["text"];
|
|
82
|
+
};
|
|
83
|
+
readonly capabilities: {
|
|
84
|
+
readonly reasoning: false;
|
|
85
|
+
readonly toolCall: false;
|
|
86
|
+
readonly attachment: false;
|
|
87
|
+
readonly structuredOutput: false;
|
|
88
|
+
};
|
|
89
|
+
}, {
|
|
90
|
+
readonly id: "nvidia/nvidia-nemotron-nano-9b-v2";
|
|
91
|
+
readonly name: "nvidia-nemotron-nano-9b-v2";
|
|
92
|
+
readonly provider: "nvidia";
|
|
93
|
+
readonly family: "nemotron";
|
|
94
|
+
readonly pricing: {
|
|
95
|
+
readonly input: 0;
|
|
96
|
+
readonly output: 0;
|
|
97
|
+
};
|
|
98
|
+
readonly contextWindow: 131072;
|
|
99
|
+
readonly maxOutput: 131072;
|
|
100
|
+
readonly modalities: {
|
|
101
|
+
readonly input: readonly ["text"];
|
|
102
|
+
readonly output: readonly ["text"];
|
|
103
|
+
};
|
|
104
|
+
readonly capabilities: {
|
|
105
|
+
readonly reasoning: true;
|
|
106
|
+
readonly toolCall: true;
|
|
107
|
+
readonly attachment: false;
|
|
108
|
+
readonly structuredOutput: false;
|
|
109
|
+
};
|
|
110
|
+
}, {
|
|
111
|
+
readonly id: "nvidia/llama-embed-nemotron-8b";
|
|
112
|
+
readonly name: "Llama Embed Nemotron 8B";
|
|
113
|
+
readonly provider: "nvidia";
|
|
114
|
+
readonly family: "llama";
|
|
115
|
+
readonly pricing: {
|
|
116
|
+
readonly input: 0;
|
|
117
|
+
readonly output: 0;
|
|
118
|
+
};
|
|
119
|
+
readonly contextWindow: 32768;
|
|
120
|
+
readonly maxOutput: 2048;
|
|
121
|
+
readonly modalities: {
|
|
122
|
+
readonly input: readonly ["text"];
|
|
123
|
+
readonly output: readonly ["text"];
|
|
124
|
+
};
|
|
125
|
+
readonly capabilities: {
|
|
126
|
+
readonly reasoning: false;
|
|
127
|
+
readonly toolCall: false;
|
|
128
|
+
readonly attachment: false;
|
|
129
|
+
readonly structuredOutput: false;
|
|
130
|
+
};
|
|
131
|
+
}, {
|
|
132
|
+
readonly id: "nvidia/llama-3.3-nemotron-super-49b-v1.5";
|
|
133
|
+
readonly name: "Llama 3.3 Nemotron Super 49b V1.5";
|
|
134
|
+
readonly provider: "nvidia";
|
|
135
|
+
readonly family: "";
|
|
136
|
+
readonly pricing: {
|
|
137
|
+
readonly input: 0;
|
|
138
|
+
readonly output: 0;
|
|
139
|
+
};
|
|
140
|
+
readonly contextWindow: 128000;
|
|
141
|
+
readonly maxOutput: 4096;
|
|
142
|
+
readonly modalities: {
|
|
143
|
+
readonly input: readonly ["text"];
|
|
144
|
+
readonly output: readonly ["text"];
|
|
145
|
+
};
|
|
146
|
+
readonly capabilities: {
|
|
147
|
+
readonly reasoning: false;
|
|
148
|
+
readonly toolCall: false;
|
|
149
|
+
readonly attachment: false;
|
|
150
|
+
readonly structuredOutput: false;
|
|
151
|
+
};
|
|
152
|
+
}, {
|
|
153
|
+
readonly id: "nvidia/llama-3.3-nemotron-super-49b-v1";
|
|
154
|
+
readonly name: "Llama 3.3 Nemotron Super 49b V1";
|
|
155
|
+
readonly provider: "nvidia";
|
|
156
|
+
readonly family: "";
|
|
157
|
+
readonly pricing: {
|
|
158
|
+
readonly input: 0;
|
|
159
|
+
readonly output: 0;
|
|
160
|
+
};
|
|
161
|
+
readonly contextWindow: 128000;
|
|
162
|
+
readonly maxOutput: 4096;
|
|
163
|
+
readonly modalities: {
|
|
164
|
+
readonly input: readonly ["text"];
|
|
165
|
+
readonly output: readonly ["text"];
|
|
166
|
+
};
|
|
167
|
+
readonly capabilities: {
|
|
168
|
+
readonly reasoning: false;
|
|
169
|
+
readonly toolCall: false;
|
|
170
|
+
readonly attachment: false;
|
|
171
|
+
readonly structuredOutput: false;
|
|
172
|
+
};
|
|
173
|
+
}, {
|
|
174
|
+
readonly id: "nvidia/llama3-chatqa-1.5-70b";
|
|
175
|
+
readonly name: "Llama3 Chatqa 1.5 70b";
|
|
176
|
+
readonly provider: "nvidia";
|
|
177
|
+
readonly family: "";
|
|
178
|
+
readonly pricing: {
|
|
179
|
+
readonly input: 0;
|
|
180
|
+
readonly output: 0;
|
|
181
|
+
};
|
|
182
|
+
readonly contextWindow: 128000;
|
|
183
|
+
readonly maxOutput: 4096;
|
|
184
|
+
readonly modalities: {
|
|
185
|
+
readonly input: readonly ["text"];
|
|
186
|
+
readonly output: readonly ["text"];
|
|
187
|
+
};
|
|
188
|
+
readonly capabilities: {
|
|
189
|
+
readonly reasoning: false;
|
|
190
|
+
readonly toolCall: true;
|
|
191
|
+
readonly attachment: false;
|
|
192
|
+
readonly structuredOutput: true;
|
|
193
|
+
};
|
|
194
|
+
}, {
|
|
195
|
+
readonly id: "nvidia/cosmos-nemotron-34b";
|
|
196
|
+
readonly name: "Cosmos Nemotron 34B";
|
|
197
|
+
readonly provider: "nvidia";
|
|
198
|
+
readonly family: "nemotron";
|
|
199
|
+
readonly pricing: {
|
|
200
|
+
readonly input: 0;
|
|
201
|
+
readonly output: 0;
|
|
202
|
+
};
|
|
203
|
+
readonly contextWindow: 131072;
|
|
204
|
+
readonly maxOutput: 8192;
|
|
205
|
+
readonly modalities: {
|
|
206
|
+
readonly input: readonly ["text", "image", "video"];
|
|
207
|
+
readonly output: readonly ["text"];
|
|
208
|
+
};
|
|
209
|
+
readonly capabilities: {
|
|
210
|
+
readonly reasoning: true;
|
|
211
|
+
readonly toolCall: false;
|
|
212
|
+
readonly attachment: false;
|
|
213
|
+
readonly structuredOutput: false;
|
|
214
|
+
};
|
|
215
|
+
}, {
|
|
216
|
+
readonly id: "nvidia/nemoretriever-ocr-v1";
|
|
217
|
+
readonly name: "NeMo Retriever OCR v1";
|
|
218
|
+
readonly provider: "nvidia";
|
|
219
|
+
readonly family: "nemoretriever";
|
|
220
|
+
readonly pricing: {
|
|
221
|
+
readonly input: 0;
|
|
222
|
+
readonly output: 0;
|
|
223
|
+
};
|
|
224
|
+
readonly contextWindow: 0;
|
|
225
|
+
readonly maxOutput: 4096;
|
|
226
|
+
readonly modalities: {
|
|
227
|
+
readonly input: readonly ["image"];
|
|
228
|
+
readonly output: readonly ["text"];
|
|
229
|
+
};
|
|
230
|
+
readonly capabilities: {
|
|
231
|
+
readonly reasoning: false;
|
|
232
|
+
readonly toolCall: false;
|
|
233
|
+
readonly attachment: false;
|
|
234
|
+
readonly structuredOutput: false;
|
|
235
|
+
};
|
|
236
|
+
}, {
|
|
237
|
+
readonly id: "nvidia/nemotron-4-340b-instruct";
|
|
238
|
+
readonly name: "Nemotron 4 340b Instruct";
|
|
239
|
+
readonly provider: "nvidia";
|
|
240
|
+
readonly family: "";
|
|
241
|
+
readonly pricing: {
|
|
242
|
+
readonly input: 0;
|
|
243
|
+
readonly output: 0;
|
|
244
|
+
};
|
|
245
|
+
readonly contextWindow: 128000;
|
|
246
|
+
readonly maxOutput: 4096;
|
|
247
|
+
readonly modalities: {
|
|
248
|
+
readonly input: readonly ["text"];
|
|
249
|
+
readonly output: readonly ["text"];
|
|
250
|
+
};
|
|
251
|
+
readonly capabilities: {
|
|
252
|
+
readonly reasoning: false;
|
|
253
|
+
readonly toolCall: true;
|
|
254
|
+
readonly attachment: false;
|
|
255
|
+
readonly structuredOutput: true;
|
|
256
|
+
};
|
|
257
|
+
}, {
|
|
258
|
+
readonly id: "nvidia/nemotron-3-nano-30b-a3b";
|
|
259
|
+
readonly name: "nemotron-3-nano-30b-a3b";
|
|
260
|
+
readonly provider: "nvidia";
|
|
261
|
+
readonly family: "nemotron";
|
|
262
|
+
readonly pricing: {
|
|
263
|
+
readonly input: 0;
|
|
264
|
+
readonly output: 0;
|
|
265
|
+
};
|
|
266
|
+
readonly contextWindow: 131072;
|
|
267
|
+
readonly maxOutput: 131072;
|
|
268
|
+
readonly modalities: {
|
|
269
|
+
readonly input: readonly ["text"];
|
|
270
|
+
readonly output: readonly ["text"];
|
|
271
|
+
};
|
|
272
|
+
readonly capabilities: {
|
|
273
|
+
readonly reasoning: true;
|
|
274
|
+
readonly toolCall: true;
|
|
275
|
+
readonly attachment: false;
|
|
276
|
+
readonly structuredOutput: false;
|
|
277
|
+
};
|
|
278
|
+
}, {
|
|
279
|
+
readonly id: "microsoft/phi-3-small-128k-instruct";
|
|
280
|
+
readonly name: "Phi 3 Small 128k Instruct";
|
|
281
|
+
readonly provider: "nvidia";
|
|
282
|
+
readonly family: "";
|
|
283
|
+
readonly pricing: {
|
|
284
|
+
readonly input: 0;
|
|
285
|
+
readonly output: 0;
|
|
286
|
+
};
|
|
287
|
+
readonly contextWindow: 128000;
|
|
288
|
+
readonly maxOutput: 4096;
|
|
289
|
+
readonly modalities: {
|
|
290
|
+
readonly input: readonly ["text", "image"];
|
|
291
|
+
readonly output: readonly ["text"];
|
|
292
|
+
};
|
|
293
|
+
readonly capabilities: {
|
|
294
|
+
readonly reasoning: false;
|
|
295
|
+
readonly toolCall: true;
|
|
296
|
+
readonly attachment: true;
|
|
297
|
+
readonly structuredOutput: true;
|
|
298
|
+
};
|
|
299
|
+
}, {
|
|
300
|
+
readonly id: "microsoft/phi-3-medium-128k-instruct";
|
|
301
|
+
readonly name: "Phi 3 Medium 128k Instruct";
|
|
302
|
+
readonly provider: "nvidia";
|
|
303
|
+
readonly family: "";
|
|
304
|
+
readonly pricing: {
|
|
305
|
+
readonly input: 0;
|
|
306
|
+
readonly output: 0;
|
|
307
|
+
};
|
|
308
|
+
readonly contextWindow: 128000;
|
|
309
|
+
readonly maxOutput: 4096;
|
|
310
|
+
readonly modalities: {
|
|
311
|
+
readonly input: readonly ["text", "image"];
|
|
312
|
+
readonly output: readonly ["text"];
|
|
313
|
+
};
|
|
314
|
+
readonly capabilities: {
|
|
315
|
+
readonly reasoning: false;
|
|
316
|
+
readonly toolCall: true;
|
|
317
|
+
readonly attachment: true;
|
|
318
|
+
readonly structuredOutput: true;
|
|
319
|
+
};
|
|
320
|
+
}, {
|
|
321
|
+
readonly id: "microsoft/phi-3.5-moe-instruct";
|
|
322
|
+
readonly name: "Phi 3.5 Moe Instruct";
|
|
323
|
+
readonly provider: "nvidia";
|
|
324
|
+
readonly family: "";
|
|
325
|
+
readonly pricing: {
|
|
326
|
+
readonly input: 0;
|
|
327
|
+
readonly output: 0;
|
|
328
|
+
};
|
|
329
|
+
readonly contextWindow: 128000;
|
|
330
|
+
readonly maxOutput: 4096;
|
|
331
|
+
readonly modalities: {
|
|
332
|
+
readonly input: readonly ["text"];
|
|
333
|
+
readonly output: readonly ["text"];
|
|
334
|
+
};
|
|
335
|
+
readonly capabilities: {
|
|
336
|
+
readonly reasoning: false;
|
|
337
|
+
readonly toolCall: true;
|
|
338
|
+
readonly attachment: false;
|
|
339
|
+
readonly structuredOutput: true;
|
|
340
|
+
};
|
|
341
|
+
}, {
|
|
342
|
+
readonly id: "microsoft/phi-3-vision-128k-instruct";
|
|
343
|
+
readonly name: "Phi 3 Vision 128k Instruct";
|
|
344
|
+
readonly provider: "nvidia";
|
|
345
|
+
readonly family: "";
|
|
346
|
+
readonly pricing: {
|
|
347
|
+
readonly input: 0;
|
|
348
|
+
readonly output: 0;
|
|
349
|
+
};
|
|
350
|
+
readonly contextWindow: 128000;
|
|
351
|
+
readonly maxOutput: 4096;
|
|
352
|
+
readonly modalities: {
|
|
353
|
+
readonly input: readonly ["text", "image"];
|
|
354
|
+
readonly output: readonly ["text"];
|
|
355
|
+
};
|
|
356
|
+
readonly capabilities: {
|
|
357
|
+
readonly reasoning: false;
|
|
358
|
+
readonly toolCall: true;
|
|
359
|
+
readonly attachment: false;
|
|
360
|
+
readonly structuredOutput: true;
|
|
361
|
+
};
|
|
362
|
+
}, {
|
|
363
|
+
readonly id: "microsoft/phi-4-mini-instruct";
|
|
364
|
+
readonly name: "Phi-4-Mini";
|
|
365
|
+
readonly provider: "nvidia";
|
|
366
|
+
readonly family: "phi";
|
|
367
|
+
readonly pricing: {
|
|
368
|
+
readonly input: 0;
|
|
369
|
+
readonly output: 0;
|
|
370
|
+
};
|
|
371
|
+
readonly contextWindow: 131072;
|
|
372
|
+
readonly maxOutput: 8192;
|
|
373
|
+
readonly modalities: {
|
|
374
|
+
readonly input: readonly ["text", "image", "audio"];
|
|
375
|
+
readonly output: readonly ["text"];
|
|
376
|
+
};
|
|
377
|
+
readonly capabilities: {
|
|
378
|
+
readonly reasoning: true;
|
|
379
|
+
readonly toolCall: true;
|
|
380
|
+
readonly attachment: true;
|
|
381
|
+
readonly structuredOutput: false;
|
|
382
|
+
};
|
|
383
|
+
}, {
|
|
384
|
+
readonly id: "microsoft/phi-3.5-vision-instruct";
|
|
385
|
+
readonly name: "Phi 3.5 Vision Instruct";
|
|
386
|
+
readonly provider: "nvidia";
|
|
387
|
+
readonly family: "";
|
|
388
|
+
readonly pricing: {
|
|
389
|
+
readonly input: 0;
|
|
390
|
+
readonly output: 0;
|
|
391
|
+
};
|
|
392
|
+
readonly contextWindow: 128000;
|
|
393
|
+
readonly maxOutput: 4096;
|
|
394
|
+
readonly modalities: {
|
|
395
|
+
readonly input: readonly ["text", "image"];
|
|
396
|
+
readonly output: readonly ["text"];
|
|
397
|
+
};
|
|
398
|
+
readonly capabilities: {
|
|
399
|
+
readonly reasoning: false;
|
|
400
|
+
readonly toolCall: true;
|
|
401
|
+
readonly attachment: false;
|
|
402
|
+
readonly structuredOutput: true;
|
|
403
|
+
};
|
|
404
|
+
}, {
|
|
405
|
+
readonly id: "microsoft/phi-3-medium-4k-instruct";
|
|
406
|
+
readonly name: "Phi 3 Medium 4k Instruct";
|
|
407
|
+
readonly provider: "nvidia";
|
|
408
|
+
readonly family: "";
|
|
409
|
+
readonly pricing: {
|
|
410
|
+
readonly input: 0;
|
|
411
|
+
readonly output: 0;
|
|
412
|
+
};
|
|
413
|
+
readonly contextWindow: 4000;
|
|
414
|
+
readonly maxOutput: 4096;
|
|
415
|
+
readonly modalities: {
|
|
416
|
+
readonly input: readonly ["text", "image"];
|
|
417
|
+
readonly output: readonly ["text"];
|
|
418
|
+
};
|
|
419
|
+
readonly capabilities: {
|
|
420
|
+
readonly reasoning: false;
|
|
421
|
+
readonly toolCall: true;
|
|
422
|
+
readonly attachment: true;
|
|
423
|
+
readonly structuredOutput: true;
|
|
424
|
+
};
|
|
425
|
+
}, {
|
|
426
|
+
readonly id: "microsoft/phi-3-small-8k-instruct";
|
|
427
|
+
readonly name: "Phi 3 Small 8k Instruct";
|
|
428
|
+
readonly provider: "nvidia";
|
|
429
|
+
readonly family: "";
|
|
430
|
+
readonly pricing: {
|
|
431
|
+
readonly input: 0;
|
|
432
|
+
readonly output: 0;
|
|
433
|
+
};
|
|
434
|
+
readonly contextWindow: 8000;
|
|
435
|
+
readonly maxOutput: 4096;
|
|
436
|
+
readonly modalities: {
|
|
437
|
+
readonly input: readonly ["text", "image"];
|
|
438
|
+
readonly output: readonly ["text"];
|
|
439
|
+
};
|
|
440
|
+
readonly capabilities: {
|
|
441
|
+
readonly reasoning: false;
|
|
442
|
+
readonly toolCall: true;
|
|
443
|
+
readonly attachment: true;
|
|
444
|
+
readonly structuredOutput: true;
|
|
445
|
+
};
|
|
446
|
+
}, {
|
|
447
|
+
readonly id: "minimaxai/minimax-m2.1";
|
|
448
|
+
readonly name: "MiniMax-M2.1";
|
|
449
|
+
readonly provider: "nvidia";
|
|
450
|
+
readonly family: "minimax";
|
|
451
|
+
readonly pricing: {
|
|
452
|
+
readonly input: 0;
|
|
453
|
+
readonly output: 0;
|
|
454
|
+
};
|
|
455
|
+
readonly contextWindow: 204800;
|
|
456
|
+
readonly maxOutput: 131072;
|
|
457
|
+
readonly modalities: {
|
|
458
|
+
readonly input: readonly ["text"];
|
|
459
|
+
readonly output: readonly ["text"];
|
|
460
|
+
};
|
|
461
|
+
readonly capabilities: {
|
|
462
|
+
readonly reasoning: true;
|
|
463
|
+
readonly toolCall: true;
|
|
464
|
+
readonly attachment: false;
|
|
465
|
+
readonly structuredOutput: false;
|
|
466
|
+
};
|
|
467
|
+
}, {
|
|
468
|
+
readonly id: "minimaxai/minimax-m2.5";
|
|
469
|
+
readonly name: "MiniMax-M2.5";
|
|
470
|
+
readonly provider: "nvidia";
|
|
471
|
+
readonly family: "minimax";
|
|
472
|
+
readonly pricing: {
|
|
473
|
+
readonly input: 0;
|
|
474
|
+
readonly output: 0;
|
|
475
|
+
};
|
|
476
|
+
readonly contextWindow: 204800;
|
|
477
|
+
readonly maxOutput: 131072;
|
|
478
|
+
readonly modalities: {
|
|
479
|
+
readonly input: readonly ["text"];
|
|
480
|
+
readonly output: readonly ["text"];
|
|
481
|
+
};
|
|
482
|
+
readonly capabilities: {
|
|
483
|
+
readonly reasoning: true;
|
|
484
|
+
readonly toolCall: true;
|
|
485
|
+
readonly attachment: false;
|
|
486
|
+
readonly structuredOutput: false;
|
|
487
|
+
};
|
|
488
|
+
}, {
|
|
489
|
+
readonly id: "deepseek-ai/deepseek-v3.1";
|
|
490
|
+
readonly name: "DeepSeek V3.1";
|
|
491
|
+
readonly provider: "nvidia";
|
|
492
|
+
readonly family: "deepseek";
|
|
493
|
+
readonly pricing: {
|
|
494
|
+
readonly input: 0;
|
|
495
|
+
readonly output: 0;
|
|
496
|
+
};
|
|
497
|
+
readonly contextWindow: 128000;
|
|
498
|
+
readonly maxOutput: 8192;
|
|
499
|
+
readonly modalities: {
|
|
500
|
+
readonly input: readonly ["text"];
|
|
501
|
+
readonly output: readonly ["text"];
|
|
502
|
+
};
|
|
503
|
+
readonly capabilities: {
|
|
504
|
+
readonly reasoning: true;
|
|
505
|
+
readonly toolCall: true;
|
|
506
|
+
readonly attachment: false;
|
|
507
|
+
readonly structuredOutput: false;
|
|
508
|
+
};
|
|
509
|
+
}, {
|
|
510
|
+
readonly id: "deepseek-ai/deepseek-r1-0528";
|
|
511
|
+
readonly name: "Deepseek R1 0528";
|
|
512
|
+
readonly provider: "nvidia";
|
|
513
|
+
readonly family: "";
|
|
514
|
+
readonly pricing: {
|
|
515
|
+
readonly input: 0;
|
|
516
|
+
readonly output: 0;
|
|
517
|
+
};
|
|
518
|
+
readonly contextWindow: 128000;
|
|
519
|
+
readonly maxOutput: 4096;
|
|
520
|
+
readonly modalities: {
|
|
521
|
+
readonly input: readonly ["text"];
|
|
522
|
+
readonly output: readonly ["text"];
|
|
523
|
+
};
|
|
524
|
+
readonly capabilities: {
|
|
525
|
+
readonly reasoning: true;
|
|
526
|
+
readonly toolCall: true;
|
|
527
|
+
readonly attachment: false;
|
|
528
|
+
readonly structuredOutput: true;
|
|
529
|
+
};
|
|
530
|
+
}, {
|
|
531
|
+
readonly id: "deepseek-ai/deepseek-r1";
|
|
532
|
+
readonly name: "Deepseek R1";
|
|
533
|
+
readonly provider: "nvidia";
|
|
534
|
+
readonly family: "";
|
|
535
|
+
readonly pricing: {
|
|
536
|
+
readonly input: 0;
|
|
537
|
+
readonly output: 0;
|
|
538
|
+
};
|
|
539
|
+
readonly contextWindow: 128000;
|
|
540
|
+
readonly maxOutput: 4096;
|
|
541
|
+
readonly modalities: {
|
|
542
|
+
readonly input: readonly ["text"];
|
|
543
|
+
readonly output: readonly ["text"];
|
|
544
|
+
};
|
|
545
|
+
readonly capabilities: {
|
|
546
|
+
readonly reasoning: true;
|
|
547
|
+
readonly toolCall: false;
|
|
548
|
+
readonly attachment: false;
|
|
549
|
+
readonly structuredOutput: false;
|
|
550
|
+
};
|
|
551
|
+
}, {
|
|
552
|
+
readonly id: "deepseek-ai/deepseek-v3.1-terminus";
|
|
553
|
+
readonly name: "DeepSeek V3.1 Terminus";
|
|
554
|
+
readonly provider: "nvidia";
|
|
555
|
+
readonly family: "deepseek";
|
|
556
|
+
readonly pricing: {
|
|
557
|
+
readonly input: 0;
|
|
558
|
+
readonly output: 0;
|
|
559
|
+
};
|
|
560
|
+
readonly contextWindow: 128000;
|
|
561
|
+
readonly maxOutput: 8192;
|
|
562
|
+
readonly modalities: {
|
|
563
|
+
readonly input: readonly ["text"];
|
|
564
|
+
readonly output: readonly ["text"];
|
|
565
|
+
};
|
|
566
|
+
readonly capabilities: {
|
|
567
|
+
readonly reasoning: true;
|
|
568
|
+
readonly toolCall: true;
|
|
569
|
+
readonly attachment: false;
|
|
570
|
+
readonly structuredOutput: false;
|
|
571
|
+
};
|
|
572
|
+
}, {
|
|
573
|
+
readonly id: "deepseek-ai/deepseek-coder-6.7b-instruct";
|
|
574
|
+
readonly name: "Deepseek Coder 6.7b Instruct";
|
|
575
|
+
readonly provider: "nvidia";
|
|
576
|
+
readonly family: "";
|
|
577
|
+
readonly pricing: {
|
|
578
|
+
readonly input: 0;
|
|
579
|
+
readonly output: 0;
|
|
580
|
+
};
|
|
581
|
+
readonly contextWindow: 128000;
|
|
582
|
+
readonly maxOutput: 4096;
|
|
583
|
+
readonly modalities: {
|
|
584
|
+
readonly input: readonly ["text"];
|
|
585
|
+
readonly output: readonly ["text"];
|
|
586
|
+
};
|
|
587
|
+
readonly capabilities: {
|
|
588
|
+
readonly reasoning: false;
|
|
589
|
+
readonly toolCall: true;
|
|
590
|
+
readonly attachment: false;
|
|
591
|
+
readonly structuredOutput: true;
|
|
592
|
+
};
|
|
593
|
+
}, {
|
|
594
|
+
readonly id: "deepseek-ai/deepseek-v3.2";
|
|
595
|
+
readonly name: "DeepSeek V3.2";
|
|
596
|
+
readonly provider: "nvidia";
|
|
597
|
+
readonly family: "deepseek";
|
|
598
|
+
readonly pricing: {
|
|
599
|
+
readonly input: 0;
|
|
600
|
+
readonly output: 0;
|
|
601
|
+
};
|
|
602
|
+
readonly contextWindow: 163840;
|
|
603
|
+
readonly maxOutput: 65536;
|
|
604
|
+
readonly modalities: {
|
|
605
|
+
readonly input: readonly ["text"];
|
|
606
|
+
readonly output: readonly ["text"];
|
|
607
|
+
};
|
|
608
|
+
readonly capabilities: {
|
|
609
|
+
readonly reasoning: true;
|
|
610
|
+
readonly toolCall: true;
|
|
611
|
+
readonly attachment: false;
|
|
612
|
+
readonly structuredOutput: false;
|
|
613
|
+
};
|
|
614
|
+
}, {
|
|
615
|
+
readonly id: "moonshotai/kimi-k2-instruct";
|
|
616
|
+
readonly name: "Kimi K2 Instruct";
|
|
617
|
+
readonly provider: "nvidia";
|
|
618
|
+
readonly family: "kimi";
|
|
619
|
+
readonly pricing: {
|
|
620
|
+
readonly input: 0;
|
|
621
|
+
readonly output: 0;
|
|
622
|
+
};
|
|
623
|
+
readonly contextWindow: 128000;
|
|
624
|
+
readonly maxOutput: 8192;
|
|
625
|
+
readonly modalities: {
|
|
626
|
+
readonly input: readonly ["text"];
|
|
627
|
+
readonly output: readonly ["text"];
|
|
628
|
+
};
|
|
629
|
+
readonly capabilities: {
|
|
630
|
+
readonly reasoning: true;
|
|
631
|
+
readonly toolCall: true;
|
|
632
|
+
readonly attachment: false;
|
|
633
|
+
readonly structuredOutput: false;
|
|
634
|
+
};
|
|
635
|
+
}, {
|
|
636
|
+
readonly id: "moonshotai/kimi-k2-instruct-0905";
|
|
637
|
+
readonly name: "Kimi K2 0905";
|
|
638
|
+
readonly provider: "nvidia";
|
|
639
|
+
readonly family: "kimi";
|
|
640
|
+
readonly pricing: {
|
|
641
|
+
readonly input: 0;
|
|
642
|
+
readonly output: 0;
|
|
643
|
+
};
|
|
644
|
+
readonly contextWindow: 262144;
|
|
645
|
+
readonly maxOutput: 262144;
|
|
646
|
+
readonly modalities: {
|
|
647
|
+
readonly input: readonly ["text"];
|
|
648
|
+
readonly output: readonly ["text"];
|
|
649
|
+
};
|
|
650
|
+
readonly capabilities: {
|
|
651
|
+
readonly reasoning: false;
|
|
652
|
+
readonly toolCall: true;
|
|
653
|
+
readonly attachment: false;
|
|
654
|
+
readonly structuredOutput: false;
|
|
655
|
+
};
|
|
656
|
+
}, {
|
|
657
|
+
readonly id: "moonshotai/kimi-k2.5";
|
|
658
|
+
readonly name: "Kimi K2.5";
|
|
659
|
+
readonly provider: "nvidia";
|
|
660
|
+
readonly family: "kimi";
|
|
661
|
+
readonly pricing: {
|
|
662
|
+
readonly input: 0;
|
|
663
|
+
readonly output: 0;
|
|
664
|
+
};
|
|
665
|
+
readonly contextWindow: 262144;
|
|
666
|
+
readonly maxOutput: 262144;
|
|
667
|
+
readonly modalities: {
|
|
668
|
+
readonly input: readonly ["text", "image", "video"];
|
|
669
|
+
readonly output: readonly ["text"];
|
|
670
|
+
};
|
|
671
|
+
readonly capabilities: {
|
|
672
|
+
readonly reasoning: true;
|
|
673
|
+
readonly toolCall: true;
|
|
674
|
+
readonly attachment: true;
|
|
675
|
+
readonly structuredOutput: false;
|
|
676
|
+
};
|
|
677
|
+
}, {
|
|
678
|
+
readonly id: "moonshotai/kimi-k2-thinking";
|
|
679
|
+
readonly name: "Kimi K2 Thinking";
|
|
680
|
+
readonly provider: "nvidia";
|
|
681
|
+
readonly family: "kimi-thinking";
|
|
682
|
+
readonly pricing: {
|
|
683
|
+
readonly input: 0;
|
|
684
|
+
readonly output: 0;
|
|
685
|
+
};
|
|
686
|
+
readonly contextWindow: 262144;
|
|
687
|
+
readonly maxOutput: 262144;
|
|
688
|
+
readonly modalities: {
|
|
689
|
+
readonly input: readonly ["text"];
|
|
690
|
+
readonly output: readonly ["text"];
|
|
691
|
+
};
|
|
692
|
+
readonly capabilities: {
|
|
693
|
+
readonly reasoning: true;
|
|
694
|
+
readonly toolCall: true;
|
|
695
|
+
readonly attachment: false;
|
|
696
|
+
readonly structuredOutput: true;
|
|
697
|
+
};
|
|
698
|
+
}, {
|
|
699
|
+
readonly id: "google/codegemma-7b";
|
|
700
|
+
readonly name: "Codegemma 7b";
|
|
701
|
+
readonly provider: "nvidia";
|
|
702
|
+
readonly family: "";
|
|
703
|
+
readonly pricing: {
|
|
704
|
+
readonly input: 0;
|
|
705
|
+
readonly output: 0;
|
|
706
|
+
};
|
|
707
|
+
readonly contextWindow: 128000;
|
|
708
|
+
readonly maxOutput: 4096;
|
|
709
|
+
readonly modalities: {
|
|
710
|
+
readonly input: readonly ["text"];
|
|
711
|
+
readonly output: readonly ["text"];
|
|
712
|
+
};
|
|
713
|
+
readonly capabilities: {
|
|
714
|
+
readonly reasoning: false;
|
|
715
|
+
readonly toolCall: false;
|
|
716
|
+
readonly attachment: false;
|
|
717
|
+
readonly structuredOutput: false;
|
|
718
|
+
};
|
|
719
|
+
}, {
|
|
720
|
+
readonly id: "google/gemma-2-2b-it";
|
|
721
|
+
readonly name: "Gemma 2 2b It";
|
|
722
|
+
readonly provider: "nvidia";
|
|
723
|
+
readonly family: "";
|
|
724
|
+
readonly pricing: {
|
|
725
|
+
readonly input: 0;
|
|
726
|
+
readonly output: 0;
|
|
727
|
+
};
|
|
728
|
+
readonly contextWindow: 128000;
|
|
729
|
+
readonly maxOutput: 4096;
|
|
730
|
+
readonly modalities: {
|
|
731
|
+
readonly input: readonly ["text"];
|
|
732
|
+
readonly output: readonly ["text"];
|
|
733
|
+
};
|
|
734
|
+
readonly capabilities: {
|
|
735
|
+
readonly reasoning: false;
|
|
736
|
+
readonly toolCall: true;
|
|
737
|
+
readonly attachment: false;
|
|
738
|
+
readonly structuredOutput: true;
|
|
739
|
+
};
|
|
740
|
+
}, {
|
|
741
|
+
readonly id: "google/gemma-3-1b-it";
|
|
742
|
+
readonly name: "Gemma 3 1b It";
|
|
743
|
+
readonly provider: "nvidia";
|
|
744
|
+
readonly family: "";
|
|
745
|
+
readonly pricing: {
|
|
746
|
+
readonly input: 0;
|
|
747
|
+
readonly output: 0;
|
|
748
|
+
};
|
|
749
|
+
readonly contextWindow: 128000;
|
|
750
|
+
readonly maxOutput: 4096;
|
|
751
|
+
readonly modalities: {
|
|
752
|
+
readonly input: readonly ["text", "image"];
|
|
753
|
+
readonly output: readonly ["text"];
|
|
754
|
+
};
|
|
755
|
+
readonly capabilities: {
|
|
756
|
+
readonly reasoning: false;
|
|
757
|
+
readonly toolCall: true;
|
|
758
|
+
readonly attachment: true;
|
|
759
|
+
readonly structuredOutput: true;
|
|
760
|
+
};
|
|
761
|
+
}, {
|
|
762
|
+
readonly id: "google/gemma-2-27b-it";
|
|
763
|
+
readonly name: "Gemma 2 27b It";
|
|
764
|
+
readonly provider: "nvidia";
|
|
765
|
+
readonly family: "";
|
|
766
|
+
readonly pricing: {
|
|
767
|
+
readonly input: 0;
|
|
768
|
+
readonly output: 0;
|
|
769
|
+
};
|
|
770
|
+
readonly contextWindow: 128000;
|
|
771
|
+
readonly maxOutput: 4096;
|
|
772
|
+
readonly modalities: {
|
|
773
|
+
readonly input: readonly ["text"];
|
|
774
|
+
readonly output: readonly ["text"];
|
|
775
|
+
};
|
|
776
|
+
readonly capabilities: {
|
|
777
|
+
readonly reasoning: false;
|
|
778
|
+
readonly toolCall: true;
|
|
779
|
+
readonly attachment: false;
|
|
780
|
+
readonly structuredOutput: true;
|
|
781
|
+
};
|
|
782
|
+
}, {
|
|
783
|
+
readonly id: "google/gemma-3n-e2b-it";
|
|
784
|
+
readonly name: "Gemma 3n E2b It";
|
|
785
|
+
readonly provider: "nvidia";
|
|
786
|
+
readonly family: "";
|
|
787
|
+
readonly pricing: {
|
|
788
|
+
readonly input: 0;
|
|
789
|
+
readonly output: 0;
|
|
790
|
+
};
|
|
791
|
+
readonly contextWindow: 128000;
|
|
792
|
+
readonly maxOutput: 4096;
|
|
793
|
+
readonly modalities: {
|
|
794
|
+
readonly input: readonly ["text", "image"];
|
|
795
|
+
readonly output: readonly ["text"];
|
|
796
|
+
};
|
|
797
|
+
readonly capabilities: {
|
|
798
|
+
readonly reasoning: false;
|
|
799
|
+
readonly toolCall: true;
|
|
800
|
+
readonly attachment: true;
|
|
801
|
+
readonly structuredOutput: true;
|
|
802
|
+
};
|
|
803
|
+
}, {
|
|
804
|
+
readonly id: "google/codegemma-1.1-7b";
|
|
805
|
+
readonly name: "Codegemma 1.1 7b";
|
|
806
|
+
readonly provider: "nvidia";
|
|
807
|
+
readonly family: "";
|
|
808
|
+
readonly pricing: {
|
|
809
|
+
readonly input: 0;
|
|
810
|
+
readonly output: 0;
|
|
811
|
+
};
|
|
812
|
+
readonly contextWindow: 128000;
|
|
813
|
+
readonly maxOutput: 4096;
|
|
814
|
+
readonly modalities: {
|
|
815
|
+
readonly input: readonly ["text"];
|
|
816
|
+
readonly output: readonly ["text"];
|
|
817
|
+
};
|
|
818
|
+
readonly capabilities: {
|
|
819
|
+
readonly reasoning: false;
|
|
820
|
+
readonly toolCall: false;
|
|
821
|
+
readonly attachment: false;
|
|
822
|
+
readonly structuredOutput: false;
|
|
823
|
+
};
|
|
824
|
+
}, {
|
|
825
|
+
readonly id: "google/gemma-3n-e4b-it";
|
|
826
|
+
readonly name: "Gemma 3n E4b It";
|
|
827
|
+
readonly provider: "nvidia";
|
|
828
|
+
readonly family: "";
|
|
829
|
+
readonly pricing: {
|
|
830
|
+
readonly input: 0;
|
|
831
|
+
readonly output: 0;
|
|
832
|
+
};
|
|
833
|
+
readonly contextWindow: 128000;
|
|
834
|
+
readonly maxOutput: 4096;
|
|
835
|
+
readonly modalities: {
|
|
836
|
+
readonly input: readonly ["text", "image"];
|
|
837
|
+
readonly output: readonly ["text"];
|
|
838
|
+
};
|
|
839
|
+
readonly capabilities: {
|
|
840
|
+
readonly reasoning: false;
|
|
841
|
+
readonly toolCall: true;
|
|
842
|
+
readonly attachment: true;
|
|
843
|
+
readonly structuredOutput: true;
|
|
844
|
+
};
|
|
845
|
+
}, {
|
|
846
|
+
readonly id: "google/gemma-3-12b-it";
|
|
847
|
+
readonly name: "Gemma 3 12b It";
|
|
848
|
+
readonly provider: "nvidia";
|
|
849
|
+
readonly family: "";
|
|
850
|
+
readonly pricing: {
|
|
851
|
+
readonly input: 0;
|
|
852
|
+
readonly output: 0;
|
|
853
|
+
};
|
|
854
|
+
readonly contextWindow: 128000;
|
|
855
|
+
readonly maxOutput: 4096;
|
|
856
|
+
readonly modalities: {
|
|
857
|
+
readonly input: readonly ["text"];
|
|
858
|
+
readonly output: readonly ["text"];
|
|
859
|
+
};
|
|
860
|
+
readonly capabilities: {
|
|
861
|
+
readonly reasoning: false;
|
|
862
|
+
readonly toolCall: true;
|
|
863
|
+
readonly attachment: false;
|
|
864
|
+
readonly structuredOutput: true;
|
|
865
|
+
};
|
|
866
|
+
}, {
|
|
867
|
+
readonly id: "google/gemma-3-27b-it";
|
|
868
|
+
readonly name: "Gemma-3-27B-IT";
|
|
869
|
+
readonly provider: "nvidia";
|
|
870
|
+
readonly family: "gemma";
|
|
871
|
+
readonly pricing: {
|
|
872
|
+
readonly input: 0;
|
|
873
|
+
readonly output: 0;
|
|
874
|
+
};
|
|
875
|
+
readonly contextWindow: 131072;
|
|
876
|
+
readonly maxOutput: 8192;
|
|
877
|
+
readonly modalities: {
|
|
878
|
+
readonly input: readonly ["text", "image"];
|
|
879
|
+
readonly output: readonly ["text"];
|
|
880
|
+
};
|
|
881
|
+
readonly capabilities: {
|
|
882
|
+
readonly reasoning: true;
|
|
883
|
+
readonly toolCall: true;
|
|
884
|
+
readonly attachment: true;
|
|
885
|
+
readonly structuredOutput: false;
|
|
886
|
+
};
|
|
887
|
+
}, {
|
|
888
|
+
readonly id: "z-ai/glm4.7";
|
|
889
|
+
readonly name: "GLM-4.7";
|
|
890
|
+
readonly provider: "nvidia";
|
|
891
|
+
readonly family: "glm";
|
|
892
|
+
readonly pricing: {
|
|
893
|
+
readonly input: 0;
|
|
894
|
+
readonly output: 0;
|
|
895
|
+
};
|
|
896
|
+
readonly contextWindow: 204800;
|
|
897
|
+
readonly maxOutput: 131072;
|
|
898
|
+
readonly modalities: {
|
|
899
|
+
readonly input: readonly ["text"];
|
|
900
|
+
readonly output: readonly ["text"];
|
|
901
|
+
};
|
|
902
|
+
readonly capabilities: {
|
|
903
|
+
readonly reasoning: true;
|
|
904
|
+
readonly toolCall: true;
|
|
905
|
+
readonly attachment: false;
|
|
906
|
+
readonly structuredOutput: false;
|
|
907
|
+
};
|
|
908
|
+
}, {
|
|
909
|
+
readonly id: "z-ai/glm5";
|
|
910
|
+
readonly name: "GLM5";
|
|
911
|
+
readonly provider: "nvidia";
|
|
912
|
+
readonly family: "glm";
|
|
913
|
+
readonly pricing: {
|
|
914
|
+
readonly input: 0;
|
|
915
|
+
readonly output: 0;
|
|
916
|
+
};
|
|
917
|
+
readonly contextWindow: 202752;
|
|
918
|
+
readonly maxOutput: 131000;
|
|
919
|
+
readonly modalities: {
|
|
920
|
+
readonly input: readonly ["text"];
|
|
921
|
+
readonly output: readonly ["text"];
|
|
922
|
+
};
|
|
923
|
+
readonly capabilities: {
|
|
924
|
+
readonly reasoning: true;
|
|
925
|
+
readonly toolCall: true;
|
|
926
|
+
readonly attachment: false;
|
|
927
|
+
readonly structuredOutput: true;
|
|
928
|
+
};
|
|
929
|
+
}, {
|
|
930
|
+
readonly id: "stepfun-ai/step-3.5-flash";
|
|
931
|
+
readonly name: "Step 3.5 Flash";
|
|
932
|
+
readonly provider: "nvidia";
|
|
933
|
+
readonly family: "";
|
|
934
|
+
readonly pricing: {
|
|
935
|
+
readonly input: 0;
|
|
936
|
+
readonly output: 0;
|
|
937
|
+
};
|
|
938
|
+
readonly contextWindow: 256000;
|
|
939
|
+
readonly maxOutput: 16384;
|
|
940
|
+
readonly modalities: {
|
|
941
|
+
readonly input: readonly ["text"];
|
|
942
|
+
readonly output: readonly ["text"];
|
|
943
|
+
};
|
|
944
|
+
readonly capabilities: {
|
|
945
|
+
readonly reasoning: true;
|
|
946
|
+
readonly toolCall: true;
|
|
947
|
+
readonly attachment: false;
|
|
948
|
+
readonly structuredOutput: false;
|
|
949
|
+
};
|
|
950
|
+
}, {
|
|
951
|
+
readonly id: "qwen/qwen3-next-80b-a3b-thinking";
|
|
952
|
+
readonly name: "Qwen3-Next-80B-A3B-Thinking";
|
|
953
|
+
readonly provider: "nvidia";
|
|
954
|
+
readonly family: "qwen";
|
|
955
|
+
readonly pricing: {
|
|
956
|
+
readonly input: 0;
|
|
957
|
+
readonly output: 0;
|
|
958
|
+
};
|
|
959
|
+
readonly contextWindow: 262144;
|
|
960
|
+
readonly maxOutput: 16384;
|
|
961
|
+
readonly modalities: {
|
|
962
|
+
readonly input: readonly ["text"];
|
|
963
|
+
readonly output: readonly ["text"];
|
|
964
|
+
};
|
|
965
|
+
readonly capabilities: {
|
|
966
|
+
readonly reasoning: true;
|
|
967
|
+
readonly toolCall: true;
|
|
968
|
+
readonly attachment: false;
|
|
969
|
+
readonly structuredOutput: false;
|
|
970
|
+
};
|
|
971
|
+
}, {
|
|
972
|
+
readonly id: "qwen/qwen3-coder-480b-a35b-instruct";
|
|
973
|
+
readonly name: "Qwen3 Coder 480B A35B Instruct";
|
|
974
|
+
readonly provider: "nvidia";
|
|
975
|
+
readonly family: "qwen";
|
|
976
|
+
readonly pricing: {
|
|
977
|
+
readonly input: 0;
|
|
978
|
+
readonly output: 0;
|
|
979
|
+
};
|
|
980
|
+
readonly contextWindow: 262144;
|
|
981
|
+
readonly maxOutput: 66536;
|
|
982
|
+
readonly modalities: {
|
|
983
|
+
readonly input: readonly ["text"];
|
|
984
|
+
readonly output: readonly ["text"];
|
|
985
|
+
};
|
|
986
|
+
readonly capabilities: {
|
|
987
|
+
readonly reasoning: false;
|
|
988
|
+
readonly toolCall: true;
|
|
989
|
+
readonly attachment: false;
|
|
990
|
+
readonly structuredOutput: false;
|
|
991
|
+
};
|
|
992
|
+
}, {
|
|
993
|
+
readonly id: "qwen/qwq-32b";
|
|
994
|
+
readonly name: "Qwq 32b";
|
|
995
|
+
readonly provider: "nvidia";
|
|
996
|
+
readonly family: "";
|
|
997
|
+
readonly pricing: {
|
|
998
|
+
readonly input: 0;
|
|
999
|
+
readonly output: 0;
|
|
1000
|
+
};
|
|
1001
|
+
readonly contextWindow: 128000;
|
|
1002
|
+
readonly maxOutput: 4096;
|
|
1003
|
+
readonly modalities: {
|
|
1004
|
+
readonly input: readonly ["text"];
|
|
1005
|
+
readonly output: readonly ["text"];
|
|
1006
|
+
};
|
|
1007
|
+
readonly capabilities: {
|
|
1008
|
+
readonly reasoning: true;
|
|
1009
|
+
readonly toolCall: false;
|
|
1010
|
+
readonly attachment: false;
|
|
1011
|
+
readonly structuredOutput: false;
|
|
1012
|
+
};
|
|
1013
|
+
}, {
|
|
1014
|
+
readonly id: "qwen/qwen2.5-coder-7b-instruct";
|
|
1015
|
+
readonly name: "Qwen2.5 Coder 7b Instruct";
|
|
1016
|
+
readonly provider: "nvidia";
|
|
1017
|
+
readonly family: "";
|
|
1018
|
+
readonly pricing: {
|
|
1019
|
+
readonly input: 0;
|
|
1020
|
+
readonly output: 0;
|
|
1021
|
+
};
|
|
1022
|
+
readonly contextWindow: 128000;
|
|
1023
|
+
readonly maxOutput: 4096;
|
|
1024
|
+
readonly modalities: {
|
|
1025
|
+
readonly input: readonly ["text"];
|
|
1026
|
+
readonly output: readonly ["text"];
|
|
1027
|
+
};
|
|
1028
|
+
readonly capabilities: {
|
|
1029
|
+
readonly reasoning: false;
|
|
1030
|
+
readonly toolCall: true;
|
|
1031
|
+
readonly attachment: false;
|
|
1032
|
+
readonly structuredOutput: true;
|
|
1033
|
+
};
|
|
1034
|
+
}, {
|
|
1035
|
+
readonly id: "qwen/qwen3.5-397b-a17b";
|
|
1036
|
+
readonly name: "Qwen3.5-397B-A17B";
|
|
1037
|
+
readonly provider: "nvidia";
|
|
1038
|
+
readonly family: "qwen";
|
|
1039
|
+
readonly pricing: {
|
|
1040
|
+
readonly input: 0;
|
|
1041
|
+
readonly output: 0;
|
|
1042
|
+
};
|
|
1043
|
+
readonly contextWindow: 262144;
|
|
1044
|
+
readonly maxOutput: 8192;
|
|
1045
|
+
readonly modalities: {
|
|
1046
|
+
readonly input: readonly ["text", "image"];
|
|
1047
|
+
readonly output: readonly ["text"];
|
|
1048
|
+
};
|
|
1049
|
+
readonly capabilities: {
|
|
1050
|
+
readonly reasoning: true;
|
|
1051
|
+
readonly toolCall: true;
|
|
1052
|
+
readonly attachment: true;
|
|
1053
|
+
readonly structuredOutput: true;
|
|
1054
|
+
};
|
|
1055
|
+
}, {
|
|
1056
|
+
readonly id: "qwen/qwen2.5-coder-32b-instruct";
|
|
1057
|
+
readonly name: "Qwen2.5 Coder 32b Instruct";
|
|
1058
|
+
readonly provider: "nvidia";
|
|
1059
|
+
readonly family: "";
|
|
1060
|
+
readonly pricing: {
|
|
1061
|
+
readonly input: 0;
|
|
1062
|
+
readonly output: 0;
|
|
1063
|
+
};
|
|
1064
|
+
readonly contextWindow: 128000;
|
|
1065
|
+
readonly maxOutput: 4096;
|
|
1066
|
+
readonly modalities: {
|
|
1067
|
+
readonly input: readonly ["text"];
|
|
1068
|
+
readonly output: readonly ["text"];
|
|
1069
|
+
};
|
|
1070
|
+
readonly capabilities: {
|
|
1071
|
+
readonly reasoning: false;
|
|
1072
|
+
readonly toolCall: true;
|
|
1073
|
+
readonly attachment: false;
|
|
1074
|
+
readonly structuredOutput: true;
|
|
1075
|
+
};
|
|
1076
|
+
}, {
|
|
1077
|
+
readonly id: "qwen/qwen3-235b-a22b";
|
|
1078
|
+
readonly name: "Qwen3-235B-A22B";
|
|
1079
|
+
readonly provider: "nvidia";
|
|
1080
|
+
readonly family: "qwen";
|
|
1081
|
+
readonly pricing: {
|
|
1082
|
+
readonly input: 0;
|
|
1083
|
+
readonly output: 0;
|
|
1084
|
+
};
|
|
1085
|
+
readonly contextWindow: 131072;
|
|
1086
|
+
readonly maxOutput: 8192;
|
|
1087
|
+
readonly modalities: {
|
|
1088
|
+
readonly input: readonly ["text"];
|
|
1089
|
+
readonly output: readonly ["text"];
|
|
1090
|
+
};
|
|
1091
|
+
readonly capabilities: {
|
|
1092
|
+
readonly reasoning: true;
|
|
1093
|
+
readonly toolCall: true;
|
|
1094
|
+
readonly attachment: false;
|
|
1095
|
+
readonly structuredOutput: false;
|
|
1096
|
+
};
|
|
1097
|
+
}, {
|
|
1098
|
+
readonly id: "qwen/qwen3-next-80b-a3b-instruct";
|
|
1099
|
+
readonly name: "Qwen3-Next-80B-A3B-Instruct";
|
|
1100
|
+
readonly provider: "nvidia";
|
|
1101
|
+
readonly family: "qwen";
|
|
1102
|
+
readonly pricing: {
|
|
1103
|
+
readonly input: 0;
|
|
1104
|
+
readonly output: 0;
|
|
1105
|
+
};
|
|
1106
|
+
readonly contextWindow: 262144;
|
|
1107
|
+
readonly maxOutput: 16384;
|
|
1108
|
+
readonly modalities: {
|
|
1109
|
+
readonly input: readonly ["text"];
|
|
1110
|
+
readonly output: readonly ["text"];
|
|
1111
|
+
};
|
|
1112
|
+
readonly capabilities: {
|
|
1113
|
+
readonly reasoning: false;
|
|
1114
|
+
readonly toolCall: true;
|
|
1115
|
+
readonly attachment: false;
|
|
1116
|
+
readonly structuredOutput: false;
|
|
1117
|
+
};
|
|
1118
|
+
}, {
|
|
1119
|
+
readonly id: "meta/llama-3.1-70b-instruct";
|
|
1120
|
+
readonly name: "Llama 3.1 70b Instruct";
|
|
1121
|
+
readonly provider: "nvidia";
|
|
1122
|
+
readonly family: "";
|
|
1123
|
+
readonly pricing: {
|
|
1124
|
+
readonly input: 0;
|
|
1125
|
+
readonly output: 0;
|
|
1126
|
+
};
|
|
1127
|
+
readonly contextWindow: 128000;
|
|
1128
|
+
readonly maxOutput: 4096;
|
|
1129
|
+
readonly modalities: {
|
|
1130
|
+
readonly input: readonly ["text"];
|
|
1131
|
+
readonly output: readonly ["text"];
|
|
1132
|
+
};
|
|
1133
|
+
readonly capabilities: {
|
|
1134
|
+
readonly reasoning: false;
|
|
1135
|
+
readonly toolCall: true;
|
|
1136
|
+
readonly attachment: false;
|
|
1137
|
+
readonly structuredOutput: true;
|
|
1138
|
+
};
|
|
1139
|
+
}, {
|
|
1140
|
+
readonly id: "meta/llama-3.3-70b-instruct";
|
|
1141
|
+
readonly name: "Llama 3.3 70b Instruct";
|
|
1142
|
+
readonly provider: "nvidia";
|
|
1143
|
+
readonly family: "";
|
|
1144
|
+
readonly pricing: {
|
|
1145
|
+
readonly input: 0;
|
|
1146
|
+
readonly output: 0;
|
|
1147
|
+
};
|
|
1148
|
+
readonly contextWindow: 128000;
|
|
1149
|
+
readonly maxOutput: 4096;
|
|
1150
|
+
readonly modalities: {
|
|
1151
|
+
readonly input: readonly ["text"];
|
|
1152
|
+
readonly output: readonly ["text"];
|
|
1153
|
+
};
|
|
1154
|
+
readonly capabilities: {
|
|
1155
|
+
readonly reasoning: false;
|
|
1156
|
+
readonly toolCall: true;
|
|
1157
|
+
readonly attachment: false;
|
|
1158
|
+
readonly structuredOutput: true;
|
|
1159
|
+
};
|
|
1160
|
+
}, {
|
|
1161
|
+
readonly id: "meta/llama-4-scout-17b-16e-instruct";
|
|
1162
|
+
readonly name: "Llama 4 Scout 17b 16e Instruct";
|
|
1163
|
+
readonly provider: "nvidia";
|
|
1164
|
+
readonly family: "";
|
|
1165
|
+
readonly pricing: {
|
|
1166
|
+
readonly input: 0;
|
|
1167
|
+
readonly output: 0;
|
|
1168
|
+
};
|
|
1169
|
+
readonly contextWindow: 128000;
|
|
1170
|
+
readonly maxOutput: 4096;
|
|
1171
|
+
readonly modalities: {
|
|
1172
|
+
readonly input: readonly ["text", "image"];
|
|
1173
|
+
readonly output: readonly ["text"];
|
|
1174
|
+
};
|
|
1175
|
+
readonly capabilities: {
|
|
1176
|
+
readonly reasoning: false;
|
|
1177
|
+
readonly toolCall: true;
|
|
1178
|
+
readonly attachment: true;
|
|
1179
|
+
readonly structuredOutput: true;
|
|
1180
|
+
};
|
|
1181
|
+
}, {
|
|
1182
|
+
readonly id: "meta/llama-3.2-11b-vision-instruct";
|
|
1183
|
+
readonly name: "Llama 3.2 11b Vision Instruct";
|
|
1184
|
+
readonly provider: "nvidia";
|
|
1185
|
+
readonly family: "";
|
|
1186
|
+
readonly pricing: {
|
|
1187
|
+
readonly input: 0;
|
|
1188
|
+
readonly output: 0;
|
|
1189
|
+
};
|
|
1190
|
+
readonly contextWindow: 128000;
|
|
1191
|
+
readonly maxOutput: 4096;
|
|
1192
|
+
readonly modalities: {
|
|
1193
|
+
readonly input: readonly ["text", "image"];
|
|
1194
|
+
readonly output: readonly ["text"];
|
|
1195
|
+
};
|
|
1196
|
+
readonly capabilities: {
|
|
1197
|
+
readonly reasoning: false;
|
|
1198
|
+
readonly toolCall: true;
|
|
1199
|
+
readonly attachment: true;
|
|
1200
|
+
readonly structuredOutput: true;
|
|
1201
|
+
};
|
|
1202
|
+
}, {
|
|
1203
|
+
readonly id: "meta/llama3-8b-instruct";
|
|
1204
|
+
readonly name: "Llama3 8b Instruct";
|
|
1205
|
+
readonly provider: "nvidia";
|
|
1206
|
+
readonly family: "";
|
|
1207
|
+
readonly pricing: {
|
|
1208
|
+
readonly input: 0;
|
|
1209
|
+
readonly output: 0;
|
|
1210
|
+
};
|
|
1211
|
+
readonly contextWindow: 128000;
|
|
1212
|
+
readonly maxOutput: 4096;
|
|
1213
|
+
readonly modalities: {
|
|
1214
|
+
readonly input: readonly ["text"];
|
|
1215
|
+
readonly output: readonly ["text"];
|
|
1216
|
+
};
|
|
1217
|
+
readonly capabilities: {
|
|
1218
|
+
readonly reasoning: false;
|
|
1219
|
+
readonly toolCall: true;
|
|
1220
|
+
readonly attachment: false;
|
|
1221
|
+
readonly structuredOutput: true;
|
|
1222
|
+
};
|
|
1223
|
+
}, {
|
|
1224
|
+
readonly id: "meta/codellama-70b";
|
|
1225
|
+
readonly name: "Codellama 70b";
|
|
1226
|
+
readonly provider: "nvidia";
|
|
1227
|
+
readonly family: "";
|
|
1228
|
+
readonly pricing: {
|
|
1229
|
+
readonly input: 0;
|
|
1230
|
+
readonly output: 0;
|
|
1231
|
+
};
|
|
1232
|
+
readonly contextWindow: 128000;
|
|
1233
|
+
readonly maxOutput: 4096;
|
|
1234
|
+
readonly modalities: {
|
|
1235
|
+
readonly input: readonly ["text"];
|
|
1236
|
+
readonly output: readonly ["text"];
|
|
1237
|
+
};
|
|
1238
|
+
readonly capabilities: {
|
|
1239
|
+
readonly reasoning: false;
|
|
1240
|
+
readonly toolCall: false;
|
|
1241
|
+
readonly attachment: false;
|
|
1242
|
+
readonly structuredOutput: false;
|
|
1243
|
+
};
|
|
1244
|
+
}, {
|
|
1245
|
+
readonly id: "meta/llama-3.2-1b-instruct";
|
|
1246
|
+
readonly name: "Llama 3.2 1b Instruct";
|
|
1247
|
+
readonly provider: "nvidia";
|
|
1248
|
+
readonly family: "";
|
|
1249
|
+
readonly pricing: {
|
|
1250
|
+
readonly input: 0;
|
|
1251
|
+
readonly output: 0;
|
|
1252
|
+
};
|
|
1253
|
+
readonly contextWindow: 128000;
|
|
1254
|
+
readonly maxOutput: 4096;
|
|
1255
|
+
readonly modalities: {
|
|
1256
|
+
readonly input: readonly ["text"];
|
|
1257
|
+
readonly output: readonly ["text"];
|
|
1258
|
+
};
|
|
1259
|
+
readonly capabilities: {
|
|
1260
|
+
readonly reasoning: false;
|
|
1261
|
+
readonly toolCall: true;
|
|
1262
|
+
readonly attachment: false;
|
|
1263
|
+
readonly structuredOutput: true;
|
|
1264
|
+
};
|
|
1265
|
+
}, {
|
|
1266
|
+
readonly id: "meta/llama-3.1-405b-instruct";
|
|
1267
|
+
readonly name: "Llama 3.1 405b Instruct";
|
|
1268
|
+
readonly provider: "nvidia";
|
|
1269
|
+
readonly family: "";
|
|
1270
|
+
readonly pricing: {
|
|
1271
|
+
readonly input: 0;
|
|
1272
|
+
readonly output: 0;
|
|
1273
|
+
};
|
|
1274
|
+
readonly contextWindow: 128000;
|
|
1275
|
+
readonly maxOutput: 4096;
|
|
1276
|
+
readonly modalities: {
|
|
1277
|
+
readonly input: readonly ["text"];
|
|
1278
|
+
readonly output: readonly ["text"];
|
|
1279
|
+
};
|
|
1280
|
+
readonly capabilities: {
|
|
1281
|
+
readonly reasoning: false;
|
|
1282
|
+
readonly toolCall: true;
|
|
1283
|
+
readonly attachment: false;
|
|
1284
|
+
readonly structuredOutput: true;
|
|
1285
|
+
};
|
|
1286
|
+
}, {
|
|
1287
|
+
readonly id: "meta/llama3-70b-instruct";
|
|
1288
|
+
readonly name: "Llama3 70b Instruct";
|
|
1289
|
+
readonly provider: "nvidia";
|
|
1290
|
+
readonly family: "";
|
|
1291
|
+
readonly pricing: {
|
|
1292
|
+
readonly input: 0;
|
|
1293
|
+
readonly output: 0;
|
|
1294
|
+
};
|
|
1295
|
+
readonly contextWindow: 128000;
|
|
1296
|
+
readonly maxOutput: 4096;
|
|
1297
|
+
readonly modalities: {
|
|
1298
|
+
readonly input: readonly ["text"];
|
|
1299
|
+
readonly output: readonly ["text"];
|
|
1300
|
+
};
|
|
1301
|
+
readonly capabilities: {
|
|
1302
|
+
readonly reasoning: false;
|
|
1303
|
+
readonly toolCall: true;
|
|
1304
|
+
readonly attachment: false;
|
|
1305
|
+
readonly structuredOutput: true;
|
|
1306
|
+
};
|
|
1307
|
+
}, {
|
|
1308
|
+
readonly id: "meta/llama-4-maverick-17b-128e-instruct";
|
|
1309
|
+
readonly name: "Llama 4 Maverick 17b 128e Instruct";
|
|
1310
|
+
readonly provider: "nvidia";
|
|
1311
|
+
readonly family: "";
|
|
1312
|
+
readonly pricing: {
|
|
1313
|
+
readonly input: 0;
|
|
1314
|
+
readonly output: 0;
|
|
1315
|
+
};
|
|
1316
|
+
readonly contextWindow: 128000;
|
|
1317
|
+
readonly maxOutput: 4096;
|
|
1318
|
+
readonly modalities: {
|
|
1319
|
+
readonly input: readonly ["text", "image"];
|
|
1320
|
+
readonly output: readonly ["text"];
|
|
1321
|
+
};
|
|
1322
|
+
readonly capabilities: {
|
|
1323
|
+
readonly reasoning: false;
|
|
1324
|
+
readonly toolCall: true;
|
|
1325
|
+
readonly attachment: true;
|
|
1326
|
+
readonly structuredOutput: true;
|
|
1327
|
+
};
|
|
1328
|
+
}, {
|
|
1329
|
+
readonly id: "mistralai/mistral-large-3-675b-instruct-2512";
|
|
1330
|
+
readonly name: "Mistral Large 3 675B Instruct 2512";
|
|
1331
|
+
readonly provider: "nvidia";
|
|
1332
|
+
readonly family: "mistral-large";
|
|
1333
|
+
readonly pricing: {
|
|
1334
|
+
readonly input: 0;
|
|
1335
|
+
readonly output: 0;
|
|
1336
|
+
};
|
|
1337
|
+
readonly contextWindow: 262144;
|
|
1338
|
+
readonly maxOutput: 262144;
|
|
1339
|
+
readonly modalities: {
|
|
1340
|
+
readonly input: readonly ["text", "image"];
|
|
1341
|
+
readonly output: readonly ["text"];
|
|
1342
|
+
};
|
|
1343
|
+
readonly capabilities: {
|
|
1344
|
+
readonly reasoning: false;
|
|
1345
|
+
readonly toolCall: true;
|
|
1346
|
+
readonly attachment: true;
|
|
1347
|
+
readonly structuredOutput: true;
|
|
1348
|
+
};
|
|
1349
|
+
}, {
|
|
1350
|
+
readonly id: "mistralai/mamba-codestral-7b-v0.1";
|
|
1351
|
+
readonly name: "Mamba Codestral 7b V0.1";
|
|
1352
|
+
readonly provider: "nvidia";
|
|
1353
|
+
readonly family: "";
|
|
1354
|
+
readonly pricing: {
|
|
1355
|
+
readonly input: 0;
|
|
1356
|
+
readonly output: 0;
|
|
1357
|
+
};
|
|
1358
|
+
readonly contextWindow: 128000;
|
|
1359
|
+
readonly maxOutput: 4096;
|
|
1360
|
+
readonly modalities: {
|
|
1361
|
+
readonly input: readonly ["text"];
|
|
1362
|
+
readonly output: readonly ["text"];
|
|
1363
|
+
};
|
|
1364
|
+
readonly capabilities: {
|
|
1365
|
+
readonly reasoning: false;
|
|
1366
|
+
readonly toolCall: false;
|
|
1367
|
+
readonly attachment: false;
|
|
1368
|
+
readonly structuredOutput: false;
|
|
1369
|
+
};
|
|
1370
|
+
}, {
|
|
1371
|
+
readonly id: "mistralai/codestral-22b-instruct-v0.1";
|
|
1372
|
+
readonly name: "Codestral 22b Instruct V0.1";
|
|
1373
|
+
readonly provider: "nvidia";
|
|
1374
|
+
readonly family: "";
|
|
1375
|
+
readonly pricing: {
|
|
1376
|
+
readonly input: 0;
|
|
1377
|
+
readonly output: 0;
|
|
1378
|
+
};
|
|
1379
|
+
readonly contextWindow: 128000;
|
|
1380
|
+
readonly maxOutput: 4096;
|
|
1381
|
+
readonly modalities: {
|
|
1382
|
+
readonly input: readonly ["text"];
|
|
1383
|
+
readonly output: readonly ["text"];
|
|
1384
|
+
};
|
|
1385
|
+
readonly capabilities: {
|
|
1386
|
+
readonly reasoning: false;
|
|
1387
|
+
readonly toolCall: true;
|
|
1388
|
+
readonly attachment: false;
|
|
1389
|
+
readonly structuredOutput: true;
|
|
1390
|
+
};
|
|
1391
|
+
}, {
|
|
1392
|
+
readonly id: "mistralai/mistral-large-2-instruct";
|
|
1393
|
+
readonly name: "Mistral Large 2 Instruct";
|
|
1394
|
+
readonly provider: "nvidia";
|
|
1395
|
+
readonly family: "";
|
|
1396
|
+
readonly pricing: {
|
|
1397
|
+
readonly input: 0;
|
|
1398
|
+
readonly output: 0;
|
|
1399
|
+
};
|
|
1400
|
+
readonly contextWindow: 128000;
|
|
1401
|
+
readonly maxOutput: 4096;
|
|
1402
|
+
readonly modalities: {
|
|
1403
|
+
readonly input: readonly ["text"];
|
|
1404
|
+
readonly output: readonly ["text"];
|
|
1405
|
+
};
|
|
1406
|
+
readonly capabilities: {
|
|
1407
|
+
readonly reasoning: false;
|
|
1408
|
+
readonly toolCall: true;
|
|
1409
|
+
readonly attachment: false;
|
|
1410
|
+
readonly structuredOutput: true;
|
|
1411
|
+
};
|
|
1412
|
+
}, {
|
|
1413
|
+
readonly id: "mistralai/ministral-14b-instruct-2512";
|
|
1414
|
+
readonly name: "Ministral 3 14B Instruct 2512";
|
|
1415
|
+
readonly provider: "nvidia";
|
|
1416
|
+
readonly family: "ministral";
|
|
1417
|
+
readonly pricing: {
|
|
1418
|
+
readonly input: 0;
|
|
1419
|
+
readonly output: 0;
|
|
1420
|
+
};
|
|
1421
|
+
readonly contextWindow: 262144;
|
|
1422
|
+
readonly maxOutput: 262144;
|
|
1423
|
+
readonly modalities: {
|
|
1424
|
+
readonly input: readonly ["text", "image"];
|
|
1425
|
+
readonly output: readonly ["text"];
|
|
1426
|
+
};
|
|
1427
|
+
readonly capabilities: {
|
|
1428
|
+
readonly reasoning: false;
|
|
1429
|
+
readonly toolCall: true;
|
|
1430
|
+
readonly attachment: true;
|
|
1431
|
+
readonly structuredOutput: true;
|
|
1432
|
+
};
|
|
1433
|
+
}, {
|
|
1434
|
+
readonly id: "mistralai/mistral-small-3.1-24b-instruct-2503";
|
|
1435
|
+
readonly name: "Mistral Small 3.1 24b Instruct 2503";
|
|
1436
|
+
readonly provider: "nvidia";
|
|
1437
|
+
readonly family: "";
|
|
1438
|
+
readonly pricing: {
|
|
1439
|
+
readonly input: 0;
|
|
1440
|
+
readonly output: 0;
|
|
1441
|
+
};
|
|
1442
|
+
readonly contextWindow: 128000;
|
|
1443
|
+
readonly maxOutput: 4096;
|
|
1444
|
+
readonly modalities: {
|
|
1445
|
+
readonly input: readonly ["text"];
|
|
1446
|
+
readonly output: readonly ["text"];
|
|
1447
|
+
};
|
|
1448
|
+
readonly capabilities: {
|
|
1449
|
+
readonly reasoning: false;
|
|
1450
|
+
readonly toolCall: true;
|
|
1451
|
+
readonly attachment: false;
|
|
1452
|
+
readonly structuredOutput: true;
|
|
1453
|
+
};
|
|
1454
|
+
}, {
|
|
1455
|
+
readonly id: "mistralai/devstral-2-123b-instruct-2512";
|
|
1456
|
+
readonly name: "Devstral-2-123B-Instruct-2512";
|
|
1457
|
+
readonly provider: "nvidia";
|
|
1458
|
+
readonly family: "devstral";
|
|
1459
|
+
readonly pricing: {
|
|
1460
|
+
readonly input: 0;
|
|
1461
|
+
readonly output: 0;
|
|
1462
|
+
};
|
|
1463
|
+
readonly contextWindow: 262144;
|
|
1464
|
+
readonly maxOutput: 262144;
|
|
1465
|
+
readonly modalities: {
|
|
1466
|
+
readonly input: readonly ["text"];
|
|
1467
|
+
readonly output: readonly ["text"];
|
|
1468
|
+
};
|
|
1469
|
+
readonly capabilities: {
|
|
1470
|
+
readonly reasoning: true;
|
|
1471
|
+
readonly toolCall: true;
|
|
1472
|
+
readonly attachment: true;
|
|
1473
|
+
readonly structuredOutput: true;
|
|
1474
|
+
};
|
|
1475
|
+
}, {
|
|
1476
|
+
readonly id: "openai/gpt-oss-120b";
|
|
1477
|
+
readonly name: "GPT-OSS-120B";
|
|
1478
|
+
readonly provider: "nvidia";
|
|
1479
|
+
readonly family: "gpt-oss";
|
|
1480
|
+
readonly pricing: {
|
|
1481
|
+
readonly input: 0;
|
|
1482
|
+
readonly output: 0;
|
|
1483
|
+
};
|
|
1484
|
+
readonly contextWindow: 128000;
|
|
1485
|
+
readonly maxOutput: 8192;
|
|
1486
|
+
readonly modalities: {
|
|
1487
|
+
readonly input: readonly ["text"];
|
|
1488
|
+
readonly output: readonly ["text"];
|
|
1489
|
+
};
|
|
1490
|
+
readonly capabilities: {
|
|
1491
|
+
readonly reasoning: true;
|
|
1492
|
+
readonly toolCall: false;
|
|
1493
|
+
readonly attachment: true;
|
|
1494
|
+
readonly structuredOutput: false;
|
|
1495
|
+
};
|
|
1496
|
+
}, {
|
|
1497
|
+
readonly id: "openai/whisper-large-v3";
|
|
1498
|
+
readonly name: "Whisper Large v3";
|
|
1499
|
+
readonly provider: "nvidia";
|
|
1500
|
+
readonly family: "whisper";
|
|
1501
|
+
readonly pricing: {
|
|
1502
|
+
readonly input: 0;
|
|
1503
|
+
readonly output: 0;
|
|
1504
|
+
};
|
|
1505
|
+
readonly contextWindow: 0;
|
|
1506
|
+
readonly maxOutput: 4096;
|
|
1507
|
+
readonly modalities: {
|
|
1508
|
+
readonly input: readonly ["audio"];
|
|
1509
|
+
readonly output: readonly ["text"];
|
|
1510
|
+
};
|
|
1511
|
+
readonly capabilities: {
|
|
1512
|
+
readonly reasoning: false;
|
|
1513
|
+
readonly toolCall: false;
|
|
1514
|
+
readonly attachment: false;
|
|
1515
|
+
readonly structuredOutput: false;
|
|
1516
|
+
};
|
|
1517
|
+
}, {
|
|
1518
|
+
readonly id: "black-forest-labs/flux.1-dev";
|
|
1519
|
+
readonly name: "FLUX.1-dev";
|
|
1520
|
+
readonly provider: "nvidia";
|
|
1521
|
+
readonly family: "flux";
|
|
1522
|
+
readonly pricing: {
|
|
1523
|
+
readonly input: 0;
|
|
1524
|
+
readonly output: 0;
|
|
1525
|
+
};
|
|
1526
|
+
readonly contextWindow: 4096;
|
|
1527
|
+
readonly maxOutput: 0;
|
|
1528
|
+
readonly modalities: {
|
|
1529
|
+
readonly input: readonly ["text"];
|
|
1530
|
+
readonly output: readonly ["image"];
|
|
1531
|
+
};
|
|
1532
|
+
readonly capabilities: {
|
|
1533
|
+
readonly reasoning: false;
|
|
1534
|
+
readonly toolCall: false;
|
|
1535
|
+
readonly attachment: false;
|
|
1536
|
+
readonly structuredOutput: false;
|
|
1537
|
+
};
|
|
1538
|
+
}];
|
|
1539
|
+
//#endregion
|
|
1540
|
+
//#region src/providers/nvidia.d.ts
|
|
1541
|
+
/**
|
|
1542
|
+
* Known model identifiers for NVIDIA NIM.
|
|
1543
|
+
*
|
|
1544
|
+
* @example
|
|
1545
|
+
* ```typescript
|
|
1546
|
+
* import type { NvidiaModelId } from '@funkai/models/nvidia'
|
|
1547
|
+
*
|
|
1548
|
+
* const id: NvidiaModelId = 'nvidia/llama-3.1-nemotron-70b-instruct'
|
|
1549
|
+
* ```
|
|
1550
|
+
*/
|
|
1551
|
+
type NvidiaModelId = (typeof NVIDIA_MODELS)[number]["id"];
|
|
1552
|
+
/**
|
|
1553
|
+
* All NVIDIA NIM models in the catalog.
|
|
1554
|
+
*
|
|
1555
|
+
* @example
|
|
1556
|
+
* ```typescript
|
|
1557
|
+
* import { nvidiaModels } from '@funkai/models/nvidia'
|
|
1558
|
+
*
|
|
1559
|
+
* for (const m of nvidiaModels) {
|
|
1560
|
+
* console.log(m.id, m.pricing.input)
|
|
1561
|
+
* }
|
|
1562
|
+
* ```
|
|
1563
|
+
*/
|
|
1564
|
+
declare const nvidiaModels: readonly [{
|
|
1565
|
+
readonly id: "nvidia/llama-3.1-nemotron-70b-instruct";
|
|
1566
|
+
readonly name: "Llama 3.1 Nemotron 70b Instruct";
|
|
1567
|
+
readonly provider: "nvidia";
|
|
1568
|
+
readonly family: "";
|
|
1569
|
+
readonly pricing: {
|
|
1570
|
+
readonly input: 0;
|
|
1571
|
+
readonly output: 0;
|
|
1572
|
+
};
|
|
1573
|
+
readonly contextWindow: 128000;
|
|
1574
|
+
readonly maxOutput: 4096;
|
|
1575
|
+
readonly modalities: {
|
|
1576
|
+
readonly input: readonly ["text"];
|
|
1577
|
+
readonly output: readonly ["text"];
|
|
1578
|
+
};
|
|
1579
|
+
readonly capabilities: {
|
|
1580
|
+
readonly reasoning: false;
|
|
1581
|
+
readonly toolCall: true;
|
|
1582
|
+
readonly attachment: false;
|
|
1583
|
+
readonly structuredOutput: true;
|
|
1584
|
+
};
|
|
1585
|
+
}, {
|
|
1586
|
+
readonly id: "nvidia/llama-3.1-nemotron-ultra-253b-v1";
|
|
1587
|
+
readonly name: "Llama-3.1-Nemotron-Ultra-253B-v1";
|
|
1588
|
+
readonly provider: "nvidia";
|
|
1589
|
+
readonly family: "llama";
|
|
1590
|
+
readonly pricing: {
|
|
1591
|
+
readonly input: 0;
|
|
1592
|
+
readonly output: 0;
|
|
1593
|
+
};
|
|
1594
|
+
readonly contextWindow: 131072;
|
|
1595
|
+
readonly maxOutput: 8192;
|
|
1596
|
+
readonly modalities: {
|
|
1597
|
+
readonly input: readonly ["text"];
|
|
1598
|
+
readonly output: readonly ["text"];
|
|
1599
|
+
};
|
|
1600
|
+
readonly capabilities: {
|
|
1601
|
+
readonly reasoning: true;
|
|
1602
|
+
readonly toolCall: true;
|
|
1603
|
+
readonly attachment: false;
|
|
1604
|
+
readonly structuredOutput: false;
|
|
1605
|
+
};
|
|
1606
|
+
}, {
|
|
1607
|
+
readonly id: "nvidia/llama-3.1-nemotron-51b-instruct";
|
|
1608
|
+
readonly name: "Llama 3.1 Nemotron 51b Instruct";
|
|
1609
|
+
readonly provider: "nvidia";
|
|
1610
|
+
readonly family: "";
|
|
1611
|
+
readonly pricing: {
|
|
1612
|
+
readonly input: 0;
|
|
1613
|
+
readonly output: 0;
|
|
1614
|
+
};
|
|
1615
|
+
readonly contextWindow: 128000;
|
|
1616
|
+
readonly maxOutput: 4096;
|
|
1617
|
+
readonly modalities: {
|
|
1618
|
+
readonly input: readonly ["text"];
|
|
1619
|
+
readonly output: readonly ["text"];
|
|
1620
|
+
};
|
|
1621
|
+
readonly capabilities: {
|
|
1622
|
+
readonly reasoning: false;
|
|
1623
|
+
readonly toolCall: true;
|
|
1624
|
+
readonly attachment: false;
|
|
1625
|
+
readonly structuredOutput: true;
|
|
1626
|
+
};
|
|
1627
|
+
}, {
|
|
1628
|
+
readonly id: "nvidia/parakeet-tdt-0.6b-v2";
|
|
1629
|
+
readonly name: "Parakeet TDT 0.6B v2";
|
|
1630
|
+
readonly provider: "nvidia";
|
|
1631
|
+
readonly family: "parakeet";
|
|
1632
|
+
readonly pricing: {
|
|
1633
|
+
readonly input: 0;
|
|
1634
|
+
readonly output: 0;
|
|
1635
|
+
};
|
|
1636
|
+
readonly contextWindow: 0;
|
|
1637
|
+
readonly maxOutput: 4096;
|
|
1638
|
+
readonly modalities: {
|
|
1639
|
+
readonly input: readonly ["audio"];
|
|
1640
|
+
readonly output: readonly ["text"];
|
|
1641
|
+
};
|
|
1642
|
+
readonly capabilities: {
|
|
1643
|
+
readonly reasoning: false;
|
|
1644
|
+
readonly toolCall: false;
|
|
1645
|
+
readonly attachment: false;
|
|
1646
|
+
readonly structuredOutput: false;
|
|
1647
|
+
};
|
|
1648
|
+
}, {
|
|
1649
|
+
readonly id: "nvidia/nvidia-nemotron-nano-9b-v2";
|
|
1650
|
+
readonly name: "nvidia-nemotron-nano-9b-v2";
|
|
1651
|
+
readonly provider: "nvidia";
|
|
1652
|
+
readonly family: "nemotron";
|
|
1653
|
+
readonly pricing: {
|
|
1654
|
+
readonly input: 0;
|
|
1655
|
+
readonly output: 0;
|
|
1656
|
+
};
|
|
1657
|
+
readonly contextWindow: 131072;
|
|
1658
|
+
readonly maxOutput: 131072;
|
|
1659
|
+
readonly modalities: {
|
|
1660
|
+
readonly input: readonly ["text"];
|
|
1661
|
+
readonly output: readonly ["text"];
|
|
1662
|
+
};
|
|
1663
|
+
readonly capabilities: {
|
|
1664
|
+
readonly reasoning: true;
|
|
1665
|
+
readonly toolCall: true;
|
|
1666
|
+
readonly attachment: false;
|
|
1667
|
+
readonly structuredOutput: false;
|
|
1668
|
+
};
|
|
1669
|
+
}, {
|
|
1670
|
+
readonly id: "nvidia/llama-embed-nemotron-8b";
|
|
1671
|
+
readonly name: "Llama Embed Nemotron 8B";
|
|
1672
|
+
readonly provider: "nvidia";
|
|
1673
|
+
readonly family: "llama";
|
|
1674
|
+
readonly pricing: {
|
|
1675
|
+
readonly input: 0;
|
|
1676
|
+
readonly output: 0;
|
|
1677
|
+
};
|
|
1678
|
+
readonly contextWindow: 32768;
|
|
1679
|
+
readonly maxOutput: 2048;
|
|
1680
|
+
readonly modalities: {
|
|
1681
|
+
readonly input: readonly ["text"];
|
|
1682
|
+
readonly output: readonly ["text"];
|
|
1683
|
+
};
|
|
1684
|
+
readonly capabilities: {
|
|
1685
|
+
readonly reasoning: false;
|
|
1686
|
+
readonly toolCall: false;
|
|
1687
|
+
readonly attachment: false;
|
|
1688
|
+
readonly structuredOutput: false;
|
|
1689
|
+
};
|
|
1690
|
+
}, {
|
|
1691
|
+
readonly id: "nvidia/llama-3.3-nemotron-super-49b-v1.5";
|
|
1692
|
+
readonly name: "Llama 3.3 Nemotron Super 49b V1.5";
|
|
1693
|
+
readonly provider: "nvidia";
|
|
1694
|
+
readonly family: "";
|
|
1695
|
+
readonly pricing: {
|
|
1696
|
+
readonly input: 0;
|
|
1697
|
+
readonly output: 0;
|
|
1698
|
+
};
|
|
1699
|
+
readonly contextWindow: 128000;
|
|
1700
|
+
readonly maxOutput: 4096;
|
|
1701
|
+
readonly modalities: {
|
|
1702
|
+
readonly input: readonly ["text"];
|
|
1703
|
+
readonly output: readonly ["text"];
|
|
1704
|
+
};
|
|
1705
|
+
readonly capabilities: {
|
|
1706
|
+
readonly reasoning: false;
|
|
1707
|
+
readonly toolCall: false;
|
|
1708
|
+
readonly attachment: false;
|
|
1709
|
+
readonly structuredOutput: false;
|
|
1710
|
+
};
|
|
1711
|
+
}, {
|
|
1712
|
+
readonly id: "nvidia/llama-3.3-nemotron-super-49b-v1";
|
|
1713
|
+
readonly name: "Llama 3.3 Nemotron Super 49b V1";
|
|
1714
|
+
readonly provider: "nvidia";
|
|
1715
|
+
readonly family: "";
|
|
1716
|
+
readonly pricing: {
|
|
1717
|
+
readonly input: 0;
|
|
1718
|
+
readonly output: 0;
|
|
1719
|
+
};
|
|
1720
|
+
readonly contextWindow: 128000;
|
|
1721
|
+
readonly maxOutput: 4096;
|
|
1722
|
+
readonly modalities: {
|
|
1723
|
+
readonly input: readonly ["text"];
|
|
1724
|
+
readonly output: readonly ["text"];
|
|
1725
|
+
};
|
|
1726
|
+
readonly capabilities: {
|
|
1727
|
+
readonly reasoning: false;
|
|
1728
|
+
readonly toolCall: false;
|
|
1729
|
+
readonly attachment: false;
|
|
1730
|
+
readonly structuredOutput: false;
|
|
1731
|
+
};
|
|
1732
|
+
}, {
|
|
1733
|
+
readonly id: "nvidia/llama3-chatqa-1.5-70b";
|
|
1734
|
+
readonly name: "Llama3 Chatqa 1.5 70b";
|
|
1735
|
+
readonly provider: "nvidia";
|
|
1736
|
+
readonly family: "";
|
|
1737
|
+
readonly pricing: {
|
|
1738
|
+
readonly input: 0;
|
|
1739
|
+
readonly output: 0;
|
|
1740
|
+
};
|
|
1741
|
+
readonly contextWindow: 128000;
|
|
1742
|
+
readonly maxOutput: 4096;
|
|
1743
|
+
readonly modalities: {
|
|
1744
|
+
readonly input: readonly ["text"];
|
|
1745
|
+
readonly output: readonly ["text"];
|
|
1746
|
+
};
|
|
1747
|
+
readonly capabilities: {
|
|
1748
|
+
readonly reasoning: false;
|
|
1749
|
+
readonly toolCall: true;
|
|
1750
|
+
readonly attachment: false;
|
|
1751
|
+
readonly structuredOutput: true;
|
|
1752
|
+
};
|
|
1753
|
+
}, {
|
|
1754
|
+
readonly id: "nvidia/cosmos-nemotron-34b";
|
|
1755
|
+
readonly name: "Cosmos Nemotron 34B";
|
|
1756
|
+
readonly provider: "nvidia";
|
|
1757
|
+
readonly family: "nemotron";
|
|
1758
|
+
readonly pricing: {
|
|
1759
|
+
readonly input: 0;
|
|
1760
|
+
readonly output: 0;
|
|
1761
|
+
};
|
|
1762
|
+
readonly contextWindow: 131072;
|
|
1763
|
+
readonly maxOutput: 8192;
|
|
1764
|
+
readonly modalities: {
|
|
1765
|
+
readonly input: readonly ["text", "image", "video"];
|
|
1766
|
+
readonly output: readonly ["text"];
|
|
1767
|
+
};
|
|
1768
|
+
readonly capabilities: {
|
|
1769
|
+
readonly reasoning: true;
|
|
1770
|
+
readonly toolCall: false;
|
|
1771
|
+
readonly attachment: false;
|
|
1772
|
+
readonly structuredOutput: false;
|
|
1773
|
+
};
|
|
1774
|
+
}, {
|
|
1775
|
+
readonly id: "nvidia/nemoretriever-ocr-v1";
|
|
1776
|
+
readonly name: "NeMo Retriever OCR v1";
|
|
1777
|
+
readonly provider: "nvidia";
|
|
1778
|
+
readonly family: "nemoretriever";
|
|
1779
|
+
readonly pricing: {
|
|
1780
|
+
readonly input: 0;
|
|
1781
|
+
readonly output: 0;
|
|
1782
|
+
};
|
|
1783
|
+
readonly contextWindow: 0;
|
|
1784
|
+
readonly maxOutput: 4096;
|
|
1785
|
+
readonly modalities: {
|
|
1786
|
+
readonly input: readonly ["image"];
|
|
1787
|
+
readonly output: readonly ["text"];
|
|
1788
|
+
};
|
|
1789
|
+
readonly capabilities: {
|
|
1790
|
+
readonly reasoning: false;
|
|
1791
|
+
readonly toolCall: false;
|
|
1792
|
+
readonly attachment: false;
|
|
1793
|
+
readonly structuredOutput: false;
|
|
1794
|
+
};
|
|
1795
|
+
}, {
|
|
1796
|
+
readonly id: "nvidia/nemotron-4-340b-instruct";
|
|
1797
|
+
readonly name: "Nemotron 4 340b Instruct";
|
|
1798
|
+
readonly provider: "nvidia";
|
|
1799
|
+
readonly family: "";
|
|
1800
|
+
readonly pricing: {
|
|
1801
|
+
readonly input: 0;
|
|
1802
|
+
readonly output: 0;
|
|
1803
|
+
};
|
|
1804
|
+
readonly contextWindow: 128000;
|
|
1805
|
+
readonly maxOutput: 4096;
|
|
1806
|
+
readonly modalities: {
|
|
1807
|
+
readonly input: readonly ["text"];
|
|
1808
|
+
readonly output: readonly ["text"];
|
|
1809
|
+
};
|
|
1810
|
+
readonly capabilities: {
|
|
1811
|
+
readonly reasoning: false;
|
|
1812
|
+
readonly toolCall: true;
|
|
1813
|
+
readonly attachment: false;
|
|
1814
|
+
readonly structuredOutput: true;
|
|
1815
|
+
};
|
|
1816
|
+
}, {
|
|
1817
|
+
readonly id: "nvidia/nemotron-3-nano-30b-a3b";
|
|
1818
|
+
readonly name: "nemotron-3-nano-30b-a3b";
|
|
1819
|
+
readonly provider: "nvidia";
|
|
1820
|
+
readonly family: "nemotron";
|
|
1821
|
+
readonly pricing: {
|
|
1822
|
+
readonly input: 0;
|
|
1823
|
+
readonly output: 0;
|
|
1824
|
+
};
|
|
1825
|
+
readonly contextWindow: 131072;
|
|
1826
|
+
readonly maxOutput: 131072;
|
|
1827
|
+
readonly modalities: {
|
|
1828
|
+
readonly input: readonly ["text"];
|
|
1829
|
+
readonly output: readonly ["text"];
|
|
1830
|
+
};
|
|
1831
|
+
readonly capabilities: {
|
|
1832
|
+
readonly reasoning: true;
|
|
1833
|
+
readonly toolCall: true;
|
|
1834
|
+
readonly attachment: false;
|
|
1835
|
+
readonly structuredOutput: false;
|
|
1836
|
+
};
|
|
1837
|
+
}, {
|
|
1838
|
+
readonly id: "microsoft/phi-3-small-128k-instruct";
|
|
1839
|
+
readonly name: "Phi 3 Small 128k Instruct";
|
|
1840
|
+
readonly provider: "nvidia";
|
|
1841
|
+
readonly family: "";
|
|
1842
|
+
readonly pricing: {
|
|
1843
|
+
readonly input: 0;
|
|
1844
|
+
readonly output: 0;
|
|
1845
|
+
};
|
|
1846
|
+
readonly contextWindow: 128000;
|
|
1847
|
+
readonly maxOutput: 4096;
|
|
1848
|
+
readonly modalities: {
|
|
1849
|
+
readonly input: readonly ["text", "image"];
|
|
1850
|
+
readonly output: readonly ["text"];
|
|
1851
|
+
};
|
|
1852
|
+
readonly capabilities: {
|
|
1853
|
+
readonly reasoning: false;
|
|
1854
|
+
readonly toolCall: true;
|
|
1855
|
+
readonly attachment: true;
|
|
1856
|
+
readonly structuredOutput: true;
|
|
1857
|
+
};
|
|
1858
|
+
}, {
|
|
1859
|
+
readonly id: "microsoft/phi-3-medium-128k-instruct";
|
|
1860
|
+
readonly name: "Phi 3 Medium 128k Instruct";
|
|
1861
|
+
readonly provider: "nvidia";
|
|
1862
|
+
readonly family: "";
|
|
1863
|
+
readonly pricing: {
|
|
1864
|
+
readonly input: 0;
|
|
1865
|
+
readonly output: 0;
|
|
1866
|
+
};
|
|
1867
|
+
readonly contextWindow: 128000;
|
|
1868
|
+
readonly maxOutput: 4096;
|
|
1869
|
+
readonly modalities: {
|
|
1870
|
+
readonly input: readonly ["text", "image"];
|
|
1871
|
+
readonly output: readonly ["text"];
|
|
1872
|
+
};
|
|
1873
|
+
readonly capabilities: {
|
|
1874
|
+
readonly reasoning: false;
|
|
1875
|
+
readonly toolCall: true;
|
|
1876
|
+
readonly attachment: true;
|
|
1877
|
+
readonly structuredOutput: true;
|
|
1878
|
+
};
|
|
1879
|
+
}, {
|
|
1880
|
+
readonly id: "microsoft/phi-3.5-moe-instruct";
|
|
1881
|
+
readonly name: "Phi 3.5 Moe Instruct";
|
|
1882
|
+
readonly provider: "nvidia";
|
|
1883
|
+
readonly family: "";
|
|
1884
|
+
readonly pricing: {
|
|
1885
|
+
readonly input: 0;
|
|
1886
|
+
readonly output: 0;
|
|
1887
|
+
};
|
|
1888
|
+
readonly contextWindow: 128000;
|
|
1889
|
+
readonly maxOutput: 4096;
|
|
1890
|
+
readonly modalities: {
|
|
1891
|
+
readonly input: readonly ["text"];
|
|
1892
|
+
readonly output: readonly ["text"];
|
|
1893
|
+
};
|
|
1894
|
+
readonly capabilities: {
|
|
1895
|
+
readonly reasoning: false;
|
|
1896
|
+
readonly toolCall: true;
|
|
1897
|
+
readonly attachment: false;
|
|
1898
|
+
readonly structuredOutput: true;
|
|
1899
|
+
};
|
|
1900
|
+
}, {
|
|
1901
|
+
readonly id: "microsoft/phi-3-vision-128k-instruct";
|
|
1902
|
+
readonly name: "Phi 3 Vision 128k Instruct";
|
|
1903
|
+
readonly provider: "nvidia";
|
|
1904
|
+
readonly family: "";
|
|
1905
|
+
readonly pricing: {
|
|
1906
|
+
readonly input: 0;
|
|
1907
|
+
readonly output: 0;
|
|
1908
|
+
};
|
|
1909
|
+
readonly contextWindow: 128000;
|
|
1910
|
+
readonly maxOutput: 4096;
|
|
1911
|
+
readonly modalities: {
|
|
1912
|
+
readonly input: readonly ["text", "image"];
|
|
1913
|
+
readonly output: readonly ["text"];
|
|
1914
|
+
};
|
|
1915
|
+
readonly capabilities: {
|
|
1916
|
+
readonly reasoning: false;
|
|
1917
|
+
readonly toolCall: true;
|
|
1918
|
+
readonly attachment: false;
|
|
1919
|
+
readonly structuredOutput: true;
|
|
1920
|
+
};
|
|
1921
|
+
}, {
|
|
1922
|
+
readonly id: "microsoft/phi-4-mini-instruct";
|
|
1923
|
+
readonly name: "Phi-4-Mini";
|
|
1924
|
+
readonly provider: "nvidia";
|
|
1925
|
+
readonly family: "phi";
|
|
1926
|
+
readonly pricing: {
|
|
1927
|
+
readonly input: 0;
|
|
1928
|
+
readonly output: 0;
|
|
1929
|
+
};
|
|
1930
|
+
readonly contextWindow: 131072;
|
|
1931
|
+
readonly maxOutput: 8192;
|
|
1932
|
+
readonly modalities: {
|
|
1933
|
+
readonly input: readonly ["text", "image", "audio"];
|
|
1934
|
+
readonly output: readonly ["text"];
|
|
1935
|
+
};
|
|
1936
|
+
readonly capabilities: {
|
|
1937
|
+
readonly reasoning: true;
|
|
1938
|
+
readonly toolCall: true;
|
|
1939
|
+
readonly attachment: true;
|
|
1940
|
+
readonly structuredOutput: false;
|
|
1941
|
+
};
|
|
1942
|
+
}, {
|
|
1943
|
+
readonly id: "microsoft/phi-3.5-vision-instruct";
|
|
1944
|
+
readonly name: "Phi 3.5 Vision Instruct";
|
|
1945
|
+
readonly provider: "nvidia";
|
|
1946
|
+
readonly family: "";
|
|
1947
|
+
readonly pricing: {
|
|
1948
|
+
readonly input: 0;
|
|
1949
|
+
readonly output: 0;
|
|
1950
|
+
};
|
|
1951
|
+
readonly contextWindow: 128000;
|
|
1952
|
+
readonly maxOutput: 4096;
|
|
1953
|
+
readonly modalities: {
|
|
1954
|
+
readonly input: readonly ["text", "image"];
|
|
1955
|
+
readonly output: readonly ["text"];
|
|
1956
|
+
};
|
|
1957
|
+
readonly capabilities: {
|
|
1958
|
+
readonly reasoning: false;
|
|
1959
|
+
readonly toolCall: true;
|
|
1960
|
+
readonly attachment: false;
|
|
1961
|
+
readonly structuredOutput: true;
|
|
1962
|
+
};
|
|
1963
|
+
}, {
|
|
1964
|
+
readonly id: "microsoft/phi-3-medium-4k-instruct";
|
|
1965
|
+
readonly name: "Phi 3 Medium 4k Instruct";
|
|
1966
|
+
readonly provider: "nvidia";
|
|
1967
|
+
readonly family: "";
|
|
1968
|
+
readonly pricing: {
|
|
1969
|
+
readonly input: 0;
|
|
1970
|
+
readonly output: 0;
|
|
1971
|
+
};
|
|
1972
|
+
readonly contextWindow: 4000;
|
|
1973
|
+
readonly maxOutput: 4096;
|
|
1974
|
+
readonly modalities: {
|
|
1975
|
+
readonly input: readonly ["text", "image"];
|
|
1976
|
+
readonly output: readonly ["text"];
|
|
1977
|
+
};
|
|
1978
|
+
readonly capabilities: {
|
|
1979
|
+
readonly reasoning: false;
|
|
1980
|
+
readonly toolCall: true;
|
|
1981
|
+
readonly attachment: true;
|
|
1982
|
+
readonly structuredOutput: true;
|
|
1983
|
+
};
|
|
1984
|
+
}, {
|
|
1985
|
+
readonly id: "microsoft/phi-3-small-8k-instruct";
|
|
1986
|
+
readonly name: "Phi 3 Small 8k Instruct";
|
|
1987
|
+
readonly provider: "nvidia";
|
|
1988
|
+
readonly family: "";
|
|
1989
|
+
readonly pricing: {
|
|
1990
|
+
readonly input: 0;
|
|
1991
|
+
readonly output: 0;
|
|
1992
|
+
};
|
|
1993
|
+
readonly contextWindow: 8000;
|
|
1994
|
+
readonly maxOutput: 4096;
|
|
1995
|
+
readonly modalities: {
|
|
1996
|
+
readonly input: readonly ["text", "image"];
|
|
1997
|
+
readonly output: readonly ["text"];
|
|
1998
|
+
};
|
|
1999
|
+
readonly capabilities: {
|
|
2000
|
+
readonly reasoning: false;
|
|
2001
|
+
readonly toolCall: true;
|
|
2002
|
+
readonly attachment: true;
|
|
2003
|
+
readonly structuredOutput: true;
|
|
2004
|
+
};
|
|
2005
|
+
}, {
|
|
2006
|
+
readonly id: "minimaxai/minimax-m2.1";
|
|
2007
|
+
readonly name: "MiniMax-M2.1";
|
|
2008
|
+
readonly provider: "nvidia";
|
|
2009
|
+
readonly family: "minimax";
|
|
2010
|
+
readonly pricing: {
|
|
2011
|
+
readonly input: 0;
|
|
2012
|
+
readonly output: 0;
|
|
2013
|
+
};
|
|
2014
|
+
readonly contextWindow: 204800;
|
|
2015
|
+
readonly maxOutput: 131072;
|
|
2016
|
+
readonly modalities: {
|
|
2017
|
+
readonly input: readonly ["text"];
|
|
2018
|
+
readonly output: readonly ["text"];
|
|
2019
|
+
};
|
|
2020
|
+
readonly capabilities: {
|
|
2021
|
+
readonly reasoning: true;
|
|
2022
|
+
readonly toolCall: true;
|
|
2023
|
+
readonly attachment: false;
|
|
2024
|
+
readonly structuredOutput: false;
|
|
2025
|
+
};
|
|
2026
|
+
}, {
|
|
2027
|
+
readonly id: "minimaxai/minimax-m2.5";
|
|
2028
|
+
readonly name: "MiniMax-M2.5";
|
|
2029
|
+
readonly provider: "nvidia";
|
|
2030
|
+
readonly family: "minimax";
|
|
2031
|
+
readonly pricing: {
|
|
2032
|
+
readonly input: 0;
|
|
2033
|
+
readonly output: 0;
|
|
2034
|
+
};
|
|
2035
|
+
readonly contextWindow: 204800;
|
|
2036
|
+
readonly maxOutput: 131072;
|
|
2037
|
+
readonly modalities: {
|
|
2038
|
+
readonly input: readonly ["text"];
|
|
2039
|
+
readonly output: readonly ["text"];
|
|
2040
|
+
};
|
|
2041
|
+
readonly capabilities: {
|
|
2042
|
+
readonly reasoning: true;
|
|
2043
|
+
readonly toolCall: true;
|
|
2044
|
+
readonly attachment: false;
|
|
2045
|
+
readonly structuredOutput: false;
|
|
2046
|
+
};
|
|
2047
|
+
}, {
|
|
2048
|
+
readonly id: "deepseek-ai/deepseek-v3.1";
|
|
2049
|
+
readonly name: "DeepSeek V3.1";
|
|
2050
|
+
readonly provider: "nvidia";
|
|
2051
|
+
readonly family: "deepseek";
|
|
2052
|
+
readonly pricing: {
|
|
2053
|
+
readonly input: 0;
|
|
2054
|
+
readonly output: 0;
|
|
2055
|
+
};
|
|
2056
|
+
readonly contextWindow: 128000;
|
|
2057
|
+
readonly maxOutput: 8192;
|
|
2058
|
+
readonly modalities: {
|
|
2059
|
+
readonly input: readonly ["text"];
|
|
2060
|
+
readonly output: readonly ["text"];
|
|
2061
|
+
};
|
|
2062
|
+
readonly capabilities: {
|
|
2063
|
+
readonly reasoning: true;
|
|
2064
|
+
readonly toolCall: true;
|
|
2065
|
+
readonly attachment: false;
|
|
2066
|
+
readonly structuredOutput: false;
|
|
2067
|
+
};
|
|
2068
|
+
}, {
|
|
2069
|
+
readonly id: "deepseek-ai/deepseek-r1-0528";
|
|
2070
|
+
readonly name: "Deepseek R1 0528";
|
|
2071
|
+
readonly provider: "nvidia";
|
|
2072
|
+
readonly family: "";
|
|
2073
|
+
readonly pricing: {
|
|
2074
|
+
readonly input: 0;
|
|
2075
|
+
readonly output: 0;
|
|
2076
|
+
};
|
|
2077
|
+
readonly contextWindow: 128000;
|
|
2078
|
+
readonly maxOutput: 4096;
|
|
2079
|
+
readonly modalities: {
|
|
2080
|
+
readonly input: readonly ["text"];
|
|
2081
|
+
readonly output: readonly ["text"];
|
|
2082
|
+
};
|
|
2083
|
+
readonly capabilities: {
|
|
2084
|
+
readonly reasoning: true;
|
|
2085
|
+
readonly toolCall: true;
|
|
2086
|
+
readonly attachment: false;
|
|
2087
|
+
readonly structuredOutput: true;
|
|
2088
|
+
};
|
|
2089
|
+
}, {
|
|
2090
|
+
readonly id: "deepseek-ai/deepseek-r1";
|
|
2091
|
+
readonly name: "Deepseek R1";
|
|
2092
|
+
readonly provider: "nvidia";
|
|
2093
|
+
readonly family: "";
|
|
2094
|
+
readonly pricing: {
|
|
2095
|
+
readonly input: 0;
|
|
2096
|
+
readonly output: 0;
|
|
2097
|
+
};
|
|
2098
|
+
readonly contextWindow: 128000;
|
|
2099
|
+
readonly maxOutput: 4096;
|
|
2100
|
+
readonly modalities: {
|
|
2101
|
+
readonly input: readonly ["text"];
|
|
2102
|
+
readonly output: readonly ["text"];
|
|
2103
|
+
};
|
|
2104
|
+
readonly capabilities: {
|
|
2105
|
+
readonly reasoning: true;
|
|
2106
|
+
readonly toolCall: false;
|
|
2107
|
+
readonly attachment: false;
|
|
2108
|
+
readonly structuredOutput: false;
|
|
2109
|
+
};
|
|
2110
|
+
}, {
|
|
2111
|
+
readonly id: "deepseek-ai/deepseek-v3.1-terminus";
|
|
2112
|
+
readonly name: "DeepSeek V3.1 Terminus";
|
|
2113
|
+
readonly provider: "nvidia";
|
|
2114
|
+
readonly family: "deepseek";
|
|
2115
|
+
readonly pricing: {
|
|
2116
|
+
readonly input: 0;
|
|
2117
|
+
readonly output: 0;
|
|
2118
|
+
};
|
|
2119
|
+
readonly contextWindow: 128000;
|
|
2120
|
+
readonly maxOutput: 8192;
|
|
2121
|
+
readonly modalities: {
|
|
2122
|
+
readonly input: readonly ["text"];
|
|
2123
|
+
readonly output: readonly ["text"];
|
|
2124
|
+
};
|
|
2125
|
+
readonly capabilities: {
|
|
2126
|
+
readonly reasoning: true;
|
|
2127
|
+
readonly toolCall: true;
|
|
2128
|
+
readonly attachment: false;
|
|
2129
|
+
readonly structuredOutput: false;
|
|
2130
|
+
};
|
|
2131
|
+
}, {
|
|
2132
|
+
readonly id: "deepseek-ai/deepseek-coder-6.7b-instruct";
|
|
2133
|
+
readonly name: "Deepseek Coder 6.7b Instruct";
|
|
2134
|
+
readonly provider: "nvidia";
|
|
2135
|
+
readonly family: "";
|
|
2136
|
+
readonly pricing: {
|
|
2137
|
+
readonly input: 0;
|
|
2138
|
+
readonly output: 0;
|
|
2139
|
+
};
|
|
2140
|
+
readonly contextWindow: 128000;
|
|
2141
|
+
readonly maxOutput: 4096;
|
|
2142
|
+
readonly modalities: {
|
|
2143
|
+
readonly input: readonly ["text"];
|
|
2144
|
+
readonly output: readonly ["text"];
|
|
2145
|
+
};
|
|
2146
|
+
readonly capabilities: {
|
|
2147
|
+
readonly reasoning: false;
|
|
2148
|
+
readonly toolCall: true;
|
|
2149
|
+
readonly attachment: false;
|
|
2150
|
+
readonly structuredOutput: true;
|
|
2151
|
+
};
|
|
2152
|
+
}, {
|
|
2153
|
+
readonly id: "deepseek-ai/deepseek-v3.2";
|
|
2154
|
+
readonly name: "DeepSeek V3.2";
|
|
2155
|
+
readonly provider: "nvidia";
|
|
2156
|
+
readonly family: "deepseek";
|
|
2157
|
+
readonly pricing: {
|
|
2158
|
+
readonly input: 0;
|
|
2159
|
+
readonly output: 0;
|
|
2160
|
+
};
|
|
2161
|
+
readonly contextWindow: 163840;
|
|
2162
|
+
readonly maxOutput: 65536;
|
|
2163
|
+
readonly modalities: {
|
|
2164
|
+
readonly input: readonly ["text"];
|
|
2165
|
+
readonly output: readonly ["text"];
|
|
2166
|
+
};
|
|
2167
|
+
readonly capabilities: {
|
|
2168
|
+
readonly reasoning: true;
|
|
2169
|
+
readonly toolCall: true;
|
|
2170
|
+
readonly attachment: false;
|
|
2171
|
+
readonly structuredOutput: false;
|
|
2172
|
+
};
|
|
2173
|
+
}, {
|
|
2174
|
+
readonly id: "moonshotai/kimi-k2-instruct";
|
|
2175
|
+
readonly name: "Kimi K2 Instruct";
|
|
2176
|
+
readonly provider: "nvidia";
|
|
2177
|
+
readonly family: "kimi";
|
|
2178
|
+
readonly pricing: {
|
|
2179
|
+
readonly input: 0;
|
|
2180
|
+
readonly output: 0;
|
|
2181
|
+
};
|
|
2182
|
+
readonly contextWindow: 128000;
|
|
2183
|
+
readonly maxOutput: 8192;
|
|
2184
|
+
readonly modalities: {
|
|
2185
|
+
readonly input: readonly ["text"];
|
|
2186
|
+
readonly output: readonly ["text"];
|
|
2187
|
+
};
|
|
2188
|
+
readonly capabilities: {
|
|
2189
|
+
readonly reasoning: true;
|
|
2190
|
+
readonly toolCall: true;
|
|
2191
|
+
readonly attachment: false;
|
|
2192
|
+
readonly structuredOutput: false;
|
|
2193
|
+
};
|
|
2194
|
+
}, {
|
|
2195
|
+
readonly id: "moonshotai/kimi-k2-instruct-0905";
|
|
2196
|
+
readonly name: "Kimi K2 0905";
|
|
2197
|
+
readonly provider: "nvidia";
|
|
2198
|
+
readonly family: "kimi";
|
|
2199
|
+
readonly pricing: {
|
|
2200
|
+
readonly input: 0;
|
|
2201
|
+
readonly output: 0;
|
|
2202
|
+
};
|
|
2203
|
+
readonly contextWindow: 262144;
|
|
2204
|
+
readonly maxOutput: 262144;
|
|
2205
|
+
readonly modalities: {
|
|
2206
|
+
readonly input: readonly ["text"];
|
|
2207
|
+
readonly output: readonly ["text"];
|
|
2208
|
+
};
|
|
2209
|
+
readonly capabilities: {
|
|
2210
|
+
readonly reasoning: false;
|
|
2211
|
+
readonly toolCall: true;
|
|
2212
|
+
readonly attachment: false;
|
|
2213
|
+
readonly structuredOutput: false;
|
|
2214
|
+
};
|
|
2215
|
+
}, {
|
|
2216
|
+
readonly id: "moonshotai/kimi-k2.5";
|
|
2217
|
+
readonly name: "Kimi K2.5";
|
|
2218
|
+
readonly provider: "nvidia";
|
|
2219
|
+
readonly family: "kimi";
|
|
2220
|
+
readonly pricing: {
|
|
2221
|
+
readonly input: 0;
|
|
2222
|
+
readonly output: 0;
|
|
2223
|
+
};
|
|
2224
|
+
readonly contextWindow: 262144;
|
|
2225
|
+
readonly maxOutput: 262144;
|
|
2226
|
+
readonly modalities: {
|
|
2227
|
+
readonly input: readonly ["text", "image", "video"];
|
|
2228
|
+
readonly output: readonly ["text"];
|
|
2229
|
+
};
|
|
2230
|
+
readonly capabilities: {
|
|
2231
|
+
readonly reasoning: true;
|
|
2232
|
+
readonly toolCall: true;
|
|
2233
|
+
readonly attachment: true;
|
|
2234
|
+
readonly structuredOutput: false;
|
|
2235
|
+
};
|
|
2236
|
+
}, {
|
|
2237
|
+
readonly id: "moonshotai/kimi-k2-thinking";
|
|
2238
|
+
readonly name: "Kimi K2 Thinking";
|
|
2239
|
+
readonly provider: "nvidia";
|
|
2240
|
+
readonly family: "kimi-thinking";
|
|
2241
|
+
readonly pricing: {
|
|
2242
|
+
readonly input: 0;
|
|
2243
|
+
readonly output: 0;
|
|
2244
|
+
};
|
|
2245
|
+
readonly contextWindow: 262144;
|
|
2246
|
+
readonly maxOutput: 262144;
|
|
2247
|
+
readonly modalities: {
|
|
2248
|
+
readonly input: readonly ["text"];
|
|
2249
|
+
readonly output: readonly ["text"];
|
|
2250
|
+
};
|
|
2251
|
+
readonly capabilities: {
|
|
2252
|
+
readonly reasoning: true;
|
|
2253
|
+
readonly toolCall: true;
|
|
2254
|
+
readonly attachment: false;
|
|
2255
|
+
readonly structuredOutput: true;
|
|
2256
|
+
};
|
|
2257
|
+
}, {
|
|
2258
|
+
readonly id: "google/codegemma-7b";
|
|
2259
|
+
readonly name: "Codegemma 7b";
|
|
2260
|
+
readonly provider: "nvidia";
|
|
2261
|
+
readonly family: "";
|
|
2262
|
+
readonly pricing: {
|
|
2263
|
+
readonly input: 0;
|
|
2264
|
+
readonly output: 0;
|
|
2265
|
+
};
|
|
2266
|
+
readonly contextWindow: 128000;
|
|
2267
|
+
readonly maxOutput: 4096;
|
|
2268
|
+
readonly modalities: {
|
|
2269
|
+
readonly input: readonly ["text"];
|
|
2270
|
+
readonly output: readonly ["text"];
|
|
2271
|
+
};
|
|
2272
|
+
readonly capabilities: {
|
|
2273
|
+
readonly reasoning: false;
|
|
2274
|
+
readonly toolCall: false;
|
|
2275
|
+
readonly attachment: false;
|
|
2276
|
+
readonly structuredOutput: false;
|
|
2277
|
+
};
|
|
2278
|
+
}, {
|
|
2279
|
+
readonly id: "google/gemma-2-2b-it";
|
|
2280
|
+
readonly name: "Gemma 2 2b It";
|
|
2281
|
+
readonly provider: "nvidia";
|
|
2282
|
+
readonly family: "";
|
|
2283
|
+
readonly pricing: {
|
|
2284
|
+
readonly input: 0;
|
|
2285
|
+
readonly output: 0;
|
|
2286
|
+
};
|
|
2287
|
+
readonly contextWindow: 128000;
|
|
2288
|
+
readonly maxOutput: 4096;
|
|
2289
|
+
readonly modalities: {
|
|
2290
|
+
readonly input: readonly ["text"];
|
|
2291
|
+
readonly output: readonly ["text"];
|
|
2292
|
+
};
|
|
2293
|
+
readonly capabilities: {
|
|
2294
|
+
readonly reasoning: false;
|
|
2295
|
+
readonly toolCall: true;
|
|
2296
|
+
readonly attachment: false;
|
|
2297
|
+
readonly structuredOutput: true;
|
|
2298
|
+
};
|
|
2299
|
+
}, {
|
|
2300
|
+
readonly id: "google/gemma-3-1b-it";
|
|
2301
|
+
readonly name: "Gemma 3 1b It";
|
|
2302
|
+
readonly provider: "nvidia";
|
|
2303
|
+
readonly family: "";
|
|
2304
|
+
readonly pricing: {
|
|
2305
|
+
readonly input: 0;
|
|
2306
|
+
readonly output: 0;
|
|
2307
|
+
};
|
|
2308
|
+
readonly contextWindow: 128000;
|
|
2309
|
+
readonly maxOutput: 4096;
|
|
2310
|
+
readonly modalities: {
|
|
2311
|
+
readonly input: readonly ["text", "image"];
|
|
2312
|
+
readonly output: readonly ["text"];
|
|
2313
|
+
};
|
|
2314
|
+
readonly capabilities: {
|
|
2315
|
+
readonly reasoning: false;
|
|
2316
|
+
readonly toolCall: true;
|
|
2317
|
+
readonly attachment: true;
|
|
2318
|
+
readonly structuredOutput: true;
|
|
2319
|
+
};
|
|
2320
|
+
}, {
|
|
2321
|
+
readonly id: "google/gemma-2-27b-it";
|
|
2322
|
+
readonly name: "Gemma 2 27b It";
|
|
2323
|
+
readonly provider: "nvidia";
|
|
2324
|
+
readonly family: "";
|
|
2325
|
+
readonly pricing: {
|
|
2326
|
+
readonly input: 0;
|
|
2327
|
+
readonly output: 0;
|
|
2328
|
+
};
|
|
2329
|
+
readonly contextWindow: 128000;
|
|
2330
|
+
readonly maxOutput: 4096;
|
|
2331
|
+
readonly modalities: {
|
|
2332
|
+
readonly input: readonly ["text"];
|
|
2333
|
+
readonly output: readonly ["text"];
|
|
2334
|
+
};
|
|
2335
|
+
readonly capabilities: {
|
|
2336
|
+
readonly reasoning: false;
|
|
2337
|
+
readonly toolCall: true;
|
|
2338
|
+
readonly attachment: false;
|
|
2339
|
+
readonly structuredOutput: true;
|
|
2340
|
+
};
|
|
2341
|
+
}, {
|
|
2342
|
+
readonly id: "google/gemma-3n-e2b-it";
|
|
2343
|
+
readonly name: "Gemma 3n E2b It";
|
|
2344
|
+
readonly provider: "nvidia";
|
|
2345
|
+
readonly family: "";
|
|
2346
|
+
readonly pricing: {
|
|
2347
|
+
readonly input: 0;
|
|
2348
|
+
readonly output: 0;
|
|
2349
|
+
};
|
|
2350
|
+
readonly contextWindow: 128000;
|
|
2351
|
+
readonly maxOutput: 4096;
|
|
2352
|
+
readonly modalities: {
|
|
2353
|
+
readonly input: readonly ["text", "image"];
|
|
2354
|
+
readonly output: readonly ["text"];
|
|
2355
|
+
};
|
|
2356
|
+
readonly capabilities: {
|
|
2357
|
+
readonly reasoning: false;
|
|
2358
|
+
readonly toolCall: true;
|
|
2359
|
+
readonly attachment: true;
|
|
2360
|
+
readonly structuredOutput: true;
|
|
2361
|
+
};
|
|
2362
|
+
}, {
|
|
2363
|
+
readonly id: "google/codegemma-1.1-7b";
|
|
2364
|
+
readonly name: "Codegemma 1.1 7b";
|
|
2365
|
+
readonly provider: "nvidia";
|
|
2366
|
+
readonly family: "";
|
|
2367
|
+
readonly pricing: {
|
|
2368
|
+
readonly input: 0;
|
|
2369
|
+
readonly output: 0;
|
|
2370
|
+
};
|
|
2371
|
+
readonly contextWindow: 128000;
|
|
2372
|
+
readonly maxOutput: 4096;
|
|
2373
|
+
readonly modalities: {
|
|
2374
|
+
readonly input: readonly ["text"];
|
|
2375
|
+
readonly output: readonly ["text"];
|
|
2376
|
+
};
|
|
2377
|
+
readonly capabilities: {
|
|
2378
|
+
readonly reasoning: false;
|
|
2379
|
+
readonly toolCall: false;
|
|
2380
|
+
readonly attachment: false;
|
|
2381
|
+
readonly structuredOutput: false;
|
|
2382
|
+
};
|
|
2383
|
+
}, {
|
|
2384
|
+
readonly id: "google/gemma-3n-e4b-it";
|
|
2385
|
+
readonly name: "Gemma 3n E4b It";
|
|
2386
|
+
readonly provider: "nvidia";
|
|
2387
|
+
readonly family: "";
|
|
2388
|
+
readonly pricing: {
|
|
2389
|
+
readonly input: 0;
|
|
2390
|
+
readonly output: 0;
|
|
2391
|
+
};
|
|
2392
|
+
readonly contextWindow: 128000;
|
|
2393
|
+
readonly maxOutput: 4096;
|
|
2394
|
+
readonly modalities: {
|
|
2395
|
+
readonly input: readonly ["text", "image"];
|
|
2396
|
+
readonly output: readonly ["text"];
|
|
2397
|
+
};
|
|
2398
|
+
readonly capabilities: {
|
|
2399
|
+
readonly reasoning: false;
|
|
2400
|
+
readonly toolCall: true;
|
|
2401
|
+
readonly attachment: true;
|
|
2402
|
+
readonly structuredOutput: true;
|
|
2403
|
+
};
|
|
2404
|
+
}, {
|
|
2405
|
+
readonly id: "google/gemma-3-12b-it";
|
|
2406
|
+
readonly name: "Gemma 3 12b It";
|
|
2407
|
+
readonly provider: "nvidia";
|
|
2408
|
+
readonly family: "";
|
|
2409
|
+
readonly pricing: {
|
|
2410
|
+
readonly input: 0;
|
|
2411
|
+
readonly output: 0;
|
|
2412
|
+
};
|
|
2413
|
+
readonly contextWindow: 128000;
|
|
2414
|
+
readonly maxOutput: 4096;
|
|
2415
|
+
readonly modalities: {
|
|
2416
|
+
readonly input: readonly ["text"];
|
|
2417
|
+
readonly output: readonly ["text"];
|
|
2418
|
+
};
|
|
2419
|
+
readonly capabilities: {
|
|
2420
|
+
readonly reasoning: false;
|
|
2421
|
+
readonly toolCall: true;
|
|
2422
|
+
readonly attachment: false;
|
|
2423
|
+
readonly structuredOutput: true;
|
|
2424
|
+
};
|
|
2425
|
+
}, {
|
|
2426
|
+
readonly id: "google/gemma-3-27b-it";
|
|
2427
|
+
readonly name: "Gemma-3-27B-IT";
|
|
2428
|
+
readonly provider: "nvidia";
|
|
2429
|
+
readonly family: "gemma";
|
|
2430
|
+
readonly pricing: {
|
|
2431
|
+
readonly input: 0;
|
|
2432
|
+
readonly output: 0;
|
|
2433
|
+
};
|
|
2434
|
+
readonly contextWindow: 131072;
|
|
2435
|
+
readonly maxOutput: 8192;
|
|
2436
|
+
readonly modalities: {
|
|
2437
|
+
readonly input: readonly ["text", "image"];
|
|
2438
|
+
readonly output: readonly ["text"];
|
|
2439
|
+
};
|
|
2440
|
+
readonly capabilities: {
|
|
2441
|
+
readonly reasoning: true;
|
|
2442
|
+
readonly toolCall: true;
|
|
2443
|
+
readonly attachment: true;
|
|
2444
|
+
readonly structuredOutput: false;
|
|
2445
|
+
};
|
|
2446
|
+
}, {
|
|
2447
|
+
readonly id: "z-ai/glm4.7";
|
|
2448
|
+
readonly name: "GLM-4.7";
|
|
2449
|
+
readonly provider: "nvidia";
|
|
2450
|
+
readonly family: "glm";
|
|
2451
|
+
readonly pricing: {
|
|
2452
|
+
readonly input: 0;
|
|
2453
|
+
readonly output: 0;
|
|
2454
|
+
};
|
|
2455
|
+
readonly contextWindow: 204800;
|
|
2456
|
+
readonly maxOutput: 131072;
|
|
2457
|
+
readonly modalities: {
|
|
2458
|
+
readonly input: readonly ["text"];
|
|
2459
|
+
readonly output: readonly ["text"];
|
|
2460
|
+
};
|
|
2461
|
+
readonly capabilities: {
|
|
2462
|
+
readonly reasoning: true;
|
|
2463
|
+
readonly toolCall: true;
|
|
2464
|
+
readonly attachment: false;
|
|
2465
|
+
readonly structuredOutput: false;
|
|
2466
|
+
};
|
|
2467
|
+
}, {
|
|
2468
|
+
readonly id: "z-ai/glm5";
|
|
2469
|
+
readonly name: "GLM5";
|
|
2470
|
+
readonly provider: "nvidia";
|
|
2471
|
+
readonly family: "glm";
|
|
2472
|
+
readonly pricing: {
|
|
2473
|
+
readonly input: 0;
|
|
2474
|
+
readonly output: 0;
|
|
2475
|
+
};
|
|
2476
|
+
readonly contextWindow: 202752;
|
|
2477
|
+
readonly maxOutput: 131000;
|
|
2478
|
+
readonly modalities: {
|
|
2479
|
+
readonly input: readonly ["text"];
|
|
2480
|
+
readonly output: readonly ["text"];
|
|
2481
|
+
};
|
|
2482
|
+
readonly capabilities: {
|
|
2483
|
+
readonly reasoning: true;
|
|
2484
|
+
readonly toolCall: true;
|
|
2485
|
+
readonly attachment: false;
|
|
2486
|
+
readonly structuredOutput: true;
|
|
2487
|
+
};
|
|
2488
|
+
}, {
|
|
2489
|
+
readonly id: "stepfun-ai/step-3.5-flash";
|
|
2490
|
+
readonly name: "Step 3.5 Flash";
|
|
2491
|
+
readonly provider: "nvidia";
|
|
2492
|
+
readonly family: "";
|
|
2493
|
+
readonly pricing: {
|
|
2494
|
+
readonly input: 0;
|
|
2495
|
+
readonly output: 0;
|
|
2496
|
+
};
|
|
2497
|
+
readonly contextWindow: 256000;
|
|
2498
|
+
readonly maxOutput: 16384;
|
|
2499
|
+
readonly modalities: {
|
|
2500
|
+
readonly input: readonly ["text"];
|
|
2501
|
+
readonly output: readonly ["text"];
|
|
2502
|
+
};
|
|
2503
|
+
readonly capabilities: {
|
|
2504
|
+
readonly reasoning: true;
|
|
2505
|
+
readonly toolCall: true;
|
|
2506
|
+
readonly attachment: false;
|
|
2507
|
+
readonly structuredOutput: false;
|
|
2508
|
+
};
|
|
2509
|
+
}, {
|
|
2510
|
+
readonly id: "qwen/qwen3-next-80b-a3b-thinking";
|
|
2511
|
+
readonly name: "Qwen3-Next-80B-A3B-Thinking";
|
|
2512
|
+
readonly provider: "nvidia";
|
|
2513
|
+
readonly family: "qwen";
|
|
2514
|
+
readonly pricing: {
|
|
2515
|
+
readonly input: 0;
|
|
2516
|
+
readonly output: 0;
|
|
2517
|
+
};
|
|
2518
|
+
readonly contextWindow: 262144;
|
|
2519
|
+
readonly maxOutput: 16384;
|
|
2520
|
+
readonly modalities: {
|
|
2521
|
+
readonly input: readonly ["text"];
|
|
2522
|
+
readonly output: readonly ["text"];
|
|
2523
|
+
};
|
|
2524
|
+
readonly capabilities: {
|
|
2525
|
+
readonly reasoning: true;
|
|
2526
|
+
readonly toolCall: true;
|
|
2527
|
+
readonly attachment: false;
|
|
2528
|
+
readonly structuredOutput: false;
|
|
2529
|
+
};
|
|
2530
|
+
}, {
|
|
2531
|
+
readonly id: "qwen/qwen3-coder-480b-a35b-instruct";
|
|
2532
|
+
readonly name: "Qwen3 Coder 480B A35B Instruct";
|
|
2533
|
+
readonly provider: "nvidia";
|
|
2534
|
+
readonly family: "qwen";
|
|
2535
|
+
readonly pricing: {
|
|
2536
|
+
readonly input: 0;
|
|
2537
|
+
readonly output: 0;
|
|
2538
|
+
};
|
|
2539
|
+
readonly contextWindow: 262144;
|
|
2540
|
+
readonly maxOutput: 66536;
|
|
2541
|
+
readonly modalities: {
|
|
2542
|
+
readonly input: readonly ["text"];
|
|
2543
|
+
readonly output: readonly ["text"];
|
|
2544
|
+
};
|
|
2545
|
+
readonly capabilities: {
|
|
2546
|
+
readonly reasoning: false;
|
|
2547
|
+
readonly toolCall: true;
|
|
2548
|
+
readonly attachment: false;
|
|
2549
|
+
readonly structuredOutput: false;
|
|
2550
|
+
};
|
|
2551
|
+
}, {
|
|
2552
|
+
readonly id: "qwen/qwq-32b";
|
|
2553
|
+
readonly name: "Qwq 32b";
|
|
2554
|
+
readonly provider: "nvidia";
|
|
2555
|
+
readonly family: "";
|
|
2556
|
+
readonly pricing: {
|
|
2557
|
+
readonly input: 0;
|
|
2558
|
+
readonly output: 0;
|
|
2559
|
+
};
|
|
2560
|
+
readonly contextWindow: 128000;
|
|
2561
|
+
readonly maxOutput: 4096;
|
|
2562
|
+
readonly modalities: {
|
|
2563
|
+
readonly input: readonly ["text"];
|
|
2564
|
+
readonly output: readonly ["text"];
|
|
2565
|
+
};
|
|
2566
|
+
readonly capabilities: {
|
|
2567
|
+
readonly reasoning: true;
|
|
2568
|
+
readonly toolCall: false;
|
|
2569
|
+
readonly attachment: false;
|
|
2570
|
+
readonly structuredOutput: false;
|
|
2571
|
+
};
|
|
2572
|
+
}, {
|
|
2573
|
+
readonly id: "qwen/qwen2.5-coder-7b-instruct";
|
|
2574
|
+
readonly name: "Qwen2.5 Coder 7b Instruct";
|
|
2575
|
+
readonly provider: "nvidia";
|
|
2576
|
+
readonly family: "";
|
|
2577
|
+
readonly pricing: {
|
|
2578
|
+
readonly input: 0;
|
|
2579
|
+
readonly output: 0;
|
|
2580
|
+
};
|
|
2581
|
+
readonly contextWindow: 128000;
|
|
2582
|
+
readonly maxOutput: 4096;
|
|
2583
|
+
readonly modalities: {
|
|
2584
|
+
readonly input: readonly ["text"];
|
|
2585
|
+
readonly output: readonly ["text"];
|
|
2586
|
+
};
|
|
2587
|
+
readonly capabilities: {
|
|
2588
|
+
readonly reasoning: false;
|
|
2589
|
+
readonly toolCall: true;
|
|
2590
|
+
readonly attachment: false;
|
|
2591
|
+
readonly structuredOutput: true;
|
|
2592
|
+
};
|
|
2593
|
+
}, {
|
|
2594
|
+
readonly id: "qwen/qwen3.5-397b-a17b";
|
|
2595
|
+
readonly name: "Qwen3.5-397B-A17B";
|
|
2596
|
+
readonly provider: "nvidia";
|
|
2597
|
+
readonly family: "qwen";
|
|
2598
|
+
readonly pricing: {
|
|
2599
|
+
readonly input: 0;
|
|
2600
|
+
readonly output: 0;
|
|
2601
|
+
};
|
|
2602
|
+
readonly contextWindow: 262144;
|
|
2603
|
+
readonly maxOutput: 8192;
|
|
2604
|
+
readonly modalities: {
|
|
2605
|
+
readonly input: readonly ["text", "image"];
|
|
2606
|
+
readonly output: readonly ["text"];
|
|
2607
|
+
};
|
|
2608
|
+
readonly capabilities: {
|
|
2609
|
+
readonly reasoning: true;
|
|
2610
|
+
readonly toolCall: true;
|
|
2611
|
+
readonly attachment: true;
|
|
2612
|
+
readonly structuredOutput: true;
|
|
2613
|
+
};
|
|
2614
|
+
}, {
|
|
2615
|
+
readonly id: "qwen/qwen2.5-coder-32b-instruct";
|
|
2616
|
+
readonly name: "Qwen2.5 Coder 32b Instruct";
|
|
2617
|
+
readonly provider: "nvidia";
|
|
2618
|
+
readonly family: "";
|
|
2619
|
+
readonly pricing: {
|
|
2620
|
+
readonly input: 0;
|
|
2621
|
+
readonly output: 0;
|
|
2622
|
+
};
|
|
2623
|
+
readonly contextWindow: 128000;
|
|
2624
|
+
readonly maxOutput: 4096;
|
|
2625
|
+
readonly modalities: {
|
|
2626
|
+
readonly input: readonly ["text"];
|
|
2627
|
+
readonly output: readonly ["text"];
|
|
2628
|
+
};
|
|
2629
|
+
readonly capabilities: {
|
|
2630
|
+
readonly reasoning: false;
|
|
2631
|
+
readonly toolCall: true;
|
|
2632
|
+
readonly attachment: false;
|
|
2633
|
+
readonly structuredOutput: true;
|
|
2634
|
+
};
|
|
2635
|
+
}, {
|
|
2636
|
+
readonly id: "qwen/qwen3-235b-a22b";
|
|
2637
|
+
readonly name: "Qwen3-235B-A22B";
|
|
2638
|
+
readonly provider: "nvidia";
|
|
2639
|
+
readonly family: "qwen";
|
|
2640
|
+
readonly pricing: {
|
|
2641
|
+
readonly input: 0;
|
|
2642
|
+
readonly output: 0;
|
|
2643
|
+
};
|
|
2644
|
+
readonly contextWindow: 131072;
|
|
2645
|
+
readonly maxOutput: 8192;
|
|
2646
|
+
readonly modalities: {
|
|
2647
|
+
readonly input: readonly ["text"];
|
|
2648
|
+
readonly output: readonly ["text"];
|
|
2649
|
+
};
|
|
2650
|
+
readonly capabilities: {
|
|
2651
|
+
readonly reasoning: true;
|
|
2652
|
+
readonly toolCall: true;
|
|
2653
|
+
readonly attachment: false;
|
|
2654
|
+
readonly structuredOutput: false;
|
|
2655
|
+
};
|
|
2656
|
+
}, {
|
|
2657
|
+
readonly id: "qwen/qwen3-next-80b-a3b-instruct";
|
|
2658
|
+
readonly name: "Qwen3-Next-80B-A3B-Instruct";
|
|
2659
|
+
readonly provider: "nvidia";
|
|
2660
|
+
readonly family: "qwen";
|
|
2661
|
+
readonly pricing: {
|
|
2662
|
+
readonly input: 0;
|
|
2663
|
+
readonly output: 0;
|
|
2664
|
+
};
|
|
2665
|
+
readonly contextWindow: 262144;
|
|
2666
|
+
readonly maxOutput: 16384;
|
|
2667
|
+
readonly modalities: {
|
|
2668
|
+
readonly input: readonly ["text"];
|
|
2669
|
+
readonly output: readonly ["text"];
|
|
2670
|
+
};
|
|
2671
|
+
readonly capabilities: {
|
|
2672
|
+
readonly reasoning: false;
|
|
2673
|
+
readonly toolCall: true;
|
|
2674
|
+
readonly attachment: false;
|
|
2675
|
+
readonly structuredOutput: false;
|
|
2676
|
+
};
|
|
2677
|
+
}, {
|
|
2678
|
+
readonly id: "meta/llama-3.1-70b-instruct";
|
|
2679
|
+
readonly name: "Llama 3.1 70b Instruct";
|
|
2680
|
+
readonly provider: "nvidia";
|
|
2681
|
+
readonly family: "";
|
|
2682
|
+
readonly pricing: {
|
|
2683
|
+
readonly input: 0;
|
|
2684
|
+
readonly output: 0;
|
|
2685
|
+
};
|
|
2686
|
+
readonly contextWindow: 128000;
|
|
2687
|
+
readonly maxOutput: 4096;
|
|
2688
|
+
readonly modalities: {
|
|
2689
|
+
readonly input: readonly ["text"];
|
|
2690
|
+
readonly output: readonly ["text"];
|
|
2691
|
+
};
|
|
2692
|
+
readonly capabilities: {
|
|
2693
|
+
readonly reasoning: false;
|
|
2694
|
+
readonly toolCall: true;
|
|
2695
|
+
readonly attachment: false;
|
|
2696
|
+
readonly structuredOutput: true;
|
|
2697
|
+
};
|
|
2698
|
+
}, {
|
|
2699
|
+
readonly id: "meta/llama-3.3-70b-instruct";
|
|
2700
|
+
readonly name: "Llama 3.3 70b Instruct";
|
|
2701
|
+
readonly provider: "nvidia";
|
|
2702
|
+
readonly family: "";
|
|
2703
|
+
readonly pricing: {
|
|
2704
|
+
readonly input: 0;
|
|
2705
|
+
readonly output: 0;
|
|
2706
|
+
};
|
|
2707
|
+
readonly contextWindow: 128000;
|
|
2708
|
+
readonly maxOutput: 4096;
|
|
2709
|
+
readonly modalities: {
|
|
2710
|
+
readonly input: readonly ["text"];
|
|
2711
|
+
readonly output: readonly ["text"];
|
|
2712
|
+
};
|
|
2713
|
+
readonly capabilities: {
|
|
2714
|
+
readonly reasoning: false;
|
|
2715
|
+
readonly toolCall: true;
|
|
2716
|
+
readonly attachment: false;
|
|
2717
|
+
readonly structuredOutput: true;
|
|
2718
|
+
};
|
|
2719
|
+
}, {
|
|
2720
|
+
readonly id: "meta/llama-4-scout-17b-16e-instruct";
|
|
2721
|
+
readonly name: "Llama 4 Scout 17b 16e Instruct";
|
|
2722
|
+
readonly provider: "nvidia";
|
|
2723
|
+
readonly family: "";
|
|
2724
|
+
readonly pricing: {
|
|
2725
|
+
readonly input: 0;
|
|
2726
|
+
readonly output: 0;
|
|
2727
|
+
};
|
|
2728
|
+
readonly contextWindow: 128000;
|
|
2729
|
+
readonly maxOutput: 4096;
|
|
2730
|
+
readonly modalities: {
|
|
2731
|
+
readonly input: readonly ["text", "image"];
|
|
2732
|
+
readonly output: readonly ["text"];
|
|
2733
|
+
};
|
|
2734
|
+
readonly capabilities: {
|
|
2735
|
+
readonly reasoning: false;
|
|
2736
|
+
readonly toolCall: true;
|
|
2737
|
+
readonly attachment: true;
|
|
2738
|
+
readonly structuredOutput: true;
|
|
2739
|
+
};
|
|
2740
|
+
}, {
|
|
2741
|
+
readonly id: "meta/llama-3.2-11b-vision-instruct";
|
|
2742
|
+
readonly name: "Llama 3.2 11b Vision Instruct";
|
|
2743
|
+
readonly provider: "nvidia";
|
|
2744
|
+
readonly family: "";
|
|
2745
|
+
readonly pricing: {
|
|
2746
|
+
readonly input: 0;
|
|
2747
|
+
readonly output: 0;
|
|
2748
|
+
};
|
|
2749
|
+
readonly contextWindow: 128000;
|
|
2750
|
+
readonly maxOutput: 4096;
|
|
2751
|
+
readonly modalities: {
|
|
2752
|
+
readonly input: readonly ["text", "image"];
|
|
2753
|
+
readonly output: readonly ["text"];
|
|
2754
|
+
};
|
|
2755
|
+
readonly capabilities: {
|
|
2756
|
+
readonly reasoning: false;
|
|
2757
|
+
readonly toolCall: true;
|
|
2758
|
+
readonly attachment: true;
|
|
2759
|
+
readonly structuredOutput: true;
|
|
2760
|
+
};
|
|
2761
|
+
}, {
|
|
2762
|
+
readonly id: "meta/llama3-8b-instruct";
|
|
2763
|
+
readonly name: "Llama3 8b Instruct";
|
|
2764
|
+
readonly provider: "nvidia";
|
|
2765
|
+
readonly family: "";
|
|
2766
|
+
readonly pricing: {
|
|
2767
|
+
readonly input: 0;
|
|
2768
|
+
readonly output: 0;
|
|
2769
|
+
};
|
|
2770
|
+
readonly contextWindow: 128000;
|
|
2771
|
+
readonly maxOutput: 4096;
|
|
2772
|
+
readonly modalities: {
|
|
2773
|
+
readonly input: readonly ["text"];
|
|
2774
|
+
readonly output: readonly ["text"];
|
|
2775
|
+
};
|
|
2776
|
+
readonly capabilities: {
|
|
2777
|
+
readonly reasoning: false;
|
|
2778
|
+
readonly toolCall: true;
|
|
2779
|
+
readonly attachment: false;
|
|
2780
|
+
readonly structuredOutput: true;
|
|
2781
|
+
};
|
|
2782
|
+
}, {
|
|
2783
|
+
readonly id: "meta/codellama-70b";
|
|
2784
|
+
readonly name: "Codellama 70b";
|
|
2785
|
+
readonly provider: "nvidia";
|
|
2786
|
+
readonly family: "";
|
|
2787
|
+
readonly pricing: {
|
|
2788
|
+
readonly input: 0;
|
|
2789
|
+
readonly output: 0;
|
|
2790
|
+
};
|
|
2791
|
+
readonly contextWindow: 128000;
|
|
2792
|
+
readonly maxOutput: 4096;
|
|
2793
|
+
readonly modalities: {
|
|
2794
|
+
readonly input: readonly ["text"];
|
|
2795
|
+
readonly output: readonly ["text"];
|
|
2796
|
+
};
|
|
2797
|
+
readonly capabilities: {
|
|
2798
|
+
readonly reasoning: false;
|
|
2799
|
+
readonly toolCall: false;
|
|
2800
|
+
readonly attachment: false;
|
|
2801
|
+
readonly structuredOutput: false;
|
|
2802
|
+
};
|
|
2803
|
+
}, {
|
|
2804
|
+
readonly id: "meta/llama-3.2-1b-instruct";
|
|
2805
|
+
readonly name: "Llama 3.2 1b Instruct";
|
|
2806
|
+
readonly provider: "nvidia";
|
|
2807
|
+
readonly family: "";
|
|
2808
|
+
readonly pricing: {
|
|
2809
|
+
readonly input: 0;
|
|
2810
|
+
readonly output: 0;
|
|
2811
|
+
};
|
|
2812
|
+
readonly contextWindow: 128000;
|
|
2813
|
+
readonly maxOutput: 4096;
|
|
2814
|
+
readonly modalities: {
|
|
2815
|
+
readonly input: readonly ["text"];
|
|
2816
|
+
readonly output: readonly ["text"];
|
|
2817
|
+
};
|
|
2818
|
+
readonly capabilities: {
|
|
2819
|
+
readonly reasoning: false;
|
|
2820
|
+
readonly toolCall: true;
|
|
2821
|
+
readonly attachment: false;
|
|
2822
|
+
readonly structuredOutput: true;
|
|
2823
|
+
};
|
|
2824
|
+
}, {
|
|
2825
|
+
readonly id: "meta/llama-3.1-405b-instruct";
|
|
2826
|
+
readonly name: "Llama 3.1 405b Instruct";
|
|
2827
|
+
readonly provider: "nvidia";
|
|
2828
|
+
readonly family: "";
|
|
2829
|
+
readonly pricing: {
|
|
2830
|
+
readonly input: 0;
|
|
2831
|
+
readonly output: 0;
|
|
2832
|
+
};
|
|
2833
|
+
readonly contextWindow: 128000;
|
|
2834
|
+
readonly maxOutput: 4096;
|
|
2835
|
+
readonly modalities: {
|
|
2836
|
+
readonly input: readonly ["text"];
|
|
2837
|
+
readonly output: readonly ["text"];
|
|
2838
|
+
};
|
|
2839
|
+
readonly capabilities: {
|
|
2840
|
+
readonly reasoning: false;
|
|
2841
|
+
readonly toolCall: true;
|
|
2842
|
+
readonly attachment: false;
|
|
2843
|
+
readonly structuredOutput: true;
|
|
2844
|
+
};
|
|
2845
|
+
}, {
|
|
2846
|
+
readonly id: "meta/llama3-70b-instruct";
|
|
2847
|
+
readonly name: "Llama3 70b Instruct";
|
|
2848
|
+
readonly provider: "nvidia";
|
|
2849
|
+
readonly family: "";
|
|
2850
|
+
readonly pricing: {
|
|
2851
|
+
readonly input: 0;
|
|
2852
|
+
readonly output: 0;
|
|
2853
|
+
};
|
|
2854
|
+
readonly contextWindow: 128000;
|
|
2855
|
+
readonly maxOutput: 4096;
|
|
2856
|
+
readonly modalities: {
|
|
2857
|
+
readonly input: readonly ["text"];
|
|
2858
|
+
readonly output: readonly ["text"];
|
|
2859
|
+
};
|
|
2860
|
+
readonly capabilities: {
|
|
2861
|
+
readonly reasoning: false;
|
|
2862
|
+
readonly toolCall: true;
|
|
2863
|
+
readonly attachment: false;
|
|
2864
|
+
readonly structuredOutput: true;
|
|
2865
|
+
};
|
|
2866
|
+
}, {
|
|
2867
|
+
readonly id: "meta/llama-4-maverick-17b-128e-instruct";
|
|
2868
|
+
readonly name: "Llama 4 Maverick 17b 128e Instruct";
|
|
2869
|
+
readonly provider: "nvidia";
|
|
2870
|
+
readonly family: "";
|
|
2871
|
+
readonly pricing: {
|
|
2872
|
+
readonly input: 0;
|
|
2873
|
+
readonly output: 0;
|
|
2874
|
+
};
|
|
2875
|
+
readonly contextWindow: 128000;
|
|
2876
|
+
readonly maxOutput: 4096;
|
|
2877
|
+
readonly modalities: {
|
|
2878
|
+
readonly input: readonly ["text", "image"];
|
|
2879
|
+
readonly output: readonly ["text"];
|
|
2880
|
+
};
|
|
2881
|
+
readonly capabilities: {
|
|
2882
|
+
readonly reasoning: false;
|
|
2883
|
+
readonly toolCall: true;
|
|
2884
|
+
readonly attachment: true;
|
|
2885
|
+
readonly structuredOutput: true;
|
|
2886
|
+
};
|
|
2887
|
+
}, {
|
|
2888
|
+
readonly id: "mistralai/mistral-large-3-675b-instruct-2512";
|
|
2889
|
+
readonly name: "Mistral Large 3 675B Instruct 2512";
|
|
2890
|
+
readonly provider: "nvidia";
|
|
2891
|
+
readonly family: "mistral-large";
|
|
2892
|
+
readonly pricing: {
|
|
2893
|
+
readonly input: 0;
|
|
2894
|
+
readonly output: 0;
|
|
2895
|
+
};
|
|
2896
|
+
readonly contextWindow: 262144;
|
|
2897
|
+
readonly maxOutput: 262144;
|
|
2898
|
+
readonly modalities: {
|
|
2899
|
+
readonly input: readonly ["text", "image"];
|
|
2900
|
+
readonly output: readonly ["text"];
|
|
2901
|
+
};
|
|
2902
|
+
readonly capabilities: {
|
|
2903
|
+
readonly reasoning: false;
|
|
2904
|
+
readonly toolCall: true;
|
|
2905
|
+
readonly attachment: true;
|
|
2906
|
+
readonly structuredOutput: true;
|
|
2907
|
+
};
|
|
2908
|
+
}, {
|
|
2909
|
+
readonly id: "mistralai/mamba-codestral-7b-v0.1";
|
|
2910
|
+
readonly name: "Mamba Codestral 7b V0.1";
|
|
2911
|
+
readonly provider: "nvidia";
|
|
2912
|
+
readonly family: "";
|
|
2913
|
+
readonly pricing: {
|
|
2914
|
+
readonly input: 0;
|
|
2915
|
+
readonly output: 0;
|
|
2916
|
+
};
|
|
2917
|
+
readonly contextWindow: 128000;
|
|
2918
|
+
readonly maxOutput: 4096;
|
|
2919
|
+
readonly modalities: {
|
|
2920
|
+
readonly input: readonly ["text"];
|
|
2921
|
+
readonly output: readonly ["text"];
|
|
2922
|
+
};
|
|
2923
|
+
readonly capabilities: {
|
|
2924
|
+
readonly reasoning: false;
|
|
2925
|
+
readonly toolCall: false;
|
|
2926
|
+
readonly attachment: false;
|
|
2927
|
+
readonly structuredOutput: false;
|
|
2928
|
+
};
|
|
2929
|
+
}, {
|
|
2930
|
+
readonly id: "mistralai/codestral-22b-instruct-v0.1";
|
|
2931
|
+
readonly name: "Codestral 22b Instruct V0.1";
|
|
2932
|
+
readonly provider: "nvidia";
|
|
2933
|
+
readonly family: "";
|
|
2934
|
+
readonly pricing: {
|
|
2935
|
+
readonly input: 0;
|
|
2936
|
+
readonly output: 0;
|
|
2937
|
+
};
|
|
2938
|
+
readonly contextWindow: 128000;
|
|
2939
|
+
readonly maxOutput: 4096;
|
|
2940
|
+
readonly modalities: {
|
|
2941
|
+
readonly input: readonly ["text"];
|
|
2942
|
+
readonly output: readonly ["text"];
|
|
2943
|
+
};
|
|
2944
|
+
readonly capabilities: {
|
|
2945
|
+
readonly reasoning: false;
|
|
2946
|
+
readonly toolCall: true;
|
|
2947
|
+
readonly attachment: false;
|
|
2948
|
+
readonly structuredOutput: true;
|
|
2949
|
+
};
|
|
2950
|
+
}, {
|
|
2951
|
+
readonly id: "mistralai/mistral-large-2-instruct";
|
|
2952
|
+
readonly name: "Mistral Large 2 Instruct";
|
|
2953
|
+
readonly provider: "nvidia";
|
|
2954
|
+
readonly family: "";
|
|
2955
|
+
readonly pricing: {
|
|
2956
|
+
readonly input: 0;
|
|
2957
|
+
readonly output: 0;
|
|
2958
|
+
};
|
|
2959
|
+
readonly contextWindow: 128000;
|
|
2960
|
+
readonly maxOutput: 4096;
|
|
2961
|
+
readonly modalities: {
|
|
2962
|
+
readonly input: readonly ["text"];
|
|
2963
|
+
readonly output: readonly ["text"];
|
|
2964
|
+
};
|
|
2965
|
+
readonly capabilities: {
|
|
2966
|
+
readonly reasoning: false;
|
|
2967
|
+
readonly toolCall: true;
|
|
2968
|
+
readonly attachment: false;
|
|
2969
|
+
readonly structuredOutput: true;
|
|
2970
|
+
};
|
|
2971
|
+
}, {
|
|
2972
|
+
readonly id: "mistralai/ministral-14b-instruct-2512";
|
|
2973
|
+
readonly name: "Ministral 3 14B Instruct 2512";
|
|
2974
|
+
readonly provider: "nvidia";
|
|
2975
|
+
readonly family: "ministral";
|
|
2976
|
+
readonly pricing: {
|
|
2977
|
+
readonly input: 0;
|
|
2978
|
+
readonly output: 0;
|
|
2979
|
+
};
|
|
2980
|
+
readonly contextWindow: 262144;
|
|
2981
|
+
readonly maxOutput: 262144;
|
|
2982
|
+
readonly modalities: {
|
|
2983
|
+
readonly input: readonly ["text", "image"];
|
|
2984
|
+
readonly output: readonly ["text"];
|
|
2985
|
+
};
|
|
2986
|
+
readonly capabilities: {
|
|
2987
|
+
readonly reasoning: false;
|
|
2988
|
+
readonly toolCall: true;
|
|
2989
|
+
readonly attachment: true;
|
|
2990
|
+
readonly structuredOutput: true;
|
|
2991
|
+
};
|
|
2992
|
+
}, {
|
|
2993
|
+
readonly id: "mistralai/mistral-small-3.1-24b-instruct-2503";
|
|
2994
|
+
readonly name: "Mistral Small 3.1 24b Instruct 2503";
|
|
2995
|
+
readonly provider: "nvidia";
|
|
2996
|
+
readonly family: "";
|
|
2997
|
+
readonly pricing: {
|
|
2998
|
+
readonly input: 0;
|
|
2999
|
+
readonly output: 0;
|
|
3000
|
+
};
|
|
3001
|
+
readonly contextWindow: 128000;
|
|
3002
|
+
readonly maxOutput: 4096;
|
|
3003
|
+
readonly modalities: {
|
|
3004
|
+
readonly input: readonly ["text"];
|
|
3005
|
+
readonly output: readonly ["text"];
|
|
3006
|
+
};
|
|
3007
|
+
readonly capabilities: {
|
|
3008
|
+
readonly reasoning: false;
|
|
3009
|
+
readonly toolCall: true;
|
|
3010
|
+
readonly attachment: false;
|
|
3011
|
+
readonly structuredOutput: true;
|
|
3012
|
+
};
|
|
3013
|
+
}, {
|
|
3014
|
+
readonly id: "mistralai/devstral-2-123b-instruct-2512";
|
|
3015
|
+
readonly name: "Devstral-2-123B-Instruct-2512";
|
|
3016
|
+
readonly provider: "nvidia";
|
|
3017
|
+
readonly family: "devstral";
|
|
3018
|
+
readonly pricing: {
|
|
3019
|
+
readonly input: 0;
|
|
3020
|
+
readonly output: 0;
|
|
3021
|
+
};
|
|
3022
|
+
readonly contextWindow: 262144;
|
|
3023
|
+
readonly maxOutput: 262144;
|
|
3024
|
+
readonly modalities: {
|
|
3025
|
+
readonly input: readonly ["text"];
|
|
3026
|
+
readonly output: readonly ["text"];
|
|
3027
|
+
};
|
|
3028
|
+
readonly capabilities: {
|
|
3029
|
+
readonly reasoning: true;
|
|
3030
|
+
readonly toolCall: true;
|
|
3031
|
+
readonly attachment: true;
|
|
3032
|
+
readonly structuredOutput: true;
|
|
3033
|
+
};
|
|
3034
|
+
}, {
|
|
3035
|
+
readonly id: "openai/gpt-oss-120b";
|
|
3036
|
+
readonly name: "GPT-OSS-120B";
|
|
3037
|
+
readonly provider: "nvidia";
|
|
3038
|
+
readonly family: "gpt-oss";
|
|
3039
|
+
readonly pricing: {
|
|
3040
|
+
readonly input: 0;
|
|
3041
|
+
readonly output: 0;
|
|
3042
|
+
};
|
|
3043
|
+
readonly contextWindow: 128000;
|
|
3044
|
+
readonly maxOutput: 8192;
|
|
3045
|
+
readonly modalities: {
|
|
3046
|
+
readonly input: readonly ["text"];
|
|
3047
|
+
readonly output: readonly ["text"];
|
|
3048
|
+
};
|
|
3049
|
+
readonly capabilities: {
|
|
3050
|
+
readonly reasoning: true;
|
|
3051
|
+
readonly toolCall: false;
|
|
3052
|
+
readonly attachment: true;
|
|
3053
|
+
readonly structuredOutput: false;
|
|
3054
|
+
};
|
|
3055
|
+
}, {
|
|
3056
|
+
readonly id: "openai/whisper-large-v3";
|
|
3057
|
+
readonly name: "Whisper Large v3";
|
|
3058
|
+
readonly provider: "nvidia";
|
|
3059
|
+
readonly family: "whisper";
|
|
3060
|
+
readonly pricing: {
|
|
3061
|
+
readonly input: 0;
|
|
3062
|
+
readonly output: 0;
|
|
3063
|
+
};
|
|
3064
|
+
readonly contextWindow: 0;
|
|
3065
|
+
readonly maxOutput: 4096;
|
|
3066
|
+
readonly modalities: {
|
|
3067
|
+
readonly input: readonly ["audio"];
|
|
3068
|
+
readonly output: readonly ["text"];
|
|
3069
|
+
};
|
|
3070
|
+
readonly capabilities: {
|
|
3071
|
+
readonly reasoning: false;
|
|
3072
|
+
readonly toolCall: false;
|
|
3073
|
+
readonly attachment: false;
|
|
3074
|
+
readonly structuredOutput: false;
|
|
3075
|
+
};
|
|
3076
|
+
}, {
|
|
3077
|
+
readonly id: "black-forest-labs/flux.1-dev";
|
|
3078
|
+
readonly name: "FLUX.1-dev";
|
|
3079
|
+
readonly provider: "nvidia";
|
|
3080
|
+
readonly family: "flux";
|
|
3081
|
+
readonly pricing: {
|
|
3082
|
+
readonly input: 0;
|
|
3083
|
+
readonly output: 0;
|
|
3084
|
+
};
|
|
3085
|
+
readonly contextWindow: 4096;
|
|
3086
|
+
readonly maxOutput: 0;
|
|
3087
|
+
readonly modalities: {
|
|
3088
|
+
readonly input: readonly ["text"];
|
|
3089
|
+
readonly output: readonly ["image"];
|
|
3090
|
+
};
|
|
3091
|
+
readonly capabilities: {
|
|
3092
|
+
readonly reasoning: false;
|
|
3093
|
+
readonly toolCall: false;
|
|
3094
|
+
readonly attachment: false;
|
|
3095
|
+
readonly structuredOutput: false;
|
|
3096
|
+
};
|
|
3097
|
+
}];
|
|
3098
|
+
/**
|
|
3099
|
+
* Look up a NVIDIA NIM model by ID.
|
|
3100
|
+
*
|
|
3101
|
+
* @param id - The provider-native model identifier.
|
|
3102
|
+
* @returns The matching model definition, or `null`.
|
|
3103
|
+
*
|
|
3104
|
+
* @example
|
|
3105
|
+
* ```typescript
|
|
3106
|
+
* import { nvidiaModel } from '@funkai/models/nvidia'
|
|
3107
|
+
*
|
|
3108
|
+
* const m = nvidiaModel('nvidia/llama-3.1-nemotron-70b-instruct')
|
|
3109
|
+
* if (m) {
|
|
3110
|
+
* console.log(m.pricing.input)
|
|
3111
|
+
* }
|
|
3112
|
+
* ```
|
|
3113
|
+
*/
|
|
3114
|
+
declare function nvidiaModel(id: LiteralUnion<NvidiaModelId, string>): ModelDefinition | null;
|
|
3115
|
+
//#endregion
|
|
3116
|
+
export { NvidiaModelId, nvidiaModel, nvidiaModels };
|
|
3117
|
+
//# sourceMappingURL=nvidia.d.mts.map
|